diff --git "a/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.1577, "train/learning_rate": 2.5664739884393065e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 9544, "_timestamp": 1646237227, "_step": 1500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 8.0, 7.0, 3.0, 38.0, 81.0, 20.0, 8.0, 5.0, 30160.0, 112.0, 33.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.125, -239.849609375, -229.57421875, -219.298828125, -209.0234375, -198.748046875, -188.47265625, -178.197265625, -167.921875, -157.646484375, -147.37109375, -137.095703125, -126.8203125, -116.544921875, -106.26953125, -95.994140625, -85.71875, -75.443359375, -65.16796875, -54.892578125, -44.6171875, -34.341796875, -24.06640625, -13.791015625, -3.515625, 6.759765625, 17.03515625, 27.310546875, 37.5859375, 47.861328125, 58.13671875, 68.412109375, 78.6875, 88.962890625, 99.23828125, 109.513671875, 119.7890625, 130.064453125, 140.33984375, 150.615234375, 160.890625, 171.166015625, 181.44140625, 191.716796875, 201.9921875, 212.267578125, 222.54296875, 232.818359375, 243.09375, 253.369140625, 263.64453125, 273.919921875, 284.1953125, 294.470703125, 304.74609375, 315.021484375, 325.296875, 335.572265625, 345.84765625, 356.123046875, 366.3984375, 376.673828125, 386.94921875, 397.224609375, 407.5]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 10.0, 12.0, 15.0, 13.0, 17.0, 29.0, 29.0, 45.0, 35.0, 38.0, 40.0, 41.0, 55.0, 51.0, 55.0, 57.0, 49.0, 51.0, 55.0, 50.0, 32.0, 48.0, 25.0, 31.0, 15.0, 18.0, 15.0, 9.0, 10.0, 9.0, 4.0, 3.0, 4.0, 6.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-81.83889770507812, -79.4573974609375, -77.07589721679688, -74.69439697265625, -72.31289672851562, -69.931396484375, -67.54989624023438, -65.16839599609375, -62.78689956665039, -60.405399322509766, -58.02389907836914, -55.642398834228516, -53.260902404785156, -50.87940216064453, -48.497901916503906, -46.11640167236328, -43.734901428222656, -41.35340118408203, -38.971900939941406, -36.59040069580078, -34.208900451660156, -31.827402114868164, -29.445903778076172, -27.064403533935547, -24.682903289794922, -22.301403045654297, -19.919902801513672, -17.53840446472168, -15.156904220581055, -12.77540397644043, -10.393904685974121, -8.012405395507812, -5.630897521972656, -3.2493977546691895, -0.8678979873657227, 1.5136017799377441, 3.895101547241211, 6.276601791381836, 8.658101081848145, 11.039600372314453, 13.421100616455078, 15.802600860595703, 18.184101104736328, 20.56559944152832, 22.947099685668945, 25.32859992980957, 27.710098266601562, 30.091598510742188, 32.47309875488281, 34.85459899902344, 37.23609924316406, 39.61759948730469, 41.99909973144531, 44.38059997558594, 46.7620964050293, 49.14359664916992, 51.52509689331055, 53.90659713745117, 56.2880973815918, 58.66959762573242, 61.05109405517578, 63.432594299316406, 65.81409454345703, 68.19559478759766, 70.57709503173828]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 4.0, 10.0, 10.0, 12.0, 18.0, 18.0, 31.0, 23.0, 24.0, 28.0, 38.0, 26.0, 31.0, 38.0, 43.0, 38.0, 41.0, 33.0, 34.0, 46.0, 39.0, 34.0, 32.0, 35.0, 23.0, 28.0, 29.0, 22.0, 21.0, 27.0, 27.0, 25.0, 16.0, 17.0, 11.0, 14.0, 9.0, 7.0, 3.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-62.31097412109375, -60.19524383544922, -58.07950973510742, -55.963775634765625, -53.848045349121094, -51.73231506347656, -49.616580963134766, -47.50084686279297, -45.38511657714844, -43.269386291503906, -41.15365219116211, -39.03791809082031, -36.92218780517578, -34.80645751953125, -32.69072341918945, -30.57499122619629, -28.459259033203125, -26.34352684020996, -24.227794647216797, -22.112062454223633, -19.99633026123047, -17.880598068237305, -15.76486587524414, -13.649133682250977, -11.533401489257812, -9.417669296264648, -7.301937103271484, -5.18620491027832, -3.0704727172851562, -0.9547405242919922, 1.1609916687011719, 3.276723861694336, 5.392448425292969, 7.508180618286133, 9.623912811279297, 11.739645004272461, 13.855377197265625, 15.971109390258789, 18.086841583251953, 20.202573776245117, 22.31830596923828, 24.434038162231445, 26.54977035522461, 28.665502548217773, 30.781234741210938, 32.89696502685547, 35.012699127197266, 37.12843322753906, 39.244163513183594, 41.359893798828125, 43.47562789916992, 45.59136199951172, 47.70709228515625, 49.82282257080078, 51.93855667114258, 54.054290771484375, 56.170021057128906, 58.28575134277344, 60.401485443115234, 62.51721954345703, 64.63294982910156, 66.7486801147461, 68.86441040039062, 70.98014831542969, 73.09587860107422]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 18.0, 16.0, 27.0, 43.0, 72.0, 87.0, 120.0, 192.0, 267.0, 359.0, 517.0, 718.0, 1065.0, 1399.0, 2046.0, 2905.0, 4144.0, 6199.0, 9128.0, 13158.0, 19021.0, 28108.0, 41056.0, 60765.0, 91054.0, 152873.0, 230445.0, 129096.0, 81039.0, 54646.0, 37007.0, 25345.0, 17256.0, 11864.0, 8051.0, 5570.0, 3833.0, 2718.0, 1878.0, 1322.0, 921.0, 643.0, 438.0, 339.0, 262.0, 144.0, 124.0, 85.0, 69.0, 39.0, 21.0, 21.0, 10.0, 5.0, 3.0, 2.0, 4.0], "bins": [-186.625, -181.03125, -175.4375, -169.84375, -164.25, -158.65625, -153.0625, -147.46875, -141.875, -136.28125, -130.6875, -125.09375, -119.5, -113.90625, -108.3125, -102.71875, -97.125, -91.53125, -85.9375, -80.34375, -74.75, -69.15625, -63.5625, -57.96875, -52.375, -46.78125, -41.1875, -35.59375, -30.0, -24.40625, -18.8125, -13.21875, -7.625, -2.03125, 3.5625, 9.15625, 14.75, 20.34375, 25.9375, 31.53125, 37.125, 42.71875, 48.3125, 53.90625, 59.5, 65.09375, 70.6875, 76.28125, 81.875, 87.46875, 93.0625, 98.65625, 104.25, 109.84375, 115.4375, 121.03125, 126.625, 132.21875, 137.8125, 143.40625, 149.0, 154.59375, 160.1875, 165.78125, 171.375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 10.0, 4.0, 8.0, 10.0, 16.0, 8.0, 17.0, 19.0, 23.0, 20.0, 28.0, 25.0, 25.0, 36.0, 49.0, 60.0, 66.0, 89.0, 80.0, 55.0, 46.0, 38.0, 41.0, 33.0, 31.0, 16.0, 19.0, 16.0, 20.0, 13.0, 9.0, 5.0, 9.0, 7.0, 6.0, 3.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-80.8125, -78.3515625, -75.890625, -73.4296875, -70.96875, -68.5078125, -66.046875, -63.5859375, -61.125, -58.6640625, -56.203125, -53.7421875, -51.28125, -48.8203125, -46.359375, -43.8984375, -41.4375, -38.9765625, -36.515625, -34.0546875, -31.59375, -29.1328125, -26.671875, -24.2109375, -21.75, -19.2890625, -16.828125, -14.3671875, -11.90625, -9.4453125, -6.984375, -4.5234375, -2.0625, 0.3984375, 2.859375, 5.3203125, 7.78125, 10.2421875, 12.703125, 15.1640625, 17.625, 20.0859375, 22.546875, 25.0078125, 27.46875, 29.9296875, 32.390625, 34.8515625, 37.3125, 39.7734375, 42.234375, 44.6953125, 47.15625, 49.6171875, 52.078125, 54.5390625, 57.0, 59.4609375, 61.921875, 64.3828125, 66.84375, 69.3046875, 71.765625, 74.2265625, 76.6875]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 9.0, 5.0, 13.0, 17.0, 15.0, 20.0, 22.0, 25.0, 28.0, 38.0, 38.0, 49.0, 53.0, 48.0, 67.0, 74.0, 57.0, 61.0, 49.0, 49.0, 48.0, 40.0, 31.0, 21.0, 20.0, 23.0, 16.0, 9.0, 11.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.32265090942383, -51.65584182739258, -49.98903274536133, -48.32222366333008, -46.65541458129883, -44.98860549926758, -43.32179641723633, -41.65498733520508, -39.98817825317383, -38.32136917114258, -36.65456008911133, -34.98775100708008, -33.32094192504883, -31.654132843017578, -29.987323760986328, -28.320514678955078, -26.653705596923828, -24.986896514892578, -23.320087432861328, -21.653278350830078, -19.986469268798828, -18.319660186767578, -16.652851104736328, -14.986042022705078, -13.319232940673828, -11.652423858642578, -9.985614776611328, -8.318805694580078, -6.651996612548828, -4.985187530517578, -3.318378448486328, -1.6515693664550781, 0.015239715576171875, 1.6820487976074219, 3.348857879638672, 5.015666961669922, 6.682476043701172, 8.349285125732422, 10.016094207763672, 11.682903289794922, 13.349712371826172, 15.016521453857422, 16.683330535888672, 18.350139617919922, 20.016948699951172, 21.683757781982422, 23.350566864013672, 25.017375946044922, 26.684185028076172, 28.350994110107422, 30.017803192138672, 31.684612274169922, 33.35142135620117, 35.01823043823242, 36.68503952026367, 38.35184860229492, 40.01865768432617, 41.68546676635742, 43.35227584838867, 45.01908493041992, 46.68589401245117, 48.35270309448242, 50.01951217651367, 51.68632125854492, 53.35313034057617]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 6.0, 12.0, 16.0, 14.0, 13.0, 19.0, 25.0, 23.0, 25.0, 22.0, 35.0, 38.0, 35.0, 33.0, 41.0, 43.0, 42.0, 41.0, 40.0, 40.0, 42.0, 42.0, 38.0, 32.0, 39.0, 29.0, 24.0, 21.0, 18.0, 19.0, 17.0, 24.0, 13.0, 18.0, 16.0, 6.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.65802764892578, -42.214752197265625, -40.77147674560547, -39.32820129394531, -37.88492965698242, -36.441654205322266, -34.99837875366211, -33.55510330200195, -32.1118278503418, -30.66855239868164, -29.225278854370117, -27.78200340270996, -26.338727951049805, -24.89545440673828, -23.452178955078125, -22.00890350341797, -20.565629959106445, -19.12235450744629, -17.679080963134766, -16.23580551147461, -14.792530059814453, -13.349255561828613, -11.905981063842773, -10.462705612182617, -9.019431114196777, -7.576156139373779, -6.132881164550781, -4.689606666564941, -3.2463316917419434, -1.8030567169189453, -0.35978221893310547, 1.0834932327270508, 2.5267677307128906, 3.9700427055358887, 5.413317680358887, 6.856592178344727, 8.299867630004883, 9.743142127990723, 11.186416625976562, 12.629692077636719, 14.072966575622559, 15.516241073608398, 16.959516525268555, 18.402790069580078, 19.846065521240234, 21.28934097290039, 22.732616424560547, 24.175891876220703, 25.619165420532227, 27.062440872192383, 28.505714416503906, 29.948989868164062, 31.39226531982422, 32.835540771484375, 34.27881622314453, 35.72209167480469, 37.16536331176758, 38.608638763427734, 40.05191421508789, 41.49518585205078, 42.93846130371094, 44.381736755371094, 45.82501220703125, 47.268287658691406, 48.71156311035156]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 14.0, 27.0, 38.0, 70.0, 86.0, 121.0, 197.0, 307.0, 452.0, 651.0, 1007.0, 1571.0, 2455.0, 3780.0, 5978.0, 9690.0, 15818.0, 26084.0, 44547.0, 78273.0, 149105.0, 327291.0, 740951.0, 1128057.0, 864436.0, 402763.0, 175831.0, 89503.0, 49640.0, 28953.0, 17354.0, 10657.0, 6670.0, 4156.0, 2721.0, 1752.0, 1141.0, 686.0, 482.0, 347.0, 217.0, 135.0, 87.0, 69.0, 37.0, 19.0, 22.0, 16.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-44.0625, -42.6689453125, -41.275390625, -39.8818359375, -38.48828125, -37.0947265625, -35.701171875, -34.3076171875, -32.9140625, -31.5205078125, -30.126953125, -28.7333984375, -27.33984375, -25.9462890625, -24.552734375, -23.1591796875, -21.765625, -20.3720703125, -18.978515625, -17.5849609375, -16.19140625, -14.7978515625, -13.404296875, -12.0107421875, -10.6171875, -9.2236328125, -7.830078125, -6.4365234375, -5.04296875, -3.6494140625, -2.255859375, -0.8623046875, 0.53125, 1.9248046875, 3.318359375, 4.7119140625, 6.10546875, 7.4990234375, 8.892578125, 10.2861328125, 11.6796875, 13.0732421875, 14.466796875, 15.8603515625, 17.25390625, 18.6474609375, 20.041015625, 21.4345703125, 22.828125, 24.2216796875, 25.615234375, 27.0087890625, 28.40234375, 29.7958984375, 31.189453125, 32.5830078125, 33.9765625, 35.3701171875, 36.763671875, 38.1572265625, 39.55078125, 40.9443359375, 42.337890625, 43.7314453125, 45.125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 10.0, 10.0, 12.0, 10.0, 9.0, 24.0, 18.0, 24.0, 20.0, 32.0, 23.0, 29.0, 38.0, 39.0, 32.0, 36.0, 47.0, 41.0, 43.0, 41.0, 47.0, 38.0, 45.0, 41.0, 30.0, 28.0, 30.0, 25.0, 26.0, 22.0, 22.0, 15.0, 20.0, 7.0, 13.0, 14.0, 6.0, 5.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.640625, -27.677490234375, -26.71435546875, -25.751220703125, -24.7880859375, -23.824951171875, -22.86181640625, -21.898681640625, -20.935546875, -19.972412109375, -19.00927734375, -18.046142578125, -17.0830078125, -16.119873046875, -15.15673828125, -14.193603515625, -13.23046875, -12.267333984375, -11.30419921875, -10.341064453125, -9.3779296875, -8.414794921875, -7.45166015625, -6.488525390625, -5.525390625, -4.562255859375, -3.59912109375, -2.635986328125, -1.6728515625, -0.709716796875, 0.25341796875, 1.216552734375, 2.1796875, 3.142822265625, 4.10595703125, 5.069091796875, 6.0322265625, 6.995361328125, 7.95849609375, 8.921630859375, 9.884765625, 10.847900390625, 11.81103515625, 12.774169921875, 13.7373046875, 14.700439453125, 15.66357421875, 16.626708984375, 17.58984375, 18.552978515625, 19.51611328125, 20.479248046875, 21.4423828125, 22.405517578125, 23.36865234375, 24.331787109375, 25.294921875, 26.258056640625, 27.22119140625, 28.184326171875, 29.1474609375, 30.110595703125, 31.07373046875, 32.036865234375, 33.0]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 16.0, 16.0, 15.0, 37.0, 58.0, 105.0, 124.0, 203.0, 340.0, 480.0, 731.0, 1108.0, 1716.0, 2695.0, 4139.0, 6567.0, 10518.0, 16907.0, 27851.0, 46038.0, 77831.0, 133795.0, 234927.0, 413778.0, 724549.0, 954178.0, 653609.0, 371580.0, 210412.0, 120540.0, 70414.0, 42132.0, 25006.0, 15487.0, 9480.0, 6017.0, 3807.0, 2534.0, 1529.0, 1019.0, 706.0, 422.0, 314.0, 196.0, 138.0, 84.0, 48.0, 25.0, 24.0, 16.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-37.59375, -36.43359375, -35.2734375, -34.11328125, -32.953125, -31.79296875, -30.6328125, -29.47265625, -28.3125, -27.15234375, -25.9921875, -24.83203125, -23.671875, -22.51171875, -21.3515625, -20.19140625, -19.03125, -17.87109375, -16.7109375, -15.55078125, -14.390625, -13.23046875, -12.0703125, -10.91015625, -9.75, -8.58984375, -7.4296875, -6.26953125, -5.109375, -3.94921875, -2.7890625, -1.62890625, -0.46875, 0.69140625, 1.8515625, 3.01171875, 4.171875, 5.33203125, 6.4921875, 7.65234375, 8.8125, 9.97265625, 11.1328125, 12.29296875, 13.453125, 14.61328125, 15.7734375, 16.93359375, 18.09375, 19.25390625, 20.4140625, 21.57421875, 22.734375, 23.89453125, 25.0546875, 26.21484375, 27.375, 28.53515625, 29.6953125, 30.85546875, 32.015625, 33.17578125, 34.3359375, 35.49609375, 36.65625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 1.0, 4.0, 11.0, 9.0, 13.0, 9.0, 21.0, 15.0, 28.0, 35.0, 45.0, 42.0, 58.0, 66.0, 80.0, 95.0, 102.0, 151.0, 187.0, 229.0, 289.0, 339.0, 368.0, 320.0, 274.0, 252.0, 201.0, 165.0, 135.0, 109.0, 83.0, 55.0, 60.0, 55.0, 33.0, 28.0, 22.0, 21.0, 9.0, 13.0, 16.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.96875, -16.464111328125, -15.95947265625, -15.454833984375, -14.9501953125, -14.445556640625, -13.94091796875, -13.436279296875, -12.931640625, -12.427001953125, -11.92236328125, -11.417724609375, -10.9130859375, -10.408447265625, -9.90380859375, -9.399169921875, -8.89453125, -8.389892578125, -7.88525390625, -7.380615234375, -6.8759765625, -6.371337890625, -5.86669921875, -5.362060546875, -4.857421875, -4.352783203125, -3.84814453125, -3.343505859375, -2.8388671875, -2.334228515625, -1.82958984375, -1.324951171875, -0.8203125, -0.315673828125, 0.18896484375, 0.693603515625, 1.1982421875, 1.702880859375, 2.20751953125, 2.712158203125, 3.216796875, 3.721435546875, 4.22607421875, 4.730712890625, 5.2353515625, 5.739990234375, 6.24462890625, 6.749267578125, 7.25390625, 7.758544921875, 8.26318359375, 8.767822265625, 9.2724609375, 9.777099609375, 10.28173828125, 10.786376953125, 11.291015625, 11.795654296875, 12.30029296875, 12.804931640625, 13.3095703125, 13.814208984375, 14.31884765625, 14.823486328125, 15.328125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 4.0, 9.0, 5.0, 12.0, 10.0, 13.0, 13.0, 24.0, 19.0, 33.0, 25.0, 36.0, 38.0, 59.0, 59.0, 71.0, 60.0, 66.0, 57.0, 60.0, 59.0, 44.0, 31.0, 39.0, 27.0, 26.0, 24.0, 17.0, 10.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.41942596435547, -44.107601165771484, -42.795772552490234, -41.48394775390625, -40.172119140625, -38.860294342041016, -37.54846954345703, -36.23664093017578, -34.9248161315918, -33.61299133300781, -32.30116271972656, -30.989337921142578, -29.67751121520996, -28.365684509277344, -27.05385971069336, -25.742033004760742, -24.430206298828125, -23.118379592895508, -21.80655288696289, -20.494728088378906, -19.18290138244629, -17.871074676513672, -16.559249877929688, -15.24742317199707, -13.935596466064453, -12.623769760131836, -11.311944007873535, -10.000118255615234, -8.688291549682617, -7.376465320587158, -6.064639091491699, -4.752813339233398, -3.4409828186035156, -2.1291565895080566, -0.8173303604125977, 0.49449586868286133, 1.8063220977783203, 3.1181483268737793, 4.429974555969238, 5.741800308227539, 7.053627014160156, 8.365453720092773, 9.677279472351074, 10.989105224609375, 12.300931930541992, 13.61275863647461, 14.92458438873291, 16.23641014099121, 17.548236846923828, 18.860063552856445, 20.171890258789062, 21.483715057373047, 22.795541763305664, 24.10736846923828, 25.419193267822266, 26.731019973754883, 28.0428466796875, 29.354673385620117, 30.666500091552734, 31.97832489013672, 33.29015350341797, 34.60197830200195, 35.91380310058594, 37.22563171386719, 38.53745651245117]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 14.0, 7.0, 9.0, 12.0, 12.0, 22.0, 16.0, 31.0, 40.0, 34.0, 42.0, 39.0, 34.0, 37.0, 27.0, 45.0, 63.0, 31.0, 48.0, 36.0, 45.0, 41.0, 35.0, 37.0, 32.0, 28.0, 32.0, 27.0, 22.0, 8.0, 12.0, 11.0, 12.0, 6.0, 6.0, 7.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09469985961914, -32.88338088989258, -31.67205810546875, -30.460739135742188, -29.249418258666992, -28.038097381591797, -26.8267765045166, -25.615455627441406, -24.404136657714844, -23.19281578063965, -21.981494903564453, -20.77017593383789, -19.558855056762695, -18.3475341796875, -17.136213302612305, -15.924893379211426, -14.713571548461914, -13.502250671386719, -12.29093074798584, -11.079609870910645, -9.868289947509766, -8.65696907043457, -7.445648193359375, -6.234328269958496, -5.023007392883301, -3.8116869926452637, -2.6003663539886475, -1.3890457153320312, -0.17772531509399414, 1.033595085144043, 2.2449159622192383, 3.456235885620117, 4.6675567626953125, 5.87887716293335, 7.090197563171387, 8.301518440246582, 9.512838363647461, 10.724159240722656, 11.935480117797852, 13.14680004119873, 14.358120918273926, 15.569441795349121, 16.78076171875, 17.992082595825195, 19.20340347290039, 20.414722442626953, 21.62604522705078, 22.837364196777344, 24.04868507385254, 25.260005950927734, 26.47132682800293, 27.682647705078125, 28.893966674804688, 30.105287551879883, 31.316608428955078, 32.52792739868164, 33.73925018310547, 34.95056915283203, 36.16189193725586, 37.37321090698242, 38.58453369140625, 39.79585266113281, 41.007171630859375, 42.2184944152832, 43.429813385009766]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 10.0, 13.0, 12.0, 18.0, 26.0, 39.0, 69.0, 96.0, 151.0, 200.0, 320.0, 524.0, 733.0, 1204.0, 1987.0, 3173.0, 5366.0, 9466.0, 21833.0, 109397.0, 663694.0, 175058.0, 28699.0, 11010.0, 5870.0, 3513.0, 2280.0, 1375.0, 872.0, 531.0, 324.0, 225.0, 137.0, 92.0, 74.0, 41.0, 33.0, 21.0, 15.0, 11.0, 12.0, 8.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.1875, -58.283203125, -56.37890625, -54.474609375, -52.5703125, -50.666015625, -48.76171875, -46.857421875, -44.953125, -43.048828125, -41.14453125, -39.240234375, -37.3359375, -35.431640625, -33.52734375, -31.623046875, -29.71875, -27.814453125, -25.91015625, -24.005859375, -22.1015625, -20.197265625, -18.29296875, -16.388671875, -14.484375, -12.580078125, -10.67578125, -8.771484375, -6.8671875, -4.962890625, -3.05859375, -1.154296875, 0.75, 2.654296875, 4.55859375, 6.462890625, 8.3671875, 10.271484375, 12.17578125, 14.080078125, 15.984375, 17.888671875, 19.79296875, 21.697265625, 23.6015625, 25.505859375, 27.41015625, 29.314453125, 31.21875, 33.123046875, 35.02734375, 36.931640625, 38.8359375, 40.740234375, 42.64453125, 44.548828125, 46.453125, 48.357421875, 50.26171875, 52.166015625, 54.0703125, 55.974609375, 57.87890625, 59.783203125, 61.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 6.0, 8.0, 11.0, 8.0, 9.0, 22.0, 16.0, 22.0, 20.0, 26.0, 44.0, 46.0, 34.0, 32.0, 37.0, 39.0, 35.0, 47.0, 40.0, 37.0, 44.0, 39.0, 42.0, 43.0, 33.0, 26.0, 34.0, 25.0, 32.0, 23.0, 24.0, 11.0, 8.0, 10.0, 14.0, 11.0, 3.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.484375, -30.349365234375, -29.21435546875, -28.079345703125, -26.9443359375, -25.809326171875, -24.67431640625, -23.539306640625, -22.404296875, -21.269287109375, -20.13427734375, -18.999267578125, -17.8642578125, -16.729248046875, -15.59423828125, -14.459228515625, -13.32421875, -12.189208984375, -11.05419921875, -9.919189453125, -8.7841796875, -7.649169921875, -6.51416015625, -5.379150390625, -4.244140625, -3.109130859375, -1.97412109375, -0.839111328125, 0.2958984375, 1.430908203125, 2.56591796875, 3.700927734375, 4.8359375, 5.970947265625, 7.10595703125, 8.240966796875, 9.3759765625, 10.510986328125, 11.64599609375, 12.781005859375, 13.916015625, 15.051025390625, 16.18603515625, 17.321044921875, 18.4560546875, 19.591064453125, 20.72607421875, 21.861083984375, 22.99609375, 24.131103515625, 25.26611328125, 26.401123046875, 27.5361328125, 28.671142578125, 29.80615234375, 30.941162109375, 32.076171875, 33.211181640625, 34.34619140625, 35.481201171875, 36.6162109375, 37.751220703125, 38.88623046875, 40.021240234375, 41.15625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 16.0, 13.0, 31.0, 28.0, 44.0, 58.0, 97.0, 124.0, 164.0, 275.0, 363.0, 583.0, 778.0, 1410.0, 2262.0, 3761.0, 6932.0, 16835.0, 90410.0, 783276.0, 105498.0, 17751.0, 7520.0, 3953.0, 2229.0, 1317.0, 893.0, 605.0, 400.0, 273.0, 212.0, 109.0, 82.0, 60.0, 53.0, 37.0, 27.0, 13.0, 10.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.0625, -45.46875, -43.875, -42.28125, -40.6875, -39.09375, -37.5, -35.90625, -34.3125, -32.71875, -31.125, -29.53125, -27.9375, -26.34375, -24.75, -23.15625, -21.5625, -19.96875, -18.375, -16.78125, -15.1875, -13.59375, -12.0, -10.40625, -8.8125, -7.21875, -5.625, -4.03125, -2.4375, -0.84375, 0.75, 2.34375, 3.9375, 5.53125, 7.125, 8.71875, 10.3125, 11.90625, 13.5, 15.09375, 16.6875, 18.28125, 19.875, 21.46875, 23.0625, 24.65625, 26.25, 27.84375, 29.4375, 31.03125, 32.625, 34.21875, 35.8125, 37.40625, 39.0, 40.59375, 42.1875, 43.78125, 45.375, 46.96875, 48.5625, 50.15625, 51.75, 53.34375, 54.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 4.0, 8.0, 8.0, 12.0, 4.0, 14.0, 18.0, 15.0, 22.0, 24.0, 18.0, 25.0, 33.0, 37.0, 27.0, 39.0, 38.0, 31.0, 32.0, 32.0, 36.0, 34.0, 31.0, 42.0, 30.0, 41.0, 29.0, 34.0, 28.0, 32.0, 22.0, 34.0, 23.0, 16.0, 19.0, 23.0, 16.0, 10.0, 12.0, 6.0, 6.0, 8.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-23.9375, -23.165771484375, -22.39404296875, -21.622314453125, -20.8505859375, -20.078857421875, -19.30712890625, -18.535400390625, -17.763671875, -16.991943359375, -16.22021484375, -15.448486328125, -14.6767578125, -13.905029296875, -13.13330078125, -12.361572265625, -11.58984375, -10.818115234375, -10.04638671875, -9.274658203125, -8.5029296875, -7.731201171875, -6.95947265625, -6.187744140625, -5.416015625, -4.644287109375, -3.87255859375, -3.100830078125, -2.3291015625, -1.557373046875, -0.78564453125, -0.013916015625, 0.7578125, 1.529541015625, 2.30126953125, 3.072998046875, 3.8447265625, 4.616455078125, 5.38818359375, 6.159912109375, 6.931640625, 7.703369140625, 8.47509765625, 9.246826171875, 10.0185546875, 10.790283203125, 11.56201171875, 12.333740234375, 13.10546875, 13.877197265625, 14.64892578125, 15.420654296875, 16.1923828125, 16.964111328125, 17.73583984375, 18.507568359375, 19.279296875, 20.051025390625, 20.82275390625, 21.594482421875, 22.3662109375, 23.137939453125, 23.90966796875, 24.681396484375, 25.453125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 8.0, 6.0, 16.0, 21.0, 18.0, 43.0, 47.0, 79.0, 110.0, 190.0, 279.0, 466.0, 774.0, 1457.0, 2941.0, 8648.0, 102788.0, 907697.0, 14832.0, 3899.0, 1766.0, 962.0, 543.0, 342.0, 206.0, 140.0, 101.0, 49.0, 36.0, 26.0, 14.0, 18.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.90625, -57.85205078125, -55.7978515625, -53.74365234375, -51.689453125, -49.63525390625, -47.5810546875, -45.52685546875, -43.47265625, -41.41845703125, -39.3642578125, -37.31005859375, -35.255859375, -33.20166015625, -31.1474609375, -29.09326171875, -27.0390625, -24.98486328125, -22.9306640625, -20.87646484375, -18.822265625, -16.76806640625, -14.7138671875, -12.65966796875, -10.60546875, -8.55126953125, -6.4970703125, -4.44287109375, -2.388671875, -0.33447265625, 1.7197265625, 3.77392578125, 5.828125, 7.88232421875, 9.9365234375, 11.99072265625, 14.044921875, 16.09912109375, 18.1533203125, 20.20751953125, 22.26171875, 24.31591796875, 26.3701171875, 28.42431640625, 30.478515625, 32.53271484375, 34.5869140625, 36.64111328125, 38.6953125, 40.74951171875, 42.8037109375, 44.85791015625, 46.912109375, 48.96630859375, 51.0205078125, 53.07470703125, 55.12890625, 57.18310546875, 59.2373046875, 61.29150390625, 63.345703125, 65.39990234375, 67.4541015625, 69.50830078125, 71.5625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 13.0, 24.0, 22.0, 37.0, 65.0, 350.0, 331.0, 61.0, 27.0, 17.0, 8.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023250579833984375, -0.002244889736175537, -0.0021647214889526367, -0.0020845532417297363, -0.002004384994506836, -0.0019242167472839355, -0.0018440485000610352, -0.0017638802528381348, -0.0016837120056152344, -0.001603543758392334, -0.0015233755111694336, -0.0014432072639465332, -0.0013630390167236328, -0.0012828707695007324, -0.001202702522277832, -0.0011225342750549316, -0.0010423660278320312, -0.0009621977806091309, -0.0008820295333862305, -0.0008018612861633301, -0.0007216930389404297, -0.0006415247917175293, -0.0005613565444946289, -0.0004811882972717285, -0.0004010200500488281, -0.00032085180282592773, -0.00024068355560302734, -0.00016051530838012695, -8.034706115722656e-05, -1.7881393432617188e-07, 7.998943328857422e-05, 0.0001601576805114746, 0.000240325927734375, 0.0003204941749572754, 0.0004006624221801758, 0.00048083066940307617, 0.0005609989166259766, 0.000641167163848877, 0.0007213354110717773, 0.0008015036582946777, 0.0008816719055175781, 0.0009618401527404785, 0.001042008399963379, 0.0011221766471862793, 0.0012023448944091797, 0.00128251314163208, 0.0013626813888549805, 0.0014428496360778809, 0.0015230178833007812, 0.0016031861305236816, 0.001683354377746582, 0.0017635226249694824, 0.0018436908721923828, 0.0019238591194152832, 0.0020040273666381836, 0.002084195613861084, 0.0021643638610839844, 0.0022445321083068848, 0.002324700355529785, 0.0024048686027526855, 0.002485036849975586, 0.0025652050971984863, 0.0026453733444213867, 0.002725541591644287, 0.0028057098388671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 20.0, 25.0, 20.0, 47.0, 55.0, 63.0, 108.0, 132.0, 150.0, 221.0, 294.0, 422.0, 587.0, 907.0, 1373.0, 2036.0, 3665.0, 8903.0, 31338.0, 246393.0, 683327.0, 44964.0, 11774.0, 4488.0, 2399.0, 1494.0, 999.0, 689.0, 420.0, 307.0, 242.0, 167.0, 132.0, 102.0, 69.0, 55.0, 57.0, 28.0, 23.0, 10.0, 13.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.578125, -27.6884765625, -26.798828125, -25.9091796875, -25.01953125, -24.1298828125, -23.240234375, -22.3505859375, -21.4609375, -20.5712890625, -19.681640625, -18.7919921875, -17.90234375, -17.0126953125, -16.123046875, -15.2333984375, -14.34375, -13.4541015625, -12.564453125, -11.6748046875, -10.78515625, -9.8955078125, -9.005859375, -8.1162109375, -7.2265625, -6.3369140625, -5.447265625, -4.5576171875, -3.66796875, -2.7783203125, -1.888671875, -0.9990234375, -0.109375, 0.7802734375, 1.669921875, 2.5595703125, 3.44921875, 4.3388671875, 5.228515625, 6.1181640625, 7.0078125, 7.8974609375, 8.787109375, 9.6767578125, 10.56640625, 11.4560546875, 12.345703125, 13.2353515625, 14.125, 15.0146484375, 15.904296875, 16.7939453125, 17.68359375, 18.5732421875, 19.462890625, 20.3525390625, 21.2421875, 22.1318359375, 23.021484375, 23.9111328125, 24.80078125, 25.6904296875, 26.580078125, 27.4697265625, 28.359375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 34.0, 43.0, 60.0, 102.0, 475.0, 119.0, 64.0, 29.0, 20.0, 13.0, 4.0, 4.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.2603759765625, -9.934814453125, -9.6092529296875, -9.28369140625, -8.9581298828125, -8.632568359375, -8.3070068359375, -7.9814453125, -7.6558837890625, -7.330322265625, -7.0047607421875, -6.67919921875, -6.3536376953125, -6.028076171875, -5.7025146484375, -5.376953125, -5.0513916015625, -4.725830078125, -4.4002685546875, -4.07470703125, -3.7491455078125, -3.423583984375, -3.0980224609375, -2.7724609375, -2.4468994140625, -2.121337890625, -1.7957763671875, -1.47021484375, -1.1446533203125, -0.819091796875, -0.4935302734375, -0.16796875, 0.1575927734375, 0.483154296875, 0.8087158203125, 1.13427734375, 1.4598388671875, 1.785400390625, 2.1109619140625, 2.4365234375, 2.7620849609375, 3.087646484375, 3.4132080078125, 3.73876953125, 4.0643310546875, 4.389892578125, 4.7154541015625, 5.041015625, 5.3665771484375, 5.692138671875, 6.0177001953125, 6.34326171875, 6.6688232421875, 6.994384765625, 7.3199462890625, 7.6455078125, 7.9710693359375, 8.296630859375, 8.6221923828125, 8.94775390625, 9.2733154296875, 9.598876953125, 9.9244384765625, 10.25]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 7.0, 3.0, 9.0, 9.0, 16.0, 7.0, 20.0, 19.0, 17.0, 24.0, 39.0, 49.0, 55.0, 46.0, 56.0, 63.0, 56.0, 55.0, 60.0, 62.0, 55.0, 41.0, 41.0, 34.0, 22.0, 20.0, 25.0, 18.0, 10.0, 7.0, 9.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.69671630859375, -36.48967742919922, -35.28263473510742, -34.07559585571289, -32.868553161621094, -31.661514282226562, -30.45447540283203, -29.247434616088867, -28.040393829345703, -26.83335304260254, -25.626312255859375, -24.419273376464844, -23.21223258972168, -22.005191802978516, -20.798152923583984, -19.59111213684082, -18.384071350097656, -17.177030563354492, -15.969990730285645, -14.762950897216797, -13.555910110473633, -12.348869323730469, -11.141829490661621, -9.934789657592773, -8.72774887084961, -7.5207085609436035, -6.313668251037598, -5.106627941131592, -3.899587631225586, -2.69254732131958, -1.4855070114135742, -0.27846717834472656, 0.9285697937011719, 2.1356101036071777, 3.3426504135131836, 4.5496907234191895, 5.756731033325195, 6.963771343231201, 8.170811653137207, 9.377851486206055, 10.584892272949219, 11.791933059692383, 12.99897289276123, 14.206012725830078, 15.413053512573242, 16.620094299316406, 17.827133178710938, 19.0341739654541, 20.241214752197266, 21.44825553894043, 22.655296325683594, 23.862335205078125, 25.06937599182129, 26.276416778564453, 27.483455657958984, 28.69049644470215, 29.897537231445312, 31.104578018188477, 32.31161880493164, 33.51865768432617, 34.72570037841797, 35.9327392578125, 37.13977813720703, 38.34681701660156, 39.55385971069336]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 11.0, 7.0, 8.0, 9.0, 17.0, 14.0, 15.0, 24.0, 35.0, 37.0, 36.0, 27.0, 39.0, 37.0, 41.0, 41.0, 39.0, 45.0, 50.0, 38.0, 41.0, 45.0, 33.0, 33.0, 41.0, 31.0, 35.0, 26.0, 27.0, 22.0, 13.0, 12.0, 7.0, 13.0, 9.0, 6.0, 6.0, 6.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.781715393066406, -31.619911193847656, -30.458106994628906, -29.296300888061523, -28.134496688842773, -26.972692489624023, -25.81088638305664, -24.64908218383789, -23.48727798461914, -22.32547378540039, -21.16366958618164, -20.001863479614258, -18.840059280395508, -17.678255081176758, -16.516448974609375, -15.354644775390625, -14.192840576171875, -13.031036376953125, -11.869231224060059, -10.707426071166992, -9.545621871948242, -8.383817672729492, -7.222012519836426, -6.060207366943359, -4.898403167724609, -3.736598491668701, -2.574793815612793, -1.4129891395568848, -0.25118446350097656, 0.9106202125549316, 2.07242488861084, 3.2342300415039062, 4.396034240722656, 5.5578389167785645, 6.719643592834473, 7.881448268890381, 9.043252944946289, 10.205057144165039, 11.366862297058105, 12.528667449951172, 13.690471649169922, 14.852275848388672, 16.014080047607422, 17.175886154174805, 18.337690353393555, 19.499494552612305, 20.661300659179688, 21.823104858398438, 22.984909057617188, 24.146713256835938, 25.308517456054688, 26.47032356262207, 27.63212776184082, 28.79393196105957, 29.955738067626953, 31.117542266845703, 32.27934646606445, 33.4411506652832, 34.60295486450195, 35.7647590637207, 36.92656707763672, 38.08837127685547, 39.25017547607422, 40.41197967529297, 41.57378387451172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 17.0, 22.0, 24.0, 34.0, 55.0, 119.0, 151.0, 200.0, 306.0, 466.0, 662.0, 1025.0, 1577.0, 2560.0, 3966.0, 6678.0, 10828.0, 18236.0, 30767.0, 52250.0, 87150.0, 134164.0, 175579.0, 173134.0, 133311.0, 86182.0, 51957.0, 30494.0, 17896.0, 10843.0, 6627.0, 3932.0, 2536.0, 1658.0, 1043.0, 627.0, 487.0, 321.0, 218.0, 126.0, 89.0, 65.0, 49.0, 37.0, 23.0, 28.0, 11.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.1806640625, -33.923828125, -32.6669921875, -31.41015625, -30.1533203125, -28.896484375, -27.6396484375, -26.3828125, -25.1259765625, -23.869140625, -22.6123046875, -21.35546875, -20.0986328125, -18.841796875, -17.5849609375, -16.328125, -15.0712890625, -13.814453125, -12.5576171875, -11.30078125, -10.0439453125, -8.787109375, -7.5302734375, -6.2734375, -5.0166015625, -3.759765625, -2.5029296875, -1.24609375, 0.0107421875, 1.267578125, 2.5244140625, 3.78125, 5.0380859375, 6.294921875, 7.5517578125, 8.80859375, 10.0654296875, 11.322265625, 12.5791015625, 13.8359375, 15.0927734375, 16.349609375, 17.6064453125, 18.86328125, 20.1201171875, 21.376953125, 22.6337890625, 23.890625, 25.1474609375, 26.404296875, 27.6611328125, 28.91796875, 30.1748046875, 31.431640625, 32.6884765625, 33.9453125, 35.2021484375, 36.458984375, 37.7158203125, 38.97265625, 40.2294921875, 41.486328125, 42.7431640625, 44.0]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 2.0, 9.0, 9.0, 19.0, 11.0, 15.0, 23.0, 29.0, 27.0, 26.0, 28.0, 38.0, 38.0, 43.0, 38.0, 39.0, 47.0, 46.0, 38.0, 42.0, 46.0, 39.0, 32.0, 41.0, 26.0, 36.0, 30.0, 29.0, 26.0, 13.0, 21.0, 10.0, 9.0, 12.0, 12.0, 7.0, 5.0, 6.0, 5.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.125, -27.1220703125, -26.119140625, -25.1162109375, -24.11328125, -23.1103515625, -22.107421875, -21.1044921875, -20.1015625, -19.0986328125, -18.095703125, -17.0927734375, -16.08984375, -15.0869140625, -14.083984375, -13.0810546875, -12.078125, -11.0751953125, -10.072265625, -9.0693359375, -8.06640625, -7.0634765625, -6.060546875, -5.0576171875, -4.0546875, -3.0517578125, -2.048828125, -1.0458984375, -0.04296875, 0.9599609375, 1.962890625, 2.9658203125, 3.96875, 4.9716796875, 5.974609375, 6.9775390625, 7.98046875, 8.9833984375, 9.986328125, 10.9892578125, 11.9921875, 12.9951171875, 13.998046875, 15.0009765625, 16.00390625, 17.0068359375, 18.009765625, 19.0126953125, 20.015625, 21.0185546875, 22.021484375, 23.0244140625, 24.02734375, 25.0302734375, 26.033203125, 27.0361328125, 28.0390625, 29.0419921875, 30.044921875, 31.0478515625, 32.05078125, 33.0537109375, 34.056640625, 35.0595703125, 36.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 10.0, 18.0, 23.0, 38.0, 66.0, 76.0, 125.0, 179.0, 249.0, 390.0, 604.0, 924.0, 1388.0, 2185.0, 3386.0, 5350.0, 8812.0, 14075.0, 22990.0, 38525.0, 64481.0, 103849.0, 150990.0, 177233.0, 158311.0, 113072.0, 70949.0, 42919.0, 25742.0, 15472.0, 9405.0, 6040.0, 3793.0, 2383.0, 1496.0, 1041.0, 633.0, 445.0, 260.0, 205.0, 122.0, 102.0, 62.0, 39.0, 38.0, 20.0, 13.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.0, -35.75, -34.5, -33.25, -32.0, -30.75, -29.5, -28.25, -27.0, -25.75, -24.5, -23.25, -22.0, -20.75, -19.5, -18.25, -17.0, -15.75, -14.5, -13.25, -12.0, -10.75, -9.5, -8.25, -7.0, -5.75, -4.5, -3.25, -2.0, -0.75, 0.5, 1.75, 3.0, 4.25, 5.5, 6.75, 8.0, 9.25, 10.5, 11.75, 13.0, 14.25, 15.5, 16.75, 18.0, 19.25, 20.5, 21.75, 23.0, 24.25, 25.5, 26.75, 28.0, 29.25, 30.5, 31.75, 33.0, 34.25, 35.5, 36.75, 38.0, 39.25, 40.5, 41.75, 43.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 12.0, 9.0, 11.0, 16.0, 12.0, 21.0, 16.0, 30.0, 27.0, 25.0, 33.0, 29.0, 48.0, 43.0, 38.0, 57.0, 39.0, 37.0, 45.0, 55.0, 43.0, 43.0, 37.0, 33.0, 38.0, 23.0, 24.0, 28.0, 24.0, 21.0, 22.0, 14.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5, -26.746826171875, -25.99365234375, -25.240478515625, -24.4873046875, -23.734130859375, -22.98095703125, -22.227783203125, -21.474609375, -20.721435546875, -19.96826171875, -19.215087890625, -18.4619140625, -17.708740234375, -16.95556640625, -16.202392578125, -15.44921875, -14.696044921875, -13.94287109375, -13.189697265625, -12.4365234375, -11.683349609375, -10.93017578125, -10.177001953125, -9.423828125, -8.670654296875, -7.91748046875, -7.164306640625, -6.4111328125, -5.657958984375, -4.90478515625, -4.151611328125, -3.3984375, -2.645263671875, -1.89208984375, -1.138916015625, -0.3857421875, 0.367431640625, 1.12060546875, 1.873779296875, 2.626953125, 3.380126953125, 4.13330078125, 4.886474609375, 5.6396484375, 6.392822265625, 7.14599609375, 7.899169921875, 8.65234375, 9.405517578125, 10.15869140625, 10.911865234375, 11.6650390625, 12.418212890625, 13.17138671875, 13.924560546875, 14.677734375, 15.430908203125, 16.18408203125, 16.937255859375, 17.6904296875, 18.443603515625, 19.19677734375, 19.949951171875, 20.703125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 15.0, 24.0, 45.0, 41.0, 73.0, 115.0, 192.0, 307.0, 429.0, 774.0, 1258.0, 2087.0, 3497.0, 6020.0, 10921.0, 19956.0, 36266.0, 67031.0, 120059.0, 186781.0, 213850.0, 162279.0, 97634.0, 53060.0, 28751.0, 15814.0, 8854.0, 5046.0, 2845.0, 1748.0, 1036.0, 628.0, 413.0, 254.0, 164.0, 84.0, 62.0, 49.0, 33.0, 22.0, 15.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4765625, -9.1639404296875, -8.851318359375, -8.5386962890625, -8.22607421875, -7.9134521484375, -7.600830078125, -7.2882080078125, -6.9755859375, -6.6629638671875, -6.350341796875, -6.0377197265625, -5.72509765625, -5.4124755859375, -5.099853515625, -4.7872314453125, -4.474609375, -4.1619873046875, -3.849365234375, -3.5367431640625, -3.22412109375, -2.9114990234375, -2.598876953125, -2.2862548828125, -1.9736328125, -1.6610107421875, -1.348388671875, -1.0357666015625, -0.72314453125, -0.4105224609375, -0.097900390625, 0.2147216796875, 0.52734375, 0.8399658203125, 1.152587890625, 1.4652099609375, 1.77783203125, 2.0904541015625, 2.403076171875, 2.7156982421875, 3.0283203125, 3.3409423828125, 3.653564453125, 3.9661865234375, 4.27880859375, 4.5914306640625, 4.904052734375, 5.2166748046875, 5.529296875, 5.8419189453125, 6.154541015625, 6.4671630859375, 6.77978515625, 7.0924072265625, 7.405029296875, 7.7176513671875, 8.0302734375, 8.3428955078125, 8.655517578125, 8.9681396484375, 9.28076171875, 9.5933837890625, 9.906005859375, 10.2186279296875, 10.53125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 9.0, 4.0, 6.0, 9.0, 12.0, 7.0, 20.0, 32.0, 28.0, 24.0, 44.0, 35.0, 66.0, 60.0, 57.0, 58.0, 63.0, 76.0, 75.0, 50.0, 52.0, 53.0, 32.0, 30.0, 17.0, 24.0, 18.0, 11.0, 14.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008258819580078125, -0.0008001178503036499, -0.0007743537425994873, -0.0007485896348953247, -0.0007228255271911621, -0.0006970614194869995, -0.0006712973117828369, -0.0006455332040786743, -0.0006197690963745117, -0.0005940049886703491, -0.0005682408809661865, -0.0005424767732620239, -0.0005167126655578613, -0.0004909485578536987, -0.00046518445014953613, -0.00043942034244537354, -0.00041365623474121094, -0.00038789212703704834, -0.00036212801933288574, -0.00033636391162872314, -0.00031059980392456055, -0.00028483569622039795, -0.00025907158851623535, -0.00023330748081207275, -0.00020754337310791016, -0.00018177926540374756, -0.00015601515769958496, -0.00013025104999542236, -0.00010448694229125977, -7.872283458709717e-05, -5.295872688293457e-05, -2.7194619178771973e-05, -1.430511474609375e-06, 2.4333596229553223e-05, 5.009770393371582e-05, 7.586181163787842e-05, 0.00010162591934204102, 0.0001273900270462036, 0.0001531541347503662, 0.0001789182424545288, 0.0002046823501586914, 0.000230446457862854, 0.0002562105655670166, 0.0002819746732711792, 0.0003077387809753418, 0.0003335028886795044, 0.000359266996383667, 0.0003850311040878296, 0.0004107952117919922, 0.0004365593194961548, 0.0004623234272003174, 0.00048808753490448, 0.0005138516426086426, 0.0005396157503128052, 0.0005653798580169678, 0.0005911439657211304, 0.000616908073425293, 0.0006426721811294556, 0.0006684362888336182, 0.0006942003965377808, 0.0007199645042419434, 0.000745728611946106, 0.0007714927196502686, 0.0007972568273544312, 0.0008230209350585938]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 9.0, 20.0, 37.0, 43.0, 83.0, 99.0, 201.0, 271.0, 430.0, 692.0, 1122.0, 1883.0, 2875.0, 4795.0, 8087.0, 13724.0, 23847.0, 40825.0, 68346.0, 111612.0, 160656.0, 183811.0, 157197.0, 107084.0, 66103.0, 38802.0, 22748.0, 13284.0, 7856.0, 4646.0, 2727.0, 1709.0, 1039.0, 745.0, 404.0, 267.0, 153.0, 110.0, 68.0, 53.0, 40.0, 15.0, 14.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.171875, -7.912109375, -7.65234375, -7.392578125, -7.1328125, -6.873046875, -6.61328125, -6.353515625, -6.09375, -5.833984375, -5.57421875, -5.314453125, -5.0546875, -4.794921875, -4.53515625, -4.275390625, -4.015625, -3.755859375, -3.49609375, -3.236328125, -2.9765625, -2.716796875, -2.45703125, -2.197265625, -1.9375, -1.677734375, -1.41796875, -1.158203125, -0.8984375, -0.638671875, -0.37890625, -0.119140625, 0.140625, 0.400390625, 0.66015625, 0.919921875, 1.1796875, 1.439453125, 1.69921875, 1.958984375, 2.21875, 2.478515625, 2.73828125, 2.998046875, 3.2578125, 3.517578125, 3.77734375, 4.037109375, 4.296875, 4.556640625, 4.81640625, 5.076171875, 5.3359375, 5.595703125, 5.85546875, 6.115234375, 6.375, 6.634765625, 6.89453125, 7.154296875, 7.4140625, 7.673828125, 7.93359375, 8.193359375, 8.453125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 9.0, 1.0, 11.0, 18.0, 13.0, 14.0, 26.0, 22.0, 22.0, 29.0, 31.0, 31.0, 38.0, 35.0, 39.0, 46.0, 57.0, 45.0, 57.0, 40.0, 49.0, 45.0, 44.0, 34.0, 43.0, 35.0, 25.0, 21.0, 16.0, 16.0, 16.0, 14.0, 6.0, 8.0, 5.0, 13.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-3.4296875, -3.328765869140625, -3.22784423828125, -3.126922607421875, -3.0260009765625, -2.925079345703125, -2.82415771484375, -2.723236083984375, -2.622314453125, -2.521392822265625, -2.42047119140625, -2.319549560546875, -2.2186279296875, -2.117706298828125, -2.01678466796875, -1.915863037109375, -1.81494140625, -1.714019775390625, -1.61309814453125, -1.512176513671875, -1.4112548828125, -1.310333251953125, -1.20941162109375, -1.108489990234375, -1.007568359375, -0.906646728515625, -0.80572509765625, -0.704803466796875, -0.6038818359375, -0.502960205078125, -0.40203857421875, -0.301116943359375, -0.2001953125, -0.099273681640625, 0.00164794921875, 0.102569580078125, 0.2034912109375, 0.304412841796875, 0.40533447265625, 0.506256103515625, 0.607177734375, 0.708099365234375, 0.80902099609375, 0.909942626953125, 1.0108642578125, 1.111785888671875, 1.21270751953125, 1.313629150390625, 1.41455078125, 1.515472412109375, 1.61639404296875, 1.717315673828125, 1.8182373046875, 1.919158935546875, 2.02008056640625, 2.121002197265625, 2.221923828125, 2.322845458984375, 2.42376708984375, 2.524688720703125, 2.6256103515625, 2.726531982421875, 2.82745361328125, 2.928375244140625, 3.029296875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 0.0, 8.0, 9.0, 11.0, 12.0, 11.0, 18.0, 12.0, 24.0, 30.0, 32.0, 36.0, 54.0, 60.0, 58.0, 71.0, 45.0, 71.0, 61.0, 49.0, 40.0, 55.0, 37.0, 30.0, 30.0, 31.0, 20.0, 16.0, 14.0, 11.0, 9.0, 6.0, 7.0, 6.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.45931625366211, -36.3232421875, -35.187171936035156, -34.05110168457031, -32.9150276184082, -31.778955459594727, -30.64288330078125, -29.506811141967773, -28.370738983154297, -27.23466682434082, -26.098594665527344, -24.962522506713867, -23.82645034790039, -22.690378189086914, -21.554306030273438, -20.41823387145996, -19.282161712646484, -18.146089553833008, -17.01001739501953, -15.873945236206055, -14.737873077392578, -13.601800918579102, -12.465728759765625, -11.329656600952148, -10.193584442138672, -9.057512283325195, -7.921440124511719, -6.785367965698242, -5.649295806884766, -4.513223648071289, -3.3771514892578125, -2.241079330444336, -1.1050033569335938, 0.031068801879882812, 1.1671409606933594, 2.303213119506836, 3.4392852783203125, 4.575357437133789, 5.711429595947266, 6.847501754760742, 7.983573913574219, 9.119646072387695, 10.255718231201172, 11.391790390014648, 12.527862548828125, 13.663934707641602, 14.800006866455078, 15.936079025268555, 17.07215118408203, 18.208223342895508, 19.344295501708984, 20.48036766052246, 21.616439819335938, 22.752511978149414, 23.88858413696289, 25.024656295776367, 26.160728454589844, 27.29680061340332, 28.432872772216797, 29.568944931030273, 30.70501708984375, 31.841089248657227, 32.9771614074707, 34.11323547363281, 35.249305725097656]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 6.0, 15.0, 19.0, 18.0, 15.0, 27.0, 46.0, 33.0, 47.0, 42.0, 37.0, 43.0, 50.0, 37.0, 33.0, 50.0, 50.0, 42.0, 32.0, 45.0, 41.0, 48.0, 39.0, 24.0, 21.0, 20.0, 25.0, 11.0, 14.0, 11.0, 11.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.975374221801758, -30.690818786621094, -29.406261444091797, -28.121706008911133, -26.83715057373047, -25.552593231201172, -24.268037796020508, -22.983482360839844, -21.698925018310547, -20.414369583129883, -19.129812240600586, -17.845256805419922, -16.560701370239258, -15.276144981384277, -13.991588592529297, -12.707033157348633, -11.422477722167969, -10.137921333312988, -8.853365898132324, -7.568809509277344, -6.2842535972595215, -4.999697685241699, -3.7151412963867188, -2.4305858612060547, -1.1460294723510742, 0.1385265588760376, 1.4230825901031494, 2.707638740539551, 3.992194652557373, 5.276750564575195, 6.561306953430176, 7.84586238861084, 9.130416870117188, 10.414973258972168, 11.699528694152832, 12.984085083007812, 14.268640518188477, 15.553196907043457, 16.837753295898438, 18.1223087310791, 19.406864166259766, 20.69141960144043, 21.975976943969727, 23.26053237915039, 24.545087814331055, 25.82964324951172, 27.114200592041016, 28.39875602722168, 29.683313369750977, 30.96786880493164, 32.25242614746094, 33.53697967529297, 34.821537017822266, 36.10609436035156, 37.390647888183594, 38.67520523071289, 39.95976257324219, 41.244319915771484, 42.528873443603516, 43.81343078613281, 45.09798812866211, 46.38254165649414, 47.66709899902344, 48.95165252685547, 50.236209869384766]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 12.0, 9.0, 19.0, 41.0, 54.0, 105.0, 139.0, 227.0, 335.0, 571.0, 932.0, 1642.0, 2618.0, 4377.0, 7678.0, 13334.0, 23921.0, 42728.0, 78991.0, 151710.0, 305273.0, 612788.0, 969583.0, 909666.0, 523559.0, 256087.0, 129163.0, 68252.0, 37773.0, 21398.0, 12260.0, 7314.0, 4295.0, 2783.0, 1644.0, 1046.0, 670.0, 416.0, 320.0, 191.0, 139.0, 91.0, 49.0, 26.0, 15.0, 19.0, 6.0, 5.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.859375, -28.860107421875, -27.86083984375, -26.861572265625, -25.8623046875, -24.863037109375, -23.86376953125, -22.864501953125, -21.865234375, -20.865966796875, -19.86669921875, -18.867431640625, -17.8681640625, -16.868896484375, -15.86962890625, -14.870361328125, -13.87109375, -12.871826171875, -11.87255859375, -10.873291015625, -9.8740234375, -8.874755859375, -7.87548828125, -6.876220703125, -5.876953125, -4.877685546875, -3.87841796875, -2.879150390625, -1.8798828125, -0.880615234375, 0.11865234375, 1.117919921875, 2.1171875, 3.116455078125, 4.11572265625, 5.114990234375, 6.1142578125, 7.113525390625, 8.11279296875, 9.112060546875, 10.111328125, 11.110595703125, 12.10986328125, 13.109130859375, 14.1083984375, 15.107666015625, 16.10693359375, 17.106201171875, 18.10546875, 19.104736328125, 20.10400390625, 21.103271484375, 22.1025390625, 23.101806640625, 24.10107421875, 25.100341796875, 26.099609375, 27.098876953125, 28.09814453125, 29.097412109375, 30.0966796875, 31.095947265625, 32.09521484375, 33.094482421875, 34.09375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 11.0, 6.0, 9.0, 11.0, 25.0, 18.0, 25.0, 33.0, 30.0, 36.0, 38.0, 46.0, 35.0, 31.0, 53.0, 47.0, 39.0, 40.0, 39.0, 54.0, 35.0, 34.0, 46.0, 39.0, 28.0, 33.0, 27.0, 25.0, 25.0, 16.0, 12.0, 12.0, 6.0, 9.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.689697265625, -19.86376953125, -19.037841796875, -18.2119140625, -17.385986328125, -16.56005859375, -15.734130859375, -14.908203125, -14.082275390625, -13.25634765625, -12.430419921875, -11.6044921875, -10.778564453125, -9.95263671875, -9.126708984375, -8.30078125, -7.474853515625, -6.64892578125, -5.822998046875, -4.9970703125, -4.171142578125, -3.34521484375, -2.519287109375, -1.693359375, -0.867431640625, -0.04150390625, 0.784423828125, 1.6103515625, 2.436279296875, 3.26220703125, 4.088134765625, 4.9140625, 5.739990234375, 6.56591796875, 7.391845703125, 8.2177734375, 9.043701171875, 9.86962890625, 10.695556640625, 11.521484375, 12.347412109375, 13.17333984375, 13.999267578125, 14.8251953125, 15.651123046875, 16.47705078125, 17.302978515625, 18.12890625, 18.954833984375, 19.78076171875, 20.606689453125, 21.4326171875, 22.258544921875, 23.08447265625, 23.910400390625, 24.736328125, 25.562255859375, 26.38818359375, 27.214111328125, 28.0400390625, 28.865966796875, 29.69189453125, 30.517822265625, 31.34375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 36.0, 48.0, 72.0, 123.0, 185.0, 312.0, 568.0, 980.0, 1590.0, 2870.0, 5076.0, 9051.0, 16365.0, 29735.0, 54366.0, 101023.0, 182683.0, 324457.0, 537580.0, 763596.0, 786804.0, 576999.0, 354365.0, 201164.0, 110506.0, 59794.0, 32360.0, 17896.0, 9972.0, 5722.0, 3159.0, 1935.0, 1172.0, 653.0, 368.0, 256.0, 151.0, 86.0, 64.0, 36.0, 30.0, 20.0, 9.0, 3.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.65625, -22.8427734375, -22.029296875, -21.2158203125, -20.40234375, -19.5888671875, -18.775390625, -17.9619140625, -17.1484375, -16.3349609375, -15.521484375, -14.7080078125, -13.89453125, -13.0810546875, -12.267578125, -11.4541015625, -10.640625, -9.8271484375, -9.013671875, -8.2001953125, -7.38671875, -6.5732421875, -5.759765625, -4.9462890625, -4.1328125, -3.3193359375, -2.505859375, -1.6923828125, -0.87890625, -0.0654296875, 0.748046875, 1.5615234375, 2.375, 3.1884765625, 4.001953125, 4.8154296875, 5.62890625, 6.4423828125, 7.255859375, 8.0693359375, 8.8828125, 9.6962890625, 10.509765625, 11.3232421875, 12.13671875, 12.9501953125, 13.763671875, 14.5771484375, 15.390625, 16.2041015625, 17.017578125, 17.8310546875, 18.64453125, 19.4580078125, 20.271484375, 21.0849609375, 21.8984375, 22.7119140625, 23.525390625, 24.3388671875, 25.15234375, 25.9658203125, 26.779296875, 27.5927734375, 28.40625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 9.0, 9.0, 16.0, 22.0, 16.0, 17.0, 30.0, 35.0, 39.0, 48.0, 55.0, 60.0, 92.0, 101.0, 108.0, 116.0, 137.0, 150.0, 177.0, 211.0, 231.0, 235.0, 261.0, 238.0, 204.0, 238.0, 203.0, 167.0, 149.0, 131.0, 96.0, 94.0, 78.0, 55.0, 36.0, 36.0, 43.0, 26.0, 22.0, 18.0, 12.0, 2.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.68212890625, -9.3564453125, -9.03076171875, -8.705078125, -8.37939453125, -8.0537109375, -7.72802734375, -7.40234375, -7.07666015625, -6.7509765625, -6.42529296875, -6.099609375, -5.77392578125, -5.4482421875, -5.12255859375, -4.796875, -4.47119140625, -4.1455078125, -3.81982421875, -3.494140625, -3.16845703125, -2.8427734375, -2.51708984375, -2.19140625, -1.86572265625, -1.5400390625, -1.21435546875, -0.888671875, -0.56298828125, -0.2373046875, 0.08837890625, 0.4140625, 0.73974609375, 1.0654296875, 1.39111328125, 1.716796875, 2.04248046875, 2.3681640625, 2.69384765625, 3.01953125, 3.34521484375, 3.6708984375, 3.99658203125, 4.322265625, 4.64794921875, 4.9736328125, 5.29931640625, 5.625, 5.95068359375, 6.2763671875, 6.60205078125, 6.927734375, 7.25341796875, 7.5791015625, 7.90478515625, 8.23046875, 8.55615234375, 8.8818359375, 9.20751953125, 9.533203125, 9.85888671875, 10.1845703125, 10.51025390625, 10.8359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 17.0, 22.0, 25.0, 35.0, 35.0, 55.0, 41.0, 61.0, 53.0, 68.0, 83.0, 75.0, 74.0, 62.0, 58.0, 48.0, 35.0, 21.0, 18.0, 20.0, 21.0, 8.0, 11.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.94266128540039, -37.9105224609375, -36.878387451171875, -35.846248626708984, -34.81411361694336, -33.78197479248047, -32.749839782714844, -31.717700958251953, -30.685564041137695, -29.653427124023438, -28.62129020690918, -27.589153289794922, -26.55701446533203, -25.524879455566406, -24.492740631103516, -23.460603713989258, -22.428466796875, -21.396329879760742, -20.364192962646484, -19.332056045532227, -18.29991912841797, -17.267780303955078, -16.23564338684082, -15.203506469726562, -14.171369552612305, -13.139232635498047, -12.107095718383789, -11.074957847595215, -10.042820930480957, -9.0106840133667, -7.978546619415283, -6.946409225463867, -5.914268493652344, -4.882131576538086, -3.84999418258667, -2.817857027053833, -1.785719871520996, -0.7535829544067383, 0.27855443954467773, 1.3106918334960938, 2.3428287506103516, 3.3749659061431885, 4.407103061676025, 5.439240455627441, 6.471377372741699, 7.503514289855957, 8.535652160644531, 9.567789077758789, 10.599925994873047, 11.632062911987305, 12.664199829101562, 13.696337699890137, 14.728474617004395, 15.760611534118652, 16.792749404907227, 17.824886322021484, 18.857023239135742, 19.88916015625, 20.921297073364258, 21.953433990478516, 22.985572814941406, 24.01770782470703, 25.049846649169922, 26.08198356628418, 27.114120483398438]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 2.0, 10.0, 9.0, 12.0, 16.0, 18.0, 27.0, 23.0, 15.0, 30.0, 25.0, 37.0, 33.0, 34.0, 31.0, 49.0, 36.0, 31.0, 50.0, 44.0, 52.0, 32.0, 43.0, 31.0, 25.0, 34.0, 30.0, 28.0, 25.0, 33.0, 24.0, 20.0, 16.0, 11.0, 13.0, 7.0, 12.0, 3.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3282413482666, -23.398025512695312, -22.467811584472656, -21.537595748901367, -20.607379913330078, -19.677165985107422, -18.746950149536133, -17.816734313964844, -16.886520385742188, -15.956305503845215, -15.026089668273926, -14.095874786376953, -13.165658950805664, -12.235444068908691, -11.305229187011719, -10.37501335144043, -9.44479751586914, -8.514582633972168, -7.584366798400879, -6.654151916503906, -5.723936557769775, -4.7937211990356445, -3.863506317138672, -2.933290958404541, -2.00307559967041, -1.0728603601455688, -0.14264512062072754, 0.7875699996948242, 1.717785358428955, 2.648000717163086, 3.5782155990600586, 4.5084309577941895, 5.438648223876953, 6.368863582611084, 7.299078941345215, 8.229293823242188, 9.159509658813477, 10.08972454071045, 11.019939422607422, 11.950155258178711, 12.880370140075684, 13.810585021972656, 14.740800857543945, 15.671015739440918, 16.60123062133789, 17.53144645690918, 18.46166229248047, 19.391876220703125, 20.322092056274414, 21.252307891845703, 22.18252182006836, 23.11273765563965, 24.042953491210938, 24.973167419433594, 25.903383255004883, 26.833599090576172, 27.763813018798828, 28.694028854370117, 29.624242782592773, 30.554458618164062, 31.48467445373535, 32.41489028930664, 33.3451042175293, 34.27531814575195, 35.205535888671875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 17.0, 16.0, 46.0, 65.0, 105.0, 172.0, 275.0, 458.0, 681.0, 1036.0, 1695.0, 2759.0, 4350.0, 6971.0, 11477.0, 19018.0, 31212.0, 52241.0, 86174.0, 137516.0, 197345.0, 182974.0, 121554.0, 75500.0, 44977.0, 27127.0, 16417.0, 10033.0, 6049.0, 3773.0, 2436.0, 1518.0, 881.0, 637.0, 361.0, 232.0, 169.0, 92.0, 56.0, 48.0, 29.0, 16.0, 14.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.3828125, -8.1490478515625, -7.915283203125, -7.6815185546875, -7.44775390625, -7.2139892578125, -6.980224609375, -6.7464599609375, -6.5126953125, -6.2789306640625, -6.045166015625, -5.8114013671875, -5.57763671875, -5.3438720703125, -5.110107421875, -4.8763427734375, -4.642578125, -4.4088134765625, -4.175048828125, -3.9412841796875, -3.70751953125, -3.4737548828125, -3.239990234375, -3.0062255859375, -2.7724609375, -2.5386962890625, -2.304931640625, -2.0711669921875, -1.83740234375, -1.6036376953125, -1.369873046875, -1.1361083984375, -0.90234375, -0.6685791015625, -0.434814453125, -0.2010498046875, 0.03271484375, 0.2664794921875, 0.500244140625, 0.7340087890625, 0.9677734375, 1.2015380859375, 1.435302734375, 1.6690673828125, 1.90283203125, 2.1365966796875, 2.370361328125, 2.6041259765625, 2.837890625, 3.0716552734375, 3.305419921875, 3.5391845703125, 3.77294921875, 4.0067138671875, 4.240478515625, 4.4742431640625, 4.7080078125, 4.9417724609375, 5.175537109375, 5.4093017578125, 5.64306640625, 5.8768310546875, 6.110595703125, 6.3443603515625, 6.578125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 16.0, 21.0, 22.0, 17.0, 32.0, 32.0, 32.0, 20.0, 36.0, 43.0, 33.0, 37.0, 41.0, 51.0, 45.0, 51.0, 39.0, 37.0, 27.0, 30.0, 25.0, 36.0, 32.0, 23.0, 29.0, 20.0, 22.0, 21.0, 10.0, 14.0, 7.0, 10.0, 6.0, 9.0, 3.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.3271484375, -22.404296875, -21.4814453125, -20.55859375, -19.6357421875, -18.712890625, -17.7900390625, -16.8671875, -15.9443359375, -15.021484375, -14.0986328125, -13.17578125, -12.2529296875, -11.330078125, -10.4072265625, -9.484375, -8.5615234375, -7.638671875, -6.7158203125, -5.79296875, -4.8701171875, -3.947265625, -3.0244140625, -2.1015625, -1.1787109375, -0.255859375, 0.6669921875, 1.58984375, 2.5126953125, 3.435546875, 4.3583984375, 5.28125, 6.2041015625, 7.126953125, 8.0498046875, 8.97265625, 9.8955078125, 10.818359375, 11.7412109375, 12.6640625, 13.5869140625, 14.509765625, 15.4326171875, 16.35546875, 17.2783203125, 18.201171875, 19.1240234375, 20.046875, 20.9697265625, 21.892578125, 22.8154296875, 23.73828125, 24.6611328125, 25.583984375, 26.5068359375, 27.4296875, 28.3525390625, 29.275390625, 30.1982421875, 31.12109375, 32.0439453125, 32.966796875, 33.8896484375, 34.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 18.0, 23.0, 41.0, 43.0, 76.0, 111.0, 186.0, 310.0, 523.0, 933.0, 1651.0, 3054.0, 6017.0, 12412.0, 26266.0, 58670.0, 134308.0, 292768.0, 279975.0, 126286.0, 55430.0, 25002.0, 11840.0, 5797.0, 2974.0, 1612.0, 887.0, 499.0, 330.0, 175.0, 107.0, 75.0, 45.0, 23.0, 26.0, 14.0, 7.0, 5.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.515625, -9.24346923828125, -8.9713134765625, -8.69915771484375, -8.427001953125, -8.15484619140625, -7.8826904296875, -7.61053466796875, -7.33837890625, -7.06622314453125, -6.7940673828125, -6.52191162109375, -6.249755859375, -5.97760009765625, -5.7054443359375, -5.43328857421875, -5.1611328125, -4.88897705078125, -4.6168212890625, -4.34466552734375, -4.072509765625, -3.80035400390625, -3.5281982421875, -3.25604248046875, -2.98388671875, -2.71173095703125, -2.4395751953125, -2.16741943359375, -1.895263671875, -1.62310791015625, -1.3509521484375, -1.07879638671875, -0.806640625, -0.53448486328125, -0.2623291015625, 0.00982666015625, 0.281982421875, 0.55413818359375, 0.8262939453125, 1.09844970703125, 1.37060546875, 1.64276123046875, 1.9149169921875, 2.18707275390625, 2.459228515625, 2.73138427734375, 3.0035400390625, 3.27569580078125, 3.5478515625, 3.82000732421875, 4.0921630859375, 4.36431884765625, 4.636474609375, 4.90863037109375, 5.1807861328125, 5.45294189453125, 5.72509765625, 5.99725341796875, 6.2694091796875, 6.54156494140625, 6.813720703125, 7.08587646484375, 7.3580322265625, 7.63018798828125, 7.90234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 6.0, 6.0, 7.0, 9.0, 15.0, 12.0, 16.0, 19.0, 27.0, 22.0, 31.0, 38.0, 36.0, 44.0, 46.0, 28.0, 48.0, 34.0, 32.0, 42.0, 42.0, 31.0, 36.0, 46.0, 33.0, 24.0, 21.0, 28.0, 30.0, 31.0, 19.0, 16.0, 17.0, 11.0, 9.0, 17.0, 16.0, 7.0, 9.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.84375, -20.18994140625, -19.5361328125, -18.88232421875, -18.228515625, -17.57470703125, -16.9208984375, -16.26708984375, -15.61328125, -14.95947265625, -14.3056640625, -13.65185546875, -12.998046875, -12.34423828125, -11.6904296875, -11.03662109375, -10.3828125, -9.72900390625, -9.0751953125, -8.42138671875, -7.767578125, -7.11376953125, -6.4599609375, -5.80615234375, -5.15234375, -4.49853515625, -3.8447265625, -3.19091796875, -2.537109375, -1.88330078125, -1.2294921875, -0.57568359375, 0.078125, 0.73193359375, 1.3857421875, 2.03955078125, 2.693359375, 3.34716796875, 4.0009765625, 4.65478515625, 5.30859375, 5.96240234375, 6.6162109375, 7.27001953125, 7.923828125, 8.57763671875, 9.2314453125, 9.88525390625, 10.5390625, 11.19287109375, 11.8466796875, 12.50048828125, 13.154296875, 13.80810546875, 14.4619140625, 15.11572265625, 15.76953125, 16.42333984375, 17.0771484375, 17.73095703125, 18.384765625, 19.03857421875, 19.6923828125, 20.34619140625, 21.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 15.0, 17.0, 28.0, 30.0, 35.0, 68.0, 87.0, 129.0, 169.0, 254.0, 297.0, 462.0, 716.0, 976.0, 1464.0, 2297.0, 3512.0, 5842.0, 10252.0, 20772.0, 50748.0, 211410.0, 563889.0, 104744.0, 33485.0, 15221.0, 7892.0, 4783.0, 2933.0, 1879.0, 1259.0, 895.0, 558.0, 422.0, 271.0, 203.0, 161.0, 104.0, 75.0, 42.0, 37.0, 29.0, 30.0, 16.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0], "bins": [-5.6328125, -5.47320556640625, -5.3135986328125, -5.15399169921875, -4.994384765625, -4.83477783203125, -4.6751708984375, -4.51556396484375, -4.35595703125, -4.19635009765625, -4.0367431640625, -3.87713623046875, -3.717529296875, -3.55792236328125, -3.3983154296875, -3.23870849609375, -3.0791015625, -2.91949462890625, -2.7598876953125, -2.60028076171875, -2.440673828125, -2.28106689453125, -2.1214599609375, -1.96185302734375, -1.80224609375, -1.64263916015625, -1.4830322265625, -1.32342529296875, -1.163818359375, -1.00421142578125, -0.8446044921875, -0.68499755859375, -0.525390625, -0.36578369140625, -0.2061767578125, -0.04656982421875, 0.113037109375, 0.27264404296875, 0.4322509765625, 0.59185791015625, 0.75146484375, 0.91107177734375, 1.0706787109375, 1.23028564453125, 1.389892578125, 1.54949951171875, 1.7091064453125, 1.86871337890625, 2.0283203125, 2.18792724609375, 2.3475341796875, 2.50714111328125, 2.666748046875, 2.82635498046875, 2.9859619140625, 3.14556884765625, 3.30517578125, 3.46478271484375, 3.6243896484375, 3.78399658203125, 3.943603515625, 4.10321044921875, 4.2628173828125, 4.42242431640625, 4.58203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 12.0, 13.0, 36.0, 21.0, 59.0, 82.0, 119.0, 131.0, 114.0, 111.0, 74.0, 59.0, 34.0, 23.0, 21.0, 12.0, 7.0, 6.0, 6.0, 9.0, 8.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004911422729492188, -0.0004762187600135803, -0.0004612952470779419, -0.00044637173414230347, -0.00043144822120666504, -0.0004165247082710266, -0.0004016011953353882, -0.00038667768239974976, -0.00037175416946411133, -0.0003568306565284729, -0.00034190714359283447, -0.00032698363065719604, -0.0003120601177215576, -0.0002971366047859192, -0.00028221309185028076, -0.00026728957891464233, -0.0002523660659790039, -0.00023744255304336548, -0.00022251904010772705, -0.00020759552717208862, -0.0001926720142364502, -0.00017774850130081177, -0.00016282498836517334, -0.0001479014754295349, -0.00013297796249389648, -0.00011805444955825806, -0.00010313093662261963, -8.82074236869812e-05, -7.328391075134277e-05, -5.8360397815704346e-05, -4.343688488006592e-05, -2.851337194442749e-05, -1.3589859008789062e-05, 1.3336539268493652e-06, 1.6257166862487793e-05, 3.118067979812622e-05, 4.610419273376465e-05, 6.1027705669403076e-05, 7.59512186050415e-05, 9.087473154067993e-05, 0.00010579824447631836, 0.00012072175741195679, 0.00013564527034759521, 0.00015056878328323364, 0.00016549229621887207, 0.0001804158091545105, 0.00019533932209014893, 0.00021026283502578735, 0.00022518634796142578, 0.0002401098608970642, 0.00025503337383270264, 0.00026995688676834106, 0.0002848803997039795, 0.0002998039126396179, 0.00031472742557525635, 0.0003296509385108948, 0.0003445744514465332, 0.00035949796438217163, 0.00037442147731781006, 0.0003893449902534485, 0.0004042685031890869, 0.00041919201612472534, 0.00043411552906036377, 0.0004490390419960022, 0.0004639625549316406]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 11.0, 25.0, 21.0, 27.0, 41.0, 63.0, 92.0, 114.0, 178.0, 253.0, 353.0, 516.0, 713.0, 979.0, 1441.0, 2143.0, 3070.0, 4632.0, 6978.0, 11090.0, 17273.0, 29244.0, 53258.0, 108540.0, 231935.0, 279005.0, 137486.0, 66352.0, 34958.0, 20531.0, 12428.0, 8159.0, 5209.0, 3515.0, 2468.0, 1661.0, 1137.0, 764.0, 536.0, 415.0, 279.0, 196.0, 135.0, 89.0, 78.0, 42.0, 35.0, 20.0, 18.0, 18.0, 10.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-3.541015625, -3.4273681640625, -3.313720703125, -3.2000732421875, -3.08642578125, -2.9727783203125, -2.859130859375, -2.7454833984375, -2.6318359375, -2.5181884765625, -2.404541015625, -2.2908935546875, -2.17724609375, -2.0635986328125, -1.949951171875, -1.8363037109375, -1.72265625, -1.6090087890625, -1.495361328125, -1.3817138671875, -1.26806640625, -1.1544189453125, -1.040771484375, -0.9271240234375, -0.8134765625, -0.6998291015625, -0.586181640625, -0.4725341796875, -0.35888671875, -0.2452392578125, -0.131591796875, -0.0179443359375, 0.095703125, 0.2093505859375, 0.322998046875, 0.4366455078125, 0.55029296875, 0.6639404296875, 0.777587890625, 0.8912353515625, 1.0048828125, 1.1185302734375, 1.232177734375, 1.3458251953125, 1.45947265625, 1.5731201171875, 1.686767578125, 1.8004150390625, 1.9140625, 2.0277099609375, 2.141357421875, 2.2550048828125, 2.36865234375, 2.4822998046875, 2.595947265625, 2.7095947265625, 2.8232421875, 2.9368896484375, 3.050537109375, 3.1641845703125, 3.27783203125, 3.3914794921875, 3.505126953125, 3.6187744140625, 3.732421875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 6.0, 14.0, 4.0, 9.0, 7.0, 14.0, 15.0, 20.0, 24.0, 27.0, 36.0, 32.0, 41.0, 47.0, 53.0, 68.0, 65.0, 79.0, 68.0, 55.0, 51.0, 43.0, 37.0, 32.0, 26.0, 18.0, 20.0, 18.0, 15.0, 7.0, 9.0, 9.0, 7.0, 1.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4091796875, -1.3639984130859375, -1.318817138671875, -1.2736358642578125, -1.22845458984375, -1.1832733154296875, -1.138092041015625, -1.0929107666015625, -1.0477294921875, -1.0025482177734375, -0.957366943359375, -0.9121856689453125, -0.86700439453125, -0.8218231201171875, -0.776641845703125, -0.7314605712890625, -0.686279296875, -0.6410980224609375, -0.595916748046875, -0.5507354736328125, -0.50555419921875, -0.4603729248046875, -0.415191650390625, -0.3700103759765625, -0.3248291015625, -0.2796478271484375, -0.234466552734375, -0.1892852783203125, -0.14410400390625, -0.0989227294921875, -0.053741455078125, -0.0085601806640625, 0.03662109375, 0.0818023681640625, 0.126983642578125, 0.1721649169921875, 0.21734619140625, 0.2625274658203125, 0.307708740234375, 0.3528900146484375, 0.3980712890625, 0.4432525634765625, 0.488433837890625, 0.5336151123046875, 0.57879638671875, 0.6239776611328125, 0.669158935546875, 0.7143402099609375, 0.759521484375, 0.8047027587890625, 0.849884033203125, 0.8950653076171875, 0.94024658203125, 0.9854278564453125, 1.030609130859375, 1.0757904052734375, 1.1209716796875, 1.1661529541015625, 1.211334228515625, 1.2565155029296875, 1.30169677734375, 1.3468780517578125, 1.392059326171875, 1.4372406005859375, 1.482421875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 19.0, 16.0, 27.0, 42.0, 39.0, 38.0, 50.0, 60.0, 59.0, 70.0, 69.0, 74.0, 70.0, 70.0, 47.0, 58.0, 30.0, 21.0, 19.0, 20.0, 17.0, 12.0, 9.0, 9.0, 6.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.694522857666016, -36.71260070800781, -35.73067855834961, -34.74875259399414, -33.76683044433594, -32.784908294677734, -31.80298614501953, -30.821062088012695, -29.83913803100586, -28.857215881347656, -27.87529182434082, -26.893369674682617, -25.91144561767578, -24.929523468017578, -23.947601318359375, -22.96567726135254, -21.983755111694336, -21.001832962036133, -20.019908905029297, -19.037986755371094, -18.056062698364258, -17.074140548706055, -16.09221649169922, -15.110294342041016, -14.128371238708496, -13.146448135375977, -12.164525032043457, -11.182601928710938, -10.200679779052734, -9.218755722045898, -8.236833572387695, -7.254910469055176, -6.272985458374023, -5.291062355041504, -4.309139251708984, -3.327216625213623, -2.3452935218811035, -1.363370418548584, -0.38144779205322266, 0.6004753112792969, 1.5823984146118164, 2.564321517944336, 3.5462443828582764, 4.528167247772217, 5.510090351104736, 6.492013454437256, 7.473936080932617, 8.455859184265137, 9.437782287597656, 10.419705390930176, 11.401628494262695, 12.383550643920898, 13.365474700927734, 14.347396850585938, 15.329319953918457, 16.311243057250977, 17.293167114257812, 18.275089263916016, 19.25701332092285, 20.238935470581055, 21.22085952758789, 22.202781677246094, 23.184703826904297, 24.166627883911133, 25.148550033569336]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 10.0, 9.0, 16.0, 23.0, 23.0, 19.0, 23.0, 21.0, 32.0, 40.0, 29.0, 31.0, 27.0, 51.0, 36.0, 37.0, 46.0, 45.0, 47.0, 42.0, 33.0, 33.0, 28.0, 31.0, 32.0, 25.0, 23.0, 34.0, 27.0, 21.0, 18.0, 11.0, 12.0, 10.0, 8.0, 6.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.64194679260254, -22.739032745361328, -21.836118698120117, -20.933204650878906, -20.030290603637695, -19.127376556396484, -18.224462509155273, -17.321548461914062, -16.41863441467285, -15.51572036743164, -14.61280632019043, -13.709892272949219, -12.806978225708008, -11.904064178466797, -11.001150131225586, -10.098236083984375, -9.195322036743164, -8.292407989501953, -7.389493942260742, -6.486579895019531, -5.58366584777832, -4.680751800537109, -3.7778377532958984, -2.8749237060546875, -1.9720096588134766, -1.0690956115722656, -0.1661815643310547, 0.7367324829101562, 1.6396465301513672, 2.542560577392578, 3.445474624633789, 4.348388671875, 5.251300811767578, 6.154214859008789, 7.05712890625, 7.960042953491211, 8.862957000732422, 9.765871047973633, 10.668785095214844, 11.571699142456055, 12.474613189697266, 13.377527236938477, 14.280441284179688, 15.183355331420898, 16.08626937866211, 16.98918342590332, 17.89209747314453, 18.795011520385742, 19.697925567626953, 20.600839614868164, 21.503753662109375, 22.406667709350586, 23.309581756591797, 24.212495803833008, 25.11540985107422, 26.01832389831543, 26.92123794555664, 27.82415199279785, 28.727066040039062, 29.629980087280273, 30.532894134521484, 31.435808181762695, 32.338722229003906, 33.24163818359375, 34.14455032348633]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 15.0, 20.0, 31.0, 41.0, 77.0, 120.0, 166.0, 305.0, 432.0, 737.0, 1239.0, 1977.0, 3202.0, 5255.0, 8511.0, 13781.0, 22225.0, 36603.0, 57987.0, 89769.0, 125556.0, 153898.0, 153782.0, 127104.0, 90176.0, 59387.0, 37096.0, 22823.0, 13836.0, 8555.0, 5235.0, 3315.0, 2016.0, 1217.0, 756.0, 490.0, 307.0, 180.0, 129.0, 66.0, 57.0, 29.0, 12.0, 13.0, 12.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.453125, -25.65185546875, -24.8505859375, -24.04931640625, -23.248046875, -22.44677734375, -21.6455078125, -20.84423828125, -20.04296875, -19.24169921875, -18.4404296875, -17.63916015625, -16.837890625, -16.03662109375, -15.2353515625, -14.43408203125, -13.6328125, -12.83154296875, -12.0302734375, -11.22900390625, -10.427734375, -9.62646484375, -8.8251953125, -8.02392578125, -7.22265625, -6.42138671875, -5.6201171875, -4.81884765625, -4.017578125, -3.21630859375, -2.4150390625, -1.61376953125, -0.8125, -0.01123046875, 0.7900390625, 1.59130859375, 2.392578125, 3.19384765625, 3.9951171875, 4.79638671875, 5.59765625, 6.39892578125, 7.2001953125, 8.00146484375, 8.802734375, 9.60400390625, 10.4052734375, 11.20654296875, 12.0078125, 12.80908203125, 13.6103515625, 14.41162109375, 15.212890625, 16.01416015625, 16.8154296875, 17.61669921875, 18.41796875, 19.21923828125, 20.0205078125, 20.82177734375, 21.623046875, 22.42431640625, 23.2255859375, 24.02685546875, 24.828125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 12.0, 6.0, 11.0, 18.0, 18.0, 15.0, 23.0, 24.0, 30.0, 23.0, 28.0, 34.0, 30.0, 43.0, 34.0, 34.0, 51.0, 44.0, 49.0, 40.0, 44.0, 32.0, 29.0, 25.0, 34.0, 32.0, 26.0, 30.0, 27.0, 30.0, 20.0, 16.0, 10.0, 15.0, 15.0, 11.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.96875, -22.134765625, -21.30078125, -20.466796875, -19.6328125, -18.798828125, -17.96484375, -17.130859375, -16.296875, -15.462890625, -14.62890625, -13.794921875, -12.9609375, -12.126953125, -11.29296875, -10.458984375, -9.625, -8.791015625, -7.95703125, -7.123046875, -6.2890625, -5.455078125, -4.62109375, -3.787109375, -2.953125, -2.119140625, -1.28515625, -0.451171875, 0.3828125, 1.216796875, 2.05078125, 2.884765625, 3.71875, 4.552734375, 5.38671875, 6.220703125, 7.0546875, 7.888671875, 8.72265625, 9.556640625, 10.390625, 11.224609375, 12.05859375, 12.892578125, 13.7265625, 14.560546875, 15.39453125, 16.228515625, 17.0625, 17.896484375, 18.73046875, 19.564453125, 20.3984375, 21.232421875, 22.06640625, 22.900390625, 23.734375, 24.568359375, 25.40234375, 26.236328125, 27.0703125, 27.904296875, 28.73828125, 29.572265625, 30.40625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 8.0, 5.0, 9.0, 17.0, 23.0, 26.0, 42.0, 69.0, 107.0, 160.0, 244.0, 366.0, 544.0, 774.0, 1164.0, 1791.0, 2824.0, 4216.0, 6484.0, 10105.0, 15339.0, 24156.0, 37117.0, 55985.0, 81829.0, 111401.0, 135519.0, 140796.0, 123659.0, 96116.0, 67678.0, 45623.0, 29545.0, 19206.0, 12443.0, 7918.0, 5235.0, 3438.0, 2221.0, 1501.0, 959.0, 645.0, 402.0, 294.0, 202.0, 124.0, 96.0, 52.0, 29.0, 16.0, 12.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-23.109375, -22.392578125, -21.67578125, -20.958984375, -20.2421875, -19.525390625, -18.80859375, -18.091796875, -17.375, -16.658203125, -15.94140625, -15.224609375, -14.5078125, -13.791015625, -13.07421875, -12.357421875, -11.640625, -10.923828125, -10.20703125, -9.490234375, -8.7734375, -8.056640625, -7.33984375, -6.623046875, -5.90625, -5.189453125, -4.47265625, -3.755859375, -3.0390625, -2.322265625, -1.60546875, -0.888671875, -0.171875, 0.544921875, 1.26171875, 1.978515625, 2.6953125, 3.412109375, 4.12890625, 4.845703125, 5.5625, 6.279296875, 6.99609375, 7.712890625, 8.4296875, 9.146484375, 9.86328125, 10.580078125, 11.296875, 12.013671875, 12.73046875, 13.447265625, 14.1640625, 14.880859375, 15.59765625, 16.314453125, 17.03125, 17.748046875, 18.46484375, 19.181640625, 19.8984375, 20.615234375, 21.33203125, 22.048828125, 22.765625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 7.0, 6.0, 9.0, 9.0, 13.0, 9.0, 12.0, 20.0, 23.0, 17.0, 22.0, 27.0, 26.0, 30.0, 33.0, 32.0, 28.0, 25.0, 35.0, 37.0, 36.0, 41.0, 34.0, 36.0, 39.0, 29.0, 44.0, 24.0, 33.0, 27.0, 18.0, 16.0, 30.0, 14.0, 18.0, 19.0, 21.0, 12.0, 17.0, 8.0, 8.0, 8.0, 2.0, 3.0, 6.0, 5.0, 1.0, 12.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.0703125, -14.58837890625, -14.1064453125, -13.62451171875, -13.142578125, -12.66064453125, -12.1787109375, -11.69677734375, -11.21484375, -10.73291015625, -10.2509765625, -9.76904296875, -9.287109375, -8.80517578125, -8.3232421875, -7.84130859375, -7.359375, -6.87744140625, -6.3955078125, -5.91357421875, -5.431640625, -4.94970703125, -4.4677734375, -3.98583984375, -3.50390625, -3.02197265625, -2.5400390625, -2.05810546875, -1.576171875, -1.09423828125, -0.6123046875, -0.13037109375, 0.3515625, 0.83349609375, 1.3154296875, 1.79736328125, 2.279296875, 2.76123046875, 3.2431640625, 3.72509765625, 4.20703125, 4.68896484375, 5.1708984375, 5.65283203125, 6.134765625, 6.61669921875, 7.0986328125, 7.58056640625, 8.0625, 8.54443359375, 9.0263671875, 9.50830078125, 9.990234375, 10.47216796875, 10.9541015625, 11.43603515625, 11.91796875, 12.39990234375, 12.8818359375, 13.36376953125, 13.845703125, 14.32763671875, 14.8095703125, 15.29150390625, 15.7734375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 11.0, 30.0, 48.0, 64.0, 103.0, 177.0, 286.0, 540.0, 965.0, 1638.0, 3148.0, 5686.0, 11009.0, 21767.0, 44960.0, 93908.0, 181107.0, 253210.0, 206301.0, 114193.0, 55246.0, 26217.0, 13066.0, 6898.0, 3521.0, 1891.0, 1063.0, 615.0, 345.0, 206.0, 122.0, 68.0, 52.0, 30.0, 20.0, 9.0, 8.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.862548828125, -8.52978515625, -8.197021484375, -7.8642578125, -7.531494140625, -7.19873046875, -6.865966796875, -6.533203125, -6.200439453125, -5.86767578125, -5.534912109375, -5.2021484375, -4.869384765625, -4.53662109375, -4.203857421875, -3.87109375, -3.538330078125, -3.20556640625, -2.872802734375, -2.5400390625, -2.207275390625, -1.87451171875, -1.541748046875, -1.208984375, -0.876220703125, -0.54345703125, -0.210693359375, 0.1220703125, 0.454833984375, 0.78759765625, 1.120361328125, 1.453125, 1.785888671875, 2.11865234375, 2.451416015625, 2.7841796875, 3.116943359375, 3.44970703125, 3.782470703125, 4.115234375, 4.447998046875, 4.78076171875, 5.113525390625, 5.4462890625, 5.779052734375, 6.11181640625, 6.444580078125, 6.77734375, 7.110107421875, 7.44287109375, 7.775634765625, 8.1083984375, 8.441162109375, 8.77392578125, 9.106689453125, 9.439453125, 9.772216796875, 10.10498046875, 10.437744140625, 10.7705078125, 11.103271484375, 11.43603515625, 11.768798828125, 12.1015625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 9.0, 10.0, 14.0, 23.0, 26.0, 25.0, 21.0, 41.0, 38.0, 53.0, 62.0, 47.0, 70.0, 67.0, 55.0, 66.0, 54.0, 56.0, 46.0, 42.0, 38.0, 31.0, 18.0, 15.0, 12.0, 17.0, 12.0, 6.0, 7.0, 4.0, 8.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000560760498046875, -0.0005390569567680359, -0.0005173534154891968, -0.0004956498742103577, -0.00047394633293151855, -0.00045224279165267944, -0.00043053925037384033, -0.0004088357090950012, -0.0003871321678161621, -0.000365428626537323, -0.0003437250852584839, -0.0003220215439796448, -0.00030031800270080566, -0.00027861446142196655, -0.00025691092014312744, -0.00023520737886428833, -0.00021350383758544922, -0.0001918002963066101, -0.000170096755027771, -0.00014839321374893188, -0.00012668967247009277, -0.00010498613119125366, -8.328258991241455e-05, -6.157904863357544e-05, -3.987550735473633e-05, -1.8171966075897217e-05, 3.5315752029418945e-06, 2.5235116481781006e-05, 4.693865776062012e-05, 6.864219903945923e-05, 9.034574031829834e-05, 0.00011204928159713745, 0.00013375282287597656, 0.00015545636415481567, 0.00017715990543365479, 0.0001988634467124939, 0.000220566987991333, 0.00024227052927017212, 0.00026397407054901123, 0.00028567761182785034, 0.00030738115310668945, 0.00032908469438552856, 0.0003507882356643677, 0.0003724917769432068, 0.0003941953182220459, 0.000415898859500885, 0.0004376024007797241, 0.00045930594205856323, 0.00048100948333740234, 0.0005027130246162415, 0.0005244165658950806, 0.0005461201071739197, 0.0005678236484527588, 0.0005895271897315979, 0.000611230731010437, 0.0006329342722892761, 0.0006546378135681152, 0.0006763413548469543, 0.0006980448961257935, 0.0007197484374046326, 0.0007414519786834717, 0.0007631555199623108, 0.0007848590612411499, 0.000806562602519989, 0.0008282661437988281]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 16.0, 15.0, 33.0, 35.0, 59.0, 81.0, 147.0, 198.0, 307.0, 535.0, 861.0, 1382.0, 2440.0, 4350.0, 7488.0, 13574.0, 24332.0, 44055.0, 80251.0, 134999.0, 192487.0, 197543.0, 145589.0, 87359.0, 48860.0, 26827.0, 14759.0, 8370.0, 4713.0, 2765.0, 1639.0, 956.0, 566.0, 328.0, 212.0, 148.0, 84.0, 63.0, 29.0, 22.0, 25.0, 11.0, 15.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.8106689453125, -7.551025390625, -7.2913818359375, -7.03173828125, -6.7720947265625, -6.512451171875, -6.2528076171875, -5.9931640625, -5.7335205078125, -5.473876953125, -5.2142333984375, -4.95458984375, -4.6949462890625, -4.435302734375, -4.1756591796875, -3.916015625, -3.6563720703125, -3.396728515625, -3.1370849609375, -2.87744140625, -2.6177978515625, -2.358154296875, -2.0985107421875, -1.8388671875, -1.5792236328125, -1.319580078125, -1.0599365234375, -0.80029296875, -0.5406494140625, -0.281005859375, -0.0213623046875, 0.23828125, 0.4979248046875, 0.757568359375, 1.0172119140625, 1.27685546875, 1.5364990234375, 1.796142578125, 2.0557861328125, 2.3154296875, 2.5750732421875, 2.834716796875, 3.0943603515625, 3.35400390625, 3.6136474609375, 3.873291015625, 4.1329345703125, 4.392578125, 4.6522216796875, 4.911865234375, 5.1715087890625, 5.43115234375, 5.6907958984375, 5.950439453125, 6.2100830078125, 6.4697265625, 6.7293701171875, 6.989013671875, 7.2486572265625, 7.50830078125, 7.7679443359375, 8.027587890625, 8.2872314453125, 8.546875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 14.0, 13.0, 20.0, 14.0, 25.0, 27.0, 31.0, 35.0, 29.0, 51.0, 55.0, 59.0, 47.0, 45.0, 54.0, 46.0, 50.0, 43.0, 57.0, 45.0, 34.0, 27.0, 32.0, 20.0, 15.0, 12.0, 9.0, 17.0, 9.0, 3.0, 6.0, 3.0, 7.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.65234375, -3.545074462890625, -3.43780517578125, -3.330535888671875, -3.2232666015625, -3.115997314453125, -3.00872802734375, -2.901458740234375, -2.794189453125, -2.686920166015625, -2.57965087890625, -2.472381591796875, -2.3651123046875, -2.257843017578125, -2.15057373046875, -2.043304443359375, -1.93603515625, -1.828765869140625, -1.72149658203125, -1.614227294921875, -1.5069580078125, -1.399688720703125, -1.29241943359375, -1.185150146484375, -1.077880859375, -0.970611572265625, -0.86334228515625, -0.756072998046875, -0.6488037109375, -0.541534423828125, -0.43426513671875, -0.326995849609375, -0.2197265625, -0.112457275390625, -0.00518798828125, 0.102081298828125, 0.2093505859375, 0.316619873046875, 0.42388916015625, 0.531158447265625, 0.638427734375, 0.745697021484375, 0.85296630859375, 0.960235595703125, 1.0675048828125, 1.174774169921875, 1.28204345703125, 1.389312744140625, 1.49658203125, 1.603851318359375, 1.71112060546875, 1.818389892578125, 1.9256591796875, 2.032928466796875, 2.14019775390625, 2.247467041015625, 2.354736328125, 2.462005615234375, 2.56927490234375, 2.676544189453125, 2.7838134765625, 2.891082763671875, 2.99835205078125, 3.105621337890625, 3.212890625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 3.0, 10.0, 11.0, 21.0, 17.0, 19.0, 28.0, 36.0, 28.0, 45.0, 47.0, 54.0, 60.0, 55.0, 55.0, 74.0, 56.0, 59.0, 56.0, 41.0, 45.0, 29.0, 24.0, 23.0, 20.0, 17.0, 13.0, 5.0, 8.0, 11.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.568029403686523, -26.745563507080078, -25.923099517822266, -25.10063362121582, -24.278167724609375, -23.455703735351562, -22.633237838745117, -21.810771942138672, -20.98830795288086, -20.165842056274414, -19.3433780670166, -18.520912170410156, -17.698448181152344, -16.8759822845459, -16.053516387939453, -15.231051445007324, -14.408586502075195, -13.586121559143066, -12.763656616210938, -11.941190719604492, -11.118725776672363, -10.296260833740234, -9.473794937133789, -8.65132999420166, -7.828865051269531, -7.006400108337402, -6.183934688568115, -5.361469268798828, -4.539004325866699, -3.7165393829345703, -2.894073963165283, -2.071608543395996, -1.2491455078125, -0.426680326461792, 0.395784854888916, 1.218250036239624, 2.040715217590332, 2.863180160522461, 3.685645580291748, 4.508111000061035, 5.330575942993164, 6.153040885925293, 6.97550630569458, 7.797971725463867, 8.620436668395996, 9.442901611328125, 10.26536750793457, 11.0878324508667, 11.910297393798828, 12.732762336730957, 13.555227279663086, 14.377693176269531, 15.20015811920166, 16.02262306213379, 16.845088958740234, 17.667552947998047, 18.490018844604492, 19.312484741210938, 20.13494873046875, 20.957414627075195, 21.77988052368164, 22.602344512939453, 23.4248104095459, 24.247276306152344, 25.069740295410156]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 9.0, 8.0, 7.0, 17.0, 12.0, 23.0, 17.0, 19.0, 21.0, 18.0, 24.0, 28.0, 47.0, 27.0, 34.0, 37.0, 36.0, 31.0, 27.0, 35.0, 43.0, 27.0, 34.0, 37.0, 49.0, 36.0, 26.0, 37.0, 32.0, 28.0, 27.0, 22.0, 18.0, 16.0, 12.0, 13.0, 16.0, 18.0, 8.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.698118209838867, -24.790882110595703, -23.883644104003906, -22.97640609741211, -22.069169998168945, -21.16193389892578, -20.254695892333984, -19.347457885742188, -18.440221786499023, -17.53298568725586, -16.625747680664062, -15.718510627746582, -14.811273574829102, -13.904036521911621, -12.99679946899414, -12.08956241607666, -11.18232536315918, -10.2750883102417, -9.367851257324219, -8.460614204406738, -7.553377151489258, -6.646140098571777, -5.738903045654297, -4.831665992736816, -3.924428939819336, -3.0171918869018555, -2.109954833984375, -1.2027177810668945, -0.29548072814941406, 0.6117563247680664, 1.5189933776855469, 2.4262304306030273, 3.333465576171875, 4.2407026290893555, 5.147939682006836, 6.055176734924316, 6.962413787841797, 7.869650840759277, 8.776887893676758, 9.684124946594238, 10.591361999511719, 11.4985990524292, 12.40583610534668, 13.31307315826416, 14.22031021118164, 15.127547264099121, 16.0347843170166, 16.942020416259766, 17.849258422851562, 18.75649642944336, 19.663732528686523, 20.570968627929688, 21.478206634521484, 22.38544464111328, 23.292680740356445, 24.19991683959961, 25.107154846191406, 26.014392852783203, 26.921628952026367, 27.82886505126953, 28.736103057861328, 29.643341064453125, 30.55057716369629, 31.457813262939453, 32.36505126953125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 14.0, 26.0, 30.0, 58.0, 81.0, 132.0, 182.0, 298.0, 454.0, 771.0, 1109.0, 1792.0, 2719.0, 4215.0, 6451.0, 10387.0, 16335.0, 26415.0, 43798.0, 72264.0, 121480.0, 206166.0, 350143.0, 558434.0, 743303.0, 721941.0, 521029.0, 317539.0, 185731.0, 109738.0, 64195.0, 39220.0, 24586.0, 15102.0, 9626.0, 6277.0, 4086.0, 2701.0, 1753.0, 1245.0, 827.0, 550.0, 357.0, 236.0, 169.0, 115.0, 72.0, 44.0, 34.0, 14.0, 17.0, 10.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.296875, -18.692138671875, -18.08740234375, -17.482666015625, -16.8779296875, -16.273193359375, -15.66845703125, -15.063720703125, -14.458984375, -13.854248046875, -13.24951171875, -12.644775390625, -12.0400390625, -11.435302734375, -10.83056640625, -10.225830078125, -9.62109375, -9.016357421875, -8.41162109375, -7.806884765625, -7.2021484375, -6.597412109375, -5.99267578125, -5.387939453125, -4.783203125, -4.178466796875, -3.57373046875, -2.968994140625, -2.3642578125, -1.759521484375, -1.15478515625, -0.550048828125, 0.0546875, 0.659423828125, 1.26416015625, 1.868896484375, 2.4736328125, 3.078369140625, 3.68310546875, 4.287841796875, 4.892578125, 5.497314453125, 6.10205078125, 6.706787109375, 7.3115234375, 7.916259765625, 8.52099609375, 9.125732421875, 9.73046875, 10.335205078125, 10.93994140625, 11.544677734375, 12.1494140625, 12.754150390625, 13.35888671875, 13.963623046875, 14.568359375, 15.173095703125, 15.77783203125, 16.382568359375, 16.9873046875, 17.592041015625, 18.19677734375, 18.801513671875, 19.40625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 5.0, 13.0, 18.0, 20.0, 16.0, 21.0, 18.0, 25.0, 22.0, 37.0, 38.0, 34.0, 31.0, 28.0, 28.0, 39.0, 38.0, 40.0, 37.0, 20.0, 36.0, 39.0, 44.0, 42.0, 31.0, 49.0, 23.0, 31.0, 21.0, 18.0, 18.0, 10.0, 17.0, 14.0, 15.0, 10.0, 12.0, 5.0, 5.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.3125, -15.732421875, -15.15234375, -14.572265625, -13.9921875, -13.412109375, -12.83203125, -12.251953125, -11.671875, -11.091796875, -10.51171875, -9.931640625, -9.3515625, -8.771484375, -8.19140625, -7.611328125, -7.03125, -6.451171875, -5.87109375, -5.291015625, -4.7109375, -4.130859375, -3.55078125, -2.970703125, -2.390625, -1.810546875, -1.23046875, -0.650390625, -0.0703125, 0.509765625, 1.08984375, 1.669921875, 2.25, 2.830078125, 3.41015625, 3.990234375, 4.5703125, 5.150390625, 5.73046875, 6.310546875, 6.890625, 7.470703125, 8.05078125, 8.630859375, 9.2109375, 9.791015625, 10.37109375, 10.951171875, 11.53125, 12.111328125, 12.69140625, 13.271484375, 13.8515625, 14.431640625, 15.01171875, 15.591796875, 16.171875, 16.751953125, 17.33203125, 17.912109375, 18.4921875, 19.072265625, 19.65234375, 20.232421875, 20.8125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 6.0, 11.0, 12.0, 20.0, 30.0, 40.0, 67.0, 107.0, 171.0, 254.0, 435.0, 647.0, 1012.0, 1717.0, 2701.0, 4342.0, 7188.0, 11397.0, 19153.0, 31868.0, 53007.0, 89210.0, 145915.0, 236659.0, 365073.0, 514071.0, 626281.0, 623366.0, 506639.0, 359171.0, 231371.0, 143743.0, 86629.0, 51996.0, 31228.0, 18633.0, 11383.0, 7118.0, 4141.0, 2714.0, 1654.0, 1093.0, 758.0, 428.0, 282.0, 189.0, 115.0, 83.0, 52.0, 31.0, 24.0, 24.0, 12.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-15.5390625, -15.0374755859375, -14.535888671875, -14.0343017578125, -13.53271484375, -13.0311279296875, -12.529541015625, -12.0279541015625, -11.5263671875, -11.0247802734375, -10.523193359375, -10.0216064453125, -9.52001953125, -9.0184326171875, -8.516845703125, -8.0152587890625, -7.513671875, -7.0120849609375, -6.510498046875, -6.0089111328125, -5.50732421875, -5.0057373046875, -4.504150390625, -4.0025634765625, -3.5009765625, -2.9993896484375, -2.497802734375, -1.9962158203125, -1.49462890625, -0.9930419921875, -0.491455078125, 0.0101318359375, 0.51171875, 1.0133056640625, 1.514892578125, 2.0164794921875, 2.51806640625, 3.0196533203125, 3.521240234375, 4.0228271484375, 4.5244140625, 5.0260009765625, 5.527587890625, 6.0291748046875, 6.53076171875, 7.0323486328125, 7.533935546875, 8.0355224609375, 8.537109375, 9.0386962890625, 9.540283203125, 10.0418701171875, 10.54345703125, 11.0450439453125, 11.546630859375, 12.0482177734375, 12.5498046875, 13.0513916015625, 13.552978515625, 14.0545654296875, 14.55615234375, 15.0577392578125, 15.559326171875, 16.0609130859375, 16.5625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 7.0, 11.0, 14.0, 28.0, 27.0, 24.0, 35.0, 50.0, 47.0, 62.0, 104.0, 96.0, 110.0, 127.0, 132.0, 160.0, 215.0, 199.0, 248.0, 237.0, 241.0, 250.0, 227.0, 232.0, 209.0, 178.0, 156.0, 135.0, 96.0, 94.0, 71.0, 53.0, 44.0, 31.0, 31.0, 21.0, 17.0, 16.0, 7.0, 8.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.75, -10.4576416015625, -10.165283203125, -9.8729248046875, -9.58056640625, -9.2882080078125, -8.995849609375, -8.7034912109375, -8.4111328125, -8.1187744140625, -7.826416015625, -7.5340576171875, -7.24169921875, -6.9493408203125, -6.656982421875, -6.3646240234375, -6.072265625, -5.7799072265625, -5.487548828125, -5.1951904296875, -4.90283203125, -4.6104736328125, -4.318115234375, -4.0257568359375, -3.7333984375, -3.4410400390625, -3.148681640625, -2.8563232421875, -2.56396484375, -2.2716064453125, -1.979248046875, -1.6868896484375, -1.39453125, -1.1021728515625, -0.809814453125, -0.5174560546875, -0.22509765625, 0.0672607421875, 0.359619140625, 0.6519775390625, 0.9443359375, 1.2366943359375, 1.529052734375, 1.8214111328125, 2.11376953125, 2.4061279296875, 2.698486328125, 2.9908447265625, 3.283203125, 3.5755615234375, 3.867919921875, 4.1602783203125, 4.45263671875, 4.7449951171875, 5.037353515625, 5.3297119140625, 5.6220703125, 5.9144287109375, 6.206787109375, 6.4991455078125, 6.79150390625, 7.0838623046875, 7.376220703125, 7.6685791015625, 7.9609375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 19.0, 22.0, 28.0, 33.0, 55.0, 45.0, 56.0, 64.0, 77.0, 80.0, 67.0, 67.0, 64.0, 66.0, 52.0, 38.0, 30.0, 26.0, 12.0, 20.0, 10.0, 10.0, 5.0, 8.0, 4.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.038768768310547, -25.254058837890625, -24.469348907470703, -23.68463897705078, -22.89992904663086, -22.11522102355957, -21.33051109313965, -20.545801162719727, -19.761091232299805, -18.976381301879883, -18.19167137145996, -17.40696144104004, -16.62225341796875, -15.837542533874512, -15.052833557128906, -14.268123626708984, -13.483413696289062, -12.69870376586914, -11.913993835449219, -11.129284858703613, -10.344574928283691, -9.55986499786377, -8.775156021118164, -7.990446090698242, -7.20573616027832, -6.421026229858398, -5.636316776275635, -4.851607322692871, -4.066897392272949, -3.2821877002716064, -2.4974780082702637, -1.7127685546875, -0.9280605316162109, -0.14335083961486816, 0.6413588523864746, 1.4260685443878174, 2.21077823638916, 2.995487928390503, 3.7801976203918457, 4.564907073974609, 5.349617004394531, 6.134326934814453, 6.919036388397217, 7.7037458419799805, 8.488455772399902, 9.273165702819824, 10.05787467956543, 10.842584609985352, 11.627294540405273, 12.412004470825195, 13.196714401245117, 13.981423377990723, 14.766133308410645, 15.550843238830566, 16.335552215576172, 17.120262145996094, 17.904972076416016, 18.689682006835938, 19.47439193725586, 20.25910186767578, 21.043811798095703, 21.828519821166992, 22.613229751586914, 23.397939682006836, 24.182649612426758]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 10.0, 3.0, 9.0, 4.0, 9.0, 13.0, 18.0, 16.0, 19.0, 29.0, 31.0, 27.0, 24.0, 43.0, 26.0, 46.0, 27.0, 47.0, 38.0, 42.0, 32.0, 37.0, 36.0, 36.0, 51.0, 41.0, 23.0, 34.0, 32.0, 26.0, 20.0, 27.0, 22.0, 24.0, 6.0, 16.0, 13.0, 9.0, 10.0, 8.0, 6.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.271156311035156, -19.50245475769043, -18.733755111694336, -17.96505355834961, -17.196352005004883, -16.427650451660156, -15.658950805664062, -14.890249252319336, -14.121548652648926, -13.352848052978516, -12.584146499633789, -11.815445899963379, -11.046745300292969, -10.278043746948242, -9.509343147277832, -8.740642547607422, -7.971940994262695, -7.203239917755127, -6.434538841247559, -5.665838241577148, -4.89713716506958, -4.128436088562012, -3.3597354888916016, -2.591034412384033, -1.8223333358764648, -1.053632378578186, -0.2849314212799072, 0.48376941680908203, 1.2524704933166504, 2.0211715698242188, 2.789872169494629, 3.5585732460021973, 4.327272415161133, 5.095973491668701, 5.8646745681762695, 6.63337516784668, 7.402076244354248, 8.170777320861816, 8.939477920532227, 9.708179473876953, 10.476880073547363, 11.245580673217773, 12.0142822265625, 12.78298282623291, 13.55168342590332, 14.320384979248047, 15.089085578918457, 15.857786178588867, 16.626487731933594, 17.39518928527832, 18.163888931274414, 18.93259048461914, 19.701292037963867, 20.469993591308594, 21.238693237304688, 22.007394790649414, 22.77609634399414, 23.544797897338867, 24.31349754333496, 25.082199096679688, 25.850900650024414, 26.61960220336914, 27.388301849365234, 28.15700340270996, 28.925703048706055]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 13.0, 14.0, 33.0, 25.0, 45.0, 66.0, 113.0, 118.0, 214.0, 367.0, 589.0, 891.0, 1580.0, 2571.0, 4361.0, 8567.0, 17667.0, 38155.0, 86518.0, 196665.0, 324338.0, 200671.0, 88038.0, 38902.0, 17845.0, 8875.0, 4579.0, 2570.0, 1520.0, 972.0, 609.0, 361.0, 231.0, 162.0, 104.0, 50.0, 42.0, 26.0, 22.0, 18.0, 11.0, 12.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.109375, -9.82470703125, -9.5400390625, -9.25537109375, -8.970703125, -8.68603515625, -8.4013671875, -8.11669921875, -7.83203125, -7.54736328125, -7.2626953125, -6.97802734375, -6.693359375, -6.40869140625, -6.1240234375, -5.83935546875, -5.5546875, -5.27001953125, -4.9853515625, -4.70068359375, -4.416015625, -4.13134765625, -3.8466796875, -3.56201171875, -3.27734375, -2.99267578125, -2.7080078125, -2.42333984375, -2.138671875, -1.85400390625, -1.5693359375, -1.28466796875, -1.0, -0.71533203125, -0.4306640625, -0.14599609375, 0.138671875, 0.42333984375, 0.7080078125, 0.99267578125, 1.27734375, 1.56201171875, 1.8466796875, 2.13134765625, 2.416015625, 2.70068359375, 2.9853515625, 3.27001953125, 3.5546875, 3.83935546875, 4.1240234375, 4.40869140625, 4.693359375, 4.97802734375, 5.2626953125, 5.54736328125, 5.83203125, 6.11669921875, 6.4013671875, 6.68603515625, 6.970703125, 7.25537109375, 7.5400390625, 7.82470703125, 8.109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 10.0, 6.0, 5.0, 11.0, 5.0, 20.0, 12.0, 21.0, 23.0, 21.0, 37.0, 21.0, 37.0, 34.0, 31.0, 42.0, 46.0, 37.0, 32.0, 39.0, 31.0, 47.0, 37.0, 44.0, 37.0, 28.0, 30.0, 44.0, 25.0, 26.0, 26.0, 13.0, 21.0, 18.0, 17.0, 12.0, 11.0, 9.0, 7.0, 5.0, 5.0, 3.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.264892578125, -18.49853515625, -17.732177734375, -16.9658203125, -16.199462890625, -15.43310546875, -14.666748046875, -13.900390625, -13.134033203125, -12.36767578125, -11.601318359375, -10.8349609375, -10.068603515625, -9.30224609375, -8.535888671875, -7.76953125, -7.003173828125, -6.23681640625, -5.470458984375, -4.7041015625, -3.937744140625, -3.17138671875, -2.405029296875, -1.638671875, -0.872314453125, -0.10595703125, 0.660400390625, 1.4267578125, 2.193115234375, 2.95947265625, 3.725830078125, 4.4921875, 5.258544921875, 6.02490234375, 6.791259765625, 7.5576171875, 8.323974609375, 9.09033203125, 9.856689453125, 10.623046875, 11.389404296875, 12.15576171875, 12.922119140625, 13.6884765625, 14.454833984375, 15.22119140625, 15.987548828125, 16.75390625, 17.520263671875, 18.28662109375, 19.052978515625, 19.8193359375, 20.585693359375, 21.35205078125, 22.118408203125, 22.884765625, 23.651123046875, 24.41748046875, 25.183837890625, 25.9501953125, 26.716552734375, 27.48291015625, 28.249267578125, 29.015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 10.0, 17.0, 33.0, 39.0, 55.0, 82.0, 147.0, 220.0, 436.0, 742.0, 1466.0, 3109.0, 7860.0, 21438.0, 65969.0, 225955.0, 456016.0, 181478.0, 53788.0, 17610.0, 6415.0, 2765.0, 1244.0, 690.0, 362.0, 219.0, 127.0, 89.0, 55.0, 39.0, 22.0, 13.0, 13.0, 8.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.375, -11.04443359375, -10.7138671875, -10.38330078125, -10.052734375, -9.72216796875, -9.3916015625, -9.06103515625, -8.73046875, -8.39990234375, -8.0693359375, -7.73876953125, -7.408203125, -7.07763671875, -6.7470703125, -6.41650390625, -6.0859375, -5.75537109375, -5.4248046875, -5.09423828125, -4.763671875, -4.43310546875, -4.1025390625, -3.77197265625, -3.44140625, -3.11083984375, -2.7802734375, -2.44970703125, -2.119140625, -1.78857421875, -1.4580078125, -1.12744140625, -0.796875, -0.46630859375, -0.1357421875, 0.19482421875, 0.525390625, 0.85595703125, 1.1865234375, 1.51708984375, 1.84765625, 2.17822265625, 2.5087890625, 2.83935546875, 3.169921875, 3.50048828125, 3.8310546875, 4.16162109375, 4.4921875, 4.82275390625, 5.1533203125, 5.48388671875, 5.814453125, 6.14501953125, 6.4755859375, 6.80615234375, 7.13671875, 7.46728515625, 7.7978515625, 8.12841796875, 8.458984375, 8.78955078125, 9.1201171875, 9.45068359375, 9.78125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 3.0, 10.0, 5.0, 10.0, 3.0, 8.0, 12.0, 15.0, 10.0, 15.0, 12.0, 14.0, 23.0, 30.0, 29.0, 25.0, 25.0, 23.0, 24.0, 33.0, 26.0, 26.0, 34.0, 42.0, 37.0, 51.0, 29.0, 43.0, 32.0, 38.0, 41.0, 32.0, 27.0, 31.0, 18.0, 21.0, 19.0, 19.0, 6.0, 10.0, 11.0, 12.0, 8.0, 15.0, 6.0, 11.0, 6.0, 6.0, 2.0, 0.0, 3.0, 5.0, 0.0, 0.0, 2.0], "bins": [-16.625, -16.124755859375, -15.62451171875, -15.124267578125, -14.6240234375, -14.123779296875, -13.62353515625, -13.123291015625, -12.623046875, -12.122802734375, -11.62255859375, -11.122314453125, -10.6220703125, -10.121826171875, -9.62158203125, -9.121337890625, -8.62109375, -8.120849609375, -7.62060546875, -7.120361328125, -6.6201171875, -6.119873046875, -5.61962890625, -5.119384765625, -4.619140625, -4.118896484375, -3.61865234375, -3.118408203125, -2.6181640625, -2.117919921875, -1.61767578125, -1.117431640625, -0.6171875, -0.116943359375, 0.38330078125, 0.883544921875, 1.3837890625, 1.884033203125, 2.38427734375, 2.884521484375, 3.384765625, 3.885009765625, 4.38525390625, 4.885498046875, 5.3857421875, 5.885986328125, 6.38623046875, 6.886474609375, 7.38671875, 7.886962890625, 8.38720703125, 8.887451171875, 9.3876953125, 9.887939453125, 10.38818359375, 10.888427734375, 11.388671875, 11.888916015625, 12.38916015625, 12.889404296875, 13.3896484375, 13.889892578125, 14.39013671875, 14.890380859375, 15.390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 9.0, 3.0, 8.0, 12.0, 15.0, 21.0, 36.0, 42.0, 61.0, 79.0, 107.0, 160.0, 248.0, 330.0, 486.0, 741.0, 1201.0, 1866.0, 3137.0, 5483.0, 10992.0, 28703.0, 406210.0, 532165.0, 30544.0, 11427.0, 5664.0, 3199.0, 1966.0, 1217.0, 770.0, 494.0, 342.0, 239.0, 170.0, 107.0, 84.0, 60.0, 49.0, 24.0, 23.0, 21.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.5, -10.19140625, -9.8828125, -9.57421875, -9.265625, -8.95703125, -8.6484375, -8.33984375, -8.03125, -7.72265625, -7.4140625, -7.10546875, -6.796875, -6.48828125, -6.1796875, -5.87109375, -5.5625, -5.25390625, -4.9453125, -4.63671875, -4.328125, -4.01953125, -3.7109375, -3.40234375, -3.09375, -2.78515625, -2.4765625, -2.16796875, -1.859375, -1.55078125, -1.2421875, -0.93359375, -0.625, -0.31640625, -0.0078125, 0.30078125, 0.609375, 0.91796875, 1.2265625, 1.53515625, 1.84375, 2.15234375, 2.4609375, 2.76953125, 3.078125, 3.38671875, 3.6953125, 4.00390625, 4.3125, 4.62109375, 4.9296875, 5.23828125, 5.546875, 5.85546875, 6.1640625, 6.47265625, 6.78125, 7.08984375, 7.3984375, 7.70703125, 8.015625, 8.32421875, 8.6328125, 8.94140625, 9.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 2.0, 8.0, 6.0, 5.0, 15.0, 23.0, 45.0, 112.0, 309.0, 275.0, 95.0, 30.0, 23.0, 12.0, 9.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009140968322753906, -0.0008854269981384277, -0.0008567571640014648, -0.000828087329864502, -0.0007994174957275391, -0.0007707476615905762, -0.0007420778274536133, -0.0007134079933166504, -0.0006847381591796875, -0.0006560683250427246, -0.0006273984909057617, -0.0005987286567687988, -0.0005700588226318359, -0.000541388988494873, -0.0005127191543579102, -0.00048404932022094727, -0.0004553794860839844, -0.0004267096519470215, -0.0003980398178100586, -0.0003693699836730957, -0.0003407001495361328, -0.0003120303153991699, -0.00028336048126220703, -0.00025469064712524414, -0.00022602081298828125, -0.00019735097885131836, -0.00016868114471435547, -0.00014001131057739258, -0.00011134147644042969, -8.26716423034668e-05, -5.4001808166503906e-05, -2.5331974029541016e-05, 3.337860107421875e-06, 3.2007694244384766e-05, 6.0677528381347656e-05, 8.934736251831055e-05, 0.00011801719665527344, 0.00014668703079223633, 0.00017535686492919922, 0.0002040266990661621, 0.000232696533203125, 0.0002613663673400879, 0.0002900362014770508, 0.00031870603561401367, 0.00034737586975097656, 0.00037604570388793945, 0.00040471553802490234, 0.00043338537216186523, 0.0004620552062988281, 0.000490725040435791, 0.0005193948745727539, 0.0005480647087097168, 0.0005767345428466797, 0.0006054043769836426, 0.0006340742111206055, 0.0006627440452575684, 0.0006914138793945312, 0.0007200837135314941, 0.000748753547668457, 0.0007774233818054199, 0.0008060932159423828, 0.0008347630500793457, 0.0008634328842163086, 0.0008921027183532715, 0.0009207725524902344]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 9.0, 18.0, 26.0, 37.0, 52.0, 67.0, 108.0, 120.0, 189.0, 245.0, 392.0, 542.0, 819.0, 1259.0, 1885.0, 2978.0, 4779.0, 7500.0, 13166.0, 27888.0, 80089.0, 299012.0, 417866.0, 112900.0, 36686.0, 15999.0, 8657.0, 5302.0, 3381.0, 2122.0, 1438.0, 946.0, 657.0, 435.0, 283.0, 197.0, 145.0, 96.0, 61.0, 64.0, 39.0, 32.0, 16.0, 12.0, 13.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.765625, -4.62603759765625, -4.4864501953125, -4.34686279296875, -4.207275390625, -4.06768798828125, -3.9281005859375, -3.78851318359375, -3.64892578125, -3.50933837890625, -3.3697509765625, -3.23016357421875, -3.090576171875, -2.95098876953125, -2.8114013671875, -2.67181396484375, -2.5322265625, -2.39263916015625, -2.2530517578125, -2.11346435546875, -1.973876953125, -1.83428955078125, -1.6947021484375, -1.55511474609375, -1.41552734375, -1.27593994140625, -1.1363525390625, -0.99676513671875, -0.857177734375, -0.71759033203125, -0.5780029296875, -0.43841552734375, -0.298828125, -0.15924072265625, -0.0196533203125, 0.11993408203125, 0.259521484375, 0.39910888671875, 0.5386962890625, 0.67828369140625, 0.81787109375, 0.95745849609375, 1.0970458984375, 1.23663330078125, 1.376220703125, 1.51580810546875, 1.6553955078125, 1.79498291015625, 1.9345703125, 2.07415771484375, 2.2137451171875, 2.35333251953125, 2.492919921875, 2.63250732421875, 2.7720947265625, 2.91168212890625, 3.05126953125, 3.19085693359375, 3.3304443359375, 3.47003173828125, 3.609619140625, 3.74920654296875, 3.8887939453125, 4.02838134765625, 4.16796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 9.0, 5.0, 11.0, 8.0, 7.0, 16.0, 10.0, 28.0, 29.0, 68.0, 76.0, 120.0, 149.0, 128.0, 89.0, 52.0, 52.0, 34.0, 32.0, 12.0, 10.0, 9.0, 7.0, 8.0, 4.0, 5.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904296875, -1.83587646484375, -1.7674560546875, -1.69903564453125, -1.630615234375, -1.56219482421875, -1.4937744140625, -1.42535400390625, -1.35693359375, -1.28851318359375, -1.2200927734375, -1.15167236328125, -1.083251953125, -1.01483154296875, -0.9464111328125, -0.87799072265625, -0.8095703125, -0.74114990234375, -0.6727294921875, -0.60430908203125, -0.535888671875, -0.46746826171875, -0.3990478515625, -0.33062744140625, -0.26220703125, -0.19378662109375, -0.1253662109375, -0.05694580078125, 0.011474609375, 0.07989501953125, 0.1483154296875, 0.21673583984375, 0.28515625, 0.35357666015625, 0.4219970703125, 0.49041748046875, 0.558837890625, 0.62725830078125, 0.6956787109375, 0.76409912109375, 0.83251953125, 0.90093994140625, 0.9693603515625, 1.03778076171875, 1.106201171875, 1.17462158203125, 1.2430419921875, 1.31146240234375, 1.3798828125, 1.44830322265625, 1.5167236328125, 1.58514404296875, 1.653564453125, 1.72198486328125, 1.7904052734375, 1.85882568359375, 1.92724609375, 1.99566650390625, 2.0640869140625, 2.13250732421875, 2.200927734375, 2.26934814453125, 2.3377685546875, 2.40618896484375, 2.474609375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 6.0, 12.0, 16.0, 21.0, 35.0, 37.0, 52.0, 46.0, 65.0, 61.0, 72.0, 89.0, 57.0, 62.0, 69.0, 57.0, 57.0, 42.0, 20.0, 30.0, 15.0, 14.0, 13.0, 6.0, 6.0, 10.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.518566131591797, -23.74705696105957, -22.975547790527344, -22.204036712646484, -21.432527542114258, -20.66101837158203, -19.889507293701172, -19.117998123168945, -18.34648895263672, -17.574979782104492, -16.803470611572266, -16.031959533691406, -15.26045036315918, -14.488941192626953, -13.71743106842041, -12.945920944213867, -12.17441177368164, -11.402902603149414, -10.631392478942871, -9.859882354736328, -9.088373184204102, -8.316864013671875, -7.545353889465332, -6.773844242095947, -6.0023345947265625, -5.230824947357178, -4.459315299987793, -3.687805652618408, -2.9162960052490234, -2.1447863578796387, -1.373276710510254, -0.6017670631408691, 0.16974449157714844, 0.9412541389465332, 1.712763786315918, 2.4842734336853027, 3.2557830810546875, 4.027292728424072, 4.798802375793457, 5.570312023162842, 6.341821670532227, 7.113331317901611, 7.884840965270996, 8.656351089477539, 9.427860260009766, 10.199369430541992, 10.970879554748535, 11.742389678955078, 12.513898849487305, 13.285408020019531, 14.056918144226074, 14.828428268432617, 15.599937438964844, 16.37144660949707, 17.142955780029297, 17.914466857910156, 18.685976028442383, 19.45748519897461, 20.22899627685547, 21.000505447387695, 21.772014617919922, 22.54352378845215, 23.315032958984375, 24.086544036865234, 24.85805320739746]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 8.0, 3.0, 5.0, 8.0, 8.0, 17.0, 19.0, 16.0, 30.0, 25.0, 26.0, 30.0, 35.0, 32.0, 32.0, 37.0, 42.0, 51.0, 30.0, 32.0, 46.0, 38.0, 29.0, 52.0, 38.0, 34.0, 35.0, 29.0, 27.0, 28.0, 22.0, 22.0, 19.0, 19.0, 9.0, 17.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.785240173339844, -20.018680572509766, -19.252120971679688, -18.48556137084961, -17.719003677368164, -16.952444076538086, -16.185884475708008, -15.41932487487793, -14.652766227722168, -13.88620662689209, -13.119647979736328, -12.35308837890625, -11.586528778076172, -10.81997013092041, -10.053410530090332, -9.28685188293457, -8.520292282104492, -7.753733158111572, -6.987174034118652, -6.220614433288574, -5.454055309295654, -4.687496185302734, -3.9209365844726562, -3.1543774604797363, -2.3878183364868164, -1.621259093284607, -0.8546998500823975, -0.08814048767089844, 0.6784186363220215, 1.4449777603149414, 2.2115373611450195, 2.9780964851379395, 3.7446537017822266, 4.5112128257751465, 5.277771949768066, 6.0443315505981445, 6.8108906745910645, 7.577449798583984, 8.344009399414062, 9.11056900024414, 9.877127647399902, 10.64368724822998, 11.410245895385742, 12.17680549621582, 12.943365097045898, 13.70992374420166, 14.476483345031738, 15.2430419921875, 16.009601593017578, 16.776161193847656, 17.542720794677734, 18.309280395507812, 19.075838088989258, 19.842397689819336, 20.608957290649414, 21.375516891479492, 22.142074584960938, 22.908634185791016, 23.675193786621094, 24.441753387451172, 25.208311080932617, 25.974870681762695, 26.741430282592773, 27.50798988342285, 28.27454948425293]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 7.0, 5.0, 2.0, 12.0, 20.0, 26.0, 31.0, 52.0, 64.0, 120.0, 181.0, 253.0, 451.0, 708.0, 1019.0, 1634.0, 2485.0, 4000.0, 6326.0, 9762.0, 15576.0, 24718.0, 38490.0, 58543.0, 84890.0, 115195.0, 138764.0, 142298.0, 123186.0, 94169.0, 65504.0, 43345.0, 27835.0, 17692.0, 11378.0, 7182.0, 4565.0, 2889.0, 1854.0, 1236.0, 727.0, 498.0, 311.0, 191.0, 145.0, 93.0, 43.0, 29.0, 20.0, 21.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.375, -15.831787109375, -15.28857421875, -14.745361328125, -14.2021484375, -13.658935546875, -13.11572265625, -12.572509765625, -12.029296875, -11.486083984375, -10.94287109375, -10.399658203125, -9.8564453125, -9.313232421875, -8.77001953125, -8.226806640625, -7.68359375, -7.140380859375, -6.59716796875, -6.053955078125, -5.5107421875, -4.967529296875, -4.42431640625, -3.881103515625, -3.337890625, -2.794677734375, -2.25146484375, -1.708251953125, -1.1650390625, -0.621826171875, -0.07861328125, 0.464599609375, 1.0078125, 1.551025390625, 2.09423828125, 2.637451171875, 3.1806640625, 3.723876953125, 4.26708984375, 4.810302734375, 5.353515625, 5.896728515625, 6.43994140625, 6.983154296875, 7.5263671875, 8.069580078125, 8.61279296875, 9.156005859375, 9.69921875, 10.242431640625, 10.78564453125, 11.328857421875, 11.8720703125, 12.415283203125, 12.95849609375, 13.501708984375, 14.044921875, 14.588134765625, 15.13134765625, 15.674560546875, 16.2177734375, 16.760986328125, 17.30419921875, 17.847412109375, 18.390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 7.0, 5.0, 7.0, 7.0, 10.0, 19.0, 13.0, 17.0, 25.0, 28.0, 26.0, 27.0, 40.0, 29.0, 26.0, 32.0, 51.0, 35.0, 48.0, 33.0, 37.0, 39.0, 39.0, 41.0, 40.0, 40.0, 33.0, 32.0, 23.0, 34.0, 21.0, 21.0, 16.0, 19.0, 17.0, 13.0, 13.0, 6.0, 10.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -18.948974609375, -18.22607421875, -17.503173828125, -16.7802734375, -16.057373046875, -15.33447265625, -14.611572265625, -13.888671875, -13.165771484375, -12.44287109375, -11.719970703125, -10.9970703125, -10.274169921875, -9.55126953125, -8.828369140625, -8.10546875, -7.382568359375, -6.65966796875, -5.936767578125, -5.2138671875, -4.490966796875, -3.76806640625, -3.045166015625, -2.322265625, -1.599365234375, -0.87646484375, -0.153564453125, 0.5693359375, 1.292236328125, 2.01513671875, 2.738037109375, 3.4609375, 4.183837890625, 4.90673828125, 5.629638671875, 6.3525390625, 7.075439453125, 7.79833984375, 8.521240234375, 9.244140625, 9.967041015625, 10.68994140625, 11.412841796875, 12.1357421875, 12.858642578125, 13.58154296875, 14.304443359375, 15.02734375, 15.750244140625, 16.47314453125, 17.196044921875, 17.9189453125, 18.641845703125, 19.36474609375, 20.087646484375, 20.810546875, 21.533447265625, 22.25634765625, 22.979248046875, 23.7021484375, 24.425048828125, 25.14794921875, 25.870849609375, 26.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 11.0, 12.0, 14.0, 29.0, 49.0, 68.0, 110.0, 186.0, 261.0, 397.0, 526.0, 906.0, 1286.0, 2216.0, 3384.0, 5347.0, 8289.0, 13115.0, 20566.0, 32155.0, 49188.0, 72492.0, 99897.0, 126636.0, 139565.0, 131126.0, 106750.0, 79385.0, 54737.0, 36065.0, 23148.0, 14801.0, 9287.0, 6011.0, 3714.0, 2384.0, 1573.0, 981.0, 632.0, 384.0, 296.0, 198.0, 111.0, 79.0, 66.0, 33.0, 35.0, 14.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.609375, -16.084228515625, -15.55908203125, -15.033935546875, -14.5087890625, -13.983642578125, -13.45849609375, -12.933349609375, -12.408203125, -11.883056640625, -11.35791015625, -10.832763671875, -10.3076171875, -9.782470703125, -9.25732421875, -8.732177734375, -8.20703125, -7.681884765625, -7.15673828125, -6.631591796875, -6.1064453125, -5.581298828125, -5.05615234375, -4.531005859375, -4.005859375, -3.480712890625, -2.95556640625, -2.430419921875, -1.9052734375, -1.380126953125, -0.85498046875, -0.329833984375, 0.1953125, 0.720458984375, 1.24560546875, 1.770751953125, 2.2958984375, 2.821044921875, 3.34619140625, 3.871337890625, 4.396484375, 4.921630859375, 5.44677734375, 5.971923828125, 6.4970703125, 7.022216796875, 7.54736328125, 8.072509765625, 8.59765625, 9.122802734375, 9.64794921875, 10.173095703125, 10.6982421875, 11.223388671875, 11.74853515625, 12.273681640625, 12.798828125, 13.323974609375, 13.84912109375, 14.374267578125, 14.8994140625, 15.424560546875, 15.94970703125, 16.474853515625, 17.0]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 5.0, 4.0, 6.0, 5.0, 8.0, 22.0, 14.0, 17.0, 25.0, 22.0, 28.0, 29.0, 38.0, 38.0, 27.0, 41.0, 32.0, 52.0, 40.0, 43.0, 44.0, 37.0, 32.0, 22.0, 36.0, 40.0, 41.0, 27.0, 41.0, 21.0, 16.0, 22.0, 20.0, 26.0, 17.0, 8.0, 10.0, 8.0, 10.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.171875, -12.7109375, -12.25, -11.7890625, -11.328125, -10.8671875, -10.40625, -9.9453125, -9.484375, -9.0234375, -8.5625, -8.1015625, -7.640625, -7.1796875, -6.71875, -6.2578125, -5.796875, -5.3359375, -4.875, -4.4140625, -3.953125, -3.4921875, -3.03125, -2.5703125, -2.109375, -1.6484375, -1.1875, -0.7265625, -0.265625, 0.1953125, 0.65625, 1.1171875, 1.578125, 2.0390625, 2.5, 2.9609375, 3.421875, 3.8828125, 4.34375, 4.8046875, 5.265625, 5.7265625, 6.1875, 6.6484375, 7.109375, 7.5703125, 8.03125, 8.4921875, 8.953125, 9.4140625, 9.875, 10.3359375, 10.796875, 11.2578125, 11.71875, 12.1796875, 12.640625, 13.1015625, 13.5625, 14.0234375, 14.484375, 14.9453125, 15.40625, 15.8671875, 16.328125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 4.0, 7.0, 7.0, 9.0, 16.0, 22.0, 33.0, 64.0, 109.0, 133.0, 213.0, 342.0, 484.0, 764.0, 1102.0, 1871.0, 2920.0, 4584.0, 7336.0, 11738.0, 19173.0, 31104.0, 52009.0, 84377.0, 130404.0, 171507.0, 173054.0, 132145.0, 86545.0, 52711.0, 31882.0, 19352.0, 12121.0, 7344.0, 4713.0, 3039.0, 1877.0, 1219.0, 784.0, 492.0, 309.0, 242.0, 132.0, 88.0, 62.0, 46.0, 25.0, 19.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.3984375, -6.185302734375, -5.97216796875, -5.759033203125, -5.5458984375, -5.332763671875, -5.11962890625, -4.906494140625, -4.693359375, -4.480224609375, -4.26708984375, -4.053955078125, -3.8408203125, -3.627685546875, -3.41455078125, -3.201416015625, -2.98828125, -2.775146484375, -2.56201171875, -2.348876953125, -2.1357421875, -1.922607421875, -1.70947265625, -1.496337890625, -1.283203125, -1.070068359375, -0.85693359375, -0.643798828125, -0.4306640625, -0.217529296875, -0.00439453125, 0.208740234375, 0.421875, 0.635009765625, 0.84814453125, 1.061279296875, 1.2744140625, 1.487548828125, 1.70068359375, 1.913818359375, 2.126953125, 2.340087890625, 2.55322265625, 2.766357421875, 2.9794921875, 3.192626953125, 3.40576171875, 3.618896484375, 3.83203125, 4.045166015625, 4.25830078125, 4.471435546875, 4.6845703125, 4.897705078125, 5.11083984375, 5.323974609375, 5.537109375, 5.750244140625, 5.96337890625, 6.176513671875, 6.3896484375, 6.602783203125, 6.81591796875, 7.029052734375, 7.2421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 13.0, 11.0, 22.0, 24.0, 24.0, 32.0, 28.0, 49.0, 53.0, 58.0, 61.0, 76.0, 58.0, 67.0, 66.0, 42.0, 52.0, 37.0, 39.0, 38.0, 26.0, 17.0, 14.0, 10.0, 9.0, 8.0, 9.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005183219909667969, -0.0005004033446311951, -0.00048248469829559326, -0.00046456605195999146, -0.00044664740562438965, -0.00042872875928878784, -0.00041081011295318604, -0.00039289146661758423, -0.0003749728202819824, -0.0003570541739463806, -0.0003391355276107788, -0.000321216881275177, -0.0003032982349395752, -0.0002853795886039734, -0.0002674609422683716, -0.0002495422959327698, -0.00023162364959716797, -0.00021370500326156616, -0.00019578635692596436, -0.00017786771059036255, -0.00015994906425476074, -0.00014203041791915894, -0.00012411177158355713, -0.00010619312524795532, -8.827447891235352e-05, -7.035583257675171e-05, -5.24371862411499e-05, -3.4518539905548096e-05, -1.659989356994629e-05, 1.3187527656555176e-06, 1.9237399101257324e-05, 3.715604543685913e-05, 5.507469177246094e-05, 7.299333810806274e-05, 9.091198444366455e-05, 0.00010883063077926636, 0.00012674927711486816, 0.00014466792345046997, 0.00016258656978607178, 0.00018050521612167358, 0.0001984238624572754, 0.0002163425087928772, 0.000234261155128479, 0.0002521798014640808, 0.0002700984477996826, 0.0002880170941352844, 0.00030593574047088623, 0.00032385438680648804, 0.00034177303314208984, 0.00035969167947769165, 0.00037761032581329346, 0.00039552897214889526, 0.00041344761848449707, 0.0004313662648200989, 0.0004492849111557007, 0.0004672035574913025, 0.0004851222038269043, 0.0005030408501625061, 0.0005209594964981079, 0.0005388781428337097, 0.0005567967891693115, 0.0005747154355049133, 0.0005926340818405151, 0.0006105527281761169, 0.0006284713745117188]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 30.0, 27.0, 50.0, 59.0, 117.0, 151.0, 208.0, 296.0, 504.0, 819.0, 1250.0, 2085.0, 3449.0, 6055.0, 10650.0, 18595.0, 33422.0, 59423.0, 102276.0, 159942.0, 197269.0, 174609.0, 116887.0, 69349.0, 39194.0, 22001.0, 12235.0, 7095.0, 4039.0, 2428.0, 1426.0, 926.0, 542.0, 393.0, 238.0, 163.0, 112.0, 73.0, 56.0, 34.0, 20.0, 23.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.816650390625, -6.57861328125, -6.340576171875, -6.1025390625, -5.864501953125, -5.62646484375, -5.388427734375, -5.150390625, -4.912353515625, -4.67431640625, -4.436279296875, -4.1982421875, -3.960205078125, -3.72216796875, -3.484130859375, -3.24609375, -3.008056640625, -2.77001953125, -2.531982421875, -2.2939453125, -2.055908203125, -1.81787109375, -1.579833984375, -1.341796875, -1.103759765625, -0.86572265625, -0.627685546875, -0.3896484375, -0.151611328125, 0.08642578125, 0.324462890625, 0.5625, 0.800537109375, 1.03857421875, 1.276611328125, 1.5146484375, 1.752685546875, 1.99072265625, 2.228759765625, 2.466796875, 2.704833984375, 2.94287109375, 3.180908203125, 3.4189453125, 3.656982421875, 3.89501953125, 4.133056640625, 4.37109375, 4.609130859375, 4.84716796875, 5.085205078125, 5.3232421875, 5.561279296875, 5.79931640625, 6.037353515625, 6.275390625, 6.513427734375, 6.75146484375, 6.989501953125, 7.2275390625, 7.465576171875, 7.70361328125, 7.941650390625, 8.1796875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 4.0, 9.0, 10.0, 14.0, 14.0, 22.0, 20.0, 30.0, 29.0, 40.0, 44.0, 38.0, 49.0, 53.0, 43.0, 45.0, 39.0, 51.0, 54.0, 49.0, 33.0, 39.0, 30.0, 42.0, 23.0, 21.0, 19.0, 18.0, 22.0, 14.0, 12.0, 10.0, 14.0, 10.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.681640625, -2.585052490234375, -2.48846435546875, -2.391876220703125, -2.2952880859375, -2.198699951171875, -2.10211181640625, -2.005523681640625, -1.908935546875, -1.812347412109375, -1.71575927734375, -1.619171142578125, -1.5225830078125, -1.425994873046875, -1.32940673828125, -1.232818603515625, -1.13623046875, -1.039642333984375, -0.94305419921875, -0.846466064453125, -0.7498779296875, -0.653289794921875, -0.55670166015625, -0.460113525390625, -0.363525390625, -0.266937255859375, -0.17034912109375, -0.073760986328125, 0.0228271484375, 0.119415283203125, 0.21600341796875, 0.312591552734375, 0.4091796875, 0.505767822265625, 0.60235595703125, 0.698944091796875, 0.7955322265625, 0.892120361328125, 0.98870849609375, 1.085296630859375, 1.181884765625, 1.278472900390625, 1.37506103515625, 1.471649169921875, 1.5682373046875, 1.664825439453125, 1.76141357421875, 1.858001708984375, 1.95458984375, 2.051177978515625, 2.14776611328125, 2.244354248046875, 2.3409423828125, 2.437530517578125, 2.53411865234375, 2.630706787109375, 2.727294921875, 2.823883056640625, 2.92047119140625, 3.017059326171875, 3.1136474609375, 3.210235595703125, 3.30682373046875, 3.403411865234375, 3.5]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 11.0, 11.0, 16.0, 12.0, 27.0, 26.0, 42.0, 36.0, 58.0, 71.0, 68.0, 65.0, 84.0, 75.0, 63.0, 53.0, 68.0, 44.0, 42.0, 22.0, 28.0, 10.0, 11.0, 13.0, 9.0, 6.0, 10.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.39774513244629, -22.63043975830078, -21.86313247680664, -21.095827102661133, -20.328521728515625, -19.561216354370117, -18.79391098022461, -18.02660369873047, -17.25929832458496, -16.491992950439453, -15.724686622619629, -14.957380294799805, -14.190074920654297, -13.422769546508789, -12.655463218688965, -11.88815689086914, -11.120851516723633, -10.353546142578125, -9.5862398147583, -8.818933486938477, -8.051628112792969, -7.284322261810303, -6.517016410827637, -5.749710559844971, -4.982404708862305, -4.215098857879639, -3.4477930068969727, -2.6804871559143066, -1.9131813049316406, -1.1458754539489746, -0.3785696029663086, 0.3887362480163574, 1.1560401916503906, 1.9233460426330566, 2.6906518936157227, 3.4579577445983887, 4.225263595581055, 4.992569446563721, 5.759875297546387, 6.527181148529053, 7.294486999511719, 8.061792373657227, 8.82909870147705, 9.596405029296875, 10.363710403442383, 11.13101577758789, 11.898322105407715, 12.665628433227539, 13.432933807373047, 14.200239181518555, 14.967545509338379, 15.734851837158203, 16.50215721130371, 17.26946258544922, 18.03676986694336, 18.804075241088867, 19.571380615234375, 20.338685989379883, 21.10599136352539, 21.87329864501953, 22.64060401916504, 23.407909393310547, 24.175216674804688, 24.942522048950195, 25.709827423095703]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 12.0, 13.0, 19.0, 24.0, 15.0, 27.0, 23.0, 39.0, 24.0, 29.0, 38.0, 36.0, 32.0, 40.0, 38.0, 36.0, 36.0, 44.0, 43.0, 39.0, 25.0, 36.0, 36.0, 27.0, 25.0, 29.0, 31.0, 24.0, 19.0, 18.0, 12.0, 23.0, 10.0, 15.0, 8.0, 6.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.135269165039062, -21.365734100341797, -20.59619903564453, -19.826663970947266, -19.05712890625, -18.287593841552734, -17.51805877685547, -16.748523712158203, -15.978988647460938, -15.209453582763672, -14.439918518066406, -13.67038345336914, -12.900848388671875, -12.13131332397461, -11.361778259277344, -10.592243194580078, -9.822708129882812, -9.053173065185547, -8.283638000488281, -7.514102935791016, -6.74456787109375, -5.975032806396484, -5.205497741699219, -4.435962677001953, -3.6664276123046875, -2.896892547607422, -2.1273574829101562, -1.3578224182128906, -0.588287353515625, 0.18124771118164062, 0.9507827758789062, 1.7203178405761719, 2.4898548126220703, 3.259389877319336, 4.028924942016602, 4.798460006713867, 5.567995071411133, 6.337530136108398, 7.107065200805664, 7.87660026550293, 8.646135330200195, 9.415670394897461, 10.185205459594727, 10.954740524291992, 11.724275588989258, 12.493810653686523, 13.263345718383789, 14.032880783081055, 14.80241584777832, 15.571950912475586, 16.34148597717285, 17.111021041870117, 17.880556106567383, 18.65009117126465, 19.419626235961914, 20.18916130065918, 20.958696365356445, 21.72823143005371, 22.497766494750977, 23.267301559448242, 24.036836624145508, 24.806371688842773, 25.57590675354004, 26.345441818237305, 27.11497688293457]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 20.0, 22.0, 38.0, 66.0, 88.0, 180.0, 299.0, 536.0, 887.0, 1414.0, 2432.0, 4057.0, 6709.0, 11258.0, 18836.0, 31140.0, 52644.0, 89661.0, 153073.0, 265083.0, 444455.0, 674960.0, 782243.0, 642398.0, 414706.0, 243767.0, 142431.0, 83168.0, 49036.0, 29940.0, 18018.0, 11327.0, 6818.0, 4424.0, 2920.0, 1739.0, 1167.0, 763.0, 478.0, 327.0, 218.0, 171.0, 128.0, 69.0, 55.0, 48.0, 25.0, 15.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.25, -14.73193359375, -14.2138671875, -13.69580078125, -13.177734375, -12.65966796875, -12.1416015625, -11.62353515625, -11.10546875, -10.58740234375, -10.0693359375, -9.55126953125, -9.033203125, -8.51513671875, -7.9970703125, -7.47900390625, -6.9609375, -6.44287109375, -5.9248046875, -5.40673828125, -4.888671875, -4.37060546875, -3.8525390625, -3.33447265625, -2.81640625, -2.29833984375, -1.7802734375, -1.26220703125, -0.744140625, -0.22607421875, 0.2919921875, 0.81005859375, 1.328125, 1.84619140625, 2.3642578125, 2.88232421875, 3.400390625, 3.91845703125, 4.4365234375, 4.95458984375, 5.47265625, 5.99072265625, 6.5087890625, 7.02685546875, 7.544921875, 8.06298828125, 8.5810546875, 9.09912109375, 9.6171875, 10.13525390625, 10.6533203125, 11.17138671875, 11.689453125, 12.20751953125, 12.7255859375, 13.24365234375, 13.76171875, 14.27978515625, 14.7978515625, 15.31591796875, 15.833984375, 16.35205078125, 16.8701171875, 17.38818359375, 17.90625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 10.0, 7.0, 14.0, 12.0, 14.0, 15.0, 16.0, 11.0, 29.0, 27.0, 26.0, 36.0, 36.0, 33.0, 22.0, 42.0, 37.0, 36.0, 45.0, 46.0, 37.0, 35.0, 27.0, 40.0, 35.0, 24.0, 36.0, 25.0, 22.0, 36.0, 18.0, 18.0, 18.0, 22.0, 17.0, 11.0, 9.0, 14.0, 7.0, 6.0, 10.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.6328125, -13.1451416015625, -12.657470703125, -12.1697998046875, -11.68212890625, -11.1944580078125, -10.706787109375, -10.2191162109375, -9.7314453125, -9.2437744140625, -8.756103515625, -8.2684326171875, -7.78076171875, -7.2930908203125, -6.805419921875, -6.3177490234375, -5.830078125, -5.3424072265625, -4.854736328125, -4.3670654296875, -3.87939453125, -3.3917236328125, -2.904052734375, -2.4163818359375, -1.9287109375, -1.4410400390625, -0.953369140625, -0.4656982421875, 0.02197265625, 0.5096435546875, 0.997314453125, 1.4849853515625, 1.97265625, 2.4603271484375, 2.947998046875, 3.4356689453125, 3.92333984375, 4.4110107421875, 4.898681640625, 5.3863525390625, 5.8740234375, 6.3616943359375, 6.849365234375, 7.3370361328125, 7.82470703125, 8.3123779296875, 8.800048828125, 9.2877197265625, 9.775390625, 10.2630615234375, 10.750732421875, 11.2384033203125, 11.72607421875, 12.2137451171875, 12.701416015625, 13.1890869140625, 13.6767578125, 14.1644287109375, 14.652099609375, 15.1397705078125, 15.62744140625, 16.1151123046875, 16.602783203125, 17.0904541015625, 17.578125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 17.0, 34.0, 36.0, 66.0, 101.0, 143.0, 246.0, 350.0, 579.0, 924.0, 1523.0, 2467.0, 4232.0, 7006.0, 11765.0, 19919.0, 34972.0, 61072.0, 106601.0, 183920.0, 305258.0, 467943.0, 625165.0, 683032.0, 592978.0, 426550.0, 272121.0, 162297.0, 94163.0, 53861.0, 30736.0, 17796.0, 10562.0, 6288.0, 3690.0, 2239.0, 1387.0, 818.0, 508.0, 309.0, 189.0, 128.0, 99.0, 63.0, 50.0, 21.0, 20.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-13.734375, -13.2967529296875, -12.859130859375, -12.4215087890625, -11.98388671875, -11.5462646484375, -11.108642578125, -10.6710205078125, -10.2333984375, -9.7957763671875, -9.358154296875, -8.9205322265625, -8.48291015625, -8.0452880859375, -7.607666015625, -7.1700439453125, -6.732421875, -6.2947998046875, -5.857177734375, -5.4195556640625, -4.98193359375, -4.5443115234375, -4.106689453125, -3.6690673828125, -3.2314453125, -2.7938232421875, -2.356201171875, -1.9185791015625, -1.48095703125, -1.0433349609375, -0.605712890625, -0.1680908203125, 0.26953125, 0.7071533203125, 1.144775390625, 1.5823974609375, 2.02001953125, 2.4576416015625, 2.895263671875, 3.3328857421875, 3.7705078125, 4.2081298828125, 4.645751953125, 5.0833740234375, 5.52099609375, 5.9586181640625, 6.396240234375, 6.8338623046875, 7.271484375, 7.7091064453125, 8.146728515625, 8.5843505859375, 9.02197265625, 9.4595947265625, 9.897216796875, 10.3348388671875, 10.7724609375, 11.2100830078125, 11.647705078125, 12.0853271484375, 12.52294921875, 12.9605712890625, 13.398193359375, 13.8358154296875, 14.2734375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 7.0, 14.0, 15.0, 23.0, 20.0, 36.0, 41.0, 51.0, 55.0, 51.0, 86.0, 107.0, 141.0, 148.0, 162.0, 178.0, 202.0, 220.0, 197.0, 228.0, 215.0, 238.0, 233.0, 198.0, 203.0, 189.0, 153.0, 125.0, 99.0, 96.0, 72.0, 54.0, 45.0, 41.0, 30.0, 15.0, 27.0, 11.0, 17.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.829345703125, -7.58837890625, -7.347412109375, -7.1064453125, -6.865478515625, -6.62451171875, -6.383544921875, -6.142578125, -5.901611328125, -5.66064453125, -5.419677734375, -5.1787109375, -4.937744140625, -4.69677734375, -4.455810546875, -4.21484375, -3.973876953125, -3.73291015625, -3.491943359375, -3.2509765625, -3.010009765625, -2.76904296875, -2.528076171875, -2.287109375, -2.046142578125, -1.80517578125, -1.564208984375, -1.3232421875, -1.082275390625, -0.84130859375, -0.600341796875, -0.359375, -0.118408203125, 0.12255859375, 0.363525390625, 0.6044921875, 0.845458984375, 1.08642578125, 1.327392578125, 1.568359375, 1.809326171875, 2.05029296875, 2.291259765625, 2.5322265625, 2.773193359375, 3.01416015625, 3.255126953125, 3.49609375, 3.737060546875, 3.97802734375, 4.218994140625, 4.4599609375, 4.700927734375, 4.94189453125, 5.182861328125, 5.423828125, 5.664794921875, 5.90576171875, 6.146728515625, 6.3876953125, 6.628662109375, 6.86962890625, 7.110595703125, 7.3515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 9.0, 18.0, 20.0, 24.0, 35.0, 20.0, 38.0, 47.0, 65.0, 74.0, 73.0, 67.0, 76.0, 75.0, 70.0, 43.0, 43.0, 33.0, 34.0, 30.0, 19.0, 20.0, 14.0, 7.0, 10.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.388673782348633, -16.778060913085938, -16.16744613647461, -15.556832313537598, -14.946218490600586, -14.33560562133789, -13.724991798400879, -13.114377975463867, -12.503764152526855, -11.893150329589844, -11.282536506652832, -10.67192268371582, -10.061309814453125, -9.450695037841797, -8.840082168579102, -8.22946834564209, -7.618854522705078, -7.008240699768066, -6.397626876831055, -5.787013530731201, -5.1763997077941895, -4.565785884857178, -3.955172300338745, -3.3445587158203125, -2.733944892883301, -2.123331069946289, -1.5127174854278564, -0.9021037817001343, -0.2914900779724121, 0.3191237449645996, 0.9297373294830322, 1.5403509140014648, 2.1509628295898438, 2.7615766525268555, 3.372190237045288, 3.9828038215637207, 4.593417644500732, 5.204031467437744, 5.814644813537598, 6.425258636474609, 7.035872459411621, 7.646486282348633, 8.257100105285645, 8.867713928222656, 9.478326797485352, 10.08894157409668, 10.699554443359375, 11.310168266296387, 11.920782089233398, 12.53139591217041, 13.142009735107422, 13.752623558044434, 14.363237380981445, 14.97385025024414, 15.584464073181152, 16.195077896118164, 16.80569076538086, 17.416303634643555, 18.026918411254883, 18.637531280517578, 19.248146057128906, 19.8587589263916, 20.46937370300293, 21.079986572265625, 21.690601348876953]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 9.0, 16.0, 11.0, 19.0, 12.0, 24.0, 25.0, 33.0, 26.0, 32.0, 41.0, 31.0, 39.0, 47.0, 42.0, 38.0, 28.0, 42.0, 39.0, 36.0, 41.0, 30.0, 38.0, 39.0, 26.0, 31.0, 25.0, 19.0, 28.0, 25.0, 17.0, 12.0, 11.0, 13.0, 6.0, 11.0, 9.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.551782608032227, -18.901512145996094, -18.251239776611328, -17.600969314575195, -16.950698852539062, -16.300426483154297, -15.650156021118164, -14.999884605407715, -14.349613189697266, -13.699341773986816, -13.049070358276367, -12.398799896240234, -11.748528480529785, -11.098257064819336, -10.447986602783203, -9.797715187072754, -9.147443771362305, -8.497172355651855, -7.8469014167785645, -7.196630477905273, -6.546359062194824, -5.896087646484375, -5.245816707611084, -4.595545768737793, -3.9452743530273438, -3.2950031757354736, -2.6447319984436035, -1.9944608211517334, -1.3441896438598633, -0.6939184665679932, -0.04364728927612305, 0.606623649597168, 1.2568950653076172, 1.9071662425994873, 2.5574374198913574, 3.2077085971832275, 3.8579797744750977, 4.508251190185547, 5.158522129058838, 5.808793067932129, 6.459064483642578, 7.109335899353027, 7.759606838226318, 8.40987777709961, 9.060149192810059, 9.710420608520508, 10.36069107055664, 11.01096248626709, 11.661233901977539, 12.311505317687988, 12.961776733398438, 13.61204719543457, 14.26231861114502, 14.912590026855469, 15.562860488891602, 16.213130950927734, 16.8634033203125, 17.513673782348633, 18.1639461517334, 18.81421661376953, 19.464488983154297, 20.11475944519043, 20.765029907226562, 21.415302276611328, 22.06557273864746]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 8.0, 12.0, 16.0, 23.0, 32.0, 46.0, 70.0, 98.0, 154.0, 206.0, 282.0, 454.0, 768.0, 1236.0, 2081.0, 3438.0, 5795.0, 10139.0, 18525.0, 34735.0, 68876.0, 139162.0, 264604.0, 243093.0, 122784.0, 61212.0, 31310.0, 16754.0, 9222.0, 5273.0, 3150.0, 1854.0, 1125.0, 699.0, 446.0, 295.0, 179.0, 119.0, 84.0, 54.0, 43.0, 28.0, 29.0, 12.0, 6.0, 4.0, 12.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-6.1171875, -5.93133544921875, -5.7454833984375, -5.55963134765625, -5.373779296875, -5.18792724609375, -5.0020751953125, -4.81622314453125, -4.63037109375, -4.44451904296875, -4.2586669921875, -4.07281494140625, -3.886962890625, -3.70111083984375, -3.5152587890625, -3.32940673828125, -3.1435546875, -2.95770263671875, -2.7718505859375, -2.58599853515625, -2.400146484375, -2.21429443359375, -2.0284423828125, -1.84259033203125, -1.65673828125, -1.47088623046875, -1.2850341796875, -1.09918212890625, -0.913330078125, -0.72747802734375, -0.5416259765625, -0.35577392578125, -0.169921875, 0.01593017578125, 0.2017822265625, 0.38763427734375, 0.573486328125, 0.75933837890625, 0.9451904296875, 1.13104248046875, 1.31689453125, 1.50274658203125, 1.6885986328125, 1.87445068359375, 2.060302734375, 2.24615478515625, 2.4320068359375, 2.61785888671875, 2.8037109375, 2.98956298828125, 3.1754150390625, 3.36126708984375, 3.547119140625, 3.73297119140625, 3.9188232421875, 4.10467529296875, 4.29052734375, 4.47637939453125, 4.6622314453125, 4.84808349609375, 5.033935546875, 5.21978759765625, 5.4056396484375, 5.59149169921875, 5.77734375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 11.0, 10.0, 12.0, 16.0, 18.0, 20.0, 25.0, 32.0, 34.0, 31.0, 30.0, 37.0, 44.0, 46.0, 42.0, 40.0, 30.0, 40.0, 39.0, 38.0, 45.0, 48.0, 37.0, 25.0, 34.0, 28.0, 25.0, 25.0, 28.0, 20.0, 15.0, 12.0, 10.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.453125, -20.770263671875, -20.08740234375, -19.404541015625, -18.7216796875, -18.038818359375, -17.35595703125, -16.673095703125, -15.990234375, -15.307373046875, -14.62451171875, -13.941650390625, -13.2587890625, -12.575927734375, -11.89306640625, -11.210205078125, -10.52734375, -9.844482421875, -9.16162109375, -8.478759765625, -7.7958984375, -7.113037109375, -6.43017578125, -5.747314453125, -5.064453125, -4.381591796875, -3.69873046875, -3.015869140625, -2.3330078125, -1.650146484375, -0.96728515625, -0.284423828125, 0.3984375, 1.081298828125, 1.76416015625, 2.447021484375, 3.1298828125, 3.812744140625, 4.49560546875, 5.178466796875, 5.861328125, 6.544189453125, 7.22705078125, 7.909912109375, 8.5927734375, 9.275634765625, 9.95849609375, 10.641357421875, 11.32421875, 12.007080078125, 12.68994140625, 13.372802734375, 14.0556640625, 14.738525390625, 15.42138671875, 16.104248046875, 16.787109375, 17.469970703125, 18.15283203125, 18.835693359375, 19.5185546875, 20.201416015625, 20.88427734375, 21.567138671875, 22.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 22.0, 33.0, 40.0, 98.0, 165.0, 310.0, 706.0, 1444.0, 3536.0, 9232.0, 26737.0, 87094.0, 292220.0, 420320.0, 141437.0, 42507.0, 13796.0, 5012.0, 1982.0, 903.0, 445.0, 202.0, 106.0, 71.0, 37.0, 28.0, 18.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.584228515625, -8.30908203125, -8.033935546875, -7.7587890625, -7.483642578125, -7.20849609375, -6.933349609375, -6.658203125, -6.383056640625, -6.10791015625, -5.832763671875, -5.5576171875, -5.282470703125, -5.00732421875, -4.732177734375, -4.45703125, -4.181884765625, -3.90673828125, -3.631591796875, -3.3564453125, -3.081298828125, -2.80615234375, -2.531005859375, -2.255859375, -1.980712890625, -1.70556640625, -1.430419921875, -1.1552734375, -0.880126953125, -0.60498046875, -0.329833984375, -0.0546875, 0.220458984375, 0.49560546875, 0.770751953125, 1.0458984375, 1.321044921875, 1.59619140625, 1.871337890625, 2.146484375, 2.421630859375, 2.69677734375, 2.971923828125, 3.2470703125, 3.522216796875, 3.79736328125, 4.072509765625, 4.34765625, 4.622802734375, 4.89794921875, 5.173095703125, 5.4482421875, 5.723388671875, 5.99853515625, 6.273681640625, 6.548828125, 6.823974609375, 7.09912109375, 7.374267578125, 7.6494140625, 7.924560546875, 8.19970703125, 8.474853515625, 8.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 1.0, 5.0, 9.0, 7.0, 6.0, 14.0, 10.0, 20.0, 19.0, 24.0, 23.0, 24.0, 28.0, 28.0, 38.0, 48.0, 43.0, 45.0, 44.0, 41.0, 41.0, 38.0, 40.0, 39.0, 52.0, 36.0, 32.0, 49.0, 28.0, 21.0, 21.0, 17.0, 28.0, 19.0, 7.0, 15.0, 8.0, 7.0, 5.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.1143798828125, -13.580322265625, -13.0462646484375, -12.51220703125, -11.9781494140625, -11.444091796875, -10.9100341796875, -10.3759765625, -9.8419189453125, -9.307861328125, -8.7738037109375, -8.23974609375, -7.7056884765625, -7.171630859375, -6.6375732421875, -6.103515625, -5.5694580078125, -5.035400390625, -4.5013427734375, -3.96728515625, -3.4332275390625, -2.899169921875, -2.3651123046875, -1.8310546875, -1.2969970703125, -0.762939453125, -0.2288818359375, 0.30517578125, 0.8392333984375, 1.373291015625, 1.9073486328125, 2.44140625, 2.9754638671875, 3.509521484375, 4.0435791015625, 4.57763671875, 5.1116943359375, 5.645751953125, 6.1798095703125, 6.7138671875, 7.2479248046875, 7.781982421875, 8.3160400390625, 8.85009765625, 9.3841552734375, 9.918212890625, 10.4522705078125, 10.986328125, 11.5203857421875, 12.054443359375, 12.5885009765625, 13.12255859375, 13.6566162109375, 14.190673828125, 14.7247314453125, 15.2587890625, 15.7928466796875, 16.326904296875, 16.8609619140625, 17.39501953125, 17.9290771484375, 18.463134765625, 18.9971923828125, 19.53125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 12.0, 10.0, 14.0, 23.0, 28.0, 57.0, 68.0, 83.0, 127.0, 160.0, 241.0, 379.0, 546.0, 793.0, 1103.0, 1767.0, 2844.0, 4783.0, 8511.0, 17082.0, 41308.0, 142170.0, 605515.0, 141682.0, 40538.0, 17166.0, 8593.0, 4685.0, 2887.0, 1725.0, 1123.0, 763.0, 537.0, 337.0, 248.0, 171.0, 115.0, 107.0, 67.0, 48.0, 30.0, 28.0, 22.0, 14.0, 12.0, 12.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.1015625, -3.00897216796875, -2.9163818359375, -2.82379150390625, -2.731201171875, -2.63861083984375, -2.5460205078125, -2.45343017578125, -2.36083984375, -2.26824951171875, -2.1756591796875, -2.08306884765625, -1.990478515625, -1.89788818359375, -1.8052978515625, -1.71270751953125, -1.6201171875, -1.52752685546875, -1.4349365234375, -1.34234619140625, -1.249755859375, -1.15716552734375, -1.0645751953125, -0.97198486328125, -0.87939453125, -0.78680419921875, -0.6942138671875, -0.60162353515625, -0.509033203125, -0.41644287109375, -0.3238525390625, -0.23126220703125, -0.138671875, -0.04608154296875, 0.0465087890625, 0.13909912109375, 0.231689453125, 0.32427978515625, 0.4168701171875, 0.50946044921875, 0.60205078125, 0.69464111328125, 0.7872314453125, 0.87982177734375, 0.972412109375, 1.06500244140625, 1.1575927734375, 1.25018310546875, 1.3427734375, 1.43536376953125, 1.5279541015625, 1.62054443359375, 1.713134765625, 1.80572509765625, 1.8983154296875, 1.99090576171875, 2.08349609375, 2.17608642578125, 2.2686767578125, 2.36126708984375, 2.453857421875, 2.54644775390625, 2.6390380859375, 2.73162841796875, 2.82421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 6.0, 9.0, 8.0, 6.0, 17.0, 17.0, 26.0, 31.0, 42.0, 56.0, 62.0, 100.0, 119.0, 119.0, 82.0, 81.0, 57.0, 35.0, 19.0, 27.0, 16.0, 8.0, 8.0, 12.0, 6.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000316619873046875, -0.0003085099160671234, -0.0003003999590873718, -0.00029229000210762024, -0.00028418004512786865, -0.00027607008814811707, -0.0002679601311683655, -0.0002598501741886139, -0.0002517402172088623, -0.00024363026022911072, -0.00023552030324935913, -0.00022741034626960754, -0.00021930038928985596, -0.00021119043231010437, -0.00020308047533035278, -0.0001949705183506012, -0.0001868605613708496, -0.00017875060439109802, -0.00017064064741134644, -0.00016253069043159485, -0.00015442073345184326, -0.00014631077647209167, -0.0001382008194923401, -0.0001300908625125885, -0.00012198090553283691, -0.00011387094855308533, -0.00010576099157333374, -9.765103459358215e-05, -8.954107761383057e-05, -8.143112063407898e-05, -7.332116365432739e-05, -6.52112066745758e-05, -5.710124969482422e-05, -4.899129271507263e-05, -4.0881335735321045e-05, -3.277137875556946e-05, -2.466142177581787e-05, -1.6551464796066284e-05, -8.441507816314697e-06, -3.3155083656311035e-07, 7.778406143188477e-06, 1.5888363122940063e-05, 2.399832010269165e-05, 3.210827708244324e-05, 4.0218234062194824e-05, 4.832819104194641e-05, 5.6438148021698e-05, 6.454810500144958e-05, 7.265806198120117e-05, 8.076801896095276e-05, 8.887797594070435e-05, 9.698793292045593e-05, 0.00010509788990020752, 0.0001132078468799591, 0.0001213178038597107, 0.00012942776083946228, 0.00013753771781921387, 0.00014564767479896545, 0.00015375763177871704, 0.00016186758875846863, 0.00016997754573822021, 0.0001780875027179718, 0.0001861974596977234, 0.00019430741667747498, 0.00020241737365722656]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 19.0, 28.0, 48.0, 60.0, 84.0, 126.0, 196.0, 298.0, 390.0, 614.0, 903.0, 1241.0, 1816.0, 2568.0, 3762.0, 5592.0, 8278.0, 13044.0, 21646.0, 39306.0, 82643.0, 193530.0, 333835.0, 171491.0, 74183.0, 35889.0, 20114.0, 12275.0, 7866.0, 5209.0, 3498.0, 2447.0, 1655.0, 1181.0, 824.0, 576.0, 417.0, 275.0, 192.0, 149.0, 82.0, 69.0, 48.0, 28.0, 17.0, 7.0, 8.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-2.46484375, -2.39111328125, -2.3173828125, -2.24365234375, -2.169921875, -2.09619140625, -2.0224609375, -1.94873046875, -1.875, -1.80126953125, -1.7275390625, -1.65380859375, -1.580078125, -1.50634765625, -1.4326171875, -1.35888671875, -1.28515625, -1.21142578125, -1.1376953125, -1.06396484375, -0.990234375, -0.91650390625, -0.8427734375, -0.76904296875, -0.6953125, -0.62158203125, -0.5478515625, -0.47412109375, -0.400390625, -0.32666015625, -0.2529296875, -0.17919921875, -0.10546875, -0.03173828125, 0.0419921875, 0.11572265625, 0.189453125, 0.26318359375, 0.3369140625, 0.41064453125, 0.484375, 0.55810546875, 0.6318359375, 0.70556640625, 0.779296875, 0.85302734375, 0.9267578125, 1.00048828125, 1.07421875, 1.14794921875, 1.2216796875, 1.29541015625, 1.369140625, 1.44287109375, 1.5166015625, 1.59033203125, 1.6640625, 1.73779296875, 1.8115234375, 1.88525390625, 1.958984375, 2.03271484375, 2.1064453125, 2.18017578125, 2.25390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 2.0, 5.0, 7.0, 10.0, 8.0, 8.0, 15.0, 14.0, 13.0, 17.0, 17.0, 30.0, 27.0, 34.0, 34.0, 46.0, 45.0, 43.0, 38.0, 54.0, 39.0, 49.0, 49.0, 40.0, 44.0, 37.0, 46.0, 28.0, 23.0, 32.0, 17.0, 21.0, 19.0, 16.0, 8.0, 10.0, 5.0, 7.0, 7.0, 7.0, 3.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9150390625, -0.8857421875, -0.8564453125, -0.8271484375, -0.7978515625, -0.7685546875, -0.7392578125, -0.7099609375, -0.6806640625, -0.6513671875, -0.6220703125, -0.5927734375, -0.5634765625, -0.5341796875, -0.5048828125, -0.4755859375, -0.4462890625, -0.4169921875, -0.3876953125, -0.3583984375, -0.3291015625, -0.2998046875, -0.2705078125, -0.2412109375, -0.2119140625, -0.1826171875, -0.1533203125, -0.1240234375, -0.0947265625, -0.0654296875, -0.0361328125, -0.0068359375, 0.0224609375, 0.0517578125, 0.0810546875, 0.1103515625, 0.1396484375, 0.1689453125, 0.1982421875, 0.2275390625, 0.2568359375, 0.2861328125, 0.3154296875, 0.3447265625, 0.3740234375, 0.4033203125, 0.4326171875, 0.4619140625, 0.4912109375, 0.5205078125, 0.5498046875, 0.5791015625, 0.6083984375, 0.6376953125, 0.6669921875, 0.6962890625, 0.7255859375, 0.7548828125, 0.7841796875, 0.8134765625, 0.8427734375, 0.8720703125, 0.9013671875, 0.9306640625, 0.9599609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 3.0, 16.0, 23.0, 27.0, 27.0, 24.0, 40.0, 43.0, 60.0, 64.0, 63.0, 78.0, 68.0, 71.0, 81.0, 45.0, 46.0, 37.0, 37.0, 16.0, 31.0, 21.0, 15.0, 11.0, 8.0, 6.0, 4.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.738319396972656, -16.148845672607422, -15.55937385559082, -14.969901084899902, -14.380428314208984, -13.790955543518066, -13.201482772827148, -12.61201000213623, -12.022537231445312, -11.433064460754395, -10.843591690063477, -10.254118919372559, -9.66464614868164, -9.075173377990723, -8.485700607299805, -7.896227836608887, -7.306755065917969, -6.717282295227051, -6.127809524536133, -5.538336753845215, -4.948863983154297, -4.359391212463379, -3.769918441772461, -3.180445671081543, -2.590972900390625, -2.001500129699707, -1.412027359008789, -0.8225545883178711, -0.23308181762695312, 0.35639095306396484, 0.9458637237548828, 1.5353364944458008, 2.1248092651367188, 2.7142820358276367, 3.3037548065185547, 3.8932275772094727, 4.482700347900391, 5.072173118591309, 5.661645889282227, 6.2511186599731445, 6.8405914306640625, 7.4300642013549805, 8.019536972045898, 8.609009742736816, 9.198482513427734, 9.787955284118652, 10.37742805480957, 10.966900825500488, 11.556373596191406, 12.145846366882324, 12.735319137573242, 13.32479190826416, 13.914264678955078, 14.503737449645996, 15.093210220336914, 15.682682991027832, 16.27215576171875, 16.861629486083984, 17.451101303100586, 18.040573120117188, 18.630046844482422, 19.219520568847656, 19.808992385864258, 20.39846420288086, 20.987937927246094]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 7.0, 8.0, 16.0, 13.0, 19.0, 14.0, 24.0, 25.0, 30.0, 29.0, 32.0, 33.0, 42.0, 36.0, 43.0, 48.0, 30.0, 32.0, 44.0, 36.0, 33.0, 41.0, 33.0, 37.0, 36.0, 34.0, 25.0, 19.0, 27.0, 23.0, 29.0, 16.0, 12.0, 12.0, 14.0, 5.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.3096866607666, -18.66994285583496, -18.030197143554688, -17.390453338623047, -16.750709533691406, -16.110963821411133, -15.471220016479492, -14.831475257873535, -14.191730499267578, -13.551985740661621, -12.912240982055664, -12.272497177124023, -11.632752418518066, -10.99300765991211, -10.353263854980469, -9.713519096374512, -9.073774337768555, -8.434029579162598, -7.794285297393799, -7.154541015625, -6.514796257019043, -5.875051498413086, -5.235307216644287, -4.595562934875488, -3.9558181762695312, -3.3160736560821533, -2.6763291358947754, -2.0365846157073975, -1.3968400955200195, -0.7570955753326416, -0.11735105514526367, 0.5223932266235352, 1.162139892578125, 1.801884412765503, 2.441628932952881, 3.081373453140259, 3.7211179733276367, 4.360862731933594, 5.000607013702393, 5.640351295471191, 6.280096054077148, 6.9198408126831055, 7.559585094451904, 8.199329376220703, 8.83907413482666, 9.478818893432617, 10.118562698364258, 10.758307456970215, 11.398052215576172, 12.037796974182129, 12.677541732788086, 13.317285537719727, 13.957030296325684, 14.59677505493164, 15.236518859863281, 15.876263618469238, 16.516008377075195, 17.155752182006836, 17.79549789428711, 18.43524169921875, 19.07498550415039, 19.714731216430664, 20.354475021362305, 20.994220733642578, 21.63396453857422]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 14.0, 28.0, 21.0, 41.0, 70.0, 109.0, 184.0, 275.0, 405.0, 592.0, 1067.0, 1669.0, 2744.0, 4683.0, 7860.0, 13508.0, 22727.0, 38108.0, 61111.0, 93734.0, 130166.0, 154881.0, 152784.0, 125838.0, 89293.0, 58408.0, 35796.0, 21274.0, 12612.0, 7427.0, 4261.0, 2668.0, 1546.0, 977.0, 593.0, 363.0, 246.0, 159.0, 97.0, 55.0, 61.0, 29.0, 31.0, 13.0, 8.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.484375, -13.98388671875, -13.4833984375, -12.98291015625, -12.482421875, -11.98193359375, -11.4814453125, -10.98095703125, -10.48046875, -9.97998046875, -9.4794921875, -8.97900390625, -8.478515625, -7.97802734375, -7.4775390625, -6.97705078125, -6.4765625, -5.97607421875, -5.4755859375, -4.97509765625, -4.474609375, -3.97412109375, -3.4736328125, -2.97314453125, -2.47265625, -1.97216796875, -1.4716796875, -0.97119140625, -0.470703125, 0.02978515625, 0.5302734375, 1.03076171875, 1.53125, 2.03173828125, 2.5322265625, 3.03271484375, 3.533203125, 4.03369140625, 4.5341796875, 5.03466796875, 5.53515625, 6.03564453125, 6.5361328125, 7.03662109375, 7.537109375, 8.03759765625, 8.5380859375, 9.03857421875, 9.5390625, 10.03955078125, 10.5400390625, 11.04052734375, 11.541015625, 12.04150390625, 12.5419921875, 13.04248046875, 13.54296875, 14.04345703125, 14.5439453125, 15.04443359375, 15.544921875, 16.04541015625, 16.5458984375, 17.04638671875, 17.546875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 10.0, 18.0, 9.0, 20.0, 14.0, 21.0, 18.0, 27.0, 28.0, 24.0, 32.0, 31.0, 34.0, 49.0, 36.0, 37.0, 48.0, 35.0, 37.0, 34.0, 35.0, 43.0, 28.0, 37.0, 35.0, 34.0, 23.0, 25.0, 24.0, 17.0, 19.0, 27.0, 20.0, 7.0, 13.0, 10.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.890625, -18.304931640625, -17.71923828125, -17.133544921875, -16.5478515625, -15.962158203125, -15.37646484375, -14.790771484375, -14.205078125, -13.619384765625, -13.03369140625, -12.447998046875, -11.8623046875, -11.276611328125, -10.69091796875, -10.105224609375, -9.51953125, -8.933837890625, -8.34814453125, -7.762451171875, -7.1767578125, -6.591064453125, -6.00537109375, -5.419677734375, -4.833984375, -4.248291015625, -3.66259765625, -3.076904296875, -2.4912109375, -1.905517578125, -1.31982421875, -0.734130859375, -0.1484375, 0.437255859375, 1.02294921875, 1.608642578125, 2.1943359375, 2.780029296875, 3.36572265625, 3.951416015625, 4.537109375, 5.122802734375, 5.70849609375, 6.294189453125, 6.8798828125, 7.465576171875, 8.05126953125, 8.636962890625, 9.22265625, 9.808349609375, 10.39404296875, 10.979736328125, 11.5654296875, 12.151123046875, 12.73681640625, 13.322509765625, 13.908203125, 14.493896484375, 15.07958984375, 15.665283203125, 16.2509765625, 16.836669921875, 17.42236328125, 18.008056640625, 18.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 9.0, 5.0, 6.0, 21.0, 45.0, 42.0, 71.0, 127.0, 197.0, 348.0, 523.0, 909.0, 1435.0, 2588.0, 4416.0, 7803.0, 13321.0, 23791.0, 41162.0, 69632.0, 109164.0, 151446.0, 172714.0, 155341.0, 115212.0, 73851.0, 44377.0, 25593.0, 14713.0, 8388.0, 4844.0, 2601.0, 1502.0, 934.0, 547.0, 340.0, 208.0, 112.0, 63.0, 43.0, 33.0, 23.0, 20.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-16.40625, -15.886474609375, -15.36669921875, -14.846923828125, -14.3271484375, -13.807373046875, -13.28759765625, -12.767822265625, -12.248046875, -11.728271484375, -11.20849609375, -10.688720703125, -10.1689453125, -9.649169921875, -9.12939453125, -8.609619140625, -8.08984375, -7.570068359375, -7.05029296875, -6.530517578125, -6.0107421875, -5.490966796875, -4.97119140625, -4.451416015625, -3.931640625, -3.411865234375, -2.89208984375, -2.372314453125, -1.8525390625, -1.332763671875, -0.81298828125, -0.293212890625, 0.2265625, 0.746337890625, 1.26611328125, 1.785888671875, 2.3056640625, 2.825439453125, 3.34521484375, 3.864990234375, 4.384765625, 4.904541015625, 5.42431640625, 5.944091796875, 6.4638671875, 6.983642578125, 7.50341796875, 8.023193359375, 8.54296875, 9.062744140625, 9.58251953125, 10.102294921875, 10.6220703125, 11.141845703125, 11.66162109375, 12.181396484375, 12.701171875, 13.220947265625, 13.74072265625, 14.260498046875, 14.7802734375, 15.300048828125, 15.81982421875, 16.339599609375, 16.859375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 10.0, 7.0, 8.0, 7.0, 17.0, 19.0, 20.0, 19.0, 26.0, 28.0, 30.0, 31.0, 34.0, 38.0, 43.0, 38.0, 36.0, 43.0, 44.0, 41.0, 40.0, 34.0, 36.0, 44.0, 35.0, 36.0, 26.0, 34.0, 21.0, 22.0, 18.0, 17.0, 11.0, 15.0, 8.0, 10.0, 8.0, 6.0, 7.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5, -11.1229248046875, -10.745849609375, -10.3687744140625, -9.99169921875, -9.6146240234375, -9.237548828125, -8.8604736328125, -8.4833984375, -8.1063232421875, -7.729248046875, -7.3521728515625, -6.97509765625, -6.5980224609375, -6.220947265625, -5.8438720703125, -5.466796875, -5.0897216796875, -4.712646484375, -4.3355712890625, -3.95849609375, -3.5814208984375, -3.204345703125, -2.8272705078125, -2.4501953125, -2.0731201171875, -1.696044921875, -1.3189697265625, -0.94189453125, -0.5648193359375, -0.187744140625, 0.1893310546875, 0.56640625, 0.9434814453125, 1.320556640625, 1.6976318359375, 2.07470703125, 2.4517822265625, 2.828857421875, 3.2059326171875, 3.5830078125, 3.9600830078125, 4.337158203125, 4.7142333984375, 5.09130859375, 5.4683837890625, 5.845458984375, 6.2225341796875, 6.599609375, 6.9766845703125, 7.353759765625, 7.7308349609375, 8.10791015625, 8.4849853515625, 8.862060546875, 9.2391357421875, 9.6162109375, 9.9932861328125, 10.370361328125, 10.7474365234375, 11.12451171875, 11.5015869140625, 11.878662109375, 12.2557373046875, 12.6328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 23.0, 38.0, 43.0, 104.0, 161.0, 279.0, 402.0, 594.0, 1052.0, 1817.0, 2812.0, 4721.0, 8013.0, 13913.0, 23800.0, 40951.0, 71027.0, 115423.0, 168793.0, 189372.0, 155833.0, 102128.0, 61684.0, 35622.0, 20573.0, 11934.0, 6864.0, 4201.0, 2439.0, 1525.0, 932.0, 569.0, 347.0, 204.0, 121.0, 89.0, 49.0, 34.0, 24.0, 18.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.44854736328125, -5.2564697265625, -5.06439208984375, -4.872314453125, -4.68023681640625, -4.4881591796875, -4.29608154296875, -4.10400390625, -3.91192626953125, -3.7198486328125, -3.52777099609375, -3.335693359375, -3.14361572265625, -2.9515380859375, -2.75946044921875, -2.5673828125, -2.37530517578125, -2.1832275390625, -1.99114990234375, -1.799072265625, -1.60699462890625, -1.4149169921875, -1.22283935546875, -1.03076171875, -0.83868408203125, -0.6466064453125, -0.45452880859375, -0.262451171875, -0.07037353515625, 0.1217041015625, 0.31378173828125, 0.505859375, 0.69793701171875, 0.8900146484375, 1.08209228515625, 1.274169921875, 1.46624755859375, 1.6583251953125, 1.85040283203125, 2.04248046875, 2.23455810546875, 2.4266357421875, 2.61871337890625, 2.810791015625, 3.00286865234375, 3.1949462890625, 3.38702392578125, 3.5791015625, 3.77117919921875, 3.9632568359375, 4.15533447265625, 4.347412109375, 4.53948974609375, 4.7315673828125, 4.92364501953125, 5.11572265625, 5.30780029296875, 5.4998779296875, 5.69195556640625, 5.884033203125, 6.07611083984375, 6.2681884765625, 6.46026611328125, 6.65234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 3.0, 6.0, 9.0, 16.0, 17.0, 22.0, 18.0, 24.0, 38.0, 21.0, 48.0, 48.0, 35.0, 47.0, 47.0, 54.0, 61.0, 47.0, 50.0, 45.0, 45.0, 54.0, 39.0, 30.0, 33.0, 26.0, 22.0, 17.0, 15.0, 15.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.0004887580871582031, -0.0004761144518852234, -0.00046347081661224365, -0.0004508271813392639, -0.0004381835460662842, -0.00042553991079330444, -0.0004128962755203247, -0.00040025264024734497, -0.00038760900497436523, -0.0003749653697013855, -0.00036232173442840576, -0.000349678099155426, -0.0003370344638824463, -0.00032439082860946655, -0.0003117471933364868, -0.0002991035580635071, -0.00028645992279052734, -0.0002738162875175476, -0.00026117265224456787, -0.00024852901697158813, -0.0002358853816986084, -0.00022324174642562866, -0.00021059811115264893, -0.0001979544758796692, -0.00018531084060668945, -0.00017266720533370972, -0.00016002357006072998, -0.00014737993478775024, -0.0001347362995147705, -0.00012209266424179077, -0.00010944902896881104, -9.68053936958313e-05, -8.416175842285156e-05, -7.151812314987183e-05, -5.887448787689209e-05, -4.6230852603912354e-05, -3.358721733093262e-05, -2.094358205795288e-05, -8.299946784973145e-06, 4.343688488006592e-06, 1.6987323760986328e-05, 2.9630959033966064e-05, 4.22745943069458e-05, 5.491822957992554e-05, 6.756186485290527e-05, 8.020550012588501e-05, 9.284913539886475e-05, 0.00010549277067184448, 0.00011813640594482422, 0.00013078004121780396, 0.0001434236764907837, 0.00015606731176376343, 0.00016871094703674316, 0.0001813545823097229, 0.00019399821758270264, 0.00020664185285568237, 0.0002192854881286621, 0.00023192912340164185, 0.0002445727586746216, 0.0002572163939476013, 0.00026986002922058105, 0.0002825036644935608, 0.00029514729976654053, 0.00030779093503952026, 0.0003204345703125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 13.0, 13.0, 34.0, 44.0, 57.0, 98.0, 144.0, 215.0, 351.0, 538.0, 810.0, 1328.0, 2202.0, 3557.0, 5926.0, 9860.0, 17008.0, 29462.0, 49197.0, 80484.0, 123811.0, 164922.0, 173196.0, 141544.0, 96025.0, 60123.0, 35682.0, 20838.0, 12479.0, 7204.0, 4427.0, 2613.0, 1597.0, 984.0, 646.0, 357.0, 257.0, 164.0, 122.0, 72.0, 49.0, 33.0, 21.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.08148193359375, -4.9012451171875, -4.72100830078125, -4.540771484375, -4.36053466796875, -4.1802978515625, -4.00006103515625, -3.81982421875, -3.63958740234375, -3.4593505859375, -3.27911376953125, -3.098876953125, -2.91864013671875, -2.7384033203125, -2.55816650390625, -2.3779296875, -2.19769287109375, -2.0174560546875, -1.83721923828125, -1.656982421875, -1.47674560546875, -1.2965087890625, -1.11627197265625, -0.93603515625, -0.75579833984375, -0.5755615234375, -0.39532470703125, -0.215087890625, -0.03485107421875, 0.1453857421875, 0.32562255859375, 0.505859375, 0.68609619140625, 0.8663330078125, 1.04656982421875, 1.226806640625, 1.40704345703125, 1.5872802734375, 1.76751708984375, 1.94775390625, 2.12799072265625, 2.3082275390625, 2.48846435546875, 2.668701171875, 2.84893798828125, 3.0291748046875, 3.20941162109375, 3.3896484375, 3.56988525390625, 3.7501220703125, 3.93035888671875, 4.110595703125, 4.29083251953125, 4.4710693359375, 4.65130615234375, 4.83154296875, 5.01177978515625, 5.1920166015625, 5.37225341796875, 5.552490234375, 5.73272705078125, 5.9129638671875, 6.09320068359375, 6.2734375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 9.0, 13.0, 14.0, 9.0, 18.0, 15.0, 19.0, 41.0, 29.0, 38.0, 43.0, 52.0, 69.0, 63.0, 62.0, 59.0, 52.0, 56.0, 45.0, 40.0, 46.0, 30.0, 30.0, 30.0, 21.0, 18.0, 15.0, 9.0, 6.0, 5.0, 4.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6796875, -2.58050537109375, -2.4813232421875, -2.38214111328125, -2.282958984375, -2.18377685546875, -2.0845947265625, -1.98541259765625, -1.88623046875, -1.78704833984375, -1.6878662109375, -1.58868408203125, -1.489501953125, -1.39031982421875, -1.2911376953125, -1.19195556640625, -1.0927734375, -0.99359130859375, -0.8944091796875, -0.79522705078125, -0.696044921875, -0.59686279296875, -0.4976806640625, -0.39849853515625, -0.29931640625, -0.20013427734375, -0.1009521484375, -0.00177001953125, 0.097412109375, 0.19659423828125, 0.2957763671875, 0.39495849609375, 0.494140625, 0.59332275390625, 0.6925048828125, 0.79168701171875, 0.890869140625, 0.99005126953125, 1.0892333984375, 1.18841552734375, 1.28759765625, 1.38677978515625, 1.4859619140625, 1.58514404296875, 1.684326171875, 1.78350830078125, 1.8826904296875, 1.98187255859375, 2.0810546875, 2.18023681640625, 2.2794189453125, 2.37860107421875, 2.477783203125, 2.57696533203125, 2.6761474609375, 2.77532958984375, 2.87451171875, 2.97369384765625, 3.0728759765625, 3.17205810546875, 3.271240234375, 3.37042236328125, 3.4696044921875, 3.56878662109375, 3.66796875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 3.0, 8.0, 14.0, 15.0, 28.0, 19.0, 31.0, 45.0, 66.0, 69.0, 65.0, 58.0, 78.0, 69.0, 69.0, 60.0, 50.0, 48.0, 37.0, 34.0, 26.0, 23.0, 17.0, 7.0, 16.0, 6.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.831884384155273, -15.239635467529297, -14.64738655090332, -14.055137634277344, -13.462888717651367, -12.87063980102539, -12.278390884399414, -11.686141967773438, -11.093893051147461, -10.501644134521484, -9.909395217895508, -9.317146301269531, -8.724897384643555, -8.132648468017578, -7.540399551391602, -6.948150634765625, -6.355901718139648, -5.763652801513672, -5.171403884887695, -4.579154968261719, -3.986906051635742, -3.3946571350097656, -2.802408218383789, -2.2101593017578125, -1.617910385131836, -1.0256614685058594, -0.4334125518798828, 0.15883636474609375, 0.7510852813720703, 1.3433341979980469, 1.9355831146240234, 2.52783203125, 3.1200790405273438, 3.7123279571533203, 4.304576873779297, 4.896825790405273, 5.48907470703125, 6.081323623657227, 6.673572540283203, 7.26582145690918, 7.858070373535156, 8.450319290161133, 9.04256820678711, 9.634817123413086, 10.227066040039062, 10.819314956665039, 11.411563873291016, 12.003812789916992, 12.596061706542969, 13.188310623168945, 13.780559539794922, 14.372808456420898, 14.965057373046875, 15.557306289672852, 16.149555206298828, 16.741804122924805, 17.33405303955078, 17.926301956176758, 18.518550872802734, 19.11079978942871, 19.703048706054688, 20.295297622680664, 20.88754653930664, 21.479795455932617, 22.072044372558594]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 7.0, 7.0, 4.0, 5.0, 17.0, 13.0, 19.0, 20.0, 19.0, 23.0, 30.0, 30.0, 30.0, 34.0, 31.0, 45.0, 35.0, 43.0, 39.0, 37.0, 42.0, 40.0, 41.0, 30.0, 32.0, 31.0, 36.0, 42.0, 32.0, 22.0, 28.0, 22.0, 25.0, 12.0, 19.0, 13.0, 12.0, 10.0, 11.0, 6.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.034460067749023, -19.355653762817383, -18.676849365234375, -17.998043060302734, -17.319236755371094, -16.640430450439453, -15.961625099182129, -15.282819747924805, -14.604013442993164, -13.925207138061523, -13.2464017868042, -12.567596435546875, -11.888790130615234, -11.209983825683594, -10.53117847442627, -9.852373123168945, -9.173566818237305, -8.494760513305664, -7.81595516204834, -7.137149333953857, -6.458343505859375, -5.779537677764893, -5.10073184967041, -4.421926021575928, -3.7431201934814453, -3.064314365386963, -2.3855085372924805, -1.706702709197998, -1.0278968811035156, -0.3490910530090332, 0.3297147750854492, 1.0085206031799316, 1.6873245239257812, 2.3661303520202637, 3.044936180114746, 3.7237420082092285, 4.402547836303711, 5.081353664398193, 5.760159492492676, 6.438965320587158, 7.117771148681641, 7.796576976776123, 8.475382804870605, 9.15418815612793, 9.83299446105957, 10.511800765991211, 11.190606117248535, 11.86941146850586, 12.5482177734375, 13.22702407836914, 13.905829429626465, 14.584634780883789, 15.26344108581543, 15.94224739074707, 16.621051788330078, 17.29985809326172, 17.97866439819336, 18.657470703125, 19.33627700805664, 20.01508140563965, 20.69388771057129, 21.37269401550293, 22.051498413085938, 22.730304718017578, 23.40911102294922]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 7.0, 9.0, 6.0, 16.0, 24.0, 48.0, 75.0, 124.0, 195.0, 291.0, 511.0, 769.0, 1391.0, 2249.0, 3746.0, 6327.0, 10677.0, 18327.0, 31996.0, 55559.0, 97553.0, 172316.0, 301379.0, 510522.0, 748650.0, 797591.0, 594655.0, 359008.0, 203717.0, 116528.0, 66103.0, 38099.0, 22253.0, 12992.0, 7896.0, 4746.0, 2894.0, 1768.0, 1187.0, 729.0, 451.0, 317.0, 184.0, 137.0, 92.0, 59.0, 31.0, 34.0, 15.0, 14.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.7109375, -12.2596435546875, -11.808349609375, -11.3570556640625, -10.90576171875, -10.4544677734375, -10.003173828125, -9.5518798828125, -9.1005859375, -8.6492919921875, -8.197998046875, -7.7467041015625, -7.29541015625, -6.8441162109375, -6.392822265625, -5.9415283203125, -5.490234375, -5.0389404296875, -4.587646484375, -4.1363525390625, -3.68505859375, -3.2337646484375, -2.782470703125, -2.3311767578125, -1.8798828125, -1.4285888671875, -0.977294921875, -0.5260009765625, -0.07470703125, 0.3765869140625, 0.827880859375, 1.2791748046875, 1.73046875, 2.1817626953125, 2.633056640625, 3.0843505859375, 3.53564453125, 3.9869384765625, 4.438232421875, 4.8895263671875, 5.3408203125, 5.7921142578125, 6.243408203125, 6.6947021484375, 7.14599609375, 7.5972900390625, 8.048583984375, 8.4998779296875, 8.951171875, 9.4024658203125, 9.853759765625, 10.3050537109375, 10.75634765625, 11.2076416015625, 11.658935546875, 12.1102294921875, 12.5615234375, 13.0128173828125, 13.464111328125, 13.9154052734375, 14.36669921875, 14.8179931640625, 15.269287109375, 15.7205810546875, 16.171875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 9.0, 12.0, 11.0, 12.0, 21.0, 22.0, 24.0, 27.0, 32.0, 29.0, 31.0, 36.0, 28.0, 41.0, 50.0, 39.0, 41.0, 39.0, 32.0, 54.0, 31.0, 34.0, 34.0, 34.0, 35.0, 41.0, 30.0, 24.0, 23.0, 21.0, 15.0, 15.0, 18.0, 11.0, 10.0, 7.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.2686767578125, -11.826416015625, -11.3841552734375, -10.94189453125, -10.4996337890625, -10.057373046875, -9.6151123046875, -9.1728515625, -8.7305908203125, -8.288330078125, -7.8460693359375, -7.40380859375, -6.9615478515625, -6.519287109375, -6.0770263671875, -5.634765625, -5.1925048828125, -4.750244140625, -4.3079833984375, -3.86572265625, -3.4234619140625, -2.981201171875, -2.5389404296875, -2.0966796875, -1.6544189453125, -1.212158203125, -0.7698974609375, -0.32763671875, 0.1146240234375, 0.556884765625, 0.9991455078125, 1.44140625, 1.8836669921875, 2.325927734375, 2.7681884765625, 3.21044921875, 3.6527099609375, 4.094970703125, 4.5372314453125, 4.9794921875, 5.4217529296875, 5.864013671875, 6.3062744140625, 6.74853515625, 7.1907958984375, 7.633056640625, 8.0753173828125, 8.517578125, 8.9598388671875, 9.402099609375, 9.8443603515625, 10.28662109375, 10.7288818359375, 11.171142578125, 11.6134033203125, 12.0556640625, 12.4979248046875, 12.940185546875, 13.3824462890625, 13.82470703125, 14.2669677734375, 14.709228515625, 15.1514892578125, 15.59375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 16.0, 18.0, 29.0, 39.0, 67.0, 110.0, 137.0, 196.0, 333.0, 538.0, 793.0, 1171.0, 1950.0, 2987.0, 4843.0, 7718.0, 12474.0, 20172.0, 33237.0, 54887.0, 89848.0, 146836.0, 232484.0, 352017.0, 489700.0, 593412.0, 602355.0, 510733.0, 374472.0, 250797.0, 158303.0, 97330.0, 59290.0, 36844.0, 21985.0, 13516.0, 8254.0, 5234.0, 3215.0, 2156.0, 1290.0, 855.0, 571.0, 371.0, 233.0, 158.0, 104.0, 61.0, 50.0, 34.0, 17.0, 15.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.4609375, -10.1348876953125, -9.808837890625, -9.4827880859375, -9.15673828125, -8.8306884765625, -8.504638671875, -8.1785888671875, -7.8525390625, -7.5264892578125, -7.200439453125, -6.8743896484375, -6.54833984375, -6.2222900390625, -5.896240234375, -5.5701904296875, -5.244140625, -4.9180908203125, -4.592041015625, -4.2659912109375, -3.93994140625, -3.6138916015625, -3.287841796875, -2.9617919921875, -2.6357421875, -2.3096923828125, -1.983642578125, -1.6575927734375, -1.33154296875, -1.0054931640625, -0.679443359375, -0.3533935546875, -0.02734375, 0.2987060546875, 0.624755859375, 0.9508056640625, 1.27685546875, 1.6029052734375, 1.928955078125, 2.2550048828125, 2.5810546875, 2.9071044921875, 3.233154296875, 3.5592041015625, 3.88525390625, 4.2113037109375, 4.537353515625, 4.8634033203125, 5.189453125, 5.5155029296875, 5.841552734375, 6.1676025390625, 6.49365234375, 6.8197021484375, 7.145751953125, 7.4718017578125, 7.7978515625, 8.1239013671875, 8.449951171875, 8.7760009765625, 9.10205078125, 9.4281005859375, 9.754150390625, 10.0802001953125, 10.40625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 11.0, 13.0, 12.0, 23.0, 28.0, 44.0, 37.0, 45.0, 63.0, 80.0, 94.0, 110.0, 121.0, 158.0, 147.0, 169.0, 173.0, 215.0, 209.0, 210.0, 213.0, 210.0, 191.0, 187.0, 201.0, 143.0, 126.0, 145.0, 120.0, 101.0, 81.0, 74.0, 49.0, 49.0, 46.0, 36.0, 33.0, 27.0, 16.0, 12.0, 13.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.28125, -6.09478759765625, -5.9083251953125, -5.72186279296875, -5.535400390625, -5.34893798828125, -5.1624755859375, -4.97601318359375, -4.78955078125, -4.60308837890625, -4.4166259765625, -4.23016357421875, -4.043701171875, -3.85723876953125, -3.6707763671875, -3.48431396484375, -3.2978515625, -3.11138916015625, -2.9249267578125, -2.73846435546875, -2.552001953125, -2.36553955078125, -2.1790771484375, -1.99261474609375, -1.80615234375, -1.61968994140625, -1.4332275390625, -1.24676513671875, -1.060302734375, -0.87384033203125, -0.6873779296875, -0.50091552734375, -0.314453125, -0.12799072265625, 0.0584716796875, 0.24493408203125, 0.431396484375, 0.61785888671875, 0.8043212890625, 0.99078369140625, 1.17724609375, 1.36370849609375, 1.5501708984375, 1.73663330078125, 1.923095703125, 2.10955810546875, 2.2960205078125, 2.48248291015625, 2.6689453125, 2.85540771484375, 3.0418701171875, 3.22833251953125, 3.414794921875, 3.60125732421875, 3.7877197265625, 3.97418212890625, 4.16064453125, 4.34710693359375, 4.5335693359375, 4.72003173828125, 4.906494140625, 5.09295654296875, 5.2794189453125, 5.46588134765625, 5.65234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 10.0, 12.0, 13.0, 16.0, 15.0, 22.0, 34.0, 40.0, 33.0, 56.0, 56.0, 54.0, 78.0, 50.0, 65.0, 61.0, 54.0, 41.0, 50.0, 43.0, 34.0, 40.0, 28.0, 22.0, 11.0, 10.0, 12.0, 5.0, 5.0, 10.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.619202613830566, -15.163493156433105, -14.707784652709961, -14.2520751953125, -13.796365737915039, -13.340657234191895, -12.884947776794434, -12.429239273071289, -11.973529815673828, -11.517820358276367, -11.062111854553223, -10.606402397155762, -10.150693893432617, -9.694984436035156, -9.239274978637695, -8.783565521240234, -8.32785701751709, -7.872148036956787, -7.416439056396484, -6.960729598999023, -6.505020618438721, -6.049311637878418, -5.593602180480957, -5.137893199920654, -4.682184219360352, -4.226475238800049, -3.770766019821167, -3.315056800842285, -2.8593478202819824, -2.4036388397216797, -1.9479296207427979, -1.492220401763916, -1.0365114212036133, -0.580802321434021, -0.1250932216644287, 0.3306158781051636, 0.7863249778747559, 1.2420339584350586, 1.6977431774139404, 2.1534523963928223, 2.609161376953125, 3.0648703575134277, 3.5205795764923096, 3.9762887954711914, 4.431997776031494, 4.887706756591797, 5.343416213989258, 5.7991251945495605, 6.254834175109863, 6.710543155670166, 7.166252136230469, 7.62196159362793, 8.07767105102539, 8.533379554748535, 8.989089012145996, 9.44479751586914, 9.900506973266602, 10.356216430664062, 10.811924934387207, 11.267634391784668, 11.723342895507812, 12.179052352905273, 12.634761810302734, 13.090471267700195, 13.54617977142334]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 11.0, 9.0, 11.0, 10.0, 12.0, 15.0, 13.0, 13.0, 19.0, 29.0, 25.0, 30.0, 34.0, 29.0, 29.0, 45.0, 35.0, 60.0, 47.0, 47.0, 48.0, 41.0, 38.0, 45.0, 41.0, 43.0, 26.0, 25.0, 31.0, 26.0, 14.0, 32.0, 14.0, 9.0, 14.0, 10.0, 6.0, 2.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.786739349365234, -15.18981647491455, -14.592893600463867, -13.995970726013184, -13.3990478515625, -12.8021240234375, -12.205201148986816, -11.608278274536133, -11.01135540008545, -10.414432525634766, -9.817509651184082, -9.220586776733398, -8.623662948608398, -8.026741027832031, -7.429817199707031, -6.832894325256348, -6.235971450805664, -5.6390485763549805, -5.042125701904297, -4.445202350616455, -3.8482794761657715, -3.251356601715088, -2.654433488845825, -2.0575103759765625, -1.460587501525879, -0.8636645078659058, -0.2667415142059326, 0.3301814794540405, 0.9271044731140137, 1.5240273475646973, 2.12095046043396, 2.7178735733032227, 3.3147964477539062, 3.91171932220459, 4.508642196655273, 5.105565547943115, 5.702488422393799, 6.299411296844482, 6.896334648132324, 7.493257522583008, 8.090180397033691, 8.687103271484375, 9.284026145935059, 9.880949020385742, 10.477872848510742, 11.07479476928711, 11.67171859741211, 12.268641471862793, 12.865564346313477, 13.46248722076416, 14.059410095214844, 14.656332969665527, 15.253255844116211, 15.850179672241211, 16.447101593017578, 17.044025421142578, 17.640949249267578, 18.237873077392578, 18.834794998168945, 19.431718826293945, 20.028640747070312, 20.625564575195312, 21.22248649597168, 21.81941032409668, 22.416332244873047]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 12.0, 9.0, 11.0, 14.0, 25.0, 38.0, 56.0, 116.0, 172.0, 322.0, 639.0, 1228.0, 2763.0, 7022.0, 20012.0, 68180.0, 272963.0, 472069.0, 144188.0, 38075.0, 12257.0, 4492.0, 1865.0, 954.0, 458.0, 247.0, 135.0, 74.0, 51.0, 26.0, 23.0, 15.0, 14.0, 8.0, 8.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.5115966796875, -9.241943359375, -8.9722900390625, -8.70263671875, -8.4329833984375, -8.163330078125, -7.8936767578125, -7.6240234375, -7.3543701171875, -7.084716796875, -6.8150634765625, -6.54541015625, -6.2757568359375, -6.006103515625, -5.7364501953125, -5.466796875, -5.1971435546875, -4.927490234375, -4.6578369140625, -4.38818359375, -4.1185302734375, -3.848876953125, -3.5792236328125, -3.3095703125, -3.0399169921875, -2.770263671875, -2.5006103515625, -2.23095703125, -1.9613037109375, -1.691650390625, -1.4219970703125, -1.15234375, -0.8826904296875, -0.613037109375, -0.3433837890625, -0.07373046875, 0.1959228515625, 0.465576171875, 0.7352294921875, 1.0048828125, 1.2745361328125, 1.544189453125, 1.8138427734375, 2.08349609375, 2.3531494140625, 2.622802734375, 2.8924560546875, 3.162109375, 3.4317626953125, 3.701416015625, 3.9710693359375, 4.24072265625, 4.5103759765625, 4.780029296875, 5.0496826171875, 5.3193359375, 5.5889892578125, 5.858642578125, 6.1282958984375, 6.39794921875, 6.6676025390625, 6.937255859375, 7.2069091796875, 7.4765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 9.0, 19.0, 13.0, 13.0, 22.0, 26.0, 24.0, 36.0, 31.0, 27.0, 38.0, 36.0, 48.0, 53.0, 56.0, 49.0, 53.0, 40.0, 41.0, 38.0, 33.0, 48.0, 33.0, 27.0, 29.0, 28.0, 15.0, 18.0, 17.0, 12.0, 13.0, 13.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.700927734375, -16.07373046875, -15.446533203125, -14.8193359375, -14.192138671875, -13.56494140625, -12.937744140625, -12.310546875, -11.683349609375, -11.05615234375, -10.428955078125, -9.8017578125, -9.174560546875, -8.54736328125, -7.920166015625, -7.29296875, -6.665771484375, -6.03857421875, -5.411376953125, -4.7841796875, -4.156982421875, -3.52978515625, -2.902587890625, -2.275390625, -1.648193359375, -1.02099609375, -0.393798828125, 0.2333984375, 0.860595703125, 1.48779296875, 2.114990234375, 2.7421875, 3.369384765625, 3.99658203125, 4.623779296875, 5.2509765625, 5.878173828125, 6.50537109375, 7.132568359375, 7.759765625, 8.386962890625, 9.01416015625, 9.641357421875, 10.2685546875, 10.895751953125, 11.52294921875, 12.150146484375, 12.77734375, 13.404541015625, 14.03173828125, 14.658935546875, 15.2861328125, 15.913330078125, 16.54052734375, 17.167724609375, 17.794921875, 18.422119140625, 19.04931640625, 19.676513671875, 20.3037109375, 20.930908203125, 21.55810546875, 22.185302734375, 22.8125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 6.0, 10.0, 15.0, 25.0, 36.0, 47.0, 69.0, 72.0, 117.0, 215.0, 345.0, 586.0, 1055.0, 2235.0, 5264.0, 12645.0, 33143.0, 92889.0, 264473.0, 389435.0, 155857.0, 54696.0, 20333.0, 7959.0, 3409.0, 1554.0, 847.0, 416.0, 269.0, 153.0, 118.0, 79.0, 38.0, 38.0, 27.0, 19.0, 18.0, 12.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.31060791015625, -5.1290283203125, -4.94744873046875, -4.765869140625, -4.58428955078125, -4.4027099609375, -4.22113037109375, -4.03955078125, -3.85797119140625, -3.6763916015625, -3.49481201171875, -3.313232421875, -3.13165283203125, -2.9500732421875, -2.76849365234375, -2.5869140625, -2.40533447265625, -2.2237548828125, -2.04217529296875, -1.860595703125, -1.67901611328125, -1.4974365234375, -1.31585693359375, -1.13427734375, -0.95269775390625, -0.7711181640625, -0.58953857421875, -0.407958984375, -0.22637939453125, -0.0447998046875, 0.13677978515625, 0.318359375, 0.49993896484375, 0.6815185546875, 0.86309814453125, 1.044677734375, 1.22625732421875, 1.4078369140625, 1.58941650390625, 1.77099609375, 1.95257568359375, 2.1341552734375, 2.31573486328125, 2.497314453125, 2.67889404296875, 2.8604736328125, 3.04205322265625, 3.2236328125, 3.40521240234375, 3.5867919921875, 3.76837158203125, 3.949951171875, 4.13153076171875, 4.3131103515625, 4.49468994140625, 4.67626953125, 4.85784912109375, 5.0394287109375, 5.22100830078125, 5.402587890625, 5.58416748046875, 5.7657470703125, 5.94732666015625, 6.12890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 5.0, 10.0, 13.0, 5.0, 18.0, 17.0, 12.0, 15.0, 24.0, 25.0, 30.0, 21.0, 38.0, 31.0, 36.0, 30.0, 37.0, 53.0, 44.0, 55.0, 29.0, 39.0, 49.0, 34.0, 32.0, 31.0, 30.0, 27.0, 32.0, 27.0, 26.0, 21.0, 16.0, 11.0, 13.0, 9.0, 10.0, 9.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.45556640625, -12.0751953125, -11.69482421875, -11.314453125, -10.93408203125, -10.5537109375, -10.17333984375, -9.79296875, -9.41259765625, -9.0322265625, -8.65185546875, -8.271484375, -7.89111328125, -7.5107421875, -7.13037109375, -6.75, -6.36962890625, -5.9892578125, -5.60888671875, -5.228515625, -4.84814453125, -4.4677734375, -4.08740234375, -3.70703125, -3.32666015625, -2.9462890625, -2.56591796875, -2.185546875, -1.80517578125, -1.4248046875, -1.04443359375, -0.6640625, -0.28369140625, 0.0966796875, 0.47705078125, 0.857421875, 1.23779296875, 1.6181640625, 1.99853515625, 2.37890625, 2.75927734375, 3.1396484375, 3.52001953125, 3.900390625, 4.28076171875, 4.6611328125, 5.04150390625, 5.421875, 5.80224609375, 6.1826171875, 6.56298828125, 6.943359375, 7.32373046875, 7.7041015625, 8.08447265625, 8.46484375, 8.84521484375, 9.2255859375, 9.60595703125, 9.986328125, 10.36669921875, 10.7470703125, 11.12744140625, 11.5078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 6.0, 18.0, 12.0, 10.0, 24.0, 50.0, 47.0, 69.0, 97.0, 156.0, 205.0, 366.0, 607.0, 904.0, 1527.0, 2790.0, 5348.0, 12255.0, 38958.0, 371130.0, 538905.0, 47895.0, 13954.0, 5884.0, 2954.0, 1579.0, 1018.0, 597.0, 398.0, 250.0, 171.0, 127.0, 72.0, 51.0, 39.0, 19.0, 19.0, 16.0, 12.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.417633056640625, -2.33721923828125, -2.256805419921875, -2.1763916015625, -2.095977783203125, -2.01556396484375, -1.935150146484375, -1.854736328125, -1.774322509765625, -1.69390869140625, -1.613494873046875, -1.5330810546875, -1.452667236328125, -1.37225341796875, -1.291839599609375, -1.21142578125, -1.131011962890625, -1.05059814453125, -0.970184326171875, -0.8897705078125, -0.809356689453125, -0.72894287109375, -0.648529052734375, -0.568115234375, -0.487701416015625, -0.40728759765625, -0.326873779296875, -0.2464599609375, -0.166046142578125, -0.08563232421875, -0.005218505859375, 0.0751953125, 0.155609130859375, 0.23602294921875, 0.316436767578125, 0.3968505859375, 0.477264404296875, 0.55767822265625, 0.638092041015625, 0.718505859375, 0.798919677734375, 0.87933349609375, 0.959747314453125, 1.0401611328125, 1.120574951171875, 1.20098876953125, 1.281402587890625, 1.36181640625, 1.442230224609375, 1.52264404296875, 1.603057861328125, 1.6834716796875, 1.763885498046875, 1.84429931640625, 1.924713134765625, 2.005126953125, 2.085540771484375, 2.16595458984375, 2.246368408203125, 2.3267822265625, 2.407196044921875, 2.48760986328125, 2.568023681640625, 2.6484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 9.0, 18.0, 24.0, 55.0, 67.0, 126.0, 167.0, 150.0, 112.0, 96.0, 58.0, 38.0, 19.0, 14.0, 9.0, 8.0, 6.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020325183868408203, -0.00019712559878826141, -0.0001909993588924408, -0.00018487311899662018, -0.00017874687910079956, -0.00017262063920497894, -0.00016649439930915833, -0.0001603681594133377, -0.0001542419195175171, -0.00014811567962169647, -0.00014198943972587585, -0.00013586319983005524, -0.00012973695993423462, -0.000123610720038414, -0.00011748448014259338, -0.00011135824024677277, -0.00010523200035095215, -9.910576045513153e-05, -9.297952055931091e-05, -8.68532806634903e-05, -8.072704076766968e-05, -7.460080087184906e-05, -6.847456097602844e-05, -6.234832108020782e-05, -5.622208118438721e-05, -5.009584128856659e-05, -4.396960139274597e-05, -3.7843361496925354e-05, -3.1717121601104736e-05, -2.559088170528412e-05, -1.94646418094635e-05, -1.3338401913642883e-05, -7.212162017822266e-06, -1.085922122001648e-06, 5.04031777381897e-06, 1.1166557669639587e-05, 1.7292797565460205e-05, 2.3419037461280823e-05, 2.954527735710144e-05, 3.567151725292206e-05, 4.1797757148742676e-05, 4.7923997044563293e-05, 5.405023694038391e-05, 6.017647683620453e-05, 6.630271673202515e-05, 7.242895662784576e-05, 7.855519652366638e-05, 8.4681436419487e-05, 9.080767631530762e-05, 9.693391621112823e-05, 0.00010306015610694885, 0.00010918639600276947, 0.00011531263589859009, 0.0001214388757944107, 0.00012756511569023132, 0.00013369135558605194, 0.00013981759548187256, 0.00014594383537769318, 0.0001520700752735138, 0.0001581963151693344, 0.00016432255506515503, 0.00017044879496097565, 0.00017657503485679626, 0.00018270127475261688, 0.0001888275146484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 12.0, 26.0, 29.0, 43.0, 75.0, 97.0, 163.0, 224.0, 302.0, 435.0, 567.0, 887.0, 1289.0, 1790.0, 2734.0, 4095.0, 6437.0, 10569.0, 18586.0, 35138.0, 71081.0, 159419.0, 318987.0, 216810.0, 95181.0, 44991.0, 23323.0, 12700.0, 7794.0, 4759.0, 3171.0, 2223.0, 1399.0, 983.0, 719.0, 434.0, 310.0, 244.0, 160.0, 118.0, 86.0, 52.0, 32.0, 33.0, 17.0, 13.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.324981689453125, -1.28179931640625, -1.238616943359375, -1.1954345703125, -1.152252197265625, -1.10906982421875, -1.065887451171875, -1.022705078125, -0.979522705078125, -0.93634033203125, -0.893157958984375, -0.8499755859375, -0.806793212890625, -0.76361083984375, -0.720428466796875, -0.67724609375, -0.634063720703125, -0.59088134765625, -0.547698974609375, -0.5045166015625, -0.461334228515625, -0.41815185546875, -0.374969482421875, -0.331787109375, -0.288604736328125, -0.24542236328125, -0.202239990234375, -0.1590576171875, -0.115875244140625, -0.07269287109375, -0.029510498046875, 0.013671875, 0.056854248046875, 0.10003662109375, 0.143218994140625, 0.1864013671875, 0.229583740234375, 0.27276611328125, 0.315948486328125, 0.359130859375, 0.402313232421875, 0.44549560546875, 0.488677978515625, 0.5318603515625, 0.575042724609375, 0.61822509765625, 0.661407470703125, 0.70458984375, 0.747772216796875, 0.79095458984375, 0.834136962890625, 0.8773193359375, 0.920501708984375, 0.96368408203125, 1.006866455078125, 1.050048828125, 1.093231201171875, 1.13641357421875, 1.179595947265625, 1.2227783203125, 1.265960693359375, 1.30914306640625, 1.352325439453125, 1.3955078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 8.0, 11.0, 10.0, 16.0, 16.0, 23.0, 22.0, 29.0, 24.0, 25.0, 33.0, 26.0, 42.0, 56.0, 60.0, 62.0, 54.0, 65.0, 58.0, 47.0, 45.0, 38.0, 29.0, 25.0, 27.0, 20.0, 18.0, 12.0, 12.0, 13.0, 10.0, 6.0, 12.0, 3.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5125503540039062, -0.4943389892578125, -0.47612762451171875, -0.457916259765625, -0.43970489501953125, -0.4214935302734375, -0.40328216552734375, -0.38507080078125, -0.36685943603515625, -0.3486480712890625, -0.33043670654296875, -0.312225341796875, -0.29401397705078125, -0.2758026123046875, -0.25759124755859375, -0.2393798828125, -0.22116851806640625, -0.2029571533203125, -0.18474578857421875, -0.166534423828125, -0.14832305908203125, -0.1301116943359375, -0.11190032958984375, -0.09368896484375, -0.07547760009765625, -0.0572662353515625, -0.03905487060546875, -0.020843505859375, -0.00263214111328125, 0.0155792236328125, 0.03379058837890625, 0.052001953125, 0.07021331787109375, 0.0884246826171875, 0.10663604736328125, 0.124847412109375, 0.14305877685546875, 0.1612701416015625, 0.17948150634765625, 0.19769287109375, 0.21590423583984375, 0.2341156005859375, 0.25232696533203125, 0.270538330078125, 0.28874969482421875, 0.3069610595703125, 0.32517242431640625, 0.3433837890625, 0.36159515380859375, 0.3798065185546875, 0.39801788330078125, 0.416229248046875, 0.43444061279296875, 0.4526519775390625, 0.47086334228515625, 0.48907470703125, 0.5072860717773438, 0.5254974365234375, 0.5437088012695312, 0.561920166015625, 0.5801315307617188, 0.5983428955078125, 0.6165542602539062, 0.634765625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 6.0, 12.0, 12.0, 11.0, 10.0, 18.0, 19.0, 29.0, 34.0, 31.0, 40.0, 50.0, 45.0, 67.0, 65.0, 56.0, 61.0, 62.0, 46.0, 49.0, 41.0, 47.0, 30.0, 38.0, 30.0, 19.0, 19.0, 11.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-15.251289367675781, -14.81523323059082, -14.37917709350586, -13.943120956420898, -13.507064819335938, -13.071008682250977, -12.634952545166016, -12.198896408081055, -11.762840270996094, -11.326784133911133, -10.890727996826172, -10.454671859741211, -10.01861572265625, -9.582559585571289, -9.146503448486328, -8.710447311401367, -8.27439022064209, -7.838334083557129, -7.402277946472168, -6.966221809387207, -6.530165672302246, -6.094109535217285, -5.658052921295166, -5.221996784210205, -4.785940647125244, -4.349884510040283, -3.9138283729553223, -3.4777719974517822, -3.0417158603668213, -2.6056597232818604, -2.1696033477783203, -1.7335472106933594, -1.297490119934082, -0.8614339232444763, -0.4253777265548706, 0.010678529739379883, 0.4467346668243408, 0.8827908039093018, 1.3188471794128418, 1.7549033164978027, 2.1909594535827637, 2.6270155906677246, 3.0630717277526855, 3.4991281032562256, 3.9351842403411865, 4.371240615844727, 4.8072967529296875, 5.243352890014648, 5.679409027099609, 6.11546516418457, 6.551521301269531, 6.987577438354492, 7.423633575439453, 7.859689712524414, 8.295745849609375, 8.731801986694336, 9.167858123779297, 9.603914260864258, 10.039970397949219, 10.47602653503418, 10.91208267211914, 11.348138809204102, 11.784194946289062, 12.220251083374023, 12.6563081741333]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 9.0, 9.0, 14.0, 12.0, 10.0, 16.0, 11.0, 20.0, 31.0, 24.0, 33.0, 31.0, 24.0, 34.0, 38.0, 50.0, 46.0, 53.0, 45.0, 54.0, 43.0, 31.0, 51.0, 39.0, 36.0, 26.0, 29.0, 31.0, 24.0, 16.0, 27.0, 15.0, 14.0, 10.0, 9.0, 9.0, 2.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.681159973144531, -15.089672088623047, -14.498184204101562, -13.906696319580078, -13.315207481384277, -12.723719596862793, -12.132231712341309, -11.540742874145508, -10.949254989624023, -10.357767105102539, -9.766279220581055, -9.17479133605957, -8.58330249786377, -7.991814613342285, -7.400326728820801, -6.808838367462158, -6.217350959777832, -5.625863075256348, -5.034374713897705, -4.442886829376221, -3.8513987064361572, -3.2599105834960938, -2.6684226989746094, -2.076934337615967, -1.4854464530944824, -0.8939583897590637, -0.302470326423645, 0.2890176773071289, 0.8805058002471924, 1.4719939231872559, 2.0634818077087402, 2.654970169067383, 3.246458053588867, 3.8379461765289307, 4.429434299468994, 5.0209221839904785, 5.612410545349121, 6.2038984298706055, 6.79538631439209, 7.386874675750732, 7.978362560272217, 8.56985092163086, 9.161338806152344, 9.752826690673828, 10.344314575195312, 10.935802459716797, 11.527290344238281, 12.118779182434082, 12.710267066955566, 13.30175495147705, 13.893242835998535, 14.484731674194336, 15.07621955871582, 15.667707443237305, 16.25919532775879, 16.850683212280273, 17.442171096801758, 18.033658981323242, 18.625146865844727, 19.21663475036621, 19.808122634887695, 20.399612426757812, 20.991100311279297, 21.58258819580078, 22.174076080322266]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 5.0, 11.0, 8.0, 14.0, 28.0, 38.0, 45.0, 83.0, 127.0, 201.0, 351.0, 510.0, 869.0, 1352.0, 2251.0, 3784.0, 6450.0, 11389.0, 20110.0, 35542.0, 61597.0, 100802.0, 146997.0, 176744.0, 165917.0, 124494.0, 78975.0, 47005.0, 26783.0, 15152.0, 8606.0, 4900.0, 2887.0, 1705.0, 1044.0, 638.0, 420.0, 234.0, 159.0, 104.0, 88.0, 42.0, 38.0, 21.0, 14.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3131103515625, -11.852783203125, -11.3924560546875, -10.93212890625, -10.4718017578125, -10.011474609375, -9.5511474609375, -9.0908203125, -8.6304931640625, -8.170166015625, -7.7098388671875, -7.24951171875, -6.7891845703125, -6.328857421875, -5.8685302734375, -5.408203125, -4.9478759765625, -4.487548828125, -4.0272216796875, -3.56689453125, -3.1065673828125, -2.646240234375, -2.1859130859375, -1.7255859375, -1.2652587890625, -0.804931640625, -0.3446044921875, 0.11572265625, 0.5760498046875, 1.036376953125, 1.4967041015625, 1.95703125, 2.4173583984375, 2.877685546875, 3.3380126953125, 3.79833984375, 4.2586669921875, 4.718994140625, 5.1793212890625, 5.6396484375, 6.0999755859375, 6.560302734375, 7.0206298828125, 7.48095703125, 7.9412841796875, 8.401611328125, 8.8619384765625, 9.322265625, 9.7825927734375, 10.242919921875, 10.7032470703125, 11.16357421875, 11.6239013671875, 12.084228515625, 12.5445556640625, 13.0048828125, 13.4652099609375, 13.925537109375, 14.3858642578125, 14.84619140625, 15.3065185546875, 15.766845703125, 16.2271728515625, 16.6875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 12.0, 7.0, 8.0, 16.0, 13.0, 14.0, 19.0, 15.0, 24.0, 23.0, 27.0, 27.0, 40.0, 34.0, 36.0, 36.0, 55.0, 47.0, 48.0, 62.0, 46.0, 40.0, 35.0, 52.0, 32.0, 29.0, 25.0, 41.0, 26.0, 19.0, 19.0, 13.0, 12.0, 15.0, 11.0, 5.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -14.9501953125, -14.369140625, -13.7880859375, -13.20703125, -12.6259765625, -12.044921875, -11.4638671875, -10.8828125, -10.3017578125, -9.720703125, -9.1396484375, -8.55859375, -7.9775390625, -7.396484375, -6.8154296875, -6.234375, -5.6533203125, -5.072265625, -4.4912109375, -3.91015625, -3.3291015625, -2.748046875, -2.1669921875, -1.5859375, -1.0048828125, -0.423828125, 0.1572265625, 0.73828125, 1.3193359375, 1.900390625, 2.4814453125, 3.0625, 3.6435546875, 4.224609375, 4.8056640625, 5.38671875, 5.9677734375, 6.548828125, 7.1298828125, 7.7109375, 8.2919921875, 8.873046875, 9.4541015625, 10.03515625, 10.6162109375, 11.197265625, 11.7783203125, 12.359375, 12.9404296875, 13.521484375, 14.1025390625, 14.68359375, 15.2646484375, 15.845703125, 16.4267578125, 17.0078125, 17.5888671875, 18.169921875, 18.7509765625, 19.33203125, 19.9130859375, 20.494140625, 21.0751953125, 21.65625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 17.0, 19.0, 33.0, 51.0, 79.0, 104.0, 162.0, 278.0, 466.0, 686.0, 1137.0, 1786.0, 2808.0, 4578.0, 7438.0, 11834.0, 19599.0, 31352.0, 50952.0, 77911.0, 113686.0, 146887.0, 156225.0, 136464.0, 102045.0, 68167.0, 43501.0, 27073.0, 16368.0, 10157.0, 6375.0, 3797.0, 2351.0, 1477.0, 931.0, 640.0, 393.0, 245.0, 168.0, 119.0, 60.0, 45.0, 26.0, 19.0, 13.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8828125, -12.484375, -12.0859375, -11.6875, -11.2890625, -10.890625, -10.4921875, -10.09375, -9.6953125, -9.296875, -8.8984375, -8.5, -8.1015625, -7.703125, -7.3046875, -6.90625, -6.5078125, -6.109375, -5.7109375, -5.3125, -4.9140625, -4.515625, -4.1171875, -3.71875, -3.3203125, -2.921875, -2.5234375, -2.125, -1.7265625, -1.328125, -0.9296875, -0.53125, -0.1328125, 0.265625, 0.6640625, 1.0625, 1.4609375, 1.859375, 2.2578125, 2.65625, 3.0546875, 3.453125, 3.8515625, 4.25, 4.6484375, 5.046875, 5.4453125, 5.84375, 6.2421875, 6.640625, 7.0390625, 7.4375, 7.8359375, 8.234375, 8.6328125, 9.03125, 9.4296875, 9.828125, 10.2265625, 10.625, 11.0234375, 11.421875, 11.8203125, 12.21875, 12.6171875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 1.0, 5.0, 7.0, 10.0, 11.0, 11.0, 11.0, 12.0, 20.0, 19.0, 24.0, 40.0, 34.0, 25.0, 35.0, 34.0, 31.0, 41.0, 47.0, 40.0, 49.0, 35.0, 41.0, 32.0, 43.0, 38.0, 31.0, 40.0, 34.0, 28.0, 26.0, 33.0, 18.0, 21.0, 14.0, 7.0, 9.0, 6.0, 4.0, 8.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.10693359375, -9.7607421875, -9.41455078125, -9.068359375, -8.72216796875, -8.3759765625, -8.02978515625, -7.68359375, -7.33740234375, -6.9912109375, -6.64501953125, -6.298828125, -5.95263671875, -5.6064453125, -5.26025390625, -4.9140625, -4.56787109375, -4.2216796875, -3.87548828125, -3.529296875, -3.18310546875, -2.8369140625, -2.49072265625, -2.14453125, -1.79833984375, -1.4521484375, -1.10595703125, -0.759765625, -0.41357421875, -0.0673828125, 0.27880859375, 0.625, 0.97119140625, 1.3173828125, 1.66357421875, 2.009765625, 2.35595703125, 2.7021484375, 3.04833984375, 3.39453125, 3.74072265625, 4.0869140625, 4.43310546875, 4.779296875, 5.12548828125, 5.4716796875, 5.81787109375, 6.1640625, 6.51025390625, 6.8564453125, 7.20263671875, 7.548828125, 7.89501953125, 8.2412109375, 8.58740234375, 8.93359375, 9.27978515625, 9.6259765625, 9.97216796875, 10.318359375, 10.66455078125, 11.0107421875, 11.35693359375, 11.703125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 12.0, 32.0, 35.0, 48.0, 80.0, 110.0, 167.0, 249.0, 396.0, 774.0, 1215.0, 2060.0, 3931.0, 7144.0, 13340.0, 25350.0, 47904.0, 88288.0, 151505.0, 212120.0, 199611.0, 132274.0, 74938.0, 40467.0, 21144.0, 11426.0, 6109.0, 3219.0, 1924.0, 1063.0, 587.0, 346.0, 235.0, 140.0, 99.0, 57.0, 39.0, 28.0, 17.0, 22.0, 10.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.40625, -6.2052001953125, -6.004150390625, -5.8031005859375, -5.60205078125, -5.4010009765625, -5.199951171875, -4.9989013671875, -4.7978515625, -4.5968017578125, -4.395751953125, -4.1947021484375, -3.99365234375, -3.7926025390625, -3.591552734375, -3.3905029296875, -3.189453125, -2.9884033203125, -2.787353515625, -2.5863037109375, -2.38525390625, -2.1842041015625, -1.983154296875, -1.7821044921875, -1.5810546875, -1.3800048828125, -1.178955078125, -0.9779052734375, -0.77685546875, -0.5758056640625, -0.374755859375, -0.1737060546875, 0.02734375, 0.2283935546875, 0.429443359375, 0.6304931640625, 0.83154296875, 1.0325927734375, 1.233642578125, 1.4346923828125, 1.6357421875, 1.8367919921875, 2.037841796875, 2.2388916015625, 2.43994140625, 2.6409912109375, 2.842041015625, 3.0430908203125, 3.244140625, 3.4451904296875, 3.646240234375, 3.8472900390625, 4.04833984375, 4.2493896484375, 4.450439453125, 4.6514892578125, 4.8525390625, 5.0535888671875, 5.254638671875, 5.4556884765625, 5.65673828125, 5.8577880859375, 6.058837890625, 6.2598876953125, 6.4609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 1.0, 5.0, 18.0, 9.0, 18.0, 25.0, 35.0, 35.0, 37.0, 60.0, 51.0, 58.0, 90.0, 72.0, 81.0, 55.0, 59.0, 43.0, 49.0, 35.0, 23.0, 20.0, 24.0, 16.0, 14.0, 12.0, 4.0, 12.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004425048828125, -0.0004275888204574585, -0.000412672758102417, -0.0003977566957473755, -0.000382840633392334, -0.0003679245710372925, -0.000353008508682251, -0.00033809244632720947, -0.00032317638397216797, -0.00030826032161712646, -0.00029334425926208496, -0.00027842819690704346, -0.00026351213455200195, -0.00024859607219696045, -0.00023368000984191895, -0.00021876394748687744, -0.00020384788513183594, -0.00018893182277679443, -0.00017401576042175293, -0.00015909969806671143, -0.00014418363571166992, -0.00012926757335662842, -0.00011435151100158691, -9.943544864654541e-05, -8.45193862915039e-05, -6.96033239364624e-05, -5.46872615814209e-05, -3.9771199226379395e-05, -2.485513687133789e-05, -9.939074516296387e-06, 4.976987838745117e-06, 1.989305019378662e-05, 3.4809112548828125e-05, 4.972517490386963e-05, 6.464123725891113e-05, 7.955729961395264e-05, 9.447336196899414e-05, 0.00010938942432403564, 0.00012430548667907715, 0.00013922154903411865, 0.00015413761138916016, 0.00016905367374420166, 0.00018396973609924316, 0.00019888579845428467, 0.00021380186080932617, 0.00022871792316436768, 0.00024363398551940918, 0.0002585500478744507, 0.0002734661102294922, 0.0002883821725845337, 0.0003032982349395752, 0.0003182142972946167, 0.0003331303596496582, 0.0003480464220046997, 0.0003629624843597412, 0.0003778785467147827, 0.0003927946090698242, 0.0004077106714248657, 0.0004226267337799072, 0.00043754279613494873, 0.00045245885848999023, 0.00046737492084503174, 0.00048229098320007324, 0.0004972070455551147, 0.0005121231079101562]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 4.0, 9.0, 14.0, 16.0, 20.0, 37.0, 47.0, 57.0, 94.0, 131.0, 171.0, 283.0, 378.0, 552.0, 893.0, 1295.0, 1932.0, 3011.0, 4656.0, 7066.0, 11435.0, 18435.0, 29048.0, 45960.0, 69990.0, 103667.0, 139360.0, 157738.0, 141578.0, 106829.0, 72773.0, 47835.0, 30236.0, 19134.0, 11914.0, 7666.0, 5032.0, 3208.0, 1958.0, 1301.0, 904.0, 608.0, 416.0, 257.0, 196.0, 128.0, 87.0, 49.0, 49.0, 34.0, 20.0, 18.0, 6.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-4.26953125, -4.1297607421875, -3.989990234375, -3.8502197265625, -3.71044921875, -3.5706787109375, -3.430908203125, -3.2911376953125, -3.1513671875, -3.0115966796875, -2.871826171875, -2.7320556640625, -2.59228515625, -2.4525146484375, -2.312744140625, -2.1729736328125, -2.033203125, -1.8934326171875, -1.753662109375, -1.6138916015625, -1.47412109375, -1.3343505859375, -1.194580078125, -1.0548095703125, -0.9150390625, -0.7752685546875, -0.635498046875, -0.4957275390625, -0.35595703125, -0.2161865234375, -0.076416015625, 0.0633544921875, 0.203125, 0.3428955078125, 0.482666015625, 0.6224365234375, 0.76220703125, 0.9019775390625, 1.041748046875, 1.1815185546875, 1.3212890625, 1.4610595703125, 1.600830078125, 1.7406005859375, 1.88037109375, 2.0201416015625, 2.159912109375, 2.2996826171875, 2.439453125, 2.5792236328125, 2.718994140625, 2.8587646484375, 2.99853515625, 3.1383056640625, 3.278076171875, 3.4178466796875, 3.5576171875, 3.6973876953125, 3.837158203125, 3.9769287109375, 4.11669921875, 4.2564697265625, 4.396240234375, 4.5360107421875, 4.67578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 10.0, 6.0, 7.0, 16.0, 20.0, 24.0, 16.0, 35.0, 46.0, 55.0, 52.0, 60.0, 70.0, 69.0, 60.0, 67.0, 61.0, 48.0, 55.0, 50.0, 28.0, 30.0, 24.0, 18.0, 14.0, 4.0, 11.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.86328125, -2.767669677734375, -2.67205810546875, -2.576446533203125, -2.4808349609375, -2.385223388671875, -2.28961181640625, -2.194000244140625, -2.098388671875, -2.002777099609375, -1.90716552734375, -1.811553955078125, -1.7159423828125, -1.620330810546875, -1.52471923828125, -1.429107666015625, -1.33349609375, -1.237884521484375, -1.14227294921875, -1.046661376953125, -0.9510498046875, -0.855438232421875, -0.75982666015625, -0.664215087890625, -0.568603515625, -0.472991943359375, -0.37738037109375, -0.281768798828125, -0.1861572265625, -0.090545654296875, 0.00506591796875, 0.100677490234375, 0.1962890625, 0.291900634765625, 0.38751220703125, 0.483123779296875, 0.5787353515625, 0.674346923828125, 0.76995849609375, 0.865570068359375, 0.961181640625, 1.056793212890625, 1.15240478515625, 1.248016357421875, 1.3436279296875, 1.439239501953125, 1.53485107421875, 1.630462646484375, 1.72607421875, 1.821685791015625, 1.91729736328125, 2.012908935546875, 2.1085205078125, 2.204132080078125, 2.29974365234375, 2.395355224609375, 2.490966796875, 2.586578369140625, 2.68218994140625, 2.777801513671875, 2.8734130859375, 2.969024658203125, 3.06463623046875, 3.160247802734375, 3.255859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 11.0, 6.0, 6.0, 13.0, 12.0, 20.0, 28.0, 23.0, 25.0, 34.0, 42.0, 48.0, 41.0, 59.0, 57.0, 49.0, 45.0, 54.0, 49.0, 43.0, 41.0, 44.0, 36.0, 37.0, 32.0, 23.0, 22.0, 18.0, 16.0, 13.0, 13.0, 9.0, 5.0, 5.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.755647659301758, -11.367426872253418, -10.979205131530762, -10.590984344482422, -10.202763557434082, -9.814541816711426, -9.426321029663086, -9.03809928894043, -8.64987850189209, -8.26165771484375, -7.873436450958252, -7.485215187072754, -7.096993923187256, -6.708772659301758, -6.320551872253418, -5.93233060836792, -5.54410982131958, -5.155888557434082, -4.767667770385742, -4.379446506500244, -3.991225242614746, -3.603004217147827, -3.214783191680908, -2.82656192779541, -2.438340902328491, -2.0501198768615723, -1.6618986129760742, -1.2736775875091553, -0.8854564428329468, -0.4972352981567383, -0.10901427268981934, 0.2792069911956787, 0.6674280166625977, 1.0556491613388062, 1.4438703060150146, 1.8320913314819336, 2.2203125953674316, 2.6085336208343506, 2.9967546463012695, 3.3849759101867676, 3.7731969356536865, 4.1614179611206055, 4.5496392250061035, 4.937860488891602, 5.326081275939941, 5.7143025398254395, 6.1025238037109375, 6.490744590759277, 6.878965854644775, 7.267187118530273, 7.655407905578613, 8.043628692626953, 8.43185043334961, 8.82007122039795, 9.208292007446289, 9.596513748168945, 9.984734535217285, 10.372955322265625, 10.761177062988281, 11.149397850036621, 11.537618637084961, 11.925840377807617, 12.314061164855957, 12.702281951904297, 13.090503692626953]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 11.0, 11.0, 14.0, 11.0, 10.0, 19.0, 18.0, 24.0, 16.0, 29.0, 36.0, 31.0, 40.0, 49.0, 48.0, 44.0, 53.0, 50.0, 47.0, 38.0, 49.0, 41.0, 40.0, 47.0, 29.0, 35.0, 33.0, 18.0, 18.0, 20.0, 10.0, 17.0, 6.0, 12.0, 3.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.087594985961914, -19.45000648498535, -18.812419891357422, -18.17483139038086, -17.53724479675293, -16.899656295776367, -16.262069702148438, -15.624481201171875, -14.986893653869629, -14.349306106567383, -13.711718559265137, -13.07413101196289, -12.436542510986328, -11.798955917358398, -11.161367416381836, -10.52377986907959, -9.886192321777344, -9.248604774475098, -8.611017227172852, -7.973429203033447, -7.335841655731201, -6.698254108428955, -6.060666084289551, -5.423078536987305, -4.785490989685059, -4.1479034423828125, -3.5103156566619873, -2.872727870941162, -2.235140323638916, -1.59755277633667, -0.9599649906158447, -0.32237720489501953, 0.31521034240722656, 0.9527980089187622, 1.5903856754302979, 2.227973461151123, 2.865561008453369, 3.5031485557556152, 4.1407365798950195, 4.778324127197266, 5.415911674499512, 6.053499221801758, 6.691086769104004, 7.328674793243408, 7.966262340545654, 8.603849411010742, 9.241437911987305, 9.87902545928955, 10.516613006591797, 11.154200553894043, 11.791788101196289, 12.429375648498535, 13.066963195800781, 13.704551696777344, 14.34213924407959, 14.979726791381836, 15.617314338684082, 16.254901885986328, 16.89249038696289, 17.53007698059082, 18.167665481567383, 18.805252075195312, 19.442840576171875, 20.080429077148438, 20.718015670776367]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 11.0, 16.0, 31.0, 49.0, 56.0, 109.0, 184.0, 248.0, 427.0, 584.0, 935.0, 1437.0, 2305.0, 3846.0, 6115.0, 10206.0, 16593.0, 28420.0, 48045.0, 81582.0, 140559.0, 242868.0, 408836.0, 635978.0, 782343.0, 679752.0, 452059.0, 270564.0, 156705.0, 90841.0, 52849.0, 31347.0, 18555.0, 11389.0, 6896.0, 4206.0, 2665.0, 1717.0, 1041.0, 717.0, 442.0, 277.0, 170.0, 100.0, 78.0, 48.0, 33.0, 20.0, 10.0, 8.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.625, -11.257080078125, -10.88916015625, -10.521240234375, -10.1533203125, -9.785400390625, -9.41748046875, -9.049560546875, -8.681640625, -8.313720703125, -7.94580078125, -7.577880859375, -7.2099609375, -6.842041015625, -6.47412109375, -6.106201171875, -5.73828125, -5.370361328125, -5.00244140625, -4.634521484375, -4.2666015625, -3.898681640625, -3.53076171875, -3.162841796875, -2.794921875, -2.427001953125, -2.05908203125, -1.691162109375, -1.3232421875, -0.955322265625, -0.58740234375, -0.219482421875, 0.1484375, 0.516357421875, 0.88427734375, 1.252197265625, 1.6201171875, 1.988037109375, 2.35595703125, 2.723876953125, 3.091796875, 3.459716796875, 3.82763671875, 4.195556640625, 4.5634765625, 4.931396484375, 5.29931640625, 5.667236328125, 6.03515625, 6.403076171875, 6.77099609375, 7.138916015625, 7.5068359375, 7.874755859375, 8.24267578125, 8.610595703125, 8.978515625, 9.346435546875, 9.71435546875, 10.082275390625, 10.4501953125, 10.818115234375, 11.18603515625, 11.553955078125, 11.921875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 14.0, 11.0, 11.0, 10.0, 19.0, 23.0, 18.0, 22.0, 30.0, 35.0, 36.0, 43.0, 40.0, 66.0, 45.0, 55.0, 45.0, 41.0, 39.0, 45.0, 41.0, 53.0, 35.0, 30.0, 37.0, 27.0, 20.0, 22.0, 8.0, 12.0, 14.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.340087890625, -11.93017578125, -11.520263671875, -11.1103515625, -10.700439453125, -10.29052734375, -9.880615234375, -9.470703125, -9.060791015625, -8.65087890625, -8.240966796875, -7.8310546875, -7.421142578125, -7.01123046875, -6.601318359375, -6.19140625, -5.781494140625, -5.37158203125, -4.961669921875, -4.5517578125, -4.141845703125, -3.73193359375, -3.322021484375, -2.912109375, -2.502197265625, -2.09228515625, -1.682373046875, -1.2724609375, -0.862548828125, -0.45263671875, -0.042724609375, 0.3671875, 0.777099609375, 1.18701171875, 1.596923828125, 2.0068359375, 2.416748046875, 2.82666015625, 3.236572265625, 3.646484375, 4.056396484375, 4.46630859375, 4.876220703125, 5.2861328125, 5.696044921875, 6.10595703125, 6.515869140625, 6.92578125, 7.335693359375, 7.74560546875, 8.155517578125, 8.5654296875, 8.975341796875, 9.38525390625, 9.795166015625, 10.205078125, 10.614990234375, 11.02490234375, 11.434814453125, 11.8447265625, 12.254638671875, 12.66455078125, 13.074462890625, 13.484375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 2.0, 18.0, 10.0, 27.0, 47.0, 97.0, 113.0, 189.0, 375.0, 633.0, 1130.0, 1943.0, 3507.0, 6359.0, 11611.0, 21530.0, 40297.0, 77190.0, 147936.0, 273604.0, 471721.0, 699407.0, 795390.0, 667571.0, 437274.0, 250280.0, 134569.0, 71009.0, 36587.0, 19803.0, 10872.0, 5731.0, 3168.0, 1766.0, 992.0, 622.0, 354.0, 194.0, 124.0, 81.0, 66.0, 23.0, 21.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.0859375, -12.716552734375, -12.34716796875, -11.977783203125, -11.6083984375, -11.239013671875, -10.86962890625, -10.500244140625, -10.130859375, -9.761474609375, -9.39208984375, -9.022705078125, -8.6533203125, -8.283935546875, -7.91455078125, -7.545166015625, -7.17578125, -6.806396484375, -6.43701171875, -6.067626953125, -5.6982421875, -5.328857421875, -4.95947265625, -4.590087890625, -4.220703125, -3.851318359375, -3.48193359375, -3.112548828125, -2.7431640625, -2.373779296875, -2.00439453125, -1.635009765625, -1.265625, -0.896240234375, -0.52685546875, -0.157470703125, 0.2119140625, 0.581298828125, 0.95068359375, 1.320068359375, 1.689453125, 2.058837890625, 2.42822265625, 2.797607421875, 3.1669921875, 3.536376953125, 3.90576171875, 4.275146484375, 4.64453125, 5.013916015625, 5.38330078125, 5.752685546875, 6.1220703125, 6.491455078125, 6.86083984375, 7.230224609375, 7.599609375, 7.968994140625, 8.33837890625, 8.707763671875, 9.0771484375, 9.446533203125, 9.81591796875, 10.185302734375, 10.5546875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 5.0, 6.0, 4.0, 8.0, 12.0, 17.0, 21.0, 28.0, 33.0, 38.0, 35.0, 54.0, 61.0, 80.0, 90.0, 82.0, 117.0, 129.0, 147.0, 161.0, 182.0, 203.0, 214.0, 238.0, 201.0, 202.0, 209.0, 159.0, 199.0, 172.0, 145.0, 130.0, 126.0, 84.0, 86.0, 75.0, 65.0, 60.0, 38.0, 38.0, 27.0, 20.0, 14.0, 16.0, 13.0, 8.0, 7.0, 9.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.29296875, -5.1363525390625, -4.979736328125, -4.8231201171875, -4.66650390625, -4.5098876953125, -4.353271484375, -4.1966552734375, -4.0400390625, -3.8834228515625, -3.726806640625, -3.5701904296875, -3.41357421875, -3.2569580078125, -3.100341796875, -2.9437255859375, -2.787109375, -2.6304931640625, -2.473876953125, -2.3172607421875, -2.16064453125, -2.0040283203125, -1.847412109375, -1.6907958984375, -1.5341796875, -1.3775634765625, -1.220947265625, -1.0643310546875, -0.90771484375, -0.7510986328125, -0.594482421875, -0.4378662109375, -0.28125, -0.1246337890625, 0.031982421875, 0.1885986328125, 0.34521484375, 0.5018310546875, 0.658447265625, 0.8150634765625, 0.9716796875, 1.1282958984375, 1.284912109375, 1.4415283203125, 1.59814453125, 1.7547607421875, 1.911376953125, 2.0679931640625, 2.224609375, 2.3812255859375, 2.537841796875, 2.6944580078125, 2.85107421875, 3.0076904296875, 3.164306640625, 3.3209228515625, 3.4775390625, 3.6341552734375, 3.790771484375, 3.9473876953125, 4.10400390625, 4.2606201171875, 4.417236328125, 4.5738525390625, 4.73046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 8.0, 12.0, 15.0, 16.0, 18.0, 25.0, 35.0, 37.0, 33.0, 52.0, 39.0, 61.0, 54.0, 69.0, 48.0, 53.0, 56.0, 54.0, 44.0, 40.0, 37.0, 26.0, 35.0, 11.0, 27.0, 14.0, 16.0, 10.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.863256454467773, -9.505494117736816, -9.14773178100586, -8.789968490600586, -8.432206153869629, -8.074443817138672, -7.716681480407715, -7.358919143676758, -7.001156330108643, -6.6433939933776855, -6.28563117980957, -5.927868843078613, -5.570106506347656, -5.212343692779541, -4.854581356048584, -4.496818542480469, -4.139056205749512, -3.7812936305999756, -3.4235310554504395, -3.0657687187194824, -2.7080061435699463, -2.35024356842041, -1.9924812316894531, -1.634718656539917, -1.2769560813903809, -0.9191935658454895, -0.5614310503005981, -0.20366859436035156, 0.15409398078918457, 0.5118565559387207, 0.8696188926696777, 1.2273814678192139, 1.58514404296875, 1.9429066181182861, 2.3006691932678223, 2.6584315299987793, 3.0161941051483154, 3.3739566802978516, 3.7317190170288086, 4.089481353759766, 4.447244167327881, 4.805006504058838, 5.162769317626953, 5.52053165435791, 5.878293991088867, 6.236056804656982, 6.5938191413879395, 6.951581954956055, 7.309344291687012, 7.667106628417969, 8.024868965148926, 8.382631301879883, 8.740394592285156, 9.098156929016113, 9.45591926574707, 9.813681602478027, 10.171443939208984, 10.529206275939941, 10.886968612670898, 11.244731903076172, 11.602494239807129, 11.960256576538086, 12.318018913269043, 12.67578125, 13.033544540405273]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 15.0, 1.0, 13.0, 15.0, 12.0, 18.0, 19.0, 19.0, 20.0, 28.0, 28.0, 25.0, 34.0, 47.0, 38.0, 44.0, 37.0, 34.0, 39.0, 42.0, 47.0, 47.0, 51.0, 23.0, 45.0, 29.0, 32.0, 32.0, 25.0, 25.0, 16.0, 14.0, 10.0, 11.0, 9.0, 6.0, 8.0, 8.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-15.982383728027344, -15.50396728515625, -15.02554988861084, -14.547133445739746, -14.068717002868652, -13.590299606323242, -13.111883163452148, -12.633466720581055, -12.155050277709961, -11.676633834838867, -11.198216438293457, -10.719799995422363, -10.24138355255127, -9.76296615600586, -9.284549713134766, -8.806133270263672, -8.327716827392578, -7.849299907684326, -7.370883464813232, -6.8924665451049805, -6.414050102233887, -5.935633182525635, -5.457216262817383, -4.978799819946289, -4.500382423400879, -4.021965503692627, -3.543549060821533, -3.0651321411132812, -2.5867156982421875, -2.1082987785339355, -1.6298820972442627, -1.1514654159545898, -0.6730489730834961, -0.19463226199150085, 0.2837844491004944, 0.762201189994812, 1.2406178712844849, 1.7190346717834473, 2.19745135307312, 2.675868034362793, 3.154284715652466, 3.6327013969421387, 4.111118316650391, 4.589534759521484, 5.067951679229736, 5.546368598937988, 6.024785041809082, 6.503201484680176, 6.981618404388428, 7.46003532409668, 7.938451766967773, 8.416868209838867, 8.895285606384277, 9.373702049255371, 9.852118492126465, 10.330535888671875, 10.808952331542969, 11.287368774414062, 11.765786170959473, 12.244202613830566, 12.72261905670166, 13.20103645324707, 13.679452896118164, 14.157869338989258, 14.636285781860352]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 17.0, 22.0, 38.0, 48.0, 78.0, 113.0, 174.0, 233.0, 401.0, 575.0, 819.0, 1181.0, 1849.0, 2758.0, 4165.0, 6342.0, 10067.0, 16145.0, 26009.0, 42209.0, 70466.0, 117228.0, 185611.0, 204863.0, 138861.0, 84133.0, 50962.0, 30868.0, 18694.0, 11880.0, 7388.0, 4883.0, 3108.0, 2066.0, 1391.0, 896.0, 636.0, 426.0, 277.0, 203.0, 134.0, 112.0, 85.0, 50.0, 33.0, 16.0, 17.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.509765625, -2.434112548828125, -2.35845947265625, -2.282806396484375, -2.2071533203125, -2.131500244140625, -2.05584716796875, -1.980194091796875, -1.904541015625, -1.828887939453125, -1.75323486328125, -1.677581787109375, -1.6019287109375, -1.526275634765625, -1.45062255859375, -1.374969482421875, -1.29931640625, -1.223663330078125, -1.14801025390625, -1.072357177734375, -0.9967041015625, -0.921051025390625, -0.84539794921875, -0.769744873046875, -0.694091796875, -0.618438720703125, -0.54278564453125, -0.467132568359375, -0.3914794921875, -0.315826416015625, -0.24017333984375, -0.164520263671875, -0.0888671875, -0.013214111328125, 0.06243896484375, 0.138092041015625, 0.2137451171875, 0.289398193359375, 0.36505126953125, 0.440704345703125, 0.516357421875, 0.592010498046875, 0.66766357421875, 0.743316650390625, 0.8189697265625, 0.894622802734375, 0.97027587890625, 1.045928955078125, 1.12158203125, 1.197235107421875, 1.27288818359375, 1.348541259765625, 1.4241943359375, 1.499847412109375, 1.57550048828125, 1.651153564453125, 1.726806640625, 1.802459716796875, 1.87811279296875, 1.953765869140625, 2.0294189453125, 2.105072021484375, 2.18072509765625, 2.256378173828125, 2.33203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 9.0, 9.0, 6.0, 11.0, 13.0, 19.0, 14.0, 20.0, 23.0, 18.0, 31.0, 26.0, 23.0, 34.0, 34.0, 46.0, 45.0, 36.0, 49.0, 33.0, 40.0, 35.0, 40.0, 50.0, 45.0, 36.0, 32.0, 27.0, 30.0, 22.0, 28.0, 12.0, 11.0, 16.0, 11.0, 4.0, 9.0, 12.0, 8.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-14.671875, -14.205322265625, -13.73876953125, -13.272216796875, -12.8056640625, -12.339111328125, -11.87255859375, -11.406005859375, -10.939453125, -10.472900390625, -10.00634765625, -9.539794921875, -9.0732421875, -8.606689453125, -8.14013671875, -7.673583984375, -7.20703125, -6.740478515625, -6.27392578125, -5.807373046875, -5.3408203125, -4.874267578125, -4.40771484375, -3.941162109375, -3.474609375, -3.008056640625, -2.54150390625, -2.074951171875, -1.6083984375, -1.141845703125, -0.67529296875, -0.208740234375, 0.2578125, 0.724365234375, 1.19091796875, 1.657470703125, 2.1240234375, 2.590576171875, 3.05712890625, 3.523681640625, 3.990234375, 4.456787109375, 4.92333984375, 5.389892578125, 5.8564453125, 6.322998046875, 6.78955078125, 7.256103515625, 7.72265625, 8.189208984375, 8.65576171875, 9.122314453125, 9.5888671875, 10.055419921875, 10.52197265625, 10.988525390625, 11.455078125, 11.921630859375, 12.38818359375, 12.854736328125, 13.3212890625, 13.787841796875, 14.25439453125, 14.720947265625, 15.1875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 7.0, 12.0, 18.0, 19.0, 25.0, 37.0, 72.0, 91.0, 124.0, 207.0, 326.0, 506.0, 749.0, 1149.0, 1821.0, 2953.0, 4791.0, 7665.0, 12644.0, 21145.0, 36069.0, 62363.0, 105601.0, 171940.0, 219835.0, 160498.0, 97073.0, 57076.0, 33044.0, 19748.0, 11899.0, 7124.0, 4337.0, 2689.0, 1726.0, 1126.0, 710.0, 460.0, 284.0, 205.0, 126.0, 79.0, 53.0, 32.0, 36.0, 16.0, 16.0, 5.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.181640625, -2.10992431640625, -2.0382080078125, -1.96649169921875, -1.894775390625, -1.82305908203125, -1.7513427734375, -1.67962646484375, -1.60791015625, -1.53619384765625, -1.4644775390625, -1.39276123046875, -1.321044921875, -1.24932861328125, -1.1776123046875, -1.10589599609375, -1.0341796875, -0.96246337890625, -0.8907470703125, -0.81903076171875, -0.747314453125, -0.67559814453125, -0.6038818359375, -0.53216552734375, -0.46044921875, -0.38873291015625, -0.3170166015625, -0.24530029296875, -0.173583984375, -0.10186767578125, -0.0301513671875, 0.04156494140625, 0.11328125, 0.18499755859375, 0.2567138671875, 0.32843017578125, 0.400146484375, 0.47186279296875, 0.5435791015625, 0.61529541015625, 0.68701171875, 0.75872802734375, 0.8304443359375, 0.90216064453125, 0.973876953125, 1.04559326171875, 1.1173095703125, 1.18902587890625, 1.2607421875, 1.33245849609375, 1.4041748046875, 1.47589111328125, 1.547607421875, 1.61932373046875, 1.6910400390625, 1.76275634765625, 1.83447265625, 1.90618896484375, 1.9779052734375, 2.04962158203125, 2.121337890625, 2.19305419921875, 2.2647705078125, 2.33648681640625, 2.408203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 3.0, 5.0, 7.0, 11.0, 10.0, 12.0, 20.0, 23.0, 16.0, 19.0, 24.0, 22.0, 28.0, 23.0, 28.0, 32.0, 35.0, 27.0, 41.0, 34.0, 28.0, 33.0, 42.0, 37.0, 27.0, 33.0, 39.0, 36.0, 30.0, 26.0, 25.0, 22.0, 19.0, 26.0, 24.0, 20.0, 13.0, 8.0, 18.0, 10.0, 12.0, 9.0, 7.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0], "bins": [-9.625, -9.32373046875, -9.0224609375, -8.72119140625, -8.419921875, -8.11865234375, -7.8173828125, -7.51611328125, -7.21484375, -6.91357421875, -6.6123046875, -6.31103515625, -6.009765625, -5.70849609375, -5.4072265625, -5.10595703125, -4.8046875, -4.50341796875, -4.2021484375, -3.90087890625, -3.599609375, -3.29833984375, -2.9970703125, -2.69580078125, -2.39453125, -2.09326171875, -1.7919921875, -1.49072265625, -1.189453125, -0.88818359375, -0.5869140625, -0.28564453125, 0.015625, 0.31689453125, 0.6181640625, 0.91943359375, 1.220703125, 1.52197265625, 1.8232421875, 2.12451171875, 2.42578125, 2.72705078125, 3.0283203125, 3.32958984375, 3.630859375, 3.93212890625, 4.2333984375, 4.53466796875, 4.8359375, 5.13720703125, 5.4384765625, 5.73974609375, 6.041015625, 6.34228515625, 6.6435546875, 6.94482421875, 7.24609375, 7.54736328125, 7.8486328125, 8.14990234375, 8.451171875, 8.75244140625, 9.0537109375, 9.35498046875, 9.65625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 21.0, 19.0, 17.0, 25.0, 50.0, 60.0, 67.0, 85.0, 127.0, 194.0, 276.0, 393.0, 616.0, 1134.0, 2041.0, 3951.0, 9586.0, 28975.0, 134851.0, 601552.0, 202962.0, 39109.0, 11945.0, 4708.0, 2286.0, 1277.0, 675.0, 433.0, 325.0, 214.0, 143.0, 94.0, 82.0, 70.0, 40.0, 31.0, 26.0, 21.0, 8.0, 11.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.0, -0.9673309326171875, -0.934661865234375, -0.9019927978515625, -0.86932373046875, -0.8366546630859375, -0.803985595703125, -0.7713165283203125, -0.7386474609375, -0.7059783935546875, -0.673309326171875, -0.6406402587890625, -0.60797119140625, -0.5753021240234375, -0.542633056640625, -0.5099639892578125, -0.477294921875, -0.4446258544921875, -0.411956787109375, -0.3792877197265625, -0.34661865234375, -0.3139495849609375, -0.281280517578125, -0.2486114501953125, -0.2159423828125, -0.1832733154296875, -0.150604248046875, -0.1179351806640625, -0.08526611328125, -0.0525970458984375, -0.019927978515625, 0.0127410888671875, 0.04541015625, 0.0780792236328125, 0.110748291015625, 0.1434173583984375, 0.17608642578125, 0.2087554931640625, 0.241424560546875, 0.2740936279296875, 0.3067626953125, 0.3394317626953125, 0.372100830078125, 0.4047698974609375, 0.43743896484375, 0.4701080322265625, 0.502777099609375, 0.5354461669921875, 0.568115234375, 0.6007843017578125, 0.633453369140625, 0.6661224365234375, 0.69879150390625, 0.7314605712890625, 0.764129638671875, 0.7967987060546875, 0.8294677734375, 0.8621368408203125, 0.894805908203125, 0.9274749755859375, 0.96014404296875, 0.9928131103515625, 1.025482177734375, 1.0581512451171875, 1.0908203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 9.0, 10.0, 11.0, 18.0, 17.0, 44.0, 31.0, 32.0, 54.0, 58.0, 69.0, 71.0, 82.0, 61.0, 65.0, 82.0, 44.0, 40.0, 38.0, 24.0, 29.0, 21.0, 15.0, 15.0, 6.0, 11.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-05, -4.888512194156647e-05, -4.71062958240509e-05, -4.532746970653534e-05, -4.3548643589019775e-05, -4.176981747150421e-05, -3.999099135398865e-05, -3.8212165236473083e-05, -3.643333911895752e-05, -3.4654513001441956e-05, -3.287568688392639e-05, -3.109686076641083e-05, -2.9318034648895264e-05, -2.75392085313797e-05, -2.5760382413864136e-05, -2.3981556296348572e-05, -2.2202730178833008e-05, -2.0423904061317444e-05, -1.864507794380188e-05, -1.6866251826286316e-05, -1.5087425708770752e-05, -1.3308599591255188e-05, -1.1529773473739624e-05, -9.75094735622406e-06, -7.972121238708496e-06, -6.193295121192932e-06, -4.414469003677368e-06, -2.635642886161804e-06, -8.568167686462402e-07, 9.220093488693237e-07, 2.7008354663848877e-06, 4.479661583900452e-06, 6.258487701416016e-06, 8.03731381893158e-06, 9.816139936447144e-06, 1.1594966053962708e-05, 1.3373792171478271e-05, 1.5152618288993835e-05, 1.69314444065094e-05, 1.8710270524024963e-05, 2.0489096641540527e-05, 2.226792275905609e-05, 2.4046748876571655e-05, 2.582557499408722e-05, 2.7604401111602783e-05, 2.9383227229118347e-05, 3.116205334663391e-05, 3.2940879464149475e-05, 3.471970558166504e-05, 3.64985316991806e-05, 3.827735781669617e-05, 4.005618393421173e-05, 4.1835010051727295e-05, 4.361383616924286e-05, 4.539266228675842e-05, 4.717148840427399e-05, 4.895031452178955e-05, 5.0729140639305115e-05, 5.250796675682068e-05, 5.428679287433624e-05, 5.606561899185181e-05, 5.784444510936737e-05, 5.9623271226882935e-05, 6.14020973443985e-05, 6.318092346191406e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 5.0, 14.0, 19.0, 35.0, 62.0, 65.0, 103.0, 164.0, 223.0, 328.0, 526.0, 840.0, 1353.0, 2357.0, 4075.0, 7397.0, 13450.0, 24576.0, 45789.0, 86751.0, 166016.0, 275394.0, 196265.0, 103708.0, 53673.0, 29056.0, 15838.0, 8579.0, 4865.0, 2714.0, 1607.0, 991.0, 565.0, 373.0, 235.0, 164.0, 119.0, 80.0, 51.0, 39.0, 27.0, 20.0, 12.0, 11.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8577423095703125, -0.829742431640625, -0.8017425537109375, -0.77374267578125, -0.7457427978515625, -0.717742919921875, -0.6897430419921875, -0.6617431640625, -0.6337432861328125, -0.605743408203125, -0.5777435302734375, -0.54974365234375, -0.5217437744140625, -0.493743896484375, -0.4657440185546875, -0.437744140625, -0.4097442626953125, -0.381744384765625, -0.3537445068359375, -0.32574462890625, -0.2977447509765625, -0.269744873046875, -0.2417449951171875, -0.2137451171875, -0.1857452392578125, -0.157745361328125, -0.1297454833984375, -0.10174560546875, -0.0737457275390625, -0.045745849609375, -0.0177459716796875, 0.01025390625, 0.0382537841796875, 0.066253662109375, 0.0942535400390625, 0.12225341796875, 0.1502532958984375, 0.178253173828125, 0.2062530517578125, 0.2342529296875, 0.2622528076171875, 0.290252685546875, 0.3182525634765625, 0.34625244140625, 0.3742523193359375, 0.402252197265625, 0.4302520751953125, 0.458251953125, 0.4862518310546875, 0.514251708984375, 0.5422515869140625, 0.57025146484375, 0.5982513427734375, 0.626251220703125, 0.6542510986328125, 0.6822509765625, 0.7102508544921875, 0.738250732421875, 0.7662506103515625, 0.79425048828125, 0.8222503662109375, 0.850250244140625, 0.8782501220703125, 0.90625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 10.0, 8.0, 14.0, 14.0, 11.0, 19.0, 23.0, 23.0, 27.0, 36.0, 45.0, 41.0, 32.0, 32.0, 39.0, 35.0, 47.0, 45.0, 39.0, 46.0, 39.0, 36.0, 43.0, 20.0, 37.0, 26.0, 36.0, 32.0, 30.0, 25.0, 20.0, 13.0, 12.0, 14.0, 8.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.445068359375, -0.43117523193359375, -0.4172821044921875, -0.40338897705078125, -0.389495849609375, -0.37560272216796875, -0.3617095947265625, -0.34781646728515625, -0.33392333984375, -0.32003021240234375, -0.3061370849609375, -0.29224395751953125, -0.278350830078125, -0.26445770263671875, -0.2505645751953125, -0.23667144775390625, -0.2227783203125, -0.20888519287109375, -0.1949920654296875, -0.18109893798828125, -0.167205810546875, -0.15331268310546875, -0.1394195556640625, -0.12552642822265625, -0.11163330078125, -0.09774017333984375, -0.0838470458984375, -0.06995391845703125, -0.056060791015625, -0.04216766357421875, -0.0282745361328125, -0.01438140869140625, -0.00048828125, 0.01340484619140625, 0.0272979736328125, 0.04119110107421875, 0.055084228515625, 0.06897735595703125, 0.0828704833984375, 0.09676361083984375, 0.11065673828125, 0.12454986572265625, 0.1384429931640625, 0.15233612060546875, 0.166229248046875, 0.18012237548828125, 0.1940155029296875, 0.20790863037109375, 0.2218017578125, 0.23569488525390625, 0.2495880126953125, 0.26348114013671875, 0.277374267578125, 0.29126739501953125, 0.3051605224609375, 0.31905364990234375, 0.33294677734375, 0.34683990478515625, 0.3607330322265625, 0.37462615966796875, 0.388519287109375, 0.40241241455078125, 0.4163055419921875, 0.43019866943359375, 0.444091796875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 11.0, 12.0, 17.0, 14.0, 27.0, 36.0, 27.0, 34.0, 41.0, 45.0, 51.0, 66.0, 56.0, 61.0, 58.0, 54.0, 49.0, 55.0, 35.0, 37.0, 26.0, 37.0, 19.0, 17.0, 21.0, 19.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.541988372802734, -9.186993598937988, -8.831997871398926, -8.47700309753418, -8.122007369995117, -7.767012596130371, -7.412017822265625, -7.057022571563721, -6.702027320861816, -6.347032070159912, -5.992036819458008, -5.637042045593262, -5.282046794891357, -4.927051544189453, -4.572056770324707, -4.217061519622803, -3.8620662689208984, -3.507071018218994, -3.152076005935669, -2.7970809936523438, -2.4420857429504395, -2.087090492248535, -1.73209547996521, -1.3771004676818848, -1.0221052169799805, -0.6671100854873657, -0.312114953994751, 0.04288017749786377, 0.3978753089904785, 0.7528704404830933, 1.107865571975708, 1.4628605842590332, 1.817854881286621, 2.1728501319885254, 2.5278451442718506, 2.882840156555176, 3.23783540725708, 3.5928306579589844, 3.9478256702423096, 4.302820682525635, 4.657815933227539, 5.012811183929443, 5.367806434631348, 5.722801208496094, 6.077796459197998, 6.432791709899902, 6.787786483764648, 7.142781734466553, 7.497776985168457, 7.852772235870361, 8.207767486572266, 8.562762260437012, 8.917757034301758, 9.27275276184082, 9.627747535705566, 9.982742309570312, 10.337738037109375, 10.692732810974121, 11.047728538513184, 11.40272331237793, 11.757719039916992, 12.112713813781738, 12.467708587646484, 12.822704315185547, 13.177699089050293]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 8.0, 13.0, 7.0, 6.0, 12.0, 11.0, 14.0, 21.0, 19.0, 18.0, 20.0, 23.0, 26.0, 36.0, 24.0, 44.0, 40.0, 37.0, 41.0, 41.0, 39.0, 38.0, 37.0, 44.0, 49.0, 39.0, 45.0, 25.0, 35.0, 33.0, 29.0, 21.0, 20.0, 15.0, 9.0, 8.0, 12.0, 9.0, 6.0, 8.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-15.990324974060059, -15.517355918884277, -15.04438591003418, -14.571416854858398, -14.0984468460083, -13.62547779083252, -13.152507781982422, -12.67953872680664, -12.206568717956543, -11.733599662780762, -11.260629653930664, -10.787660598754883, -10.314690589904785, -9.841721534729004, -9.368751525878906, -8.895782470703125, -8.422813415527344, -7.949843883514404, -7.476874351501465, -7.003904819488525, -6.530935287475586, -6.057966232299805, -5.584996223449707, -5.112027168273926, -4.639057159423828, -4.166087627410889, -3.693118095397949, -3.2201485633850098, -2.7471790313720703, -2.27420973777771, -1.8012402057647705, -1.328270673751831, -0.8553009033203125, -0.38233140110969543, 0.09063810110092163, 0.5636075735092163, 1.0365771055221558, 1.5095465183258057, 1.9825160503387451, 2.4554855823516846, 2.928455114364624, 3.4014246463775635, 3.874394178390503, 4.347363471984863, 4.820333003997803, 5.293302536010742, 5.766272068023682, 6.239241600036621, 6.7122111320495605, 7.1851806640625, 7.6581501960754395, 8.131119728088379, 8.60408878326416, 9.077058792114258, 9.550027847290039, 10.022997856140137, 10.495966911315918, 10.9689359664917, 11.441905975341797, 11.914875030517578, 12.387845039367676, 12.860814094543457, 13.333784103393555, 13.806753158569336, 14.279723167419434]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 11.0, 21.0, 26.0, 55.0, 56.0, 109.0, 159.0, 230.0, 358.0, 496.0, 743.0, 1175.0, 1814.0, 2801.0, 4313.0, 6730.0, 10315.0, 16017.0, 24790.0, 37725.0, 56647.0, 80183.0, 108241.0, 130982.0, 136362.0, 122636.0, 97122.0, 69907.0, 47781.0, 31835.0, 20576.0, 13455.0, 8642.0, 5658.0, 3595.0, 2468.0, 1542.0, 995.0, 605.0, 454.0, 304.0, 194.0, 139.0, 98.0, 66.0, 50.0, 28.0, 13.0, 10.0, 2.0, 5.0, 2.0, 0.0, 0.0, 4.0], "bins": [-9.3359375, -9.0555419921875, -8.775146484375, -8.4947509765625, -8.21435546875, -7.9339599609375, -7.653564453125, -7.3731689453125, -7.0927734375, -6.8123779296875, -6.531982421875, -6.2515869140625, -5.97119140625, -5.6907958984375, -5.410400390625, -5.1300048828125, -4.849609375, -4.5692138671875, -4.288818359375, -4.0084228515625, -3.72802734375, -3.4476318359375, -3.167236328125, -2.8868408203125, -2.6064453125, -2.3260498046875, -2.045654296875, -1.7652587890625, -1.48486328125, -1.2044677734375, -0.924072265625, -0.6436767578125, -0.36328125, -0.0828857421875, 0.197509765625, 0.4779052734375, 0.75830078125, 1.0386962890625, 1.319091796875, 1.5994873046875, 1.8798828125, 2.1602783203125, 2.440673828125, 2.7210693359375, 3.00146484375, 3.2818603515625, 3.562255859375, 3.8426513671875, 4.123046875, 4.4034423828125, 4.683837890625, 4.9642333984375, 5.24462890625, 5.5250244140625, 5.805419921875, 6.0858154296875, 6.3662109375, 6.6466064453125, 6.927001953125, 7.2073974609375, 7.48779296875, 7.7681884765625, 8.048583984375, 8.3289794921875, 8.609375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 9.0, 6.0, 6.0, 6.0, 10.0, 13.0, 15.0, 14.0, 17.0, 17.0, 27.0, 27.0, 24.0, 34.0, 29.0, 35.0, 31.0, 43.0, 47.0, 38.0, 44.0, 44.0, 50.0, 39.0, 41.0, 35.0, 43.0, 35.0, 37.0, 28.0, 25.0, 24.0, 23.0, 13.0, 14.0, 10.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.96875, -14.500244140625, -14.03173828125, -13.563232421875, -13.0947265625, -12.626220703125, -12.15771484375, -11.689208984375, -11.220703125, -10.752197265625, -10.28369140625, -9.815185546875, -9.3466796875, -8.878173828125, -8.40966796875, -7.941162109375, -7.47265625, -7.004150390625, -6.53564453125, -6.067138671875, -5.5986328125, -5.130126953125, -4.66162109375, -4.193115234375, -3.724609375, -3.256103515625, -2.78759765625, -2.319091796875, -1.8505859375, -1.382080078125, -0.91357421875, -0.445068359375, 0.0234375, 0.491943359375, 0.96044921875, 1.428955078125, 1.8974609375, 2.365966796875, 2.83447265625, 3.302978515625, 3.771484375, 4.239990234375, 4.70849609375, 5.177001953125, 5.6455078125, 6.114013671875, 6.58251953125, 7.051025390625, 7.51953125, 7.988037109375, 8.45654296875, 8.925048828125, 9.3935546875, 9.862060546875, 10.33056640625, 10.799072265625, 11.267578125, 11.736083984375, 12.20458984375, 12.673095703125, 13.1416015625, 13.610107421875, 14.07861328125, 14.547119140625, 15.015625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [5.0, 7.0, 5.0, 10.0, 8.0, 9.0, 17.0, 14.0, 32.0, 51.0, 66.0, 84.0, 152.0, 215.0, 301.0, 436.0, 680.0, 1083.0, 1613.0, 2389.0, 3616.0, 5591.0, 8610.0, 12957.0, 20056.0, 30061.0, 44903.0, 64420.0, 88339.0, 112782.0, 129007.0, 127965.0, 111731.0, 87352.0, 63526.0, 43866.0, 29496.0, 19572.0, 12705.0, 8424.0, 5759.0, 3655.0, 2346.0, 1566.0, 1022.0, 662.0, 453.0, 302.0, 193.0, 129.0, 92.0, 65.0, 50.0, 40.0, 25.0, 20.0, 11.0, 9.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0], "bins": [-8.0546875, -7.794677734375, -7.53466796875, -7.274658203125, -7.0146484375, -6.754638671875, -6.49462890625, -6.234619140625, -5.974609375, -5.714599609375, -5.45458984375, -5.194580078125, -4.9345703125, -4.674560546875, -4.41455078125, -4.154541015625, -3.89453125, -3.634521484375, -3.37451171875, -3.114501953125, -2.8544921875, -2.594482421875, -2.33447265625, -2.074462890625, -1.814453125, -1.554443359375, -1.29443359375, -1.034423828125, -0.7744140625, -0.514404296875, -0.25439453125, 0.005615234375, 0.265625, 0.525634765625, 0.78564453125, 1.045654296875, 1.3056640625, 1.565673828125, 1.82568359375, 2.085693359375, 2.345703125, 2.605712890625, 2.86572265625, 3.125732421875, 3.3857421875, 3.645751953125, 3.90576171875, 4.165771484375, 4.42578125, 4.685791015625, 4.94580078125, 5.205810546875, 5.4658203125, 5.725830078125, 5.98583984375, 6.245849609375, 6.505859375, 6.765869140625, 7.02587890625, 7.285888671875, 7.5458984375, 7.805908203125, 8.06591796875, 8.325927734375, 8.5859375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 14.0, 9.0, 4.0, 13.0, 8.0, 15.0, 20.0, 20.0, 30.0, 22.0, 23.0, 23.0, 35.0, 20.0, 37.0, 40.0, 26.0, 57.0, 37.0, 40.0, 48.0, 36.0, 39.0, 27.0, 42.0, 45.0, 28.0, 31.0, 17.0, 24.0, 23.0, 21.0, 17.0, 21.0, 22.0, 7.0, 9.0, 8.0, 15.0, 3.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-9.28125, -9.0084228515625, -8.735595703125, -8.4627685546875, -8.18994140625, -7.9171142578125, -7.644287109375, -7.3714599609375, -7.0986328125, -6.8258056640625, -6.552978515625, -6.2801513671875, -6.00732421875, -5.7344970703125, -5.461669921875, -5.1888427734375, -4.916015625, -4.6431884765625, -4.370361328125, -4.0975341796875, -3.82470703125, -3.5518798828125, -3.279052734375, -3.0062255859375, -2.7333984375, -2.4605712890625, -2.187744140625, -1.9149169921875, -1.64208984375, -1.3692626953125, -1.096435546875, -0.8236083984375, -0.55078125, -0.2779541015625, -0.005126953125, 0.2677001953125, 0.54052734375, 0.8133544921875, 1.086181640625, 1.3590087890625, 1.6318359375, 1.9046630859375, 2.177490234375, 2.4503173828125, 2.72314453125, 2.9959716796875, 3.268798828125, 3.5416259765625, 3.814453125, 4.0872802734375, 4.360107421875, 4.6329345703125, 4.90576171875, 5.1785888671875, 5.451416015625, 5.7242431640625, 5.9970703125, 6.2698974609375, 6.542724609375, 6.8155517578125, 7.08837890625, 7.3612060546875, 7.634033203125, 7.9068603515625, 8.1796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 6.0, 4.0, 2.0, 6.0, 8.0, 11.0, 12.0, 26.0, 23.0, 43.0, 69.0, 100.0, 143.0, 236.0, 345.0, 525.0, 841.0, 1396.0, 2389.0, 3848.0, 6387.0, 11143.0, 19464.0, 34263.0, 59935.0, 101675.0, 156626.0, 192910.0, 171692.0, 117613.0, 70897.0, 40720.0, 22914.0, 12903.0, 7671.0, 4533.0, 2720.0, 1678.0, 999.0, 634.0, 383.0, 249.0, 170.0, 108.0, 82.0, 44.0, 40.0, 23.0, 26.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-4.51171875, -4.37353515625, -4.2353515625, -4.09716796875, -3.958984375, -3.82080078125, -3.6826171875, -3.54443359375, -3.40625, -3.26806640625, -3.1298828125, -2.99169921875, -2.853515625, -2.71533203125, -2.5771484375, -2.43896484375, -2.30078125, -2.16259765625, -2.0244140625, -1.88623046875, -1.748046875, -1.60986328125, -1.4716796875, -1.33349609375, -1.1953125, -1.05712890625, -0.9189453125, -0.78076171875, -0.642578125, -0.50439453125, -0.3662109375, -0.22802734375, -0.08984375, 0.04833984375, 0.1865234375, 0.32470703125, 0.462890625, 0.60107421875, 0.7392578125, 0.87744140625, 1.015625, 1.15380859375, 1.2919921875, 1.43017578125, 1.568359375, 1.70654296875, 1.8447265625, 1.98291015625, 2.12109375, 2.25927734375, 2.3974609375, 2.53564453125, 2.673828125, 2.81201171875, 2.9501953125, 3.08837890625, 3.2265625, 3.36474609375, 3.5029296875, 3.64111328125, 3.779296875, 3.91748046875, 4.0556640625, 4.19384765625, 4.33203125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 4.0, 4.0, 9.0, 7.0, 11.0, 13.0, 17.0, 26.0, 30.0, 31.0, 37.0, 41.0, 30.0, 52.0, 57.0, 51.0, 56.0, 67.0, 34.0, 48.0, 53.0, 47.0, 45.0, 34.0, 32.0, 25.0, 19.0, 21.0, 20.0, 16.0, 10.0, 10.0, 9.0, 6.0, 3.0, 1.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025153160095214844, -0.0002433769404888153, -0.00023522228002548218, -0.00022706761956214905, -0.00021891295909881592, -0.0002107582986354828, -0.00020260363817214966, -0.00019444897770881653, -0.0001862943172454834, -0.00017813965678215027, -0.00016998499631881714, -0.000161830335855484, -0.00015367567539215088, -0.00014552101492881775, -0.00013736635446548462, -0.0001292116940021515, -0.00012105703353881836, -0.00011290237307548523, -0.0001047477126121521, -9.659305214881897e-05, -8.843839168548584e-05, -8.028373122215271e-05, -7.212907075881958e-05, -6.397441029548645e-05, -5.581974983215332e-05, -4.766508936882019e-05, -3.951042890548706e-05, -3.135576844215393e-05, -2.32011079788208e-05, -1.5046447515487671e-05, -6.891787052154541e-06, 1.2628734111785889e-06, 9.417533874511719e-06, 1.757219433784485e-05, 2.572685480117798e-05, 3.388151526451111e-05, 4.203617572784424e-05, 5.019083619117737e-05, 5.83454966545105e-05, 6.650015711784363e-05, 7.465481758117676e-05, 8.280947804450989e-05, 9.096413850784302e-05, 9.911879897117615e-05, 0.00010727345943450928, 0.00011542811989784241, 0.00012358278036117554, 0.00013173744082450867, 0.0001398921012878418, 0.00014804676175117493, 0.00015620142221450806, 0.0001643560826778412, 0.00017251074314117432, 0.00018066540360450745, 0.00018882006406784058, 0.0001969747245311737, 0.00020512938499450684, 0.00021328404545783997, 0.0002214387059211731, 0.00022959336638450623, 0.00023774802684783936, 0.0002459026873111725, 0.0002540573477745056, 0.00026221200823783875, 0.0002703666687011719]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 8.0, 10.0, 20.0, 21.0, 39.0, 42.0, 77.0, 107.0, 170.0, 189.0, 295.0, 466.0, 680.0, 1022.0, 1553.0, 2266.0, 3520.0, 5835.0, 8956.0, 14768.0, 23744.0, 39306.0, 63772.0, 99765.0, 143062.0, 170821.0, 156365.0, 115215.0, 74438.0, 46445.0, 28398.0, 17370.0, 10744.0, 6842.0, 4245.0, 2650.0, 1769.0, 1133.0, 771.0, 491.0, 358.0, 263.0, 175.0, 124.0, 71.0, 65.0, 30.0, 25.0, 23.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-3.978515625, -3.85675048828125, -3.7349853515625, -3.61322021484375, -3.491455078125, -3.36968994140625, -3.2479248046875, -3.12615966796875, -3.00439453125, -2.88262939453125, -2.7608642578125, -2.63909912109375, -2.517333984375, -2.39556884765625, -2.2738037109375, -2.15203857421875, -2.0302734375, -1.90850830078125, -1.7867431640625, -1.66497802734375, -1.543212890625, -1.42144775390625, -1.2996826171875, -1.17791748046875, -1.05615234375, -0.93438720703125, -0.8126220703125, -0.69085693359375, -0.569091796875, -0.44732666015625, -0.3255615234375, -0.20379638671875, -0.08203125, 0.03973388671875, 0.1614990234375, 0.28326416015625, 0.405029296875, 0.52679443359375, 0.6485595703125, 0.77032470703125, 0.89208984375, 1.01385498046875, 1.1356201171875, 1.25738525390625, 1.379150390625, 1.50091552734375, 1.6226806640625, 1.74444580078125, 1.8662109375, 1.98797607421875, 2.1097412109375, 2.23150634765625, 2.353271484375, 2.47503662109375, 2.5968017578125, 2.71856689453125, 2.84033203125, 2.96209716796875, 3.0838623046875, 3.20562744140625, 3.327392578125, 3.44915771484375, 3.5709228515625, 3.69268798828125, 3.814453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 10.0, 5.0, 16.0, 18.0, 19.0, 24.0, 27.0, 19.0, 32.0, 44.0, 57.0, 60.0, 58.0, 55.0, 47.0, 79.0, 58.0, 54.0, 52.0, 36.0, 42.0, 26.0, 23.0, 21.0, 19.0, 8.0, 15.0, 10.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.427734375, -2.3568115234375, -2.285888671875, -2.2149658203125, -2.14404296875, -2.0731201171875, -2.002197265625, -1.9312744140625, -1.8603515625, -1.7894287109375, -1.718505859375, -1.6475830078125, -1.57666015625, -1.5057373046875, -1.434814453125, -1.3638916015625, -1.29296875, -1.2220458984375, -1.151123046875, -1.0802001953125, -1.00927734375, -0.9383544921875, -0.867431640625, -0.7965087890625, -0.7255859375, -0.6546630859375, -0.583740234375, -0.5128173828125, -0.44189453125, -0.3709716796875, -0.300048828125, -0.2291259765625, -0.158203125, -0.0872802734375, -0.016357421875, 0.0545654296875, 0.12548828125, 0.1964111328125, 0.267333984375, 0.3382568359375, 0.4091796875, 0.4801025390625, 0.551025390625, 0.6219482421875, 0.69287109375, 0.7637939453125, 0.834716796875, 0.9056396484375, 0.9765625, 1.0474853515625, 1.118408203125, 1.1893310546875, 1.26025390625, 1.3311767578125, 1.402099609375, 1.4730224609375, 1.5439453125, 1.6148681640625, 1.685791015625, 1.7567138671875, 1.82763671875, 1.8985595703125, 1.969482421875, 2.0404052734375, 2.111328125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 16.0, 15.0, 13.0, 26.0, 30.0, 33.0, 38.0, 54.0, 57.0, 60.0, 53.0, 73.0, 81.0, 51.0, 69.0, 59.0, 45.0, 31.0, 31.0, 29.0, 29.0, 24.0, 13.0, 11.0, 6.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.687433242797852, -11.270742416381836, -10.85405158996582, -10.437360763549805, -10.020670890808105, -9.60398006439209, -9.187289237976074, -8.770598411560059, -8.35390853881836, -7.937217712402344, -7.520527362823486, -7.103836536407471, -6.687146186828613, -6.270455360412598, -5.853764533996582, -5.437073707580566, -5.020382881164551, -4.603692054748535, -4.187001705169678, -3.770310878753662, -3.3536202907562256, -2.936929702758789, -2.5202388763427734, -2.103548288345337, -1.6868577003479004, -1.2701671123504639, -0.8534764051437378, -0.4367856979370117, -0.020095109939575195, 0.39659547805786133, 0.813286304473877, 1.2299768924713135, 1.6466665267944336, 2.06335711479187, 2.4800477027893066, 2.8967385292053223, 3.313429117202759, 3.7301197052001953, 4.146810531616211, 4.563501358032227, 4.980191707611084, 5.3968825340271, 5.813572883605957, 6.230263710021973, 6.646954536437988, 7.063644886016846, 7.480335712432861, 7.897026062011719, 8.313716888427734, 8.73040771484375, 9.147098541259766, 9.563789367675781, 9.98047924041748, 10.397170066833496, 10.813860893249512, 11.230551719665527, 11.647241592407227, 12.063932418823242, 12.480623245239258, 12.897314071655273, 13.314003944396973, 13.730694770812988, 14.147385597229004, 14.56407642364502, 14.980767250061035]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 10.0, 6.0, 8.0, 8.0, 8.0, 9.0, 11.0, 20.0, 20.0, 21.0, 18.0, 17.0, 29.0, 28.0, 27.0, 34.0, 36.0, 26.0, 25.0, 48.0, 33.0, 39.0, 40.0, 45.0, 37.0, 47.0, 35.0, 49.0, 35.0, 41.0, 22.0, 28.0, 27.0, 19.0, 15.0, 15.0, 9.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.270035743713379, -12.80976390838623, -12.349493026733398, -11.88922119140625, -11.428949356079102, -10.96867847442627, -10.508406639099121, -10.048135757446289, -9.58786392211914, -9.127592086791992, -8.66732120513916, -8.207049369812012, -7.7467780113220215, -7.286506652832031, -6.826234817504883, -6.365963459014893, -5.905692100524902, -5.445420742034912, -4.985149383544922, -4.524877548217773, -4.064606189727783, -3.604334831237793, -3.1440632343292236, -2.6837916374206543, -2.223520278930664, -1.7632488012313843, -1.3029773235321045, -0.8427058458328247, -0.3824343681335449, 0.07783699035644531, 0.5381085872650146, 0.998380184173584, 1.4586505889892578, 1.9189220666885376, 2.3791935443878174, 2.8394651412963867, 3.299736499786377, 3.760007858276367, 4.220279693603516, 4.680551052093506, 5.140822410583496, 5.601093769073486, 6.061365127563477, 6.521636962890625, 6.981908321380615, 7.4421796798706055, 7.902451515197754, 8.362722396850586, 8.822994232177734, 9.283266067504883, 9.743536949157715, 10.203808784484863, 10.664079666137695, 11.124351501464844, 11.584623336791992, 12.04489517211914, 12.505166053771973, 12.965437889099121, 13.425708770751953, 13.885980606079102, 14.34625244140625, 14.806523323059082, 15.26679515838623, 15.727066040039062, 16.18733787536621]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 15.0, 23.0, 34.0, 64.0, 98.0, 145.0, 276.0, 417.0, 660.0, 1135.0, 1927.0, 3145.0, 5392.0, 9103.0, 16168.0, 28773.0, 53293.0, 97339.0, 181516.0, 339502.0, 597556.0, 857951.0, 819443.0, 535898.0, 297737.0, 157887.0, 83841.0, 45313.0, 25183.0, 14037.0, 8163.0, 4729.0, 2847.0, 1712.0, 1110.0, 663.0, 417.0, 266.0, 173.0, 105.0, 66.0, 45.0, 26.0, 21.0, 18.0, 18.0, 5.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.171875, -10.7982177734375, -10.424560546875, -10.0509033203125, -9.67724609375, -9.3035888671875, -8.929931640625, -8.5562744140625, -8.1826171875, -7.8089599609375, -7.435302734375, -7.0616455078125, -6.68798828125, -6.3143310546875, -5.940673828125, -5.5670166015625, -5.193359375, -4.8197021484375, -4.446044921875, -4.0723876953125, -3.69873046875, -3.3250732421875, -2.951416015625, -2.5777587890625, -2.2041015625, -1.8304443359375, -1.456787109375, -1.0831298828125, -0.70947265625, -0.3358154296875, 0.037841796875, 0.4114990234375, 0.78515625, 1.1588134765625, 1.532470703125, 1.9061279296875, 2.27978515625, 2.6534423828125, 3.027099609375, 3.4007568359375, 3.7744140625, 4.1480712890625, 4.521728515625, 4.8953857421875, 5.26904296875, 5.6427001953125, 6.016357421875, 6.3900146484375, 6.763671875, 7.1373291015625, 7.510986328125, 7.8846435546875, 8.25830078125, 8.6319580078125, 9.005615234375, 9.3792724609375, 9.7529296875, 10.1265869140625, 10.500244140625, 10.8739013671875, 11.24755859375, 11.6212158203125, 11.994873046875, 12.3685302734375, 12.7421875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 3.0, 7.0, 6.0, 4.0, 9.0, 8.0, 12.0, 6.0, 15.0, 15.0, 17.0, 10.0, 15.0, 22.0, 16.0, 30.0, 26.0, 19.0, 39.0, 24.0, 30.0, 36.0, 32.0, 33.0, 39.0, 40.0, 36.0, 42.0, 30.0, 37.0, 38.0, 44.0, 30.0, 32.0, 25.0, 31.0, 24.0, 17.0, 19.0, 14.0, 12.0, 12.0, 4.0, 6.0, 3.0, 9.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.953125, -7.674072265625, -7.39501953125, -7.115966796875, -6.8369140625, -6.557861328125, -6.27880859375, -5.999755859375, -5.720703125, -5.441650390625, -5.16259765625, -4.883544921875, -4.6044921875, -4.325439453125, -4.04638671875, -3.767333984375, -3.48828125, -3.209228515625, -2.93017578125, -2.651123046875, -2.3720703125, -2.093017578125, -1.81396484375, -1.534912109375, -1.255859375, -0.976806640625, -0.69775390625, -0.418701171875, -0.1396484375, 0.139404296875, 0.41845703125, 0.697509765625, 0.9765625, 1.255615234375, 1.53466796875, 1.813720703125, 2.0927734375, 2.371826171875, 2.65087890625, 2.929931640625, 3.208984375, 3.488037109375, 3.76708984375, 4.046142578125, 4.3251953125, 4.604248046875, 4.88330078125, 5.162353515625, 5.44140625, 5.720458984375, 5.99951171875, 6.278564453125, 6.5576171875, 6.836669921875, 7.11572265625, 7.394775390625, 7.673828125, 7.952880859375, 8.23193359375, 8.510986328125, 8.7900390625, 9.069091796875, 9.34814453125, 9.627197265625, 9.90625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 15.0, 31.0, 29.0, 30.0, 70.0, 118.0, 161.0, 251.0, 393.0, 583.0, 907.0, 1494.0, 2379.0, 3746.0, 6345.0, 10143.0, 16589.0, 27843.0, 46364.0, 77842.0, 130891.0, 217215.0, 347154.0, 510283.0, 646134.0, 655911.0, 534722.0, 368108.0, 235580.0, 141508.0, 84723.0, 50026.0, 29970.0, 18087.0, 10966.0, 6700.0, 4172.0, 2498.0, 1597.0, 983.0, 631.0, 390.0, 264.0, 144.0, 107.0, 69.0, 53.0, 28.0, 17.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-9.0078125, -8.7354736328125, -8.463134765625, -8.1907958984375, -7.91845703125, -7.6461181640625, -7.373779296875, -7.1014404296875, -6.8291015625, -6.5567626953125, -6.284423828125, -6.0120849609375, -5.73974609375, -5.4674072265625, -5.195068359375, -4.9227294921875, -4.650390625, -4.3780517578125, -4.105712890625, -3.8333740234375, -3.56103515625, -3.2886962890625, -3.016357421875, -2.7440185546875, -2.4716796875, -2.1993408203125, -1.927001953125, -1.6546630859375, -1.38232421875, -1.1099853515625, -0.837646484375, -0.5653076171875, -0.29296875, -0.0206298828125, 0.251708984375, 0.5240478515625, 0.79638671875, 1.0687255859375, 1.341064453125, 1.6134033203125, 1.8857421875, 2.1580810546875, 2.430419921875, 2.7027587890625, 2.97509765625, 3.2474365234375, 3.519775390625, 3.7921142578125, 4.064453125, 4.3367919921875, 4.609130859375, 4.8814697265625, 5.15380859375, 5.4261474609375, 5.698486328125, 5.9708251953125, 6.2431640625, 6.5155029296875, 6.787841796875, 7.0601806640625, 7.33251953125, 7.6048583984375, 7.877197265625, 8.1495361328125, 8.421875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 4.0, 6.0, 11.0, 10.0, 8.0, 16.0, 19.0, 20.0, 41.0, 44.0, 54.0, 53.0, 78.0, 95.0, 103.0, 124.0, 143.0, 151.0, 166.0, 186.0, 177.0, 220.0, 196.0, 197.0, 202.0, 190.0, 192.0, 185.0, 170.0, 169.0, 127.0, 121.0, 100.0, 107.0, 83.0, 60.0, 46.0, 43.0, 37.0, 21.0, 25.0, 23.0, 19.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.20654296875, -4.0654296875, -3.92431640625, -3.783203125, -3.64208984375, -3.5009765625, -3.35986328125, -3.21875, -3.07763671875, -2.9365234375, -2.79541015625, -2.654296875, -2.51318359375, -2.3720703125, -2.23095703125, -2.08984375, -1.94873046875, -1.8076171875, -1.66650390625, -1.525390625, -1.38427734375, -1.2431640625, -1.10205078125, -0.9609375, -0.81982421875, -0.6787109375, -0.53759765625, -0.396484375, -0.25537109375, -0.1142578125, 0.02685546875, 0.16796875, 0.30908203125, 0.4501953125, 0.59130859375, 0.732421875, 0.87353515625, 1.0146484375, 1.15576171875, 1.296875, 1.43798828125, 1.5791015625, 1.72021484375, 1.861328125, 2.00244140625, 2.1435546875, 2.28466796875, 2.42578125, 2.56689453125, 2.7080078125, 2.84912109375, 2.990234375, 3.13134765625, 3.2724609375, 3.41357421875, 3.5546875, 3.69580078125, 3.8369140625, 3.97802734375, 4.119140625, 4.26025390625, 4.4013671875, 4.54248046875, 4.68359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 2.0, 8.0, 5.0, 6.0, 12.0, 24.0, 18.0, 23.0, 26.0, 31.0, 49.0, 47.0, 50.0, 59.0, 62.0, 67.0, 71.0, 60.0, 54.0, 60.0, 42.0, 40.0, 37.0, 21.0, 23.0, 23.0, 12.0, 14.0, 11.0, 6.0, 6.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.399839401245117, -9.041983604431152, -8.684126853942871, -8.326271057128906, -7.968414783477783, -7.61055850982666, -7.252702713012695, -6.894846439361572, -6.536990165710449, -6.179133892059326, -5.821277618408203, -5.463421821594238, -5.105565547943115, -4.747709274291992, -4.389853477478027, -4.031997203826904, -3.6741409301757812, -3.316284656524658, -2.9584286212921143, -2.6005725860595703, -2.2427163124084473, -1.8848601579666138, -1.5270040035247803, -1.1691479682922363, -0.8112916946411133, -0.4534355401992798, -0.09557938575744629, 0.2622767686843872, 0.6201329231262207, 0.9779890775680542, 1.3358452320098877, 1.6937012672424316, 2.051558494567871, 2.409414768218994, 2.767270803451538, 3.125126838684082, 3.482983112335205, 3.840839385986328, 4.198695182800293, 4.556551456451416, 4.914407730102539, 5.272264003753662, 5.630120277404785, 5.98797607421875, 6.345832347869873, 6.703688621520996, 7.061544418334961, 7.419400691986084, 7.777256965637207, 8.135112762451172, 8.492969512939453, 8.850825309753418, 9.208681106567383, 9.566537857055664, 9.924393653869629, 10.282249450683594, 10.640106201171875, 10.99796199798584, 11.355818748474121, 11.713674545288086, 12.071531295776367, 12.429387092590332, 12.787242889404297, 13.145099639892578, 13.502955436706543]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 6.0, 5.0, 8.0, 18.0, 17.0, 22.0, 13.0, 20.0, 23.0, 21.0, 30.0, 27.0, 40.0, 23.0, 20.0, 37.0, 45.0, 34.0, 42.0, 52.0, 36.0, 44.0, 57.0, 34.0, 41.0, 35.0, 35.0, 32.0, 25.0, 15.0, 31.0, 14.0, 16.0, 13.0, 8.0, 10.0, 8.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.265180587768555, -11.859153747558594, -11.453126907348633, -11.047100067138672, -10.641073226928711, -10.23504638671875, -9.829018592834473, -9.422991752624512, -9.01696491241455, -8.61093807220459, -8.204911231994629, -7.79888391494751, -7.392857074737549, -6.986830234527588, -6.580802917480469, -6.174776077270508, -5.768749237060547, -5.362722396850586, -4.956695556640625, -4.550668239593506, -4.144641399383545, -3.738614559173584, -3.332587480545044, -2.926560401916504, -2.520533561706543, -2.114506721496582, -1.708479642868042, -1.3024526834487915, -0.896425724029541, -0.4903988838195801, -0.08437180519104004, 0.3216552734375, 0.7276830673217773, 1.1337100267410278, 1.5397369861602783, 1.9457639455795288, 2.3517909049987793, 2.7578177452087402, 3.1638448238372803, 3.5698719024658203, 3.9758987426757812, 4.381925582885742, 4.787952423095703, 5.193979740142822, 5.600006580352783, 6.006033420562744, 6.412060737609863, 6.818087577819824, 7.224114418029785, 7.630141258239746, 8.036168098449707, 8.442194938659668, 8.848222732543945, 9.254249572753906, 9.660276412963867, 10.066303253173828, 10.472330093383789, 10.87835693359375, 11.284383773803711, 11.690410614013672, 12.096437454223633, 12.502464294433594, 12.908492088317871, 13.314518928527832, 13.720545768737793]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 7.0, 7.0, 8.0, 18.0, 17.0, 26.0, 32.0, 33.0, 57.0, 71.0, 103.0, 108.0, 141.0, 188.0, 229.0, 306.0, 402.0, 570.0, 830.0, 1386.0, 2784.0, 7077.0, 22855.0, 90310.0, 406937.0, 391823.0, 85966.0, 21876.0, 6992.0, 2878.0, 1427.0, 807.0, 546.0, 413.0, 334.0, 201.0, 168.0, 130.0, 119.0, 100.0, 65.0, 56.0, 37.0, 30.0, 24.0, 19.0, 9.0, 5.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-6.5390625, -6.3408203125, -6.142578125, -5.9443359375, -5.74609375, -5.5478515625, -5.349609375, -5.1513671875, -4.953125, -4.7548828125, -4.556640625, -4.3583984375, -4.16015625, -3.9619140625, -3.763671875, -3.5654296875, -3.3671875, -3.1689453125, -2.970703125, -2.7724609375, -2.57421875, -2.3759765625, -2.177734375, -1.9794921875, -1.78125, -1.5830078125, -1.384765625, -1.1865234375, -0.98828125, -0.7900390625, -0.591796875, -0.3935546875, -0.1953125, 0.0029296875, 0.201171875, 0.3994140625, 0.59765625, 0.7958984375, 0.994140625, 1.1923828125, 1.390625, 1.5888671875, 1.787109375, 1.9853515625, 2.18359375, 2.3818359375, 2.580078125, 2.7783203125, 2.9765625, 3.1748046875, 3.373046875, 3.5712890625, 3.76953125, 3.9677734375, 4.166015625, 4.3642578125, 4.5625, 4.7607421875, 4.958984375, 5.1572265625, 5.35546875, 5.5537109375, 5.751953125, 5.9501953125, 6.1484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 9.0, 11.0, 12.0, 15.0, 13.0, 15.0, 20.0, 24.0, 23.0, 27.0, 26.0, 29.0, 26.0, 32.0, 38.0, 32.0, 43.0, 41.0, 38.0, 52.0, 47.0, 38.0, 59.0, 42.0, 38.0, 28.0, 24.0, 27.0, 25.0, 29.0, 17.0, 17.0, 13.0, 15.0, 6.0, 6.0, 6.0, 10.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.3515625, -11.9339599609375, -11.516357421875, -11.0987548828125, -10.68115234375, -10.2635498046875, -9.845947265625, -9.4283447265625, -9.0107421875, -8.5931396484375, -8.175537109375, -7.7579345703125, -7.34033203125, -6.9227294921875, -6.505126953125, -6.0875244140625, -5.669921875, -5.2523193359375, -4.834716796875, -4.4171142578125, -3.99951171875, -3.5819091796875, -3.164306640625, -2.7467041015625, -2.3291015625, -1.9114990234375, -1.493896484375, -1.0762939453125, -0.65869140625, -0.2410888671875, 0.176513671875, 0.5941162109375, 1.01171875, 1.4293212890625, 1.846923828125, 2.2645263671875, 2.68212890625, 3.0997314453125, 3.517333984375, 3.9349365234375, 4.3525390625, 4.7701416015625, 5.187744140625, 5.6053466796875, 6.02294921875, 6.4405517578125, 6.858154296875, 7.2757568359375, 7.693359375, 8.1109619140625, 8.528564453125, 8.9461669921875, 9.36376953125, 9.7813720703125, 10.198974609375, 10.6165771484375, 11.0341796875, 11.4517822265625, 11.869384765625, 12.2869873046875, 12.70458984375, 13.1221923828125, 13.539794921875, 13.9573974609375, 14.375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 10.0, 15.0, 17.0, 20.0, 33.0, 44.0, 53.0, 98.0, 129.0, 161.0, 290.0, 407.0, 666.0, 1270.0, 3222.0, 12608.0, 81532.0, 577986.0, 317655.0, 40017.0, 7430.0, 2197.0, 1009.0, 556.0, 357.0, 215.0, 155.0, 124.0, 84.0, 55.0, 37.0, 23.0, 14.0, 23.0, 10.0, 8.0, 9.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.5078125, -8.26348876953125, -8.0191650390625, -7.77484130859375, -7.530517578125, -7.28619384765625, -7.0418701171875, -6.79754638671875, -6.55322265625, -6.30889892578125, -6.0645751953125, -5.82025146484375, -5.575927734375, -5.33160400390625, -5.0872802734375, -4.84295654296875, -4.5986328125, -4.35430908203125, -4.1099853515625, -3.86566162109375, -3.621337890625, -3.37701416015625, -3.1326904296875, -2.88836669921875, -2.64404296875, -2.39971923828125, -2.1553955078125, -1.91107177734375, -1.666748046875, -1.42242431640625, -1.1781005859375, -0.93377685546875, -0.689453125, -0.44512939453125, -0.2008056640625, 0.04351806640625, 0.287841796875, 0.53216552734375, 0.7764892578125, 1.02081298828125, 1.26513671875, 1.50946044921875, 1.7537841796875, 1.99810791015625, 2.242431640625, 2.48675537109375, 2.7310791015625, 2.97540283203125, 3.2197265625, 3.46405029296875, 3.7083740234375, 3.95269775390625, 4.197021484375, 4.44134521484375, 4.6856689453125, 4.92999267578125, 5.17431640625, 5.41864013671875, 5.6629638671875, 5.90728759765625, 6.151611328125, 6.39593505859375, 6.6402587890625, 6.88458251953125, 7.12890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 8.0, 9.0, 8.0, 6.0, 13.0, 16.0, 17.0, 18.0, 27.0, 30.0, 19.0, 22.0, 46.0, 38.0, 31.0, 37.0, 42.0, 46.0, 43.0, 47.0, 42.0, 45.0, 46.0, 34.0, 39.0, 38.0, 22.0, 32.0, 25.0, 33.0, 18.0, 19.0, 11.0, 13.0, 12.0, 6.0, 3.0, 9.0, 4.0, 4.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6640625, -8.3734130859375, -8.082763671875, -7.7921142578125, -7.50146484375, -7.2108154296875, -6.920166015625, -6.6295166015625, -6.3388671875, -6.0482177734375, -5.757568359375, -5.4669189453125, -5.17626953125, -4.8856201171875, -4.594970703125, -4.3043212890625, -4.013671875, -3.7230224609375, -3.432373046875, -3.1417236328125, -2.85107421875, -2.5604248046875, -2.269775390625, -1.9791259765625, -1.6884765625, -1.3978271484375, -1.107177734375, -0.8165283203125, -0.52587890625, -0.2352294921875, 0.055419921875, 0.3460693359375, 0.63671875, 0.9273681640625, 1.218017578125, 1.5086669921875, 1.79931640625, 2.0899658203125, 2.380615234375, 2.6712646484375, 2.9619140625, 3.2525634765625, 3.543212890625, 3.8338623046875, 4.12451171875, 4.4151611328125, 4.705810546875, 4.9964599609375, 5.287109375, 5.5777587890625, 5.868408203125, 6.1590576171875, 6.44970703125, 6.7403564453125, 7.031005859375, 7.3216552734375, 7.6123046875, 7.9029541015625, 8.193603515625, 8.4842529296875, 8.77490234375, 9.0655517578125, 9.356201171875, 9.6468505859375, 9.9375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 6.0, 17.0, 14.0, 27.0, 37.0, 43.0, 88.0, 102.0, 138.0, 212.0, 346.0, 492.0, 875.0, 1441.0, 2922.0, 6630.0, 19605.0, 97086.0, 688054.0, 185100.0, 28287.0, 8829.0, 3672.0, 1794.0, 1004.0, 582.0, 362.0, 259.0, 144.0, 119.0, 67.0, 41.0, 38.0, 36.0, 19.0, 16.0, 11.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8287582397460938, -0.7976531982421875, -0.7665481567382812, -0.735443115234375, -0.7043380737304688, -0.6732330322265625, -0.6421279907226562, -0.61102294921875, -0.5799179077148438, -0.5488128662109375, -0.5177078247070312, -0.486602783203125, -0.45549774169921875, -0.4243927001953125, -0.39328765869140625, -0.3621826171875, -0.33107757568359375, -0.2999725341796875, -0.26886749267578125, -0.237762451171875, -0.20665740966796875, -0.1755523681640625, -0.14444732666015625, -0.11334228515625, -0.08223724365234375, -0.0511322021484375, -0.02002716064453125, 0.011077880859375, 0.04218292236328125, 0.0732879638671875, 0.10439300537109375, 0.135498046875, 0.16660308837890625, 0.1977081298828125, 0.22881317138671875, 0.259918212890625, 0.29102325439453125, 0.3221282958984375, 0.35323333740234375, 0.38433837890625, 0.41544342041015625, 0.4465484619140625, 0.47765350341796875, 0.508758544921875, 0.5398635864257812, 0.5709686279296875, 0.6020736694335938, 0.6331787109375, 0.6642837524414062, 0.6953887939453125, 0.7264938354492188, 0.757598876953125, 0.7887039184570312, 0.8198089599609375, 0.8509140014648438, 0.88201904296875, 0.9131240844726562, 0.9442291259765625, 0.9753341674804688, 1.006439208984375, 1.0375442504882812, 1.0686492919921875, 1.0997543334960938, 1.130859375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 18.0, 20.0, 43.0, 61.0, 93.0, 89.0, 121.0, 117.0, 110.0, 84.0, 67.0, 45.0, 30.0, 28.0, 21.0, 9.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.685754776000977e-05, -9.425915777683258e-05, -9.16607677936554e-05, -8.906237781047821e-05, -8.646398782730103e-05, -8.386559784412384e-05, -8.126720786094666e-05, -7.866881787776947e-05, -7.607042789459229e-05, -7.34720379114151e-05, -7.087364792823792e-05, -6.827525794506073e-05, -6.567686796188354e-05, -6.307847797870636e-05, -6.0480087995529175e-05, -5.788169801235199e-05, -5.5283308029174805e-05, -5.268491804599762e-05, -5.0086528062820435e-05, -4.748813807964325e-05, -4.4889748096466064e-05, -4.229135811328888e-05, -3.9692968130111694e-05, -3.709457814693451e-05, -3.4496188163757324e-05, -3.189779818058014e-05, -2.9299408197402954e-05, -2.670101821422577e-05, -2.4102628231048584e-05, -2.15042382478714e-05, -1.8905848264694214e-05, -1.630745828151703e-05, -1.3709068298339844e-05, -1.1110678315162659e-05, -8.512288331985474e-06, -5.9138983488082886e-06, -3.3155083656311035e-06, -7.171183824539185e-07, 1.8812716007232666e-06, 4.479661583900452e-06, 7.078051567077637e-06, 9.676441550254822e-06, 1.2274831533432007e-05, 1.4873221516609192e-05, 1.7471611499786377e-05, 2.0070001482963562e-05, 2.2668391466140747e-05, 2.5266781449317932e-05, 2.7865171432495117e-05, 3.0463561415672302e-05, 3.306195139884949e-05, 3.566034138202667e-05, 3.825873136520386e-05, 4.085712134838104e-05, 4.345551133155823e-05, 4.605390131473541e-05, 4.86522912979126e-05, 5.125068128108978e-05, 5.384907126426697e-05, 5.644746124744415e-05, 5.904585123062134e-05, 6.164424121379852e-05, 6.424263119697571e-05, 6.684102118015289e-05, 6.943941116333008e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 10.0, 8.0, 11.0, 23.0, 31.0, 37.0, 59.0, 55.0, 108.0, 149.0, 196.0, 257.0, 425.0, 617.0, 898.0, 1486.0, 2344.0, 3883.0, 7189.0, 13435.0, 27239.0, 60061.0, 144313.0, 344616.0, 252086.0, 100510.0, 43101.0, 20490.0, 10421.0, 5679.0, 3179.0, 1898.0, 1184.0, 795.0, 506.0, 372.0, 258.0, 183.0, 118.0, 92.0, 66.0, 43.0, 35.0, 24.0, 15.0, 18.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 4.0], "bins": [-0.93994140625, -0.911285400390625, -0.88262939453125, -0.853973388671875, -0.8253173828125, -0.796661376953125, -0.76800537109375, -0.739349365234375, -0.710693359375, -0.682037353515625, -0.65338134765625, -0.624725341796875, -0.5960693359375, -0.567413330078125, -0.53875732421875, -0.510101318359375, -0.4814453125, -0.452789306640625, -0.42413330078125, -0.395477294921875, -0.3668212890625, -0.338165283203125, -0.30950927734375, -0.280853271484375, -0.252197265625, -0.223541259765625, -0.19488525390625, -0.166229248046875, -0.1375732421875, -0.108917236328125, -0.08026123046875, -0.051605224609375, -0.02294921875, 0.005706787109375, 0.03436279296875, 0.063018798828125, 0.0916748046875, 0.120330810546875, 0.14898681640625, 0.177642822265625, 0.206298828125, 0.234954833984375, 0.26361083984375, 0.292266845703125, 0.3209228515625, 0.349578857421875, 0.37823486328125, 0.406890869140625, 0.435546875, 0.464202880859375, 0.49285888671875, 0.521514892578125, 0.5501708984375, 0.578826904296875, 0.60748291015625, 0.636138916015625, 0.664794921875, 0.693450927734375, 0.72210693359375, 0.750762939453125, 0.7794189453125, 0.808074951171875, 0.83673095703125, 0.865386962890625, 0.89404296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 5.0, 10.0, 6.0, 17.0, 12.0, 17.0, 16.0, 13.0, 24.0, 25.0, 26.0, 26.0, 33.0, 22.0, 21.0, 31.0, 42.0, 27.0, 35.0, 36.0, 34.0, 48.0, 24.0, 30.0, 32.0, 47.0, 26.0, 34.0, 40.0, 36.0, 25.0, 32.0, 19.0, 22.0, 12.0, 17.0, 7.0, 15.0, 9.0, 4.0, 4.0, 5.0, 5.0, 3.0, 8.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.30029296875, -0.291229248046875, -0.28216552734375, -0.273101806640625, -0.2640380859375, -0.254974365234375, -0.24591064453125, -0.236846923828125, -0.227783203125, -0.218719482421875, -0.20965576171875, -0.200592041015625, -0.1915283203125, -0.182464599609375, -0.17340087890625, -0.164337158203125, -0.1552734375, -0.146209716796875, -0.13714599609375, -0.128082275390625, -0.1190185546875, -0.109954833984375, -0.10089111328125, -0.091827392578125, -0.082763671875, -0.073699951171875, -0.06463623046875, -0.055572509765625, -0.0465087890625, -0.037445068359375, -0.02838134765625, -0.019317626953125, -0.01025390625, -0.001190185546875, 0.00787353515625, 0.016937255859375, 0.0260009765625, 0.035064697265625, 0.04412841796875, 0.053192138671875, 0.062255859375, 0.071319580078125, 0.08038330078125, 0.089447021484375, 0.0985107421875, 0.107574462890625, 0.11663818359375, 0.125701904296875, 0.134765625, 0.143829345703125, 0.15289306640625, 0.161956787109375, 0.1710205078125, 0.180084228515625, 0.18914794921875, 0.198211669921875, 0.207275390625, 0.216339111328125, 0.22540283203125, 0.234466552734375, 0.2435302734375, 0.252593994140625, 0.26165771484375, 0.270721435546875, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 8.0, 12.0, 15.0, 24.0, 17.0, 29.0, 35.0, 43.0, 45.0, 56.0, 56.0, 58.0, 69.0, 73.0, 66.0, 59.0, 50.0, 37.0, 40.0, 41.0, 24.0, 21.0, 23.0, 10.0, 16.0, 12.0, 6.0, 9.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.63278579711914, -8.277523040771484, -7.922260761260986, -7.566998481750488, -7.211735725402832, -6.856473445892334, -6.501211166381836, -6.14594841003418, -5.790686130523682, -5.435423851013184, -5.080161094665527, -4.724898815155029, -4.369636535644531, -4.014373779296875, -3.659111499786377, -3.3038489818573, -2.9485864639282227, -2.5933239459991455, -2.2380614280700684, -1.8827991485595703, -1.5275366306304932, -1.172274112701416, -0.817011833190918, -0.4617493152618408, -0.10648679733276367, 0.2487756609916687, 0.6040381193161011, 0.9593005180358887, 1.3145630359649658, 1.669825553894043, 2.025087833404541, 2.380350351333618, 2.7356138229370117, 3.090876340866089, 3.446138858795166, 3.801401138305664, 4.15666389465332, 4.511926174163818, 4.867188453674316, 5.222451210021973, 5.577713489532471, 5.932975769042969, 6.288238525390625, 6.643500804901123, 6.998763084411621, 7.354025840759277, 7.709288120269775, 8.064550399780273, 8.41981315612793, 8.775075912475586, 9.130337715148926, 9.485600471496582, 9.840863227844238, 10.196125030517578, 10.551387786865234, 10.90665054321289, 11.261913299560547, 11.617176055908203, 11.972437858581543, 12.3277006149292, 12.682963371276855, 13.038225173950195, 13.393487930297852, 13.748750686645508, 14.104012489318848]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 2.0, 4.0, 3.0, 8.0, 6.0, 7.0, 19.0, 15.0, 18.0, 15.0, 19.0, 23.0, 24.0, 33.0, 24.0, 28.0, 29.0, 27.0, 28.0, 43.0, 35.0, 36.0, 54.0, 32.0, 50.0, 58.0, 34.0, 37.0, 40.0, 30.0, 36.0, 26.0, 22.0, 21.0, 22.0, 17.0, 14.0, 10.0, 6.0, 12.0, 7.0, 4.0, 8.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.231788635253906, -11.830744743347168, -11.42970085144043, -11.028656005859375, -10.627612113952637, -10.226568222045898, -9.825523376464844, -9.424479484558105, -9.023435592651367, -8.622391700744629, -8.22134780883789, -7.820302963256836, -7.419259071350098, -7.018215179443359, -6.617170810699463, -6.216126441955566, -5.815082550048828, -5.41403865814209, -5.012994289398193, -4.611949920654297, -4.210906028747559, -3.809861898422241, -3.408817768096924, -3.0077736377716064, -2.606729507446289, -2.2056853771209717, -1.8046412467956543, -1.403597116470337, -1.0025529861450195, -0.6015088558197021, -0.20046472549438477, 0.20057940483093262, 0.6016244888305664, 1.0026686191558838, 1.4037127494812012, 1.8047568798065186, 2.205801010131836, 2.6068451404571533, 3.0078892707824707, 3.408933401107788, 3.8099775314331055, 4.211021423339844, 4.61206579208374, 5.013110160827637, 5.414154052734375, 5.815197944641113, 6.21624231338501, 6.617286682128906, 7.0183305740356445, 7.419374465942383, 7.820418834686279, 8.221463203430176, 8.622507095336914, 9.023550987243652, 9.42459487915039, 9.825639724731445, 10.226683616638184, 10.627727508544922, 11.028772354125977, 11.429816246032715, 11.830860137939453, 12.231904029846191, 12.63294792175293, 13.033992767333984, 13.435036659240723]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 10.0, 19.0, 23.0, 23.0, 56.0, 68.0, 93.0, 138.0, 225.0, 304.0, 508.0, 734.0, 1216.0, 1886.0, 2889.0, 4587.0, 7366.0, 11629.0, 18232.0, 28948.0, 44167.0, 67541.0, 96018.0, 125093.0, 143494.0, 138176.0, 113388.0, 83093.0, 56814.0, 36935.0, 23377.0, 14935.0, 9590.0, 6115.0, 3873.0, 2472.0, 1597.0, 986.0, 638.0, 444.0, 306.0, 174.0, 135.0, 73.0, 44.0, 36.0, 31.0, 20.0, 7.0, 9.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.5703125, -8.316650390625, -8.06298828125, -7.809326171875, -7.5556640625, -7.302001953125, -7.04833984375, -6.794677734375, -6.541015625, -6.287353515625, -6.03369140625, -5.780029296875, -5.5263671875, -5.272705078125, -5.01904296875, -4.765380859375, -4.51171875, -4.258056640625, -4.00439453125, -3.750732421875, -3.4970703125, -3.243408203125, -2.98974609375, -2.736083984375, -2.482421875, -2.228759765625, -1.97509765625, -1.721435546875, -1.4677734375, -1.214111328125, -0.96044921875, -0.706787109375, -0.453125, -0.199462890625, 0.05419921875, 0.307861328125, 0.5615234375, 0.815185546875, 1.06884765625, 1.322509765625, 1.576171875, 1.829833984375, 2.08349609375, 2.337158203125, 2.5908203125, 2.844482421875, 3.09814453125, 3.351806640625, 3.60546875, 3.859130859375, 4.11279296875, 4.366455078125, 4.6201171875, 4.873779296875, 5.12744140625, 5.381103515625, 5.634765625, 5.888427734375, 6.14208984375, 6.395751953125, 6.6494140625, 6.903076171875, 7.15673828125, 7.410400390625, 7.6640625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 13.0, 15.0, 24.0, 14.0, 27.0, 22.0, 20.0, 37.0, 18.0, 27.0, 29.0, 38.0, 38.0, 36.0, 32.0, 43.0, 37.0, 51.0, 50.0, 40.0, 46.0, 37.0, 37.0, 40.0, 31.0, 23.0, 32.0, 17.0, 16.0, 14.0, 13.0, 8.0, 8.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.625, -12.220458984375, -11.81591796875, -11.411376953125, -11.0068359375, -10.602294921875, -10.19775390625, -9.793212890625, -9.388671875, -8.984130859375, -8.57958984375, -8.175048828125, -7.7705078125, -7.365966796875, -6.96142578125, -6.556884765625, -6.15234375, -5.747802734375, -5.34326171875, -4.938720703125, -4.5341796875, -4.129638671875, -3.72509765625, -3.320556640625, -2.916015625, -2.511474609375, -2.10693359375, -1.702392578125, -1.2978515625, -0.893310546875, -0.48876953125, -0.084228515625, 0.3203125, 0.724853515625, 1.12939453125, 1.533935546875, 1.9384765625, 2.343017578125, 2.74755859375, 3.152099609375, 3.556640625, 3.961181640625, 4.36572265625, 4.770263671875, 5.1748046875, 5.579345703125, 5.98388671875, 6.388427734375, 6.79296875, 7.197509765625, 7.60205078125, 8.006591796875, 8.4111328125, 8.815673828125, 9.22021484375, 9.624755859375, 10.029296875, 10.433837890625, 10.83837890625, 11.242919921875, 11.6474609375, 12.052001953125, 12.45654296875, 12.861083984375, 13.265625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 12.0, 24.0, 45.0, 57.0, 95.0, 125.0, 204.0, 289.0, 469.0, 683.0, 1095.0, 1529.0, 2605.0, 3852.0, 6089.0, 9531.0, 14897.0, 22983.0, 35413.0, 53867.0, 78783.0, 107557.0, 132640.0, 140214.0, 126867.0, 99799.0, 71671.0, 47808.0, 31871.0, 20419.0, 13198.0, 8492.0, 5531.0, 3387.0, 2264.0, 1433.0, 939.0, 564.0, 403.0, 297.0, 180.0, 121.0, 85.0, 58.0, 38.0, 21.0, 8.0, 14.0, 4.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.7265625, -7.480224609375, -7.23388671875, -6.987548828125, -6.7412109375, -6.494873046875, -6.24853515625, -6.002197265625, -5.755859375, -5.509521484375, -5.26318359375, -5.016845703125, -4.7705078125, -4.524169921875, -4.27783203125, -4.031494140625, -3.78515625, -3.538818359375, -3.29248046875, -3.046142578125, -2.7998046875, -2.553466796875, -2.30712890625, -2.060791015625, -1.814453125, -1.568115234375, -1.32177734375, -1.075439453125, -0.8291015625, -0.582763671875, -0.33642578125, -0.090087890625, 0.15625, 0.402587890625, 0.64892578125, 0.895263671875, 1.1416015625, 1.387939453125, 1.63427734375, 1.880615234375, 2.126953125, 2.373291015625, 2.61962890625, 2.865966796875, 3.1123046875, 3.358642578125, 3.60498046875, 3.851318359375, 4.09765625, 4.343994140625, 4.59033203125, 4.836669921875, 5.0830078125, 5.329345703125, 5.57568359375, 5.822021484375, 6.068359375, 6.314697265625, 6.56103515625, 6.807373046875, 7.0537109375, 7.300048828125, 7.54638671875, 7.792724609375, 8.0390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 7.0, 15.0, 15.0, 16.0, 19.0, 19.0, 16.0, 28.0, 29.0, 30.0, 25.0, 36.0, 42.0, 25.0, 29.0, 37.0, 42.0, 51.0, 43.0, 33.0, 40.0, 39.0, 41.0, 35.0, 36.0, 29.0, 26.0, 33.0, 19.0, 15.0, 13.0, 10.0, 7.0, 10.0, 8.0, 12.0, 9.0, 3.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.59375, -7.3564453125, -7.119140625, -6.8818359375, -6.64453125, -6.4072265625, -6.169921875, -5.9326171875, -5.6953125, -5.4580078125, -5.220703125, -4.9833984375, -4.74609375, -4.5087890625, -4.271484375, -4.0341796875, -3.796875, -3.5595703125, -3.322265625, -3.0849609375, -2.84765625, -2.6103515625, -2.373046875, -2.1357421875, -1.8984375, -1.6611328125, -1.423828125, -1.1865234375, -0.94921875, -0.7119140625, -0.474609375, -0.2373046875, 0.0, 0.2373046875, 0.474609375, 0.7119140625, 0.94921875, 1.1865234375, 1.423828125, 1.6611328125, 1.8984375, 2.1357421875, 2.373046875, 2.6103515625, 2.84765625, 3.0849609375, 3.322265625, 3.5595703125, 3.796875, 4.0341796875, 4.271484375, 4.5087890625, 4.74609375, 4.9833984375, 5.220703125, 5.4580078125, 5.6953125, 5.9326171875, 6.169921875, 6.4072265625, 6.64453125, 6.8818359375, 7.119140625, 7.3564453125, 7.59375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 7.0, 10.0, 23.0, 29.0, 77.0, 95.0, 149.0, 231.0, 397.0, 655.0, 1147.0, 1936.0, 3130.0, 5657.0, 9913.0, 17990.0, 32938.0, 60274.0, 107334.0, 172108.0, 212422.0, 174888.0, 109305.0, 61413.0, 33842.0, 18382.0, 10159.0, 5856.0, 3352.0, 1974.0, 1111.0, 657.0, 400.0, 280.0, 139.0, 89.0, 49.0, 53.0, 22.0, 16.0, 16.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.38848876953125, -4.2535400390625, -4.11859130859375, -3.983642578125, -3.84869384765625, -3.7137451171875, -3.57879638671875, -3.44384765625, -3.30889892578125, -3.1739501953125, -3.03900146484375, -2.904052734375, -2.76910400390625, -2.6341552734375, -2.49920654296875, -2.3642578125, -2.22930908203125, -2.0943603515625, -1.95941162109375, -1.824462890625, -1.68951416015625, -1.5545654296875, -1.41961669921875, -1.28466796875, -1.14971923828125, -1.0147705078125, -0.87982177734375, -0.744873046875, -0.60992431640625, -0.4749755859375, -0.34002685546875, -0.205078125, -0.07012939453125, 0.0648193359375, 0.19976806640625, 0.334716796875, 0.46966552734375, 0.6046142578125, 0.73956298828125, 0.87451171875, 1.00946044921875, 1.1444091796875, 1.27935791015625, 1.414306640625, 1.54925537109375, 1.6842041015625, 1.81915283203125, 1.9541015625, 2.08905029296875, 2.2239990234375, 2.35894775390625, 2.493896484375, 2.62884521484375, 2.7637939453125, 2.89874267578125, 3.03369140625, 3.16864013671875, 3.3035888671875, 3.43853759765625, 3.573486328125, 3.70843505859375, 3.8433837890625, 3.97833251953125, 4.11328125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 12.0, 15.0, 23.0, 26.0, 38.0, 39.0, 69.0, 80.0, 53.0, 66.0, 82.0, 80.0, 80.0, 67.0, 58.0, 43.0, 40.0, 28.0, 18.0, 17.0, 14.0, 9.0, 12.0, 11.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003864765167236328, -0.00037537142634391785, -0.0003642663359642029, -0.0003531612455844879, -0.00034205615520477295, -0.000330951064825058, -0.000319845974445343, -0.00030874088406562805, -0.0002976357936859131, -0.0002865307033061981, -0.00027542561292648315, -0.0002643205225467682, -0.0002532154321670532, -0.00024211034178733826, -0.0002310052514076233, -0.00021990016102790833, -0.00020879507064819336, -0.0001976899802684784, -0.00018658488988876343, -0.00017547979950904846, -0.0001643747091293335, -0.00015326961874961853, -0.00014216452836990356, -0.0001310594379901886, -0.00011995434761047363, -0.00010884925723075867, -9.77441668510437e-05, -8.663907647132874e-05, -7.553398609161377e-05, -6.44288957118988e-05, -5.332380533218384e-05, -4.221871495246887e-05, -3.1113624572753906e-05, -2.000853419303894e-05, -8.903443813323975e-06, 2.201646566390991e-06, 1.3306736946105957e-05, 2.4411827325820923e-05, 3.551691770553589e-05, 4.6622008085250854e-05, 5.772709846496582e-05, 6.883218884468079e-05, 7.993727922439575e-05, 9.104236960411072e-05, 0.00010214745998382568, 0.00011325255036354065, 0.00012435764074325562, 0.00013546273112297058, 0.00014656782150268555, 0.0001576729118824005, 0.00016877800226211548, 0.00017988309264183044, 0.0001909881830215454, 0.00020209327340126038, 0.00021319836378097534, 0.0002243034541606903, 0.00023540854454040527, 0.00024651363492012024, 0.0002576187252998352, 0.00026872381567955017, 0.00027982890605926514, 0.0002909339964389801, 0.00030203908681869507, 0.00031314417719841003, 0.000324249267578125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 13.0, 22.0, 25.0, 50.0, 75.0, 99.0, 185.0, 291.0, 466.0, 824.0, 1402.0, 2639.0, 4826.0, 9277.0, 17496.0, 34011.0, 65324.0, 121098.0, 198400.0, 226910.0, 165558.0, 95091.0, 49806.0, 25859.0, 13240.0, 6891.0, 3751.0, 2081.0, 1129.0, 631.0, 389.0, 242.0, 157.0, 100.0, 57.0, 32.0, 27.0, 19.0, 10.0, 11.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.76171875, -4.6142578125, -4.466796875, -4.3193359375, -4.171875, -4.0244140625, -3.876953125, -3.7294921875, -3.58203125, -3.4345703125, -3.287109375, -3.1396484375, -2.9921875, -2.8447265625, -2.697265625, -2.5498046875, -2.40234375, -2.2548828125, -2.107421875, -1.9599609375, -1.8125, -1.6650390625, -1.517578125, -1.3701171875, -1.22265625, -1.0751953125, -0.927734375, -0.7802734375, -0.6328125, -0.4853515625, -0.337890625, -0.1904296875, -0.04296875, 0.1044921875, 0.251953125, 0.3994140625, 0.546875, 0.6943359375, 0.841796875, 0.9892578125, 1.13671875, 1.2841796875, 1.431640625, 1.5791015625, 1.7265625, 1.8740234375, 2.021484375, 2.1689453125, 2.31640625, 2.4638671875, 2.611328125, 2.7587890625, 2.90625, 3.0537109375, 3.201171875, 3.3486328125, 3.49609375, 3.6435546875, 3.791015625, 3.9384765625, 4.0859375, 4.2333984375, 4.380859375, 4.5283203125, 4.67578125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 13.0, 15.0, 20.0, 23.0, 25.0, 45.0, 36.0, 47.0, 54.0, 51.0, 61.0, 71.0, 63.0, 55.0, 53.0, 56.0, 42.0, 44.0, 36.0, 43.0, 33.0, 19.0, 17.0, 13.0, 8.0, 7.0, 6.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.644317626953125, -1.57769775390625, -1.511077880859375, -1.4444580078125, -1.377838134765625, -1.31121826171875, -1.244598388671875, -1.177978515625, -1.111358642578125, -1.04473876953125, -0.978118896484375, -0.9114990234375, -0.844879150390625, -0.77825927734375, -0.711639404296875, -0.64501953125, -0.578399658203125, -0.51177978515625, -0.445159912109375, -0.3785400390625, -0.311920166015625, -0.24530029296875, -0.178680419921875, -0.112060546875, -0.045440673828125, 0.02117919921875, 0.087799072265625, 0.1544189453125, 0.221038818359375, 0.28765869140625, 0.354278564453125, 0.4208984375, 0.487518310546875, 0.55413818359375, 0.620758056640625, 0.6873779296875, 0.753997802734375, 0.82061767578125, 0.887237548828125, 0.953857421875, 1.020477294921875, 1.08709716796875, 1.153717041015625, 1.2203369140625, 1.286956787109375, 1.35357666015625, 1.420196533203125, 1.48681640625, 1.553436279296875, 1.62005615234375, 1.686676025390625, 1.7532958984375, 1.819915771484375, 1.88653564453125, 1.953155517578125, 2.019775390625, 2.086395263671875, 2.15301513671875, 2.219635009765625, 2.2862548828125, 2.352874755859375, 2.41949462890625, 2.486114501953125, 2.552734375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 4.0, 2.0, 7.0, 7.0, 9.0, 14.0, 20.0, 25.0, 37.0, 39.0, 47.0, 40.0, 49.0, 47.0, 76.0, 66.0, 76.0, 65.0, 59.0, 48.0, 45.0, 38.0, 47.0, 26.0, 20.0, 25.0, 9.0, 3.0, 8.0, 6.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.361170768737793, -9.978911399841309, -9.59665298461914, -9.214393615722656, -8.832134246826172, -8.449875831604004, -8.06761646270752, -7.685357570648193, -7.303098678588867, -6.920839786529541, -6.538580894470215, -6.1563215255737305, -5.774062633514404, -5.391803741455078, -5.009544372558594, -4.627285480499268, -4.245026588439941, -3.8627676963806152, -3.48050856590271, -3.0982494354248047, -2.7159905433654785, -2.3337316513061523, -1.951472520828247, -1.5692133903503418, -1.1869544982910156, -0.8046954870223999, -0.4224364757537842, -0.04017746448516846, 0.34208154678344727, 0.724340558052063, 1.1065995693206787, 1.488858699798584, 1.8711166381835938, 2.25337553024292, 2.635634660720825, 3.0178937911987305, 3.4001526832580566, 3.782411575317383, 4.164670944213867, 4.546929836273193, 4.9291887283325195, 5.311447620391846, 5.693706512451172, 6.075965881347656, 6.458224773406982, 6.840483665466309, 7.222743034362793, 7.605001926422119, 7.987260818481445, 8.36952018737793, 8.751778602600098, 9.134037971496582, 9.51629638671875, 9.898555755615234, 10.280815124511719, 10.663074493408203, 11.045332908630371, 11.427592277526855, 11.809850692749023, 12.192110061645508, 12.574369430541992, 12.95662784576416, 13.338887214660645, 13.721145629882812, 14.103404998779297]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 7.0, 6.0, 8.0, 12.0, 13.0, 14.0, 11.0, 16.0, 18.0, 19.0, 15.0, 30.0, 23.0, 24.0, 31.0, 28.0, 36.0, 31.0, 37.0, 29.0, 42.0, 35.0, 44.0, 34.0, 48.0, 34.0, 40.0, 41.0, 27.0, 31.0, 32.0, 32.0, 26.0, 15.0, 12.0, 10.0, 12.0, 18.0, 13.0, 10.0, 8.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.329523086547852, -11.938533782958984, -11.547544479370117, -11.15655517578125, -10.765565872192383, -10.374576568603516, -9.983587265014648, -9.592597961425781, -9.201608657836914, -8.810619354248047, -8.41963005065918, -8.028640747070312, -7.637651443481445, -7.246662139892578, -6.855672836303711, -6.464683532714844, -6.073694229125977, -5.682704925537109, -5.291715621948242, -4.900726318359375, -4.509737014770508, -4.118747711181641, -3.7277584075927734, -3.3367691040039062, -2.945779800415039, -2.554790496826172, -2.1638011932373047, -1.7728118896484375, -1.3818225860595703, -0.9908332824707031, -0.5998439788818359, -0.20885467529296875, 0.18213367462158203, 0.5731229782104492, 0.9641122817993164, 1.3551015853881836, 1.7460908889770508, 2.137080192565918, 2.528069496154785, 2.9190587997436523, 3.3100481033325195, 3.7010374069213867, 4.092026710510254, 4.483016014099121, 4.874005317687988, 5.2649946212768555, 5.655983924865723, 6.04697322845459, 6.437962532043457, 6.828951835632324, 7.219941139221191, 7.610930442810059, 8.001919746398926, 8.392909049987793, 8.78389835357666, 9.174887657165527, 9.565876960754395, 9.956866264343262, 10.347855567932129, 10.738844871520996, 11.129834175109863, 11.52082347869873, 11.911812782287598, 12.302802085876465, 12.693791389465332]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 8.0, 18.0, 14.0, 26.0, 48.0, 58.0, 86.0, 133.0, 195.0, 290.0, 417.0, 615.0, 1026.0, 1535.0, 2369.0, 3714.0, 5894.0, 9728.0, 16349.0, 27867.0, 47010.0, 82185.0, 147447.0, 262952.0, 460592.0, 718089.0, 833706.0, 650658.0, 398475.0, 225930.0, 126102.0, 70658.0, 40618.0, 23432.0, 13993.0, 8488.0, 5047.0, 3012.0, 1963.0, 1270.0, 746.0, 553.0, 302.0, 233.0, 154.0, 100.0, 58.0, 37.0, 22.0, 18.0, 15.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-10.0703125, -9.7591552734375, -9.447998046875, -9.1368408203125, -8.82568359375, -8.5145263671875, -8.203369140625, -7.8922119140625, -7.5810546875, -7.2698974609375, -6.958740234375, -6.6475830078125, -6.33642578125, -6.0252685546875, -5.714111328125, -5.4029541015625, -5.091796875, -4.7806396484375, -4.469482421875, -4.1583251953125, -3.84716796875, -3.5360107421875, -3.224853515625, -2.9136962890625, -2.6025390625, -2.2913818359375, -1.980224609375, -1.6690673828125, -1.35791015625, -1.0467529296875, -0.735595703125, -0.4244384765625, -0.11328125, 0.1978759765625, 0.509033203125, 0.8201904296875, 1.13134765625, 1.4425048828125, 1.753662109375, 2.0648193359375, 2.3759765625, 2.6871337890625, 2.998291015625, 3.3094482421875, 3.62060546875, 3.9317626953125, 4.242919921875, 4.5540771484375, 4.865234375, 5.1763916015625, 5.487548828125, 5.7987060546875, 6.10986328125, 6.4210205078125, 6.732177734375, 7.0433349609375, 7.3544921875, 7.6656494140625, 7.976806640625, 8.2879638671875, 8.59912109375, 8.9102783203125, 9.221435546875, 9.5325927734375, 9.84375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 13.0, 11.0, 11.0, 11.0, 9.0, 15.0, 18.0, 23.0, 16.0, 25.0, 19.0, 25.0, 34.0, 30.0, 30.0, 44.0, 27.0, 33.0, 40.0, 34.0, 46.0, 37.0, 48.0, 48.0, 36.0, 43.0, 29.0, 32.0, 28.0, 35.0, 19.0, 18.0, 13.0, 15.0, 14.0, 10.0, 8.0, 5.0, 10.0, 5.0, 9.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.80078125, -7.53729248046875, -7.2738037109375, -7.01031494140625, -6.746826171875, -6.48333740234375, -6.2198486328125, -5.95635986328125, -5.69287109375, -5.42938232421875, -5.1658935546875, -4.90240478515625, -4.638916015625, -4.37542724609375, -4.1119384765625, -3.84844970703125, -3.5849609375, -3.32147216796875, -3.0579833984375, -2.79449462890625, -2.531005859375, -2.26751708984375, -2.0040283203125, -1.74053955078125, -1.47705078125, -1.21356201171875, -0.9500732421875, -0.68658447265625, -0.423095703125, -0.15960693359375, 0.1038818359375, 0.36737060546875, 0.630859375, 0.89434814453125, 1.1578369140625, 1.42132568359375, 1.684814453125, 1.94830322265625, 2.2117919921875, 2.47528076171875, 2.73876953125, 3.00225830078125, 3.2657470703125, 3.52923583984375, 3.792724609375, 4.05621337890625, 4.3197021484375, 4.58319091796875, 4.8466796875, 5.11016845703125, 5.3736572265625, 5.63714599609375, 5.900634765625, 6.16412353515625, 6.4276123046875, 6.69110107421875, 6.95458984375, 7.21807861328125, 7.4815673828125, 7.74505615234375, 8.008544921875, 8.27203369140625, 8.5355224609375, 8.79901123046875, 9.0625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 11.0, 13.0, 28.0, 43.0, 71.0, 136.0, 209.0, 319.0, 523.0, 840.0, 1312.0, 2229.0, 3738.0, 6463.0, 11534.0, 20494.0, 36441.0, 66941.0, 124056.0, 226525.0, 399071.0, 633422.0, 794969.0, 722303.0, 495037.0, 290573.0, 161169.0, 87688.0, 47288.0, 26277.0, 14611.0, 8360.0, 4555.0, 2712.0, 1637.0, 1009.0, 629.0, 399.0, 242.0, 148.0, 95.0, 71.0, 38.0, 25.0, 12.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.2080078125, -8.908203125, -8.6083984375, -8.30859375, -8.0087890625, -7.708984375, -7.4091796875, -7.109375, -6.8095703125, -6.509765625, -6.2099609375, -5.91015625, -5.6103515625, -5.310546875, -5.0107421875, -4.7109375, -4.4111328125, -4.111328125, -3.8115234375, -3.51171875, -3.2119140625, -2.912109375, -2.6123046875, -2.3125, -2.0126953125, -1.712890625, -1.4130859375, -1.11328125, -0.8134765625, -0.513671875, -0.2138671875, 0.0859375, 0.3857421875, 0.685546875, 0.9853515625, 1.28515625, 1.5849609375, 1.884765625, 2.1845703125, 2.484375, 2.7841796875, 3.083984375, 3.3837890625, 3.68359375, 3.9833984375, 4.283203125, 4.5830078125, 4.8828125, 5.1826171875, 5.482421875, 5.7822265625, 6.08203125, 6.3818359375, 6.681640625, 6.9814453125, 7.28125, 7.5810546875, 7.880859375, 8.1806640625, 8.48046875, 8.7802734375, 9.080078125, 9.3798828125, 9.6796875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 14.0, 3.0, 15.0, 13.0, 20.0, 14.0, 32.0, 47.0, 49.0, 66.0, 77.0, 95.0, 101.0, 135.0, 145.0, 149.0, 160.0, 192.0, 187.0, 188.0, 193.0, 213.0, 208.0, 202.0, 168.0, 200.0, 188.0, 169.0, 119.0, 126.0, 105.0, 88.0, 80.0, 55.0, 65.0, 47.0, 45.0, 18.0, 13.0, 14.0, 16.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.657958984375, -3.53076171875, -3.403564453125, -3.2763671875, -3.149169921875, -3.02197265625, -2.894775390625, -2.767578125, -2.640380859375, -2.51318359375, -2.385986328125, -2.2587890625, -2.131591796875, -2.00439453125, -1.877197265625, -1.75, -1.622802734375, -1.49560546875, -1.368408203125, -1.2412109375, -1.114013671875, -0.98681640625, -0.859619140625, -0.732421875, -0.605224609375, -0.47802734375, -0.350830078125, -0.2236328125, -0.096435546875, 0.03076171875, 0.157958984375, 0.28515625, 0.412353515625, 0.53955078125, 0.666748046875, 0.7939453125, 0.921142578125, 1.04833984375, 1.175537109375, 1.302734375, 1.429931640625, 1.55712890625, 1.684326171875, 1.8115234375, 1.938720703125, 2.06591796875, 2.193115234375, 2.3203125, 2.447509765625, 2.57470703125, 2.701904296875, 2.8291015625, 2.956298828125, 3.08349609375, 3.210693359375, 3.337890625, 3.465087890625, 3.59228515625, 3.719482421875, 3.8466796875, 3.973876953125, 4.10107421875, 4.228271484375, 4.35546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 10.0, 20.0, 28.0, 41.0, 57.0, 45.0, 76.0, 87.0, 102.0, 84.0, 81.0, 65.0, 61.0, 47.0, 41.0, 36.0, 28.0, 15.0, 9.0, 17.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.310401916503906, -9.852616310119629, -9.394830703735352, -8.937044143676758, -8.47925853729248, -8.021472930908203, -7.563687324523926, -7.10590124130249, -6.648115158081055, -6.190329551696777, -5.732543468475342, -5.2747578620910645, -4.816971778869629, -4.359186172485352, -3.901400327682495, -3.4436144828796387, -2.9858288764953613, -2.528043031692505, -2.0702571868896484, -1.6124714612960815, -1.154685616493225, -0.6968998908996582, -0.23911404609680176, 0.2186717987060547, 0.6764576435089111, 1.1342434883117676, 1.592029333114624, 2.0498151779174805, 2.507600784301758, 2.9653866291046143, 3.4231724739074707, 3.880958318710327, 4.338744163513184, 4.796529769897461, 5.2543158531188965, 5.712101459503174, 6.169887542724609, 6.627673149108887, 7.085458755493164, 7.5432448387146, 8.001030921936035, 8.458816528320312, 8.91660213470459, 9.374388694763184, 9.832174301147461, 10.289959907531738, 10.747745513916016, 11.20553207397461, 11.66331672668457, 12.121102333068848, 12.578887939453125, 13.036674499511719, 13.494460105895996, 13.952245712280273, 14.41003131866455, 14.867816925048828, 15.325603485107422, 15.7833890914917, 16.241174697875977, 16.69896125793457, 17.15674591064453, 17.614532470703125, 18.07231903076172, 18.53010368347168, 18.987890243530273]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 3.0, 2.0, 8.0, 14.0, 12.0, 12.0, 19.0, 12.0, 18.0, 18.0, 24.0, 22.0, 32.0, 38.0, 31.0, 32.0, 31.0, 44.0, 36.0, 34.0, 40.0, 41.0, 37.0, 35.0, 47.0, 46.0, 41.0, 30.0, 30.0, 20.0, 24.0, 30.0, 17.0, 11.0, 17.0, 21.0, 13.0, 12.0, 11.0, 9.0, 5.0, 5.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.766721725463867, -11.40952205657959, -11.052323341369629, -10.695123672485352, -10.337924003601074, -9.980725288391113, -9.623525619506836, -9.266326904296875, -8.909127235412598, -8.55192756652832, -8.19472885131836, -7.837529182434082, -7.480329990386963, -7.123130798339844, -6.765931129455566, -6.408731937408447, -6.05153226852417, -5.694333076477051, -5.337133407592773, -4.979934215545654, -4.622735023498535, -4.265535354614258, -3.9083361625671387, -3.5511369705200195, -3.1939375400543213, -2.836738109588623, -2.479538917541504, -2.1223394870758057, -1.765140175819397, -1.4079408645629883, -1.05074143409729, -0.6935422420501709, -0.33634281158447266, 0.020856529474258423, 0.3780558705329895, 0.735255241394043, 1.0924545526504517, 1.4496538639068604, 1.8068532943725586, 2.1640524864196777, 2.521251916885376, 2.878451347351074, 3.2356505393981934, 3.5928499698638916, 3.95004940032959, 4.307248592376709, 4.664447784423828, 5.0216474533081055, 5.378846645355225, 5.736045837402344, 6.093245506286621, 6.45044469833374, 6.807643890380859, 7.164843559265137, 7.522042751312256, 7.879241943359375, 8.236441612243652, 8.59364128112793, 8.95083999633789, 9.308039665222168, 9.665239334106445, 10.022438049316406, 10.379637718200684, 10.736837387084961, 11.094036102294922]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 9.0, 18.0, 17.0, 36.0, 56.0, 66.0, 102.0, 160.0, 222.0, 345.0, 508.0, 811.0, 1143.0, 1731.0, 2536.0, 3734.0, 5616.0, 8383.0, 12688.0, 19149.0, 29294.0, 45959.0, 72357.0, 116216.0, 171552.0, 184490.0, 134654.0, 84713.0, 52792.0, 33821.0, 22014.0, 14277.0, 9374.0, 6351.0, 4358.0, 2989.0, 1990.0, 1349.0, 882.0, 607.0, 389.0, 304.0, 170.0, 93.0, 82.0, 53.0, 29.0, 23.0, 16.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0], "bins": [-1.6201171875, -1.57269287109375, -1.5252685546875, -1.47784423828125, -1.430419921875, -1.38299560546875, -1.3355712890625, -1.28814697265625, -1.24072265625, -1.19329833984375, -1.1458740234375, -1.09844970703125, -1.051025390625, -1.00360107421875, -0.9561767578125, -0.90875244140625, -0.861328125, -0.81390380859375, -0.7664794921875, -0.71905517578125, -0.671630859375, -0.62420654296875, -0.5767822265625, -0.52935791015625, -0.48193359375, -0.43450927734375, -0.3870849609375, -0.33966064453125, -0.292236328125, -0.24481201171875, -0.1973876953125, -0.14996337890625, -0.1025390625, -0.05511474609375, -0.0076904296875, 0.03973388671875, 0.087158203125, 0.13458251953125, 0.1820068359375, 0.22943115234375, 0.27685546875, 0.32427978515625, 0.3717041015625, 0.41912841796875, 0.466552734375, 0.51397705078125, 0.5614013671875, 0.60882568359375, 0.65625, 0.70367431640625, 0.7510986328125, 0.79852294921875, 0.845947265625, 0.89337158203125, 0.9407958984375, 0.98822021484375, 1.03564453125, 1.08306884765625, 1.1304931640625, 1.17791748046875, 1.225341796875, 1.27276611328125, 1.3201904296875, 1.36761474609375, 1.4150390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 12.0, 11.0, 17.0, 17.0, 13.0, 17.0, 23.0, 25.0, 28.0, 34.0, 38.0, 30.0, 39.0, 43.0, 46.0, 36.0, 45.0, 51.0, 35.0, 43.0, 52.0, 29.0, 32.0, 37.0, 33.0, 26.0, 24.0, 19.0, 27.0, 13.0, 21.0, 14.0, 13.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.03125, -12.646240234375, -12.26123046875, -11.876220703125, -11.4912109375, -11.106201171875, -10.72119140625, -10.336181640625, -9.951171875, -9.566162109375, -9.18115234375, -8.796142578125, -8.4111328125, -8.026123046875, -7.64111328125, -7.256103515625, -6.87109375, -6.486083984375, -6.10107421875, -5.716064453125, -5.3310546875, -4.946044921875, -4.56103515625, -4.176025390625, -3.791015625, -3.406005859375, -3.02099609375, -2.635986328125, -2.2509765625, -1.865966796875, -1.48095703125, -1.095947265625, -0.7109375, -0.325927734375, 0.05908203125, 0.444091796875, 0.8291015625, 1.214111328125, 1.59912109375, 1.984130859375, 2.369140625, 2.754150390625, 3.13916015625, 3.524169921875, 3.9091796875, 4.294189453125, 4.67919921875, 5.064208984375, 5.44921875, 5.834228515625, 6.21923828125, 6.604248046875, 6.9892578125, 7.374267578125, 7.75927734375, 8.144287109375, 8.529296875, 8.914306640625, 9.29931640625, 9.684326171875, 10.0693359375, 10.454345703125, 10.83935546875, 11.224365234375, 11.609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 13.0, 13.0, 32.0, 54.0, 56.0, 108.0, 140.0, 238.0, 427.0, 723.0, 1181.0, 2127.0, 3831.0, 6613.0, 12044.0, 21830.0, 40025.0, 73983.0, 134218.0, 230773.0, 227582.0, 132060.0, 72656.0, 39609.0, 21275.0, 11814.0, 6470.0, 3613.0, 2034.0, 1205.0, 670.0, 426.0, 240.0, 160.0, 98.0, 65.0, 58.0, 28.0, 23.0, 17.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.893951416015625, -1.83282470703125, -1.771697998046875, -1.7105712890625, -1.649444580078125, -1.58831787109375, -1.527191162109375, -1.466064453125, -1.404937744140625, -1.34381103515625, -1.282684326171875, -1.2215576171875, -1.160430908203125, -1.09930419921875, -1.038177490234375, -0.97705078125, -0.915924072265625, -0.85479736328125, -0.793670654296875, -0.7325439453125, -0.671417236328125, -0.61029052734375, -0.549163818359375, -0.488037109375, -0.426910400390625, -0.36578369140625, -0.304656982421875, -0.2435302734375, -0.182403564453125, -0.12127685546875, -0.060150146484375, 0.0009765625, 0.062103271484375, 0.12322998046875, 0.184356689453125, 0.2454833984375, 0.306610107421875, 0.36773681640625, 0.428863525390625, 0.489990234375, 0.551116943359375, 0.61224365234375, 0.673370361328125, 0.7344970703125, 0.795623779296875, 0.85675048828125, 0.917877197265625, 0.97900390625, 1.040130615234375, 1.10125732421875, 1.162384033203125, 1.2235107421875, 1.284637451171875, 1.34576416015625, 1.406890869140625, 1.468017578125, 1.529144287109375, 1.59027099609375, 1.651397705078125, 1.7125244140625, 1.773651123046875, 1.83477783203125, 1.895904541015625, 1.95703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 1.0, 5.0, 6.0, 1.0, 8.0, 5.0, 11.0, 17.0, 12.0, 10.0, 16.0, 20.0, 25.0, 33.0, 25.0, 33.0, 29.0, 39.0, 44.0, 44.0, 35.0, 32.0, 49.0, 50.0, 40.0, 38.0, 44.0, 38.0, 43.0, 46.0, 27.0, 31.0, 19.0, 17.0, 21.0, 19.0, 11.0, 18.0, 11.0, 8.0, 3.0, 6.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1484375, -8.889404296875, -8.63037109375, -8.371337890625, -8.1123046875, -7.853271484375, -7.59423828125, -7.335205078125, -7.076171875, -6.817138671875, -6.55810546875, -6.299072265625, -6.0400390625, -5.781005859375, -5.52197265625, -5.262939453125, -5.00390625, -4.744873046875, -4.48583984375, -4.226806640625, -3.9677734375, -3.708740234375, -3.44970703125, -3.190673828125, -2.931640625, -2.672607421875, -2.41357421875, -2.154541015625, -1.8955078125, -1.636474609375, -1.37744140625, -1.118408203125, -0.859375, -0.600341796875, -0.34130859375, -0.082275390625, 0.1767578125, 0.435791015625, 0.69482421875, 0.953857421875, 1.212890625, 1.471923828125, 1.73095703125, 1.989990234375, 2.2490234375, 2.508056640625, 2.76708984375, 3.026123046875, 3.28515625, 3.544189453125, 3.80322265625, 4.062255859375, 4.3212890625, 4.580322265625, 4.83935546875, 5.098388671875, 5.357421875, 5.616455078125, 5.87548828125, 6.134521484375, 6.3935546875, 6.652587890625, 6.91162109375, 7.170654296875, 7.4296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 9.0, 7.0, 6.0, 19.0, 28.0, 30.0, 38.0, 57.0, 78.0, 113.0, 170.0, 220.0, 370.0, 517.0, 793.0, 1394.0, 2238.0, 4271.0, 8518.0, 18434.0, 45862.0, 132811.0, 387196.0, 289784.0, 92189.0, 33767.0, 14279.0, 6676.0, 3432.0, 1963.0, 1121.0, 668.0, 474.0, 314.0, 203.0, 151.0, 112.0, 56.0, 51.0, 44.0, 24.0, 13.0, 17.0, 8.0, 13.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.330322265625, -0.3202629089355469, -0.31020355224609375, -0.3001441955566406, -0.2900848388671875, -0.2800254821777344, -0.26996612548828125, -0.2599067687988281, -0.249847412109375, -0.23978805541992188, -0.22972869873046875, -0.21966934204101562, -0.2096099853515625, -0.19955062866210938, -0.18949127197265625, -0.17943191528320312, -0.16937255859375, -0.15931320190429688, -0.14925384521484375, -0.13919448852539062, -0.1291351318359375, -0.11907577514648438, -0.10901641845703125, -0.09895706176757812, -0.088897705078125, -0.07883834838867188, -0.06877899169921875, -0.058719635009765625, -0.0486602783203125, -0.038600921630859375, -0.02854156494140625, -0.018482208251953125, -0.0084228515625, 0.001636505126953125, 0.01169586181640625, 0.021755218505859375, 0.0318145751953125, 0.041873931884765625, 0.05193328857421875, 0.061992645263671875, 0.072052001953125, 0.08211135864257812, 0.09217071533203125, 0.10223007202148438, 0.1122894287109375, 0.12234878540039062, 0.13240814208984375, 0.14246749877929688, 0.15252685546875, 0.16258621215820312, 0.17264556884765625, 0.18270492553710938, 0.1927642822265625, 0.20282363891601562, 0.21288299560546875, 0.22294235229492188, 0.233001708984375, 0.24306106567382812, 0.25312042236328125, 0.2631797790527344, 0.2732391357421875, 0.2832984924316406, 0.29335784912109375, 0.3034172058105469, 0.3134765625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 14.0, 15.0, 12.0, 11.0, 20.0, 22.0, 20.0, 33.0, 26.0, 26.0, 24.0, 30.0, 44.0, 47.0, 44.0, 39.0, 45.0, 44.0, 47.0, 42.0, 49.0, 45.0, 43.0, 34.0, 27.0, 21.0, 27.0, 21.0, 11.0, 16.0, 15.0, 18.0, 12.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.0460225641727448e-05, -1.9820407032966614e-05, -1.918058842420578e-05, -1.8540769815444946e-05, -1.7900951206684113e-05, -1.726113259792328e-05, -1.6621313989162445e-05, -1.598149538040161e-05, -1.5341676771640778e-05, -1.4701858162879944e-05, -1.406203955411911e-05, -1.3422220945358276e-05, -1.2782402336597443e-05, -1.2142583727836609e-05, -1.1502765119075775e-05, -1.0862946510314941e-05, -1.0223127901554108e-05, -9.583309292793274e-06, -8.94349068403244e-06, -8.303672075271606e-06, -7.663853466510773e-06, -7.024034857749939e-06, -6.384216248989105e-06, -5.7443976402282715e-06, -5.104579031467438e-06, -4.464760422706604e-06, -3.82494181394577e-06, -3.1851232051849365e-06, -2.5453045964241028e-06, -1.905485987663269e-06, -1.2656673789024353e-06, -6.258487701416016e-07, 1.3969838619232178e-08, 6.537884473800659e-07, 1.2936070561408997e-06, 1.9334256649017334e-06, 2.573244273662567e-06, 3.213062882423401e-06, 3.852881491184235e-06, 4.492700099945068e-06, 5.132518708705902e-06, 5.772337317466736e-06, 6.41215592622757e-06, 7.051974534988403e-06, 7.691793143749237e-06, 8.33161175251007e-06, 8.971430361270905e-06, 9.611248970031738e-06, 1.0251067578792572e-05, 1.0890886187553406e-05, 1.153070479631424e-05, 1.2170523405075073e-05, 1.2810342013835907e-05, 1.345016062259674e-05, 1.4089979231357574e-05, 1.4729797840118408e-05, 1.5369616448879242e-05, 1.6009435057640076e-05, 1.664925366640091e-05, 1.7289072275161743e-05, 1.7928890883922577e-05, 1.856870949268341e-05, 1.9208528101444244e-05, 1.9848346710205078e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 17.0, 17.0, 46.0, 52.0, 94.0, 145.0, 202.0, 306.0, 466.0, 627.0, 999.0, 1542.0, 2332.0, 3569.0, 5399.0, 8677.0, 13366.0, 20688.0, 32687.0, 51918.0, 82220.0, 131065.0, 199576.0, 180760.0, 113973.0, 71357.0, 45921.0, 28742.0, 18429.0, 11573.0, 7557.0, 4980.0, 3149.0, 2106.0, 1348.0, 897.0, 632.0, 377.0, 236.0, 179.0, 111.0, 80.0, 53.0, 25.0, 27.0, 10.0, 9.0, 10.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30712890625, -0.29648590087890625, -0.2858428955078125, -0.27519989013671875, -0.264556884765625, -0.25391387939453125, -0.2432708740234375, -0.23262786865234375, -0.22198486328125, -0.21134185791015625, -0.2006988525390625, -0.19005584716796875, -0.179412841796875, -0.16876983642578125, -0.1581268310546875, -0.14748382568359375, -0.1368408203125, -0.12619781494140625, -0.1155548095703125, -0.10491180419921875, -0.094268798828125, -0.08362579345703125, -0.0729827880859375, -0.06233978271484375, -0.05169677734375, -0.04105377197265625, -0.0304107666015625, -0.01976776123046875, -0.009124755859375, 0.00151824951171875, 0.0121612548828125, 0.02280426025390625, 0.033447265625, 0.04409027099609375, 0.0547332763671875, 0.06537628173828125, 0.076019287109375, 0.08666229248046875, 0.0973052978515625, 0.10794830322265625, 0.11859130859375, 0.12923431396484375, 0.1398773193359375, 0.15052032470703125, 0.161163330078125, 0.17180633544921875, 0.1824493408203125, 0.19309234619140625, 0.2037353515625, 0.21437835693359375, 0.2250213623046875, 0.23566436767578125, 0.246307373046875, 0.25695037841796875, 0.2675933837890625, 0.27823638916015625, 0.28887939453125, 0.29952239990234375, 0.3101654052734375, 0.32080841064453125, 0.331451416015625, 0.34209442138671875, 0.3527374267578125, 0.36338043212890625, 0.3740234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 12.0, 11.0, 9.0, 9.0, 14.0, 11.0, 22.0, 12.0, 22.0, 18.0, 21.0, 23.0, 27.0, 22.0, 39.0, 33.0, 31.0, 37.0, 47.0, 38.0, 45.0, 40.0, 42.0, 43.0, 46.0, 43.0, 30.0, 34.0, 31.0, 17.0, 21.0, 17.0, 23.0, 12.0, 14.0, 14.0, 12.0, 6.0, 9.0, 8.0, 7.0, 1.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.20458984375, -0.19793319702148438, -0.19127655029296875, -0.18461990356445312, -0.1779632568359375, -0.17130661010742188, -0.16464996337890625, -0.15799331665039062, -0.151336669921875, -0.14468002319335938, -0.13802337646484375, -0.13136672973632812, -0.1247100830078125, -0.11805343627929688, -0.11139678955078125, -0.10474014282226562, -0.09808349609375, -0.09142684936523438, -0.08477020263671875, -0.07811355590820312, -0.0714569091796875, -0.06480026245117188, -0.05814361572265625, -0.051486968994140625, -0.044830322265625, -0.038173675537109375, -0.03151702880859375, -0.024860382080078125, -0.0182037353515625, -0.011547088623046875, -0.00489044189453125, 0.001766204833984375, 0.0084228515625, 0.015079498291015625, 0.02173614501953125, 0.028392791748046875, 0.0350494384765625, 0.041706085205078125, 0.04836273193359375, 0.055019378662109375, 0.061676025390625, 0.06833267211914062, 0.07498931884765625, 0.08164596557617188, 0.0883026123046875, 0.09495925903320312, 0.10161590576171875, 0.10827255249023438, 0.11492919921875, 0.12158584594726562, 0.12824249267578125, 0.13489913940429688, 0.1415557861328125, 0.14821243286132812, 0.15486907958984375, 0.16152572631835938, 0.168182373046875, 0.17483901977539062, 0.18149566650390625, 0.18815231323242188, 0.1948089599609375, 0.20146560668945312, 0.20812225341796875, 0.21477890014648438, 0.221435546875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 11.0, 9.0, 23.0, 27.0, 43.0, 50.0, 45.0, 79.0, 88.0, 102.0, 88.0, 78.0, 66.0, 66.0, 47.0, 38.0, 36.0, 27.0, 14.0, 12.0, 13.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.871111869812012, -10.408175468444824, -9.94523811340332, -9.482301712036133, -9.019365310668945, -8.556428909301758, -8.093491554260254, -7.630555152893066, -7.167618274688721, -6.704681396484375, -6.2417449951171875, -5.778808116912842, -5.315871238708496, -4.852934837341309, -4.389997959136963, -3.9270613193511963, -3.4641246795654297, -3.001188039779663, -2.5382513999938965, -2.075314521789551, -1.6123778820037842, -1.1494412422180176, -0.6865043640136719, -0.22356772422790527, 0.23936891555786133, 0.7023056149482727, 1.165242314338684, 1.6281790733337402, 2.091115713119507, 2.5540523529052734, 3.016989231109619, 3.4799258708953857, 3.942861557006836, 4.405798435211182, 4.868734836578369, 5.331671714782715, 5.794608116149902, 6.257544994354248, 6.720481872558594, 7.183418273925781, 7.646355152130127, 8.109292030334473, 8.57222843170166, 9.035165786743164, 9.498102188110352, 9.961038589477539, 10.423974990844727, 10.88691234588623, 11.349848747253418, 11.812785148620605, 12.27572250366211, 12.738658905029297, 13.201595306396484, 13.664531707763672, 14.127469062805176, 14.590405464172363, 15.053342819213867, 15.516279220581055, 15.979216575622559, 16.442153930664062, 16.90509033203125, 17.368026733398438, 17.830963134765625, 18.293899536132812, 18.7568359375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 6.0, 13.0, 11.0, 13.0, 16.0, 14.0, 18.0, 18.0, 15.0, 30.0, 31.0, 31.0, 35.0, 32.0, 31.0, 35.0, 39.0, 35.0, 38.0, 44.0, 39.0, 39.0, 42.0, 42.0, 45.0, 32.0, 34.0, 15.0, 22.0, 29.0, 27.0, 10.0, 16.0, 20.0, 13.0, 10.0, 17.0, 8.0, 6.0, 4.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.883959770202637, -11.52858829498291, -11.1732177734375, -10.817846298217773, -10.462475776672363, -10.107104301452637, -9.751733779907227, -9.3963623046875, -9.04099178314209, -8.685620307922363, -8.330249786376953, -7.974878787994385, -7.619507789611816, -7.264136791229248, -6.90876579284668, -6.553394317626953, -6.198023319244385, -5.842652320861816, -5.487281322479248, -5.13191032409668, -4.776539325714111, -4.421168327331543, -4.065796852111816, -3.710426092147827, -3.355055093765259, -2.9996840953826904, -2.644313097000122, -2.2889418601989746, -1.9335709810256958, -1.5781999826431274, -1.2228288650512695, -0.8674578666687012, -0.5120868682861328, -0.15671584010124207, 0.19865518808364868, 0.5540262460708618, 0.9093972444534302, 1.2647682428359985, 1.6201393604278564, 1.9755103588104248, 2.330881357192993, 2.6862523555755615, 3.04162335395813, 3.3969945907592773, 3.7523655891418457, 4.107736587524414, 4.463107585906982, 4.818478584289551, 5.173849582672119, 5.5292205810546875, 5.884591579437256, 6.239962577819824, 6.595333576202393, 6.950704574584961, 7.3060760498046875, 7.661446571350098, 8.016818046569824, 8.37218952178955, 8.727560043334961, 9.082931518554688, 9.438302040100098, 9.793673515319824, 10.149044036865234, 10.504415512084961, 10.859786033630371]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 13.0, 19.0, 17.0, 36.0, 50.0, 58.0, 117.0, 158.0, 252.0, 428.0, 587.0, 936.0, 1410.0, 2190.0, 3463.0, 5287.0, 8197.0, 12663.0, 19722.0, 29663.0, 45442.0, 65774.0, 90727.0, 115739.0, 131013.0, 130460.0, 112014.0, 86539.0, 62233.0, 42807.0, 28119.0, 18440.0, 12102.0, 7762.0, 5000.0, 3212.0, 2042.0, 1356.0, 876.0, 579.0, 356.0, 231.0, 160.0, 101.0, 81.0, 44.0, 25.0, 24.0, 14.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41796875, -6.21044921875, -6.0029296875, -5.79541015625, -5.587890625, -5.38037109375, -5.1728515625, -4.96533203125, -4.7578125, -4.55029296875, -4.3427734375, -4.13525390625, -3.927734375, -3.72021484375, -3.5126953125, -3.30517578125, -3.09765625, -2.89013671875, -2.6826171875, -2.47509765625, -2.267578125, -2.06005859375, -1.8525390625, -1.64501953125, -1.4375, -1.22998046875, -1.0224609375, -0.81494140625, -0.607421875, -0.39990234375, -0.1923828125, 0.01513671875, 0.22265625, 0.43017578125, 0.6376953125, 0.84521484375, 1.052734375, 1.26025390625, 1.4677734375, 1.67529296875, 1.8828125, 2.09033203125, 2.2978515625, 2.50537109375, 2.712890625, 2.92041015625, 3.1279296875, 3.33544921875, 3.54296875, 3.75048828125, 3.9580078125, 4.16552734375, 4.373046875, 4.58056640625, 4.7880859375, 4.99560546875, 5.203125, 5.41064453125, 5.6181640625, 5.82568359375, 6.033203125, 6.24072265625, 6.4482421875, 6.65576171875, 6.86328125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 5.0, 16.0, 13.0, 12.0, 18.0, 12.0, 30.0, 16.0, 25.0, 36.0, 34.0, 26.0, 39.0, 29.0, 36.0, 36.0, 52.0, 32.0, 42.0, 39.0, 38.0, 33.0, 45.0, 40.0, 28.0, 37.0, 24.0, 25.0, 23.0, 16.0, 20.0, 20.0, 15.0, 11.0, 13.0, 7.0, 8.0, 10.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-11.953125, -11.6029052734375, -11.252685546875, -10.9024658203125, -10.55224609375, -10.2020263671875, -9.851806640625, -9.5015869140625, -9.1513671875, -8.8011474609375, -8.450927734375, -8.1007080078125, -7.75048828125, -7.4002685546875, -7.050048828125, -6.6998291015625, -6.349609375, -5.9993896484375, -5.649169921875, -5.2989501953125, -4.94873046875, -4.5985107421875, -4.248291015625, -3.8980712890625, -3.5478515625, -3.1976318359375, -2.847412109375, -2.4971923828125, -2.14697265625, -1.7967529296875, -1.446533203125, -1.0963134765625, -0.74609375, -0.3958740234375, -0.045654296875, 0.3045654296875, 0.65478515625, 1.0050048828125, 1.355224609375, 1.7054443359375, 2.0556640625, 2.4058837890625, 2.756103515625, 3.1063232421875, 3.45654296875, 3.8067626953125, 4.156982421875, 4.5072021484375, 4.857421875, 5.2076416015625, 5.557861328125, 5.9080810546875, 6.25830078125, 6.6085205078125, 6.958740234375, 7.3089599609375, 7.6591796875, 8.0093994140625, 8.359619140625, 8.7098388671875, 9.06005859375, 9.4102783203125, 9.760498046875, 10.1107177734375, 10.4609375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 19.0, 38.0, 58.0, 72.0, 155.0, 206.0, 354.0, 579.0, 1005.0, 1541.0, 2757.0, 4667.0, 8195.0, 14035.0, 23975.0, 40422.0, 66244.0, 102543.0, 143605.0, 167276.0, 155515.0, 118461.0, 78226.0, 48413.0, 29098.0, 16956.0, 9803.0, 5891.0, 3395.0, 2082.0, 1183.0, 689.0, 422.0, 250.0, 145.0, 93.0, 63.0, 37.0, 19.0, 20.0, 12.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.93359375, -7.66632080078125, -7.3990478515625, -7.13177490234375, -6.864501953125, -6.59722900390625, -6.3299560546875, -6.06268310546875, -5.79541015625, -5.52813720703125, -5.2608642578125, -4.99359130859375, -4.726318359375, -4.45904541015625, -4.1917724609375, -3.92449951171875, -3.6572265625, -3.38995361328125, -3.1226806640625, -2.85540771484375, -2.588134765625, -2.32086181640625, -2.0535888671875, -1.78631591796875, -1.51904296875, -1.25177001953125, -0.9844970703125, -0.71722412109375, -0.449951171875, -0.18267822265625, 0.0845947265625, 0.35186767578125, 0.619140625, 0.88641357421875, 1.1536865234375, 1.42095947265625, 1.688232421875, 1.95550537109375, 2.2227783203125, 2.49005126953125, 2.75732421875, 3.02459716796875, 3.2918701171875, 3.55914306640625, 3.826416015625, 4.09368896484375, 4.3609619140625, 4.62823486328125, 4.8955078125, 5.16278076171875, 5.4300537109375, 5.69732666015625, 5.964599609375, 6.23187255859375, 6.4991455078125, 6.76641845703125, 7.03369140625, 7.30096435546875, 7.5682373046875, 7.83551025390625, 8.102783203125, 8.37005615234375, 8.6373291015625, 8.90460205078125, 9.171875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 10.0, 6.0, 12.0, 19.0, 16.0, 21.0, 18.0, 14.0, 23.0, 32.0, 29.0, 32.0, 35.0, 43.0, 43.0, 50.0, 33.0, 44.0, 38.0, 43.0, 48.0, 35.0, 40.0, 42.0, 35.0, 35.0, 32.0, 23.0, 24.0, 16.0, 20.0, 17.0, 14.0, 13.0, 9.0, 10.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.015625, -6.7685546875, -6.521484375, -6.2744140625, -6.02734375, -5.7802734375, -5.533203125, -5.2861328125, -5.0390625, -4.7919921875, -4.544921875, -4.2978515625, -4.05078125, -3.8037109375, -3.556640625, -3.3095703125, -3.0625, -2.8154296875, -2.568359375, -2.3212890625, -2.07421875, -1.8271484375, -1.580078125, -1.3330078125, -1.0859375, -0.8388671875, -0.591796875, -0.3447265625, -0.09765625, 0.1494140625, 0.396484375, 0.6435546875, 0.890625, 1.1376953125, 1.384765625, 1.6318359375, 1.87890625, 2.1259765625, 2.373046875, 2.6201171875, 2.8671875, 3.1142578125, 3.361328125, 3.6083984375, 3.85546875, 4.1025390625, 4.349609375, 4.5966796875, 4.84375, 5.0908203125, 5.337890625, 5.5849609375, 5.83203125, 6.0791015625, 6.326171875, 6.5732421875, 6.8203125, 7.0673828125, 7.314453125, 7.5615234375, 7.80859375, 8.0556640625, 8.302734375, 8.5498046875, 8.796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 28.0, 41.0, 57.0, 71.0, 146.0, 195.0, 287.0, 429.0, 636.0, 979.0, 1462.0, 2326.0, 3754.0, 5706.0, 9400.0, 15603.0, 26056.0, 44905.0, 76235.0, 125592.0, 180687.0, 190084.0, 143296.0, 89217.0, 52703.0, 30915.0, 18345.0, 10946.0, 6750.0, 4114.0, 2629.0, 1688.0, 1070.0, 733.0, 435.0, 329.0, 194.0, 164.0, 100.0, 60.0, 37.0, 34.0, 23.0, 16.0, 15.0, 10.0, 2.0, 6.0], "bins": [-3.9453125, -3.839111328125, -3.73291015625, -3.626708984375, -3.5205078125, -3.414306640625, -3.30810546875, -3.201904296875, -3.095703125, -2.989501953125, -2.88330078125, -2.777099609375, -2.6708984375, -2.564697265625, -2.45849609375, -2.352294921875, -2.24609375, -2.139892578125, -2.03369140625, -1.927490234375, -1.8212890625, -1.715087890625, -1.60888671875, -1.502685546875, -1.396484375, -1.290283203125, -1.18408203125, -1.077880859375, -0.9716796875, -0.865478515625, -0.75927734375, -0.653076171875, -0.546875, -0.440673828125, -0.33447265625, -0.228271484375, -0.1220703125, -0.015869140625, 0.09033203125, 0.196533203125, 0.302734375, 0.408935546875, 0.51513671875, 0.621337890625, 0.7275390625, 0.833740234375, 0.93994140625, 1.046142578125, 1.15234375, 1.258544921875, 1.36474609375, 1.470947265625, 1.5771484375, 1.683349609375, 1.78955078125, 1.895751953125, 2.001953125, 2.108154296875, 2.21435546875, 2.320556640625, 2.4267578125, 2.532958984375, 2.63916015625, 2.745361328125, 2.8515625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 3.0, 8.0, 9.0, 13.0, 16.0, 18.0, 25.0, 27.0, 35.0, 33.0, 58.0, 49.0, 59.0, 53.0, 57.0, 74.0, 62.0, 81.0, 69.0, 47.0, 45.0, 32.0, 33.0, 28.0, 14.0, 12.0, 16.0, 11.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024271011352539062, -0.0002351328730583191, -0.00022755563259124756, -0.00021997839212417603, -0.0002124011516571045, -0.00020482391119003296, -0.00019724667072296143, -0.0001896694302558899, -0.00018209218978881836, -0.00017451494932174683, -0.0001669377088546753, -0.00015936046838760376, -0.00015178322792053223, -0.0001442059874534607, -0.00013662874698638916, -0.00012905150651931763, -0.0001214742660522461, -0.00011389702558517456, -0.00010631978511810303, -9.87425446510315e-05, -9.116530418395996e-05, -8.358806371688843e-05, -7.60108232498169e-05, -6.843358278274536e-05, -6.085634231567383e-05, -5.3279101848602295e-05, -4.570186138153076e-05, -3.812462091445923e-05, -3.0547380447387695e-05, -2.2970139980316162e-05, -1.539289951324463e-05, -7.815659046173096e-06, -2.384185791015625e-07, 7.338821887969971e-06, 1.4916062355041504e-05, 2.2493302822113037e-05, 3.007054328918457e-05, 3.7647783756256104e-05, 4.522502422332764e-05, 5.280226469039917e-05, 6.03795051574707e-05, 6.795674562454224e-05, 7.553398609161377e-05, 8.31112265586853e-05, 9.068846702575684e-05, 9.826570749282837e-05, 0.0001058429479598999, 0.00011342018842697144, 0.00012099742889404297, 0.0001285746693611145, 0.00013615190982818604, 0.00014372915029525757, 0.0001513063907623291, 0.00015888363122940063, 0.00016646087169647217, 0.0001740381121635437, 0.00018161535263061523, 0.00018919259309768677, 0.0001967698335647583, 0.00020434707403182983, 0.00021192431449890137, 0.0002195015549659729, 0.00022707879543304443, 0.00023465603590011597, 0.0002422332763671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 7.0, 9.0, 22.0, 29.0, 57.0, 71.0, 102.0, 138.0, 223.0, 319.0, 511.0, 766.0, 1171.0, 1844.0, 3128.0, 5243.0, 9018.0, 15739.0, 27891.0, 49025.0, 84376.0, 136089.0, 184672.0, 186216.0, 137314.0, 86201.0, 50583.0, 28709.0, 16054.0, 9015.0, 5352.0, 3143.0, 2008.0, 1236.0, 772.0, 486.0, 312.0, 227.0, 136.0, 85.0, 69.0, 61.0, 38.0, 30.0, 18.0, 14.0, 7.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.54296875, -3.4356689453125, -3.328369140625, -3.2210693359375, -3.11376953125, -3.0064697265625, -2.899169921875, -2.7918701171875, -2.6845703125, -2.5772705078125, -2.469970703125, -2.3626708984375, -2.25537109375, -2.1480712890625, -2.040771484375, -1.9334716796875, -1.826171875, -1.7188720703125, -1.611572265625, -1.5042724609375, -1.39697265625, -1.2896728515625, -1.182373046875, -1.0750732421875, -0.9677734375, -0.8604736328125, -0.753173828125, -0.6458740234375, -0.53857421875, -0.4312744140625, -0.323974609375, -0.2166748046875, -0.109375, -0.0020751953125, 0.105224609375, 0.2125244140625, 0.31982421875, 0.4271240234375, 0.534423828125, 0.6417236328125, 0.7490234375, 0.8563232421875, 0.963623046875, 1.0709228515625, 1.17822265625, 1.2855224609375, 1.392822265625, 1.5001220703125, 1.607421875, 1.7147216796875, 1.822021484375, 1.9293212890625, 2.03662109375, 2.1439208984375, 2.251220703125, 2.3585205078125, 2.4658203125, 2.5731201171875, 2.680419921875, 2.7877197265625, 2.89501953125, 3.0023193359375, 3.109619140625, 3.2169189453125, 3.32421875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 1.0, 4.0, 8.0, 7.0, 12.0, 16.0, 14.0, 22.0, 24.0, 31.0, 29.0, 50.0, 32.0, 53.0, 55.0, 52.0, 54.0, 46.0, 48.0, 62.0, 49.0, 41.0, 36.0, 40.0, 30.0, 34.0, 22.0, 27.0, 17.0, 13.0, 13.0, 7.0, 6.0, 4.0, 1.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.46484375, -1.4170989990234375, -1.369354248046875, -1.3216094970703125, -1.27386474609375, -1.2261199951171875, -1.178375244140625, -1.1306304931640625, -1.0828857421875, -1.0351409912109375, -0.987396240234375, -0.9396514892578125, -0.89190673828125, -0.8441619873046875, -0.796417236328125, -0.7486724853515625, -0.700927734375, -0.6531829833984375, -0.605438232421875, -0.5576934814453125, -0.50994873046875, -0.4622039794921875, -0.414459228515625, -0.3667144775390625, -0.3189697265625, -0.2712249755859375, -0.223480224609375, -0.1757354736328125, -0.12799072265625, -0.0802459716796875, -0.032501220703125, 0.0152435302734375, 0.06298828125, 0.1107330322265625, 0.158477783203125, 0.2062225341796875, 0.25396728515625, 0.3017120361328125, 0.349456787109375, 0.3972015380859375, 0.4449462890625, 0.4926910400390625, 0.540435791015625, 0.5881805419921875, 0.63592529296875, 0.6836700439453125, 0.731414794921875, 0.7791595458984375, 0.826904296875, 0.8746490478515625, 0.922393798828125, 0.9701385498046875, 1.01788330078125, 1.0656280517578125, 1.113372802734375, 1.1611175537109375, 1.2088623046875, 1.2566070556640625, 1.304351806640625, 1.3520965576171875, 1.39984130859375, 1.4475860595703125, 1.495330810546875, 1.5430755615234375, 1.5908203125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 4.0, 10.0, 17.0, 25.0, 24.0, 37.0, 67.0, 73.0, 66.0, 81.0, 106.0, 102.0, 83.0, 62.0, 46.0, 46.0, 28.0, 28.0, 25.0, 27.0, 6.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.169316291809082, -10.684086799621582, -10.198858261108398, -9.713628768920898, -9.228399276733398, -8.743170738220215, -8.257941246032715, -7.772712230682373, -7.287483215332031, -6.8022541999816895, -6.317025184631348, -5.831795692443848, -5.346566677093506, -4.861337661743164, -4.376108169555664, -3.8908791542053223, -3.4056501388549805, -2.9204211235046387, -2.4351918697357178, -1.9499627351760864, -1.464733600616455, -0.9795045852661133, -0.4942753314971924, -0.009046077728271484, 0.4761829376220703, 0.9614120721817017, 1.446641206741333, 1.9318703413009644, 2.4170994758605957, 2.9023284912109375, 3.3875577449798584, 3.8727869987487793, 4.3580169677734375, 4.843245983123779, 5.328474998474121, 5.813704490661621, 6.298933506011963, 6.784162521362305, 7.269392013549805, 7.7546210289001465, 8.239850044250488, 8.725079536437988, 9.210308074951172, 9.695537567138672, 10.180767059326172, 10.665995597839355, 11.151225090026855, 11.636453628540039, 12.121683120727539, 12.606912612915039, 13.092141151428223, 13.577370643615723, 14.062599182128906, 14.547828674316406, 15.033058166503906, 15.518287658691406, 16.003517150878906, 16.488746643066406, 16.973976135253906, 17.459203720092773, 17.944433212280273, 18.429662704467773, 18.914892196655273, 19.400121688842773, 19.88534927368164]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 7.0, 7.0, 6.0, 10.0, 10.0, 7.0, 13.0, 19.0, 20.0, 15.0, 26.0, 31.0, 39.0, 18.0, 29.0, 38.0, 46.0, 45.0, 35.0, 27.0, 44.0, 39.0, 48.0, 33.0, 34.0, 29.0, 38.0, 41.0, 34.0, 19.0, 22.0, 19.0, 25.0, 19.0, 18.0, 11.0, 18.0, 10.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.458518028259277, -11.097037315368652, -10.735557556152344, -10.374076843261719, -10.012596130371094, -9.651115417480469, -9.28963565826416, -8.928154945373535, -8.56667423248291, -8.205193519592285, -7.843713283538818, -7.482233047485352, -7.120752334594727, -6.75927209854126, -6.397791862487793, -6.036311149597168, -5.674830913543701, -5.313350677490234, -4.951869964599609, -4.590389728546143, -4.228909015655518, -3.867428779602051, -3.505948305130005, -3.144467830657959, -2.782987356185913, -2.421506881713867, -2.0600264072418213, -1.698546051979065, -1.337065577507019, -0.9755851030349731, -0.6141047477722168, -0.2526242733001709, 0.108856201171875, 0.4703366458415985, 0.831817090511322, 1.1932975053787231, 1.554777979850769, 1.916258454322815, 2.2777388095855713, 2.639219284057617, 3.000699758529663, 3.362180233001709, 3.723660707473755, 4.085141181945801, 4.446621417999268, 4.808102130889893, 5.169582366943359, 5.531063079833984, 5.892543315887451, 6.254023551940918, 6.615504264831543, 6.97698450088501, 7.338465213775635, 7.699945449829102, 8.061426162719727, 8.422906875610352, 8.78438663482666, 9.145867347717285, 9.507347106933594, 9.868827819824219, 10.230308532714844, 10.591789245605469, 10.953269004821777, 11.314749717712402, 11.676230430603027]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 33.0, 35.0, 60.0, 60.0, 114.0, 160.0, 207.0, 366.0, 495.0, 716.0, 1051.0, 1602.0, 2511.0, 3860.0, 6075.0, 9683.0, 15785.0, 26356.0, 45396.0, 79044.0, 140763.0, 250911.0, 438741.0, 693338.0, 835387.0, 674083.0, 416631.0, 235798.0, 131606.0, 74671.0, 42783.0, 25424.0, 15156.0, 9398.0, 5750.0, 3680.0, 2265.0, 1465.0, 979.0, 637.0, 377.0, 276.0, 202.0, 104.0, 68.0, 65.0, 39.0, 26.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-9.7734375, -9.48974609375, -9.2060546875, -8.92236328125, -8.638671875, -8.35498046875, -8.0712890625, -7.78759765625, -7.50390625, -7.22021484375, -6.9365234375, -6.65283203125, -6.369140625, -6.08544921875, -5.8017578125, -5.51806640625, -5.234375, -4.95068359375, -4.6669921875, -4.38330078125, -4.099609375, -3.81591796875, -3.5322265625, -3.24853515625, -2.96484375, -2.68115234375, -2.3974609375, -2.11376953125, -1.830078125, -1.54638671875, -1.2626953125, -0.97900390625, -0.6953125, -0.41162109375, -0.1279296875, 0.15576171875, 0.439453125, 0.72314453125, 1.0068359375, 1.29052734375, 1.57421875, 1.85791015625, 2.1416015625, 2.42529296875, 2.708984375, 2.99267578125, 3.2763671875, 3.56005859375, 3.84375, 4.12744140625, 4.4111328125, 4.69482421875, 4.978515625, 5.26220703125, 5.5458984375, 5.82958984375, 6.11328125, 6.39697265625, 6.6806640625, 6.96435546875, 7.248046875, 7.53173828125, 7.8154296875, 8.09912109375, 8.3828125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 3.0, 8.0, 7.0, 6.0, 13.0, 11.0, 14.0, 13.0, 17.0, 28.0, 31.0, 27.0, 30.0, 23.0, 39.0, 43.0, 42.0, 47.0, 27.0, 33.0, 48.0, 40.0, 46.0, 37.0, 37.0, 30.0, 35.0, 43.0, 23.0, 26.0, 27.0, 23.0, 13.0, 16.0, 19.0, 9.0, 10.0, 9.0, 9.0, 8.0, 10.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.6640625, -7.41961669921875, -7.1751708984375, -6.93072509765625, -6.686279296875, -6.44183349609375, -6.1973876953125, -5.95294189453125, -5.70849609375, -5.46405029296875, -5.2196044921875, -4.97515869140625, -4.730712890625, -4.48626708984375, -4.2418212890625, -3.99737548828125, -3.7529296875, -3.50848388671875, -3.2640380859375, -3.01959228515625, -2.775146484375, -2.53070068359375, -2.2862548828125, -2.04180908203125, -1.79736328125, -1.55291748046875, -1.3084716796875, -1.06402587890625, -0.819580078125, -0.57513427734375, -0.3306884765625, -0.08624267578125, 0.158203125, 0.40264892578125, 0.6470947265625, 0.89154052734375, 1.135986328125, 1.38043212890625, 1.6248779296875, 1.86932373046875, 2.11376953125, 2.35821533203125, 2.6026611328125, 2.84710693359375, 3.091552734375, 3.33599853515625, 3.5804443359375, 3.82489013671875, 4.0693359375, 4.31378173828125, 4.5582275390625, 4.80267333984375, 5.047119140625, 5.29156494140625, 5.5360107421875, 5.78045654296875, 6.02490234375, 6.26934814453125, 6.5137939453125, 6.75823974609375, 7.002685546875, 7.24713134765625, 7.4915771484375, 7.73602294921875, 7.98046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 6.0, 3.0, 10.0, 5.0, 15.0, 20.0, 32.0, 46.0, 95.0, 130.0, 176.0, 280.0, 436.0, 649.0, 946.0, 1474.0, 2317.0, 3601.0, 5826.0, 9546.0, 15576.0, 25520.0, 42107.0, 70551.0, 118819.0, 197651.0, 325757.0, 501640.0, 669404.0, 696069.0, 556717.0, 372353.0, 230893.0, 137932.0, 82041.0, 48842.0, 29680.0, 17906.0, 10753.0, 6805.0, 4259.0, 2592.0, 1638.0, 1136.0, 683.0, 439.0, 314.0, 198.0, 148.0, 67.0, 62.0, 55.0, 28.0, 21.0, 9.0, 3.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.3046875, -7.0623779296875, -6.820068359375, -6.5777587890625, -6.33544921875, -6.0931396484375, -5.850830078125, -5.6085205078125, -5.3662109375, -5.1239013671875, -4.881591796875, -4.6392822265625, -4.39697265625, -4.1546630859375, -3.912353515625, -3.6700439453125, -3.427734375, -3.1854248046875, -2.943115234375, -2.7008056640625, -2.45849609375, -2.2161865234375, -1.973876953125, -1.7315673828125, -1.4892578125, -1.2469482421875, -1.004638671875, -0.7623291015625, -0.52001953125, -0.2777099609375, -0.035400390625, 0.2069091796875, 0.44921875, 0.6915283203125, 0.933837890625, 1.1761474609375, 1.41845703125, 1.6607666015625, 1.903076171875, 2.1453857421875, 2.3876953125, 2.6300048828125, 2.872314453125, 3.1146240234375, 3.35693359375, 3.5992431640625, 3.841552734375, 4.0838623046875, 4.326171875, 4.5684814453125, 4.810791015625, 5.0531005859375, 5.29541015625, 5.5377197265625, 5.780029296875, 6.0223388671875, 6.2646484375, 6.5069580078125, 6.749267578125, 6.9915771484375, 7.23388671875, 7.4761962890625, 7.718505859375, 7.9608154296875, 8.203125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 2.0, 8.0, 7.0, 3.0, 12.0, 5.0, 7.0, 14.0, 19.0, 30.0, 33.0, 37.0, 49.0, 69.0, 72.0, 93.0, 111.0, 142.0, 124.0, 174.0, 190.0, 177.0, 224.0, 212.0, 223.0, 253.0, 212.0, 205.0, 166.0, 174.0, 148.0, 137.0, 125.0, 98.0, 112.0, 87.0, 67.0, 55.0, 41.0, 49.0, 30.0, 25.0, 16.0, 6.0, 8.0, 12.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.3275146484375, -3.209716796875, -3.0919189453125, -2.97412109375, -2.8563232421875, -2.738525390625, -2.6207275390625, -2.5029296875, -2.3851318359375, -2.267333984375, -2.1495361328125, -2.03173828125, -1.9139404296875, -1.796142578125, -1.6783447265625, -1.560546875, -1.4427490234375, -1.324951171875, -1.2071533203125, -1.08935546875, -0.9715576171875, -0.853759765625, -0.7359619140625, -0.6181640625, -0.5003662109375, -0.382568359375, -0.2647705078125, -0.14697265625, -0.0291748046875, 0.088623046875, 0.2064208984375, 0.32421875, 0.4420166015625, 0.559814453125, 0.6776123046875, 0.79541015625, 0.9132080078125, 1.031005859375, 1.1488037109375, 1.2666015625, 1.3843994140625, 1.502197265625, 1.6199951171875, 1.73779296875, 1.8555908203125, 1.973388671875, 2.0911865234375, 2.208984375, 2.3267822265625, 2.444580078125, 2.5623779296875, 2.68017578125, 2.7979736328125, 2.915771484375, 3.0335693359375, 3.1513671875, 3.2691650390625, 3.386962890625, 3.5047607421875, 3.62255859375, 3.7403564453125, 3.858154296875, 3.9759521484375, 4.09375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 16.0, 16.0, 17.0, 19.0, 16.0, 29.0, 48.0, 48.0, 69.0, 67.0, 79.0, 91.0, 72.0, 71.0, 59.0, 61.0, 32.0, 30.0, 25.0, 21.0, 23.0, 26.0, 11.0, 9.0, 6.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.526385307312012, -10.148177146911621, -9.76996898651123, -9.39176082611084, -9.01355266571045, -8.635344505310059, -8.257135391235352, -7.878927707672119, -7.5007195472717285, -7.122511386871338, -6.744303226470947, -6.366094589233398, -5.987886428833008, -5.609678268432617, -5.231470108032227, -4.853261947631836, -4.475053787231445, -4.096845626831055, -3.718637466430664, -3.3404290676116943, -2.9622209072113037, -2.584012746810913, -2.2058043479919434, -1.8275961875915527, -1.449388027191162, -1.0711798667907715, -0.6929715871810913, -0.31476330757141113, 0.06344485282897949, 0.4416530132293701, 0.8198614120483398, 1.1980695724487305, 1.5762767791748047, 1.9544849395751953, 2.332693099975586, 2.7109014987945557, 3.0891096591949463, 3.467317819595337, 3.8455262184143066, 4.223734378814697, 4.601942539215088, 4.9801506996154785, 5.358358860015869, 5.736567497253418, 6.114775657653809, 6.492983818054199, 6.87119197845459, 7.2494001388549805, 7.627608299255371, 8.005816459655762, 8.384024620056152, 8.762232780456543, 9.140440940856934, 9.518649101257324, 9.896858215332031, 10.275066375732422, 10.653274536132812, 11.031482696533203, 11.409690856933594, 11.787899017333984, 12.166107177734375, 12.544315338134766, 12.922523498535156, 13.300731658935547, 13.678939819335938]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 4.0, 7.0, 7.0, 8.0, 9.0, 12.0, 8.0, 15.0, 15.0, 25.0, 13.0, 22.0, 20.0, 29.0, 14.0, 25.0, 37.0, 44.0, 43.0, 35.0, 37.0, 38.0, 41.0, 54.0, 29.0, 40.0, 26.0, 40.0, 32.0, 32.0, 22.0, 30.0, 34.0, 19.0, 25.0, 17.0, 9.0, 16.0, 16.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 5.0], "bins": [-10.697165489196777, -10.378005981445312, -10.058845520019531, -9.739686012268066, -9.420526504516602, -9.10136604309082, -8.782206535339355, -8.46304702758789, -8.14388656616211, -7.824726581573486, -7.505566596984863, -7.186407089233398, -6.867247104644775, -6.548087120056152, -6.2289276123046875, -5.9097676277160645, -5.590607643127441, -5.271447658538818, -4.952287673950195, -4.6331281661987305, -4.313968181610107, -3.9948081970214844, -3.6756484508514404, -3.3564887046813965, -3.0373287200927734, -2.7181687355041504, -2.3990089893341064, -2.0798492431640625, -1.7606892585754395, -1.441529393196106, -1.1223695278167725, -0.8032097816467285, -0.4840507507324219, -0.16489088535308838, 0.15426898002624512, 0.4734288454055786, 0.7925887107849121, 1.1117485761642456, 1.430908441543579, 1.750068187713623, 2.069228172302246, 2.388388156890869, 2.707547903060913, 3.026707649230957, 3.34586763381958, 3.665027618408203, 3.984187364578247, 4.303347110748291, 4.622507095336914, 4.941667079925537, 5.26082706451416, 5.579986572265625, 5.899146556854248, 6.218306541442871, 6.537466049194336, 6.856626033782959, 7.175786018371582, 7.494946002960205, 7.814105987548828, 8.133265495300293, 8.452425003051758, 8.771585464477539, 9.090744972229004, 9.409904479980469, 9.72906494140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 7.0, 23.0, 14.0, 30.0, 44.0, 63.0, 85.0, 120.0, 170.0, 281.0, 446.0, 620.0, 968.0, 1420.0, 2165.0, 3283.0, 5048.0, 7870.0, 12256.0, 19137.0, 30826.0, 49883.0, 80911.0, 128606.0, 184504.0, 182832.0, 125872.0, 79307.0, 48913.0, 29962.0, 18964.0, 11926.0, 7417.0, 4797.0, 3275.0, 2138.0, 1348.0, 973.0, 616.0, 432.0, 328.0, 217.0, 164.0, 86.0, 71.0, 52.0, 24.0, 21.0, 16.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.33203125, -1.290374755859375, -1.24871826171875, -1.207061767578125, -1.1654052734375, -1.123748779296875, -1.08209228515625, -1.040435791015625, -0.998779296875, -0.957122802734375, -0.91546630859375, -0.873809814453125, -0.8321533203125, -0.790496826171875, -0.74884033203125, -0.707183837890625, -0.66552734375, -0.623870849609375, -0.58221435546875, -0.540557861328125, -0.4989013671875, -0.457244873046875, -0.41558837890625, -0.373931884765625, -0.332275390625, -0.290618896484375, -0.24896240234375, -0.207305908203125, -0.1656494140625, -0.123992919921875, -0.08233642578125, -0.040679931640625, 0.0009765625, 0.042633056640625, 0.08428955078125, 0.125946044921875, 0.1676025390625, 0.209259033203125, 0.25091552734375, 0.292572021484375, 0.334228515625, 0.375885009765625, 0.41754150390625, 0.459197998046875, 0.5008544921875, 0.542510986328125, 0.58416748046875, 0.625823974609375, 0.66748046875, 0.709136962890625, 0.75079345703125, 0.792449951171875, 0.8341064453125, 0.875762939453125, 0.91741943359375, 0.959075927734375, 1.000732421875, 1.042388916015625, 1.08404541015625, 1.125701904296875, 1.1673583984375, 1.209014892578125, 1.25067138671875, 1.292327880859375, 1.333984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 11.0, 8.0, 7.0, 7.0, 7.0, 17.0, 17.0, 21.0, 18.0, 17.0, 16.0, 21.0, 30.0, 38.0, 31.0, 30.0, 46.0, 41.0, 43.0, 43.0, 35.0, 41.0, 55.0, 35.0, 30.0, 32.0, 40.0, 44.0, 23.0, 28.0, 25.0, 16.0, 16.0, 18.0, 21.0, 8.0, 11.0, 10.0, 9.0, 3.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0], "bins": [-11.3984375, -11.058349609375, -10.71826171875, -10.378173828125, -10.0380859375, -9.697998046875, -9.35791015625, -9.017822265625, -8.677734375, -8.337646484375, -7.99755859375, -7.657470703125, -7.3173828125, -6.977294921875, -6.63720703125, -6.297119140625, -5.95703125, -5.616943359375, -5.27685546875, -4.936767578125, -4.5966796875, -4.256591796875, -3.91650390625, -3.576416015625, -3.236328125, -2.896240234375, -2.55615234375, -2.216064453125, -1.8759765625, -1.535888671875, -1.19580078125, -0.855712890625, -0.515625, -0.175537109375, 0.16455078125, 0.504638671875, 0.8447265625, 1.184814453125, 1.52490234375, 1.864990234375, 2.205078125, 2.545166015625, 2.88525390625, 3.225341796875, 3.5654296875, 3.905517578125, 4.24560546875, 4.585693359375, 4.92578125, 5.265869140625, 5.60595703125, 5.946044921875, 6.2861328125, 6.626220703125, 6.96630859375, 7.306396484375, 7.646484375, 7.986572265625, 8.32666015625, 8.666748046875, 9.0068359375, 9.346923828125, 9.68701171875, 10.027099609375, 10.3671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 20.0, 32.0, 40.0, 73.0, 109.0, 175.0, 299.0, 540.0, 995.0, 1824.0, 3079.0, 5694.0, 10762.0, 19705.0, 37718.0, 70893.0, 134138.0, 239351.0, 238936.0, 133096.0, 70911.0, 37334.0, 19691.0, 10358.0, 5759.0, 3004.0, 1698.0, 958.0, 533.0, 321.0, 198.0, 102.0, 68.0, 33.0, 30.0, 25.0, 13.0, 8.0, 8.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.688812255859375, -1.63250732421875, -1.576202392578125, -1.5198974609375, -1.463592529296875, -1.40728759765625, -1.350982666015625, -1.294677734375, -1.238372802734375, -1.18206787109375, -1.125762939453125, -1.0694580078125, -1.013153076171875, -0.95684814453125, -0.900543212890625, -0.84423828125, -0.787933349609375, -0.73162841796875, -0.675323486328125, -0.6190185546875, -0.562713623046875, -0.50640869140625, -0.450103759765625, -0.393798828125, -0.337493896484375, -0.28118896484375, -0.224884033203125, -0.1685791015625, -0.112274169921875, -0.05596923828125, 0.000335693359375, 0.056640625, 0.112945556640625, 0.16925048828125, 0.225555419921875, 0.2818603515625, 0.338165283203125, 0.39447021484375, 0.450775146484375, 0.507080078125, 0.563385009765625, 0.61968994140625, 0.675994873046875, 0.7322998046875, 0.788604736328125, 0.84490966796875, 0.901214599609375, 0.95751953125, 1.013824462890625, 1.07012939453125, 1.126434326171875, 1.1827392578125, 1.239044189453125, 1.29534912109375, 1.351654052734375, 1.407958984375, 1.464263916015625, 1.52056884765625, 1.576873779296875, 1.6331787109375, 1.689483642578125, 1.74578857421875, 1.802093505859375, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 10.0, 10.0, 12.0, 6.0, 16.0, 15.0, 27.0, 21.0, 22.0, 20.0, 40.0, 27.0, 37.0, 21.0, 41.0, 46.0, 47.0, 48.0, 46.0, 36.0, 48.0, 37.0, 39.0, 43.0, 37.0, 29.0, 33.0, 27.0, 30.0, 20.0, 22.0, 17.0, 8.0, 9.0, 9.0, 10.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.234375, -7.991455078125, -7.74853515625, -7.505615234375, -7.2626953125, -7.019775390625, -6.77685546875, -6.533935546875, -6.291015625, -6.048095703125, -5.80517578125, -5.562255859375, -5.3193359375, -5.076416015625, -4.83349609375, -4.590576171875, -4.34765625, -4.104736328125, -3.86181640625, -3.618896484375, -3.3759765625, -3.133056640625, -2.89013671875, -2.647216796875, -2.404296875, -2.161376953125, -1.91845703125, -1.675537109375, -1.4326171875, -1.189697265625, -0.94677734375, -0.703857421875, -0.4609375, -0.218017578125, 0.02490234375, 0.267822265625, 0.5107421875, 0.753662109375, 0.99658203125, 1.239501953125, 1.482421875, 1.725341796875, 1.96826171875, 2.211181640625, 2.4541015625, 2.697021484375, 2.93994140625, 3.182861328125, 3.42578125, 3.668701171875, 3.91162109375, 4.154541015625, 4.3974609375, 4.640380859375, 4.88330078125, 5.126220703125, 5.369140625, 5.612060546875, 5.85498046875, 6.097900390625, 6.3408203125, 6.583740234375, 6.82666015625, 7.069580078125, 7.3125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 4.0, 12.0, 13.0, 37.0, 37.0, 55.0, 82.0, 94.0, 183.0, 248.0, 375.0, 587.0, 923.0, 1510.0, 2479.0, 4408.0, 8384.0, 17429.0, 41758.0, 125056.0, 413713.0, 288634.0, 82969.0, 30170.0, 13418.0, 6695.0, 3623.0, 2110.0, 1207.0, 795.0, 515.0, 338.0, 207.0, 142.0, 108.0, 65.0, 42.0, 39.0, 32.0, 15.0, 7.0, 12.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.314208984375, -0.3054389953613281, -0.29666900634765625, -0.2878990173339844, -0.2791290283203125, -0.2703590393066406, -0.26158905029296875, -0.2528190612792969, -0.244049072265625, -0.23527908325195312, -0.22650909423828125, -0.21773910522460938, -0.2089691162109375, -0.20019912719726562, -0.19142913818359375, -0.18265914916992188, -0.17388916015625, -0.16511917114257812, -0.15634918212890625, -0.14757919311523438, -0.1388092041015625, -0.13003921508789062, -0.12126922607421875, -0.11249923706054688, -0.103729248046875, -0.09495925903320312, -0.08618927001953125, -0.07741928100585938, -0.0686492919921875, -0.059879302978515625, -0.05110931396484375, -0.042339324951171875, -0.0335693359375, -0.024799346923828125, -0.01602935791015625, -0.007259368896484375, 0.0015106201171875, 0.010280609130859375, 0.01905059814453125, 0.027820587158203125, 0.036590576171875, 0.045360565185546875, 0.05413055419921875, 0.06290054321289062, 0.0716705322265625, 0.08044052124023438, 0.08921051025390625, 0.09798049926757812, 0.10675048828125, 0.11552047729492188, 0.12429046630859375, 0.13306045532226562, 0.1418304443359375, 0.15060043334960938, 0.15937042236328125, 0.16814041137695312, 0.176910400390625, 0.18568038940429688, 0.19445037841796875, 0.20322036743164062, 0.2119903564453125, 0.22076034545898438, 0.22953033447265625, 0.23830032348632812, 0.2470703125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 5.0, 8.0, 15.0, 16.0, 19.0, 20.0, 35.0, 31.0, 29.0, 49.0, 57.0, 56.0, 47.0, 75.0, 61.0, 56.0, 56.0, 60.0, 48.0, 50.0, 34.0, 32.0, 21.0, 25.0, 24.0, 13.0, 10.0, 9.0, 3.0, 7.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.737195998430252e-05, -1.6743317246437073e-05, -1.6114674508571625e-05, -1.5486031770706177e-05, -1.4857389032840729e-05, -1.422874629497528e-05, -1.3600103557109833e-05, -1.2971460819244385e-05, -1.2342818081378937e-05, -1.1714175343513489e-05, -1.108553260564804e-05, -1.0456889867782593e-05, -9.828247129917145e-06, -9.199604392051697e-06, -8.570961654186249e-06, -7.9423189163208e-06, -7.313676178455353e-06, -6.685033440589905e-06, -6.056390702724457e-06, -5.427747964859009e-06, -4.799105226993561e-06, -4.170462489128113e-06, -3.541819751262665e-06, -2.913177013397217e-06, -2.284534275531769e-06, -1.6558915376663208e-06, -1.0272487998008728e-06, -3.986060619354248e-07, 2.300366759300232e-07, 8.586794137954712e-07, 1.4873221516609192e-06, 2.115964889526367e-06, 2.744607627391815e-06, 3.373250365257263e-06, 4.001893103122711e-06, 4.630535840988159e-06, 5.259178578853607e-06, 5.887821316719055e-06, 6.516464054584503e-06, 7.145106792449951e-06, 7.7737495303154e-06, 8.402392268180847e-06, 9.031035006046295e-06, 9.659677743911743e-06, 1.0288320481777191e-05, 1.091696321964264e-05, 1.1545605957508087e-05, 1.2174248695373535e-05, 1.2802891433238983e-05, 1.3431534171104431e-05, 1.4060176908969879e-05, 1.4688819646835327e-05, 1.5317462384700775e-05, 1.5946105122566223e-05, 1.657474786043167e-05, 1.720339059829712e-05, 1.7832033336162567e-05, 1.8460676074028015e-05, 1.9089318811893463e-05, 1.971796154975891e-05, 2.034660428762436e-05, 2.0975247025489807e-05, 2.1603889763355255e-05, 2.2232532501220703e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 14.0, 17.0, 9.0, 31.0, 46.0, 62.0, 70.0, 112.0, 122.0, 174.0, 271.0, 391.0, 518.0, 729.0, 1150.0, 1785.0, 2756.0, 4572.0, 7585.0, 13213.0, 23650.0, 45250.0, 88215.0, 185339.0, 308632.0, 178716.0, 85141.0, 43703.0, 23184.0, 12978.0, 7500.0, 4398.0, 2684.0, 1737.0, 1150.0, 765.0, 562.0, 367.0, 274.0, 188.0, 137.0, 114.0, 74.0, 48.0, 38.0, 22.0, 20.0, 16.0, 13.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.345947265625, -0.3349571228027344, -0.32396697998046875, -0.3129768371582031, -0.3019866943359375, -0.2909965515136719, -0.28000640869140625, -0.2690162658691406, -0.258026123046875, -0.24703598022460938, -0.23604583740234375, -0.22505569458007812, -0.2140655517578125, -0.20307540893554688, -0.19208526611328125, -0.18109512329101562, -0.17010498046875, -0.15911483764648438, -0.14812469482421875, -0.13713455200195312, -0.1261444091796875, -0.11515426635742188, -0.10416412353515625, -0.09317398071289062, -0.082183837890625, -0.07119369506835938, -0.06020355224609375, -0.049213409423828125, -0.0382232666015625, -0.027233123779296875, -0.01624298095703125, -0.005252838134765625, 0.0057373046875, 0.016727447509765625, 0.02771759033203125, 0.038707733154296875, 0.0496978759765625, 0.060688018798828125, 0.07167816162109375, 0.08266830444335938, 0.093658447265625, 0.10464859008789062, 0.11563873291015625, 0.12662887573242188, 0.1376190185546875, 0.14860916137695312, 0.15959930419921875, 0.17058944702148438, 0.18157958984375, 0.19256973266601562, 0.20355987548828125, 0.21455001831054688, 0.2255401611328125, 0.23653030395507812, 0.24752044677734375, 0.2585105895996094, 0.269500732421875, 0.2804908752441406, 0.29148101806640625, 0.3024711608886719, 0.3134613037109375, 0.3244514465332031, 0.33544158935546875, 0.3464317321777344, 0.357421875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 1.0, 12.0, 7.0, 10.0, 19.0, 19.0, 24.0, 29.0, 43.0, 60.0, 53.0, 69.0, 48.0, 56.0, 69.0, 48.0, 67.0, 59.0, 56.0, 47.0, 43.0, 35.0, 25.0, 22.0, 19.0, 7.0, 12.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.19952774047851562, -0.19251251220703125, -0.18549728393554688, -0.1784820556640625, -0.17146682739257812, -0.16445159912109375, -0.15743637084960938, -0.150421142578125, -0.14340591430664062, -0.13639068603515625, -0.12937545776367188, -0.1223602294921875, -0.11534500122070312, -0.10832977294921875, -0.10131454467773438, -0.09429931640625, -0.08728408813476562, -0.08026885986328125, -0.07325363159179688, -0.0662384033203125, -0.059223175048828125, -0.05220794677734375, -0.045192718505859375, -0.038177490234375, -0.031162261962890625, -0.02414703369140625, -0.017131805419921875, -0.0101165771484375, -0.003101348876953125, 0.00391387939453125, 0.010929107666015625, 0.0179443359375, 0.024959564208984375, 0.03197479248046875, 0.038990020751953125, 0.0460052490234375, 0.053020477294921875, 0.06003570556640625, 0.06705093383789062, 0.074066162109375, 0.08108139038085938, 0.08809661865234375, 0.09511184692382812, 0.1021270751953125, 0.10914230346679688, 0.11615753173828125, 0.12317276000976562, 0.13018798828125, 0.13720321655273438, 0.14421844482421875, 0.15123367309570312, 0.1582489013671875, 0.16526412963867188, 0.17227935791015625, 0.17929458618164062, 0.186309814453125, 0.19332504272460938, 0.20034027099609375, 0.20735549926757812, 0.2143707275390625, 0.22138595581054688, 0.22840118408203125, 0.23541641235351562, 0.242431640625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 14.0, 16.0, 12.0, 22.0, 19.0, 31.0, 45.0, 55.0, 59.0, 69.0, 86.0, 84.0, 80.0, 69.0, 65.0, 49.0, 33.0, 33.0, 28.0, 22.0, 20.0, 23.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.547654151916504, -10.168135643005371, -9.788617134094238, -9.409098625183105, -9.029579162597656, -8.650060653686523, -8.27054214477539, -7.891023635864258, -7.511505126953125, -7.131986618041992, -6.752468109130859, -6.372949123382568, -5.9934306144714355, -5.613912105560303, -5.234393119812012, -4.854874610900879, -4.475356101989746, -4.095837593078613, -3.7163188457489014, -3.3368000984191895, -2.9572815895080566, -2.577763080596924, -2.198244333267212, -1.8187255859375, -1.4392070770263672, -1.0596884489059448, -0.6801698207855225, -0.3006511926651001, 0.07886743545532227, 0.45838606357574463, 0.837904691696167, 1.217423439025879, 1.5969429016113281, 1.9764615297317505, 2.355980157852173, 2.7354989051818848, 3.1150174140930176, 3.4945359230041504, 3.8740546703338623, 4.253573417663574, 4.633091926574707, 5.01261043548584, 5.392128944396973, 5.771647930145264, 6.1511664390563965, 6.530684947967529, 6.91020393371582, 7.289722442626953, 7.669240951538086, 8.048759460449219, 8.428277969360352, 8.807796478271484, 9.187314987182617, 9.566834449768066, 9.9463529586792, 10.325871467590332, 10.705389976501465, 11.084908485412598, 11.46442699432373, 11.843945503234863, 12.223464965820312, 12.602983474731445, 12.982501983642578, 13.362020492553711, 13.741539001464844]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 0.0, 5.0, 7.0, 7.0, 9.0, 8.0, 11.0, 11.0, 13.0, 17.0, 23.0, 17.0, 19.0, 27.0, 19.0, 21.0, 26.0, 38.0, 43.0, 41.0, 38.0, 34.0, 35.0, 47.0, 48.0, 31.0, 36.0, 27.0, 37.0, 34.0, 30.0, 24.0, 31.0, 29.0, 24.0, 23.0, 17.0, 13.0, 15.0, 15.0, 9.0, 6.0, 4.0, 4.0, 7.0, 0.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0], "bins": [-10.605825424194336, -10.289403915405273, -9.972981452941895, -9.656559944152832, -9.34013843536377, -9.02371597290039, -8.707294464111328, -8.390872955322266, -8.074451446533203, -7.758029460906982, -7.44160795211792, -7.125185966491699, -6.808764457702637, -6.492342472076416, -6.175920486450195, -5.859498977661133, -5.543076515197754, -5.226654529571533, -4.910233020782471, -4.59381103515625, -4.2773895263671875, -3.960967540740967, -3.644545555114746, -3.3281238079071045, -3.011702060699463, -2.6952803134918213, -2.3788585662841797, -2.062436580657959, -1.7460148334503174, -1.4295930862426758, -1.1131712198257446, -0.7967493534088135, -0.4803276062011719, -0.1639057993888855, 0.15251600742340088, 0.46893781423568726, 0.7853596210479736, 1.1017813682556152, 1.4182032346725464, 1.7346251010894775, 2.051046848297119, 2.3674685955047607, 2.6838903427124023, 3.000312328338623, 3.3167340755462646, 3.6331558227539062, 3.949577808380127, 4.265999794006348, 4.58242130279541, 4.898843288421631, 5.215264797210693, 5.531686782836914, 5.848108291625977, 6.164530277252197, 6.480952262878418, 6.7973737716674805, 7.113795757293701, 7.430217742919922, 7.746639251708984, 8.063060760498047, 8.379483222961426, 8.695904731750488, 9.01232624053955, 9.32874870300293, 9.645170211791992]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 4.0, 24.0, 23.0, 33.0, 63.0, 96.0, 145.0, 203.0, 355.0, 535.0, 838.0, 1350.0, 2144.0, 3260.0, 5288.0, 8593.0, 14191.0, 23818.0, 38830.0, 62252.0, 96005.0, 133198.0, 158318.0, 152935.0, 121616.0, 84411.0, 53890.0, 33435.0, 20194.0, 12478.0, 7574.0, 4572.0, 2874.0, 1816.0, 1160.0, 758.0, 439.0, 289.0, 183.0, 126.0, 73.0, 50.0, 38.0, 24.0, 14.0, 13.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.203125, -7.96771240234375, -7.7322998046875, -7.49688720703125, -7.261474609375, -7.02606201171875, -6.7906494140625, -6.55523681640625, -6.31982421875, -6.08441162109375, -5.8489990234375, -5.61358642578125, -5.378173828125, -5.14276123046875, -4.9073486328125, -4.67193603515625, -4.4365234375, -4.20111083984375, -3.9656982421875, -3.73028564453125, -3.494873046875, -3.25946044921875, -3.0240478515625, -2.78863525390625, -2.55322265625, -2.31781005859375, -2.0823974609375, -1.84698486328125, -1.611572265625, -1.37615966796875, -1.1407470703125, -0.90533447265625, -0.669921875, -0.43450927734375, -0.1990966796875, 0.03631591796875, 0.271728515625, 0.50714111328125, 0.7425537109375, 0.97796630859375, 1.21337890625, 1.44879150390625, 1.6842041015625, 1.91961669921875, 2.155029296875, 2.39044189453125, 2.6258544921875, 2.86126708984375, 3.0966796875, 3.33209228515625, 3.5675048828125, 3.80291748046875, 4.038330078125, 4.27374267578125, 4.5091552734375, 4.74456787109375, 4.97998046875, 5.21539306640625, 5.4508056640625, 5.68621826171875, 5.921630859375, 6.15704345703125, 6.3924560546875, 6.62786865234375, 6.86328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 18.0, 7.0, 16.0, 16.0, 18.0, 21.0, 21.0, 16.0, 24.0, 30.0, 28.0, 28.0, 42.0, 34.0, 37.0, 33.0, 53.0, 48.0, 42.0, 36.0, 41.0, 38.0, 28.0, 33.0, 35.0, 22.0, 22.0, 30.0, 21.0, 20.0, 26.0, 12.0, 13.0, 12.0, 10.0, 8.0, 5.0, 7.0, 5.0, 6.0, 1.0, 2.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-10.8671875, -10.545654296875, -10.22412109375, -9.902587890625, -9.5810546875, -9.259521484375, -8.93798828125, -8.616455078125, -8.294921875, -7.973388671875, -7.65185546875, -7.330322265625, -7.0087890625, -6.687255859375, -6.36572265625, -6.044189453125, -5.72265625, -5.401123046875, -5.07958984375, -4.758056640625, -4.4365234375, -4.114990234375, -3.79345703125, -3.471923828125, -3.150390625, -2.828857421875, -2.50732421875, -2.185791015625, -1.8642578125, -1.542724609375, -1.22119140625, -0.899658203125, -0.578125, -0.256591796875, 0.06494140625, 0.386474609375, 0.7080078125, 1.029541015625, 1.35107421875, 1.672607421875, 1.994140625, 2.315673828125, 2.63720703125, 2.958740234375, 3.2802734375, 3.601806640625, 3.92333984375, 4.244873046875, 4.56640625, 4.887939453125, 5.20947265625, 5.531005859375, 5.8525390625, 6.174072265625, 6.49560546875, 6.817138671875, 7.138671875, 7.460205078125, 7.78173828125, 8.103271484375, 8.4248046875, 8.746337890625, 9.06787109375, 9.389404296875, 9.7109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 6.0, 13.0, 30.0, 30.0, 60.0, 107.0, 137.0, 218.0, 375.0, 559.0, 942.0, 1442.0, 2177.0, 3493.0, 5462.0, 8363.0, 12458.0, 19489.0, 28945.0, 43342.0, 62049.0, 86835.0, 112118.0, 130437.0, 130229.0, 113620.0, 89010.0, 64686.0, 44421.0, 30527.0, 19766.0, 13126.0, 8548.0, 5592.0, 3552.0, 2402.0, 1443.0, 961.0, 576.0, 369.0, 229.0, 163.0, 99.0, 51.0, 37.0, 31.0, 9.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0], "bins": [-6.75, -6.557373046875, -6.36474609375, -6.172119140625, -5.9794921875, -5.786865234375, -5.59423828125, -5.401611328125, -5.208984375, -5.016357421875, -4.82373046875, -4.631103515625, -4.4384765625, -4.245849609375, -4.05322265625, -3.860595703125, -3.66796875, -3.475341796875, -3.28271484375, -3.090087890625, -2.8974609375, -2.704833984375, -2.51220703125, -2.319580078125, -2.126953125, -1.934326171875, -1.74169921875, -1.549072265625, -1.3564453125, -1.163818359375, -0.97119140625, -0.778564453125, -0.5859375, -0.393310546875, -0.20068359375, -0.008056640625, 0.1845703125, 0.377197265625, 0.56982421875, 0.762451171875, 0.955078125, 1.147705078125, 1.34033203125, 1.532958984375, 1.7255859375, 1.918212890625, 2.11083984375, 2.303466796875, 2.49609375, 2.688720703125, 2.88134765625, 3.073974609375, 3.2666015625, 3.459228515625, 3.65185546875, 3.844482421875, 4.037109375, 4.229736328125, 4.42236328125, 4.614990234375, 4.8076171875, 5.000244140625, 5.19287109375, 5.385498046875, 5.578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 7.0, 11.0, 9.0, 14.0, 14.0, 11.0, 15.0, 11.0, 20.0, 26.0, 30.0, 37.0, 21.0, 27.0, 36.0, 27.0, 35.0, 43.0, 34.0, 36.0, 45.0, 42.0, 41.0, 47.0, 28.0, 29.0, 41.0, 31.0, 31.0, 27.0, 28.0, 22.0, 10.0, 18.0, 16.0, 10.0, 7.0, 13.0, 4.0, 17.0, 5.0, 8.0, 3.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.41937255859375, -5.2332763671875, -5.04718017578125, -4.861083984375, -4.67498779296875, -4.4888916015625, -4.30279541015625, -4.11669921875, -3.93060302734375, -3.7445068359375, -3.55841064453125, -3.372314453125, -3.18621826171875, -3.0001220703125, -2.81402587890625, -2.6279296875, -2.44183349609375, -2.2557373046875, -2.06964111328125, -1.883544921875, -1.69744873046875, -1.5113525390625, -1.32525634765625, -1.13916015625, -0.95306396484375, -0.7669677734375, -0.58087158203125, -0.394775390625, -0.20867919921875, -0.0225830078125, 0.16351318359375, 0.349609375, 0.53570556640625, 0.7218017578125, 0.90789794921875, 1.093994140625, 1.28009033203125, 1.4661865234375, 1.65228271484375, 1.83837890625, 2.02447509765625, 2.2105712890625, 2.39666748046875, 2.582763671875, 2.76885986328125, 2.9549560546875, 3.14105224609375, 3.3271484375, 3.51324462890625, 3.6993408203125, 3.88543701171875, 4.071533203125, 4.25762939453125, 4.4437255859375, 4.62982177734375, 4.81591796875, 5.00201416015625, 5.1881103515625, 5.37420654296875, 5.560302734375, 5.74639892578125, 5.9324951171875, 6.11859130859375, 6.3046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 17.0, 18.0, 33.0, 39.0, 37.0, 87.0, 114.0, 175.0, 291.0, 423.0, 706.0, 1181.0, 1953.0, 3532.0, 6386.0, 12384.0, 24039.0, 48388.0, 96330.0, 177000.0, 241325.0, 199550.0, 114678.0, 58698.0, 28744.0, 14703.0, 7689.0, 4250.0, 2286.0, 1304.0, 800.0, 480.0, 292.0, 208.0, 120.0, 86.0, 65.0, 35.0, 31.0, 19.0, 12.0, 9.0, 6.0, 5.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.943359375, -3.82611083984375, -3.7088623046875, -3.59161376953125, -3.474365234375, -3.35711669921875, -3.2398681640625, -3.12261962890625, -3.00537109375, -2.88812255859375, -2.7708740234375, -2.65362548828125, -2.536376953125, -2.41912841796875, -2.3018798828125, -2.18463134765625, -2.0673828125, -1.95013427734375, -1.8328857421875, -1.71563720703125, -1.598388671875, -1.48114013671875, -1.3638916015625, -1.24664306640625, -1.12939453125, -1.01214599609375, -0.8948974609375, -0.77764892578125, -0.660400390625, -0.54315185546875, -0.4259033203125, -0.30865478515625, -0.19140625, -0.07415771484375, 0.0430908203125, 0.16033935546875, 0.277587890625, 0.39483642578125, 0.5120849609375, 0.62933349609375, 0.74658203125, 0.86383056640625, 0.9810791015625, 1.09832763671875, 1.215576171875, 1.33282470703125, 1.4500732421875, 1.56732177734375, 1.6845703125, 1.80181884765625, 1.9190673828125, 2.03631591796875, 2.153564453125, 2.27081298828125, 2.3880615234375, 2.50531005859375, 2.62255859375, 2.73980712890625, 2.8570556640625, 2.97430419921875, 3.091552734375, 3.20880126953125, 3.3260498046875, 3.44329833984375, 3.560546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 6.0, 7.0, 5.0, 5.0, 9.0, 21.0, 13.0, 17.0, 18.0, 27.0, 36.0, 28.0, 43.0, 46.0, 38.0, 42.0, 36.0, 62.0, 52.0, 53.0, 39.0, 54.0, 38.0, 32.0, 32.0, 44.0, 31.0, 20.0, 35.0, 22.0, 18.0, 14.0, 5.0, 8.0, 11.0, 7.0, 7.0, 5.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001424551010131836, -0.00013708136975765228, -0.00013170763850212097, -0.00012633390724658966, -0.00012096017599105835, -0.00011558644473552704, -0.00011021271347999573, -0.00010483898222446442, -9.94652509689331e-05, -9.40915197134018e-05, -8.871778845787048e-05, -8.334405720233917e-05, -7.797032594680786e-05, -7.259659469127655e-05, -6.722286343574524e-05, -6.184913218021393e-05, -5.647540092468262e-05, -5.1101669669151306e-05, -4.5727938413619995e-05, -4.0354207158088684e-05, -3.498047590255737e-05, -2.9606744647026062e-05, -2.423301339149475e-05, -1.885928213596344e-05, -1.3485550880432129e-05, -8.111819624900818e-06, -2.738088369369507e-06, 2.635642886161804e-06, 8.009374141693115e-06, 1.3383105397224426e-05, 1.8756836652755737e-05, 2.413056790828705e-05, 2.950429916381836e-05, 3.487803041934967e-05, 4.025176167488098e-05, 4.562549293041229e-05, 5.0999224185943604e-05, 5.6372955441474915e-05, 6.174668669700623e-05, 6.712041795253754e-05, 7.249414920806885e-05, 7.786788046360016e-05, 8.324161171913147e-05, 8.861534297466278e-05, 9.398907423019409e-05, 9.93628054857254e-05, 0.00010473653674125671, 0.00011011026799678802, 0.00011548399925231934, 0.00012085773050785065, 0.00012623146176338196, 0.00013160519301891327, 0.00013697892427444458, 0.0001423526555299759, 0.0001477263867855072, 0.0001531001180410385, 0.00015847384929656982, 0.00016384758055210114, 0.00016922131180763245, 0.00017459504306316376, 0.00017996877431869507, 0.00018534250557422638, 0.0001907162368297577, 0.000196089968085289, 0.0002014636993408203]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 6.0, 11.0, 11.0, 42.0, 54.0, 71.0, 109.0, 157.0, 222.0, 340.0, 474.0, 759.0, 1064.0, 1526.0, 2314.0, 3432.0, 5357.0, 8194.0, 12475.0, 19668.0, 30793.0, 48332.0, 74044.0, 108514.0, 142528.0, 156666.0, 137148.0, 101852.0, 68318.0, 43866.0, 28496.0, 17992.0, 11391.0, 7331.0, 4893.0, 3294.0, 2235.0, 1495.0, 974.0, 674.0, 460.0, 316.0, 224.0, 123.0, 100.0, 80.0, 42.0, 33.0, 20.0, 13.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.31640625, -2.242645263671875, -2.16888427734375, -2.095123291015625, -2.0213623046875, -1.947601318359375, -1.87384033203125, -1.800079345703125, -1.726318359375, -1.652557373046875, -1.57879638671875, -1.505035400390625, -1.4312744140625, -1.357513427734375, -1.28375244140625, -1.209991455078125, -1.13623046875, -1.062469482421875, -0.98870849609375, -0.914947509765625, -0.8411865234375, -0.767425537109375, -0.69366455078125, -0.619903564453125, -0.546142578125, -0.472381591796875, -0.39862060546875, -0.324859619140625, -0.2510986328125, -0.177337646484375, -0.10357666015625, -0.029815673828125, 0.0439453125, 0.117706298828125, 0.19146728515625, 0.265228271484375, 0.3389892578125, 0.412750244140625, 0.48651123046875, 0.560272216796875, 0.634033203125, 0.707794189453125, 0.78155517578125, 0.855316162109375, 0.9290771484375, 1.002838134765625, 1.07659912109375, 1.150360107421875, 1.22412109375, 1.297882080078125, 1.37164306640625, 1.445404052734375, 1.5191650390625, 1.592926025390625, 1.66668701171875, 1.740447998046875, 1.814208984375, 1.887969970703125, 1.96173095703125, 2.035491943359375, 2.1092529296875, 2.183013916015625, 2.25677490234375, 2.330535888671875, 2.404296875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 18.0, 14.0, 18.0, 26.0, 24.0, 35.0, 58.0, 39.0, 47.0, 47.0, 61.0, 62.0, 51.0, 67.0, 44.0, 49.0, 45.0, 42.0, 43.0, 36.0, 26.0, 29.0, 25.0, 13.0, 18.0, 5.0, 8.0, 4.0, 5.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0159149169921875, -0.979095458984375, -0.9422760009765625, -0.90545654296875, -0.8686370849609375, -0.831817626953125, -0.7949981689453125, -0.7581787109375, -0.7213592529296875, -0.684539794921875, -0.6477203369140625, -0.61090087890625, -0.5740814208984375, -0.537261962890625, -0.5004425048828125, -0.463623046875, -0.4268035888671875, -0.389984130859375, -0.3531646728515625, -0.31634521484375, -0.2795257568359375, -0.242706298828125, -0.2058868408203125, -0.1690673828125, -0.1322479248046875, -0.095428466796875, -0.0586090087890625, -0.02178955078125, 0.0150299072265625, 0.051849365234375, 0.0886688232421875, 0.12548828125, 0.1623077392578125, 0.199127197265625, 0.2359466552734375, 0.27276611328125, 0.3095855712890625, 0.346405029296875, 0.3832244873046875, 0.4200439453125, 0.4568634033203125, 0.493682861328125, 0.5305023193359375, 0.56732177734375, 0.6041412353515625, 0.640960693359375, 0.6777801513671875, 0.714599609375, 0.7514190673828125, 0.788238525390625, 0.8250579833984375, 0.86187744140625, 0.8986968994140625, 0.935516357421875, 0.9723358154296875, 1.0091552734375, 1.0459747314453125, 1.082794189453125, 1.1196136474609375, 1.15643310546875, 1.1932525634765625, 1.230072021484375, 1.2668914794921875, 1.3037109375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 16.0, 13.0, 21.0, 19.0, 24.0, 35.0, 39.0, 45.0, 63.0, 55.0, 85.0, 84.0, 59.0, 87.0, 65.0, 41.0, 39.0, 35.0, 36.0, 23.0, 18.0, 17.0, 17.0, 12.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.081822395324707, -10.724729537963867, -10.367636680603027, -10.010543823242188, -9.653450965881348, -9.296358108520508, -8.939264297485352, -8.582172393798828, -8.225078582763672, -7.867985725402832, -7.510892868041992, -7.153800010681152, -6.7967071533203125, -6.439614295959473, -6.082520961761475, -5.725428104400635, -5.368335723876953, -5.011242866516113, -4.654150009155273, -4.297057151794434, -3.9399640560150146, -3.582871198654175, -3.225778102874756, -2.868685245513916, -2.511592388153076, -2.1544995307922363, -1.797406554222107, -1.4403135776519775, -1.0832207202911377, -0.7261278629302979, -0.3690347671508789, -0.011941909790039062, 0.3451519012451172, 0.7022448182106018, 1.0593377351760864, 1.4164307117462158, 1.7735235691070557, 2.1306164264678955, 2.4877095222473145, 2.8448023796081543, 3.201895236968994, 3.558988094329834, 3.916080951690674, 4.273174285888672, 4.630267143249512, 4.987360000610352, 5.344452857971191, 5.701545715332031, 6.058638572692871, 6.415731430053711, 6.772824287414551, 7.129917144775391, 7.4870100021362305, 7.84410285949707, 8.201196670532227, 8.55828857421875, 8.915382385253906, 9.272475242614746, 9.629568099975586, 9.986660957336426, 10.343753814697266, 10.700846672058105, 11.057939529418945, 11.415033340454102, 11.772125244140625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 14.0, 7.0, 5.0, 11.0, 11.0, 15.0, 18.0, 17.0, 27.0, 19.0, 24.0, 23.0, 36.0, 39.0, 34.0, 40.0, 38.0, 39.0, 48.0, 46.0, 33.0, 27.0, 51.0, 37.0, 37.0, 35.0, 27.0, 29.0, 29.0, 26.0, 26.0, 16.0, 18.0, 13.0, 15.0, 15.0, 9.0, 11.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.22400188446045, -10.891515731811523, -10.559028625488281, -10.226542472839355, -9.894055366516113, -9.561569213867188, -9.229082107543945, -8.89659595489502, -8.564109802246094, -8.231623649597168, -7.899136543273926, -7.566650390625, -7.234163761138916, -6.901677131652832, -6.569190502166748, -6.236703872680664, -5.90421724319458, -5.571730613708496, -5.239243984222412, -4.906757354736328, -4.574271202087402, -4.241784572601318, -3.9092979431152344, -3.5768115520477295, -3.2443249225616455, -2.9118382930755615, -2.5793519020080566, -2.2468652725219727, -1.9143787622451782, -1.5818922519683838, -1.2494056224822998, -0.9169192314147949, -0.5844326019287109, -0.2519460618495941, 0.0805404782295227, 0.4130270481109619, 0.7455135583877563, 1.0780000686645508, 1.4104866981506348, 1.7429730892181396, 2.0754597187042236, 2.4079463481903076, 2.7404327392578125, 3.0729193687438965, 3.4054059982299805, 3.7378923892974854, 4.070379257202148, 4.402865409851074, 4.735352039337158, 5.067838668823242, 5.400325298309326, 5.73281192779541, 6.065298080444336, 6.39778470993042, 6.730271339416504, 7.06275749206543, 7.395244598388672, 7.727731227874756, 8.06021785736084, 8.392704010009766, 8.725191116333008, 9.057677268981934, 9.39016342163086, 9.722650527954102, 10.055136680603027]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 15.0, 20.0, 21.0, 50.0, 46.0, 95.0, 153.0, 201.0, 329.0, 418.0, 665.0, 934.0, 1490.0, 2306.0, 3320.0, 5111.0, 7567.0, 12006.0, 19203.0, 31083.0, 52066.0, 88844.0, 156101.0, 273336.0, 465255.0, 710238.0, 808793.0, 626886.0, 390116.0, 225204.0, 127813.0, 73528.0, 42505.0, 25722.0, 15255.0, 9538.0, 6104.0, 3948.0, 2523.0, 1691.0, 1205.0, 814.0, 506.0, 381.0, 274.0, 187.0, 148.0, 83.0, 51.0, 51.0, 36.0, 16.0, 13.0, 9.0, 3.0, 8.0, 1.0, 2.0, 0.0, 3.0], "bins": [-7.89453125, -7.63421630859375, -7.3739013671875, -7.11358642578125, -6.853271484375, -6.59295654296875, -6.3326416015625, -6.07232666015625, -5.81201171875, -5.55169677734375, -5.2913818359375, -5.03106689453125, -4.770751953125, -4.51043701171875, -4.2501220703125, -3.98980712890625, -3.7294921875, -3.46917724609375, -3.2088623046875, -2.94854736328125, -2.688232421875, -2.42791748046875, -2.1676025390625, -1.90728759765625, -1.64697265625, -1.38665771484375, -1.1263427734375, -0.86602783203125, -0.605712890625, -0.34539794921875, -0.0850830078125, 0.17523193359375, 0.435546875, 0.69586181640625, 0.9561767578125, 1.21649169921875, 1.476806640625, 1.73712158203125, 1.9974365234375, 2.25775146484375, 2.51806640625, 2.77838134765625, 3.0386962890625, 3.29901123046875, 3.559326171875, 3.81964111328125, 4.0799560546875, 4.34027099609375, 4.6005859375, 4.86090087890625, 5.1212158203125, 5.38153076171875, 5.641845703125, 5.90216064453125, 6.1624755859375, 6.42279052734375, 6.68310546875, 6.94342041015625, 7.2037353515625, 7.46405029296875, 7.724365234375, 7.98468017578125, 8.2449951171875, 8.50531005859375, 8.765625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 6.0, 4.0, 8.0, 9.0, 8.0, 13.0, 9.0, 14.0, 14.0, 21.0, 16.0, 23.0, 34.0, 27.0, 27.0, 23.0, 28.0, 45.0, 43.0, 37.0, 36.0, 45.0, 41.0, 30.0, 32.0, 44.0, 45.0, 42.0, 22.0, 23.0, 28.0, 26.0, 34.0, 18.0, 16.0, 18.0, 18.0, 16.0, 10.0, 8.0, 10.0, 5.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.3046875, -7.09173583984375, -6.8787841796875, -6.66583251953125, -6.452880859375, -6.23992919921875, -6.0269775390625, -5.81402587890625, -5.60107421875, -5.38812255859375, -5.1751708984375, -4.96221923828125, -4.749267578125, -4.53631591796875, -4.3233642578125, -4.11041259765625, -3.8974609375, -3.68450927734375, -3.4715576171875, -3.25860595703125, -3.045654296875, -2.83270263671875, -2.6197509765625, -2.40679931640625, -2.19384765625, -1.98089599609375, -1.7679443359375, -1.55499267578125, -1.342041015625, -1.12908935546875, -0.9161376953125, -0.70318603515625, -0.490234375, -0.27728271484375, -0.0643310546875, 0.14862060546875, 0.361572265625, 0.57452392578125, 0.7874755859375, 1.00042724609375, 1.21337890625, 1.42633056640625, 1.6392822265625, 1.85223388671875, 2.065185546875, 2.27813720703125, 2.4910888671875, 2.70404052734375, 2.9169921875, 3.12994384765625, 3.3428955078125, 3.55584716796875, 3.768798828125, 3.98175048828125, 4.1947021484375, 4.40765380859375, 4.62060546875, 4.83355712890625, 5.0465087890625, 5.25946044921875, 5.472412109375, 5.68536376953125, 5.8983154296875, 6.11126708984375, 6.32421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 12.0, 15.0, 22.0, 38.0, 57.0, 95.0, 158.0, 243.0, 379.0, 625.0, 1031.0, 1758.0, 2932.0, 5163.0, 8974.0, 15686.0, 27726.0, 49737.0, 90216.0, 162717.0, 289507.0, 488551.0, 714847.0, 789462.0, 627758.0, 399100.0, 228724.0, 126916.0, 70722.0, 39228.0, 21749.0, 12501.0, 7327.0, 4201.0, 2491.0, 1461.0, 801.0, 511.0, 330.0, 187.0, 125.0, 73.0, 65.0, 20.0, 18.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.84375, -8.578125, -8.3125, -8.046875, -7.78125, -7.515625, -7.25, -6.984375, -6.71875, -6.453125, -6.1875, -5.921875, -5.65625, -5.390625, -5.125, -4.859375, -4.59375, -4.328125, -4.0625, -3.796875, -3.53125, -3.265625, -3.0, -2.734375, -2.46875, -2.203125, -1.9375, -1.671875, -1.40625, -1.140625, -0.875, -0.609375, -0.34375, -0.078125, 0.1875, 0.453125, 0.71875, 0.984375, 1.25, 1.515625, 1.78125, 2.046875, 2.3125, 2.578125, 2.84375, 3.109375, 3.375, 3.640625, 3.90625, 4.171875, 4.4375, 4.703125, 4.96875, 5.234375, 5.5, 5.765625, 6.03125, 6.296875, 6.5625, 6.828125, 7.09375, 7.359375, 7.625, 7.890625, 8.15625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 2.0, 10.0, 9.0, 16.0, 34.0, 32.0, 32.0, 50.0, 82.0, 93.0, 104.0, 157.0, 148.0, 170.0, 214.0, 235.0, 264.0, 251.0, 276.0, 258.0, 241.0, 205.0, 210.0, 179.0, 164.0, 132.0, 92.0, 82.0, 80.0, 53.0, 44.0, 34.0, 36.0, 27.0, 21.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.00286865234375, -3.8729248046875, -3.74298095703125, -3.613037109375, -3.48309326171875, -3.3531494140625, -3.22320556640625, -3.09326171875, -2.96331787109375, -2.8333740234375, -2.70343017578125, -2.573486328125, -2.44354248046875, -2.3135986328125, -2.18365478515625, -2.0537109375, -1.92376708984375, -1.7938232421875, -1.66387939453125, -1.533935546875, -1.40399169921875, -1.2740478515625, -1.14410400390625, -1.01416015625, -0.88421630859375, -0.7542724609375, -0.62432861328125, -0.494384765625, -0.36444091796875, -0.2344970703125, -0.10455322265625, 0.025390625, 0.15533447265625, 0.2852783203125, 0.41522216796875, 0.545166015625, 0.67510986328125, 0.8050537109375, 0.93499755859375, 1.06494140625, 1.19488525390625, 1.3248291015625, 1.45477294921875, 1.584716796875, 1.71466064453125, 1.8446044921875, 1.97454833984375, 2.1044921875, 2.23443603515625, 2.3643798828125, 2.49432373046875, 2.624267578125, 2.75421142578125, 2.8841552734375, 3.01409912109375, 3.14404296875, 3.27398681640625, 3.4039306640625, 3.53387451171875, 3.663818359375, 3.79376220703125, 3.9237060546875, 4.05364990234375, 4.18359375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 6.0, 8.0, 12.0, 19.0, 16.0, 23.0, 26.0, 42.0, 42.0, 53.0, 57.0, 77.0, 67.0, 75.0, 78.0, 68.0, 52.0, 41.0, 36.0, 31.0, 31.0, 23.0, 24.0, 18.0, 11.0, 10.0, 8.0, 9.0, 7.0, 1.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.856438636779785, -10.503210067749023, -10.149981498718262, -9.7967529296875, -9.443523406982422, -9.09029483795166, -8.737066268920898, -8.383837699890137, -8.030609130859375, -7.677380561828613, -7.324151515960693, -6.970922946929932, -6.617693901062012, -6.26446533203125, -5.911236763000488, -5.558008193969727, -5.204778671264648, -4.851550102233887, -4.498321056365967, -4.145092487335205, -3.7918636798858643, -3.4386348724365234, -3.0854063034057617, -2.732177495956421, -2.37894868850708, -2.0257198810577393, -1.672491192817688, -1.3192625045776367, -0.9660336971282959, -0.6128048896789551, -0.25957632064819336, 0.09365248680114746, 0.4468812942504883, 0.8001100420951843, 1.1533387899398804, 1.5065674781799316, 1.8597962856292725, 2.2130250930786133, 2.566253662109375, 2.919482469558716, 3.2727112770080566, 3.6259400844573975, 3.9791688919067383, 4.3323974609375, 4.685626029968262, 5.038855075836182, 5.392083644866943, 5.745312690734863, 6.098541259765625, 6.451769828796387, 6.804998874664307, 7.158227443695068, 7.511456489562988, 7.86468505859375, 8.217913627624512, 8.571142196655273, 8.924371719360352, 9.277600288391113, 9.630828857421875, 9.984058380126953, 10.337286949157715, 10.690515518188477, 11.043744087219238, 11.39697265625, 11.750201225280762]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 7.0, 8.0, 9.0, 8.0, 9.0, 16.0, 16.0, 13.0, 26.0, 22.0, 24.0, 27.0, 28.0, 26.0, 35.0, 31.0, 33.0, 48.0, 43.0, 28.0, 39.0, 46.0, 34.0, 48.0, 44.0, 43.0, 45.0, 21.0, 28.0, 25.0, 34.0, 17.0, 15.0, 19.0, 13.0, 11.0, 9.0, 17.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.68309497833252, -9.377996444702148, -9.072898864746094, -8.767800331115723, -8.462702751159668, -8.157604217529297, -7.852506160736084, -7.547408103942871, -7.242310047149658, -6.937211990356445, -6.632113933563232, -6.3270158767700195, -6.021917343139648, -5.716819763183594, -5.411721229553223, -5.10662317276001, -4.801525115966797, -4.496427059173584, -4.191329002380371, -3.886230707168579, -3.581132650375366, -3.2760345935821533, -2.9709362983703613, -2.6658382415771484, -2.3607401847839355, -2.0556421279907227, -1.7505439519882202, -1.4454457759857178, -1.1403477191925049, -0.835249662399292, -0.5301514863967896, -0.2250533103942871, 0.08004570007324219, 0.38514381647109985, 0.6902419328689575, 0.9953400492668152, 1.3004381656646729, 1.6055362224578857, 1.9106343984603882, 2.2157325744628906, 2.5208306312561035, 2.8259286880493164, 3.1310267448425293, 3.4361250400543213, 3.741223096847534, 4.046320915222168, 4.351419448852539, 4.656517505645752, 4.961615562438965, 5.266713619232178, 5.571811676025391, 5.8769097328186035, 6.182007789611816, 6.4871063232421875, 6.7922043800354, 7.097302436828613, 7.402400493621826, 7.707498550415039, 8.01259708404541, 8.317694664001465, 8.622793197631836, 8.92789077758789, 9.232989311218262, 9.538087844848633, 9.843185424804688]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 9.0, 14.0, 17.0, 28.0, 65.0, 105.0, 178.0, 292.0, 462.0, 727.0, 1255.0, 2004.0, 3287.0, 5547.0, 9323.0, 16040.0, 27724.0, 48210.0, 83967.0, 145039.0, 219588.0, 197939.0, 121020.0, 70193.0, 39903.0, 22827.0, 13228.0, 7860.0, 4621.0, 2782.0, 1678.0, 1060.0, 587.0, 394.0, 219.0, 144.0, 79.0, 42.0, 37.0, 22.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.4599609375, -1.4180450439453125, -1.376129150390625, -1.3342132568359375, -1.29229736328125, -1.2503814697265625, -1.208465576171875, -1.1665496826171875, -1.1246337890625, -1.0827178955078125, -1.040802001953125, -0.9988861083984375, -0.95697021484375, -0.9150543212890625, -0.873138427734375, -0.8312225341796875, -0.789306640625, -0.7473907470703125, -0.705474853515625, -0.6635589599609375, -0.62164306640625, -0.5797271728515625, -0.537811279296875, -0.4958953857421875, -0.4539794921875, -0.4120635986328125, -0.370147705078125, -0.3282318115234375, -0.28631591796875, -0.2444000244140625, -0.202484130859375, -0.1605682373046875, -0.11865234375, -0.0767364501953125, -0.034820556640625, 0.0070953369140625, 0.04901123046875, 0.0909271240234375, 0.132843017578125, 0.1747589111328125, 0.2166748046875, 0.2585906982421875, 0.300506591796875, 0.3424224853515625, 0.38433837890625, 0.4262542724609375, 0.468170166015625, 0.5100860595703125, 0.552001953125, 0.5939178466796875, 0.635833740234375, 0.6777496337890625, 0.71966552734375, 0.7615814208984375, 0.803497314453125, 0.8454132080078125, 0.8873291015625, 0.9292449951171875, 0.971160888671875, 1.0130767822265625, 1.05499267578125, 1.0969085693359375, 1.138824462890625, 1.1807403564453125, 1.22265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 7.0, 8.0, 7.0, 10.0, 21.0, 13.0, 17.0, 20.0, 23.0, 21.0, 26.0, 45.0, 33.0, 27.0, 25.0, 41.0, 45.0, 52.0, 45.0, 38.0, 42.0, 33.0, 46.0, 41.0, 39.0, 37.0, 32.0, 27.0, 33.0, 21.0, 23.0, 14.0, 12.0, 10.0, 14.0, 16.0, 11.0, 4.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.0546875, -10.7337646484375, -10.412841796875, -10.0919189453125, -9.77099609375, -9.4500732421875, -9.129150390625, -8.8082275390625, -8.4873046875, -8.1663818359375, -7.845458984375, -7.5245361328125, -7.20361328125, -6.8826904296875, -6.561767578125, -6.2408447265625, -5.919921875, -5.5989990234375, -5.278076171875, -4.9571533203125, -4.63623046875, -4.3153076171875, -3.994384765625, -3.6734619140625, -3.3525390625, -3.0316162109375, -2.710693359375, -2.3897705078125, -2.06884765625, -1.7479248046875, -1.427001953125, -1.1060791015625, -0.78515625, -0.4642333984375, -0.143310546875, 0.1776123046875, 0.49853515625, 0.8194580078125, 1.140380859375, 1.4613037109375, 1.7822265625, 2.1031494140625, 2.424072265625, 2.7449951171875, 3.06591796875, 3.3868408203125, 3.707763671875, 4.0286865234375, 4.349609375, 4.6705322265625, 4.991455078125, 5.3123779296875, 5.63330078125, 5.9542236328125, 6.275146484375, 6.5960693359375, 6.9169921875, 7.2379150390625, 7.558837890625, 7.8797607421875, 8.20068359375, 8.5216064453125, 8.842529296875, 9.1634521484375, 9.484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 16.0, 22.0, 30.0, 50.0, 75.0, 85.0, 170.0, 219.0, 408.0, 672.0, 1171.0, 1902.0, 2973.0, 5463.0, 9498.0, 16348.0, 28320.0, 49604.0, 86246.0, 147697.0, 230349.0, 193806.0, 115942.0, 66554.0, 38549.0, 21985.0, 12572.0, 7296.0, 4248.0, 2509.0, 1451.0, 866.0, 552.0, 333.0, 202.0, 115.0, 75.0, 71.0, 31.0, 24.0, 20.0, 15.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.296875, -1.2533111572265625, -1.209747314453125, -1.1661834716796875, -1.12261962890625, -1.0790557861328125, -1.035491943359375, -0.9919281005859375, -0.9483642578125, -0.9048004150390625, -0.861236572265625, -0.8176727294921875, -0.77410888671875, -0.7305450439453125, -0.686981201171875, -0.6434173583984375, -0.599853515625, -0.5562896728515625, -0.512725830078125, -0.4691619873046875, -0.42559814453125, -0.3820343017578125, -0.338470458984375, -0.2949066162109375, -0.2513427734375, -0.2077789306640625, -0.164215087890625, -0.1206512451171875, -0.07708740234375, -0.0335235595703125, 0.010040283203125, 0.0536041259765625, 0.09716796875, 0.1407318115234375, 0.184295654296875, 0.2278594970703125, 0.27142333984375, 0.3149871826171875, 0.358551025390625, 0.4021148681640625, 0.4456787109375, 0.4892425537109375, 0.532806396484375, 0.5763702392578125, 0.61993408203125, 0.6634979248046875, 0.707061767578125, 0.7506256103515625, 0.794189453125, 0.8377532958984375, 0.881317138671875, 0.9248809814453125, 0.96844482421875, 1.0120086669921875, 1.055572509765625, 1.0991363525390625, 1.1427001953125, 1.1862640380859375, 1.229827880859375, 1.2733917236328125, 1.31695556640625, 1.3605194091796875, 1.404083251953125, 1.4476470947265625, 1.4912109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 11.0, 15.0, 9.0, 21.0, 20.0, 19.0, 21.0, 21.0, 19.0, 25.0, 34.0, 29.0, 37.0, 45.0, 41.0, 43.0, 51.0, 42.0, 40.0, 53.0, 37.0, 44.0, 31.0, 29.0, 33.0, 20.0, 26.0, 22.0, 20.0, 18.0, 15.0, 8.0, 13.0, 15.0, 16.0, 7.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.34765625, -6.142578125, -5.9375, -5.732421875, -5.52734375, -5.322265625, -5.1171875, -4.912109375, -4.70703125, -4.501953125, -4.296875, -4.091796875, -3.88671875, -3.681640625, -3.4765625, -3.271484375, -3.06640625, -2.861328125, -2.65625, -2.451171875, -2.24609375, -2.041015625, -1.8359375, -1.630859375, -1.42578125, -1.220703125, -1.015625, -0.810546875, -0.60546875, -0.400390625, -0.1953125, 0.009765625, 0.21484375, 0.419921875, 0.625, 0.830078125, 1.03515625, 1.240234375, 1.4453125, 1.650390625, 1.85546875, 2.060546875, 2.265625, 2.470703125, 2.67578125, 2.880859375, 3.0859375, 3.291015625, 3.49609375, 3.701171875, 3.90625, 4.111328125, 4.31640625, 4.521484375, 4.7265625, 4.931640625, 5.13671875, 5.341796875, 5.546875, 5.751953125, 5.95703125, 6.162109375, 6.3671875, 6.572265625, 6.77734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 2.0, 12.0, 10.0, 16.0, 31.0, 25.0, 34.0, 57.0, 79.0, 137.0, 165.0, 279.0, 434.0, 742.0, 1235.0, 2277.0, 4383.0, 9960.0, 27558.0, 108758.0, 569715.0, 244847.0, 49078.0, 15252.0, 6342.0, 3020.0, 1589.0, 922.0, 536.0, 352.0, 213.0, 131.0, 114.0, 65.0, 49.0, 42.0, 26.0, 12.0, 14.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.397705078125, -0.38625335693359375, -0.3748016357421875, -0.36334991455078125, -0.351898193359375, -0.34044647216796875, -0.3289947509765625, -0.31754302978515625, -0.30609130859375, -0.29463958740234375, -0.2831878662109375, -0.27173614501953125, -0.260284423828125, -0.24883270263671875, -0.2373809814453125, -0.22592926025390625, -0.2144775390625, -0.20302581787109375, -0.1915740966796875, -0.18012237548828125, -0.168670654296875, -0.15721893310546875, -0.1457672119140625, -0.13431549072265625, -0.12286376953125, -0.11141204833984375, -0.0999603271484375, -0.08850860595703125, -0.077056884765625, -0.06560516357421875, -0.0541534423828125, -0.04270172119140625, -0.03125, -0.01979827880859375, -0.0083465576171875, 0.00310516357421875, 0.014556884765625, 0.02600860595703125, 0.0374603271484375, 0.04891204833984375, 0.06036376953125, 0.07181549072265625, 0.0832672119140625, 0.09471893310546875, 0.106170654296875, 0.11762237548828125, 0.1290740966796875, 0.14052581787109375, 0.1519775390625, 0.16342926025390625, 0.1748809814453125, 0.18633270263671875, 0.197784423828125, 0.20923614501953125, 0.2206878662109375, 0.23213958740234375, 0.24359130859375, 0.25504302978515625, 0.2664947509765625, 0.27794647216796875, 0.289398193359375, 0.30084991455078125, 0.3123016357421875, 0.32375335693359375, 0.335205078125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 5.0, 11.0, 25.0, 35.0, 35.0, 57.0, 63.0, 74.0, 90.0, 97.0, 77.0, 87.0, 66.0, 52.0, 54.0, 38.0, 26.0, 21.0, 15.0, 25.0, 9.0, 8.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.586841583251953e-05, -2.512894570827484e-05, -2.438947558403015e-05, -2.365000545978546e-05, -2.291053533554077e-05, -2.217106521129608e-05, -2.143159508705139e-05, -2.06921249628067e-05, -1.9952654838562012e-05, -1.9213184714317322e-05, -1.8473714590072632e-05, -1.7734244465827942e-05, -1.6994774341583252e-05, -1.6255304217338562e-05, -1.5515834093093872e-05, -1.4776363968849182e-05, -1.4036893844604492e-05, -1.3297423720359802e-05, -1.2557953596115112e-05, -1.1818483471870422e-05, -1.1079013347625732e-05, -1.0339543223381042e-05, -9.600073099136353e-06, -8.860602974891663e-06, -8.121132850646973e-06, -7.381662726402283e-06, -6.642192602157593e-06, -5.902722477912903e-06, -5.163252353668213e-06, -4.423782229423523e-06, -3.684312105178833e-06, -2.944841980934143e-06, -2.205371856689453e-06, -1.4659017324447632e-06, -7.264316082000732e-07, 1.30385160446167e-08, 7.525086402893066e-07, 1.4919787645339966e-06, 2.2314488887786865e-06, 2.9709190130233765e-06, 3.7103891372680664e-06, 4.449859261512756e-06, 5.189329385757446e-06, 5.928799510002136e-06, 6.668269634246826e-06, 7.407739758491516e-06, 8.147209882736206e-06, 8.886680006980896e-06, 9.626150131225586e-06, 1.0365620255470276e-05, 1.1105090379714966e-05, 1.1844560503959656e-05, 1.2584030628204346e-05, 1.3323500752449036e-05, 1.4062970876693726e-05, 1.4802441000938416e-05, 1.5541911125183105e-05, 1.6281381249427795e-05, 1.7020851373672485e-05, 1.7760321497917175e-05, 1.8499791622161865e-05, 1.9239261746406555e-05, 1.9978731870651245e-05, 2.0718201994895935e-05, 2.1457672119140625e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 9.0, 10.0, 19.0, 34.0, 37.0, 56.0, 88.0, 122.0, 179.0, 247.0, 415.0, 615.0, 990.0, 1564.0, 2621.0, 4583.0, 8200.0, 14923.0, 29337.0, 59706.0, 128645.0, 287927.0, 271022.0, 120203.0, 55900.0, 27653.0, 14352.0, 7876.0, 4459.0, 2551.0, 1539.0, 935.0, 582.0, 355.0, 235.0, 179.0, 113.0, 77.0, 56.0, 37.0, 35.0, 17.0, 12.0, 11.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2745780944824219, -0.26570892333984375, -0.2568397521972656, -0.2479705810546875, -0.23910140991210938, -0.23023223876953125, -0.22136306762695312, -0.212493896484375, -0.20362472534179688, -0.19475555419921875, -0.18588638305664062, -0.1770172119140625, -0.16814804077148438, -0.15927886962890625, -0.15040969848632812, -0.14154052734375, -0.13267135620117188, -0.12380218505859375, -0.11493301391601562, -0.1060638427734375, -0.09719467163085938, -0.08832550048828125, -0.07945632934570312, -0.070587158203125, -0.061717987060546875, -0.05284881591796875, -0.043979644775390625, -0.0351104736328125, -0.026241302490234375, -0.01737213134765625, -0.008502960205078125, 0.0003662109375, 0.009235382080078125, 0.01810455322265625, 0.026973724365234375, 0.0358428955078125, 0.044712066650390625, 0.05358123779296875, 0.062450408935546875, 0.071319580078125, 0.08018875122070312, 0.08905792236328125, 0.09792709350585938, 0.1067962646484375, 0.11566543579101562, 0.12453460693359375, 0.13340377807617188, 0.14227294921875, 0.15114212036132812, 0.16001129150390625, 0.16888046264648438, 0.1777496337890625, 0.18661880493164062, 0.19548797607421875, 0.20435714721679688, 0.213226318359375, 0.22209548950195312, 0.23096466064453125, 0.23983383178710938, 0.2487030029296875, 0.2575721740722656, 0.26644134521484375, 0.2753105163574219, 0.2841796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 6.0, 10.0, 9.0, 16.0, 14.0, 19.0, 24.0, 28.0, 30.0, 27.0, 38.0, 31.0, 42.0, 43.0, 61.0, 58.0, 45.0, 64.0, 47.0, 38.0, 40.0, 34.0, 39.0, 29.0, 31.0, 33.0, 23.0, 21.0, 10.0, 11.0, 15.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1259765625, -0.12221431732177734, -0.11845207214355469, -0.11468982696533203, -0.11092758178710938, -0.10716533660888672, -0.10340309143066406, -0.0996408462524414, -0.09587860107421875, -0.0921163558959961, -0.08835411071777344, -0.08459186553955078, -0.08082962036132812, -0.07706737518310547, -0.07330513000488281, -0.06954288482666016, -0.0657806396484375, -0.062018394470214844, -0.05825614929199219, -0.05449390411376953, -0.050731658935546875, -0.04696941375732422, -0.04320716857910156, -0.039444923400878906, -0.03568267822265625, -0.031920433044433594, -0.028158187866210938, -0.02439594268798828, -0.020633697509765625, -0.01687145233154297, -0.013109207153320312, -0.009346961975097656, -0.005584716796875, -0.0018224716186523438, 0.0019397735595703125, 0.005702018737792969, 0.009464263916015625, 0.013226509094238281, 0.016988754272460938, 0.020750999450683594, 0.02451324462890625, 0.028275489807128906, 0.03203773498535156, 0.03579998016357422, 0.039562225341796875, 0.04332447052001953, 0.04708671569824219, 0.050848960876464844, 0.0546112060546875, 0.058373451232910156, 0.06213569641113281, 0.06589794158935547, 0.06966018676757812, 0.07342243194580078, 0.07718467712402344, 0.0809469223022461, 0.08470916748046875, 0.0884714126586914, 0.09223365783691406, 0.09599590301513672, 0.09975814819335938, 0.10352039337158203, 0.10728263854980469, 0.11104488372802734, 0.11480712890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 7.0, 7.0, 8.0, 8.0, 11.0, 17.0, 17.0, 22.0, 32.0, 43.0, 44.0, 48.0, 61.0, 82.0, 66.0, 70.0, 79.0, 71.0, 49.0, 44.0, 30.0, 34.0, 32.0, 18.0, 25.0, 15.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.856524467468262, -10.500720024108887, -10.144914627075195, -9.78911018371582, -9.433305740356445, -9.07750129699707, -8.721695899963379, -8.365891456604004, -8.010086059570312, -7.654281139373779, -7.298476696014404, -6.942671775817871, -6.586867332458496, -6.231062412261963, -5.87525749206543, -5.519453048706055, -5.16364860534668, -4.8078436851501465, -4.4520392417907715, -4.096234321594238, -3.740429639816284, -3.38462495803833, -3.028820037841797, -2.6730153560638428, -2.3172106742858887, -1.9614059925079346, -1.605601191520691, -1.2497963905334473, -0.8939917087554932, -0.5381870269775391, -0.18238210678100586, 0.17342257499694824, 0.5292263031005859, 0.8850310444831848, 1.2408357858657837, 1.5966405868530273, 1.9524452686309814, 2.3082499504089355, 2.6640548706054688, 3.019859552383423, 3.375664234161377, 3.731468915939331, 4.087273597717285, 4.443078517913818, 4.798883438110352, 5.154687881469727, 5.51049280166626, 5.866297721862793, 6.222102165222168, 6.577907085418701, 6.933711528778076, 7.289516448974609, 7.645320892333984, 8.00112533569336, 8.35693073272705, 8.712735176086426, 9.068540573120117, 9.424345016479492, 9.780150413513184, 10.135954856872559, 10.491759300231934, 10.847564697265625, 11.203369140625, 11.559173583984375, 11.91497802734375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 8.0, 10.0, 17.0, 12.0, 17.0, 24.0, 25.0, 22.0, 26.0, 27.0, 29.0, 34.0, 31.0, 31.0, 49.0, 40.0, 34.0, 42.0, 40.0, 34.0, 47.0, 43.0, 50.0, 37.0, 22.0, 28.0, 25.0, 34.0, 18.0, 16.0, 18.0, 13.0, 11.0, 9.0, 17.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.623007774353027, -9.319469451904297, -9.01593017578125, -8.71239185333252, -8.408852577209473, -8.105314254760742, -7.8017754554748535, -7.498236656188965, -7.194698333740234, -6.891159534454346, -6.587620735168457, -6.284082412719727, -5.980543613433838, -5.677004814147949, -5.3734660148620605, -5.069927215576172, -4.766388416290283, -4.4628496170043945, -4.159310817718506, -3.8557722568511963, -3.5522336959838867, -3.248694896697998, -2.9451560974121094, -2.6416175365448, -2.338078737258911, -2.0345399379730225, -1.731001377105713, -1.4274625778198242, -1.123923897743225, -0.820385217666626, -0.5168464183807373, -0.21330785751342773, 0.09023094177246094, 0.39376965165138245, 0.697308361530304, 1.0008471012115479, 1.304385781288147, 1.607924461364746, 1.9114632606506348, 2.2150018215179443, 2.518540620803833, 2.8220794200897217, 3.1256179809570312, 3.42915678024292, 3.7326955795288086, 4.036233901977539, 4.339773178100586, 4.643311500549316, 4.946850299835205, 5.250389099121094, 5.553927898406982, 5.857466697692871, 6.161005020141602, 6.46454381942749, 6.768082618713379, 7.071620941162109, 7.375160217285156, 7.678699016571045, 7.982237815856934, 8.285776138305664, 8.589315414428711, 8.892853736877441, 9.196392059326172, 9.499931335449219, 9.80346965789795]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 5.0, 13.0, 15.0, 14.0, 35.0, 46.0, 77.0, 111.0, 153.0, 257.0, 402.0, 629.0, 986.0, 1628.0, 2414.0, 4114.0, 6658.0, 10581.0, 17127.0, 27562.0, 42696.0, 66241.0, 95939.0, 128712.0, 149760.0, 143910.0, 115304.0, 82986.0, 55168.0, 35759.0, 22305.0, 14009.0, 8597.0, 5271.0, 3473.0, 2037.0, 1277.0, 813.0, 531.0, 334.0, 240.0, 134.0, 91.0, 56.0, 33.0, 22.0, 15.0, 11.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.9921875, -6.7789306640625, -6.565673828125, -6.3524169921875, -6.13916015625, -5.9259033203125, -5.712646484375, -5.4993896484375, -5.2861328125, -5.0728759765625, -4.859619140625, -4.6463623046875, -4.43310546875, -4.2198486328125, -4.006591796875, -3.7933349609375, -3.580078125, -3.3668212890625, -3.153564453125, -2.9403076171875, -2.72705078125, -2.5137939453125, -2.300537109375, -2.0872802734375, -1.8740234375, -1.6607666015625, -1.447509765625, -1.2342529296875, -1.02099609375, -0.8077392578125, -0.594482421875, -0.3812255859375, -0.16796875, 0.0452880859375, 0.258544921875, 0.4718017578125, 0.68505859375, 0.8983154296875, 1.111572265625, 1.3248291015625, 1.5380859375, 1.7513427734375, 1.964599609375, 2.1778564453125, 2.39111328125, 2.6043701171875, 2.817626953125, 3.0308837890625, 3.244140625, 3.4573974609375, 3.670654296875, 3.8839111328125, 4.09716796875, 4.3104248046875, 4.523681640625, 4.7369384765625, 4.9501953125, 5.1634521484375, 5.376708984375, 5.5899658203125, 5.80322265625, 6.0164794921875, 6.229736328125, 6.4429931640625, 6.65625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 11.0, 8.0, 15.0, 14.0, 16.0, 26.0, 17.0, 18.0, 25.0, 27.0, 30.0, 44.0, 30.0, 34.0, 36.0, 44.0, 39.0, 40.0, 40.0, 46.0, 41.0, 41.0, 43.0, 38.0, 23.0, 24.0, 42.0, 23.0, 17.0, 17.0, 17.0, 16.0, 11.0, 10.0, 14.0, 15.0, 9.0, 4.0, 9.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0335693359375, -8.731201171875, -8.4288330078125, -8.12646484375, -7.8240966796875, -7.521728515625, -7.2193603515625, -6.9169921875, -6.6146240234375, -6.312255859375, -6.0098876953125, -5.70751953125, -5.4051513671875, -5.102783203125, -4.8004150390625, -4.498046875, -4.1956787109375, -3.893310546875, -3.5909423828125, -3.28857421875, -2.9862060546875, -2.683837890625, -2.3814697265625, -2.0791015625, -1.7767333984375, -1.474365234375, -1.1719970703125, -0.86962890625, -0.5672607421875, -0.264892578125, 0.0374755859375, 0.33984375, 0.6422119140625, 0.944580078125, 1.2469482421875, 1.54931640625, 1.8516845703125, 2.154052734375, 2.4564208984375, 2.7587890625, 3.0611572265625, 3.363525390625, 3.6658935546875, 3.96826171875, 4.2706298828125, 4.572998046875, 4.8753662109375, 5.177734375, 5.4801025390625, 5.782470703125, 6.0848388671875, 6.38720703125, 6.6895751953125, 6.991943359375, 7.2943115234375, 7.5966796875, 7.8990478515625, 8.201416015625, 8.5037841796875, 8.80615234375, 9.1085205078125, 9.410888671875, 9.7132568359375, 10.015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 9.0, 17.0, 24.0, 36.0, 69.0, 100.0, 156.0, 285.0, 428.0, 710.0, 1364.0, 2340.0, 3831.0, 6842.0, 12444.0, 21559.0, 37968.0, 64810.0, 103990.0, 149830.0, 177744.0, 161964.0, 119366.0, 76661.0, 45431.0, 26457.0, 14666.0, 8222.0, 4748.0, 2736.0, 1549.0, 863.0, 524.0, 313.0, 198.0, 101.0, 85.0, 42.0, 22.0, 17.0, 18.0, 8.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9974365234375, -7.744873046875, -7.4923095703125, -7.23974609375, -6.9871826171875, -6.734619140625, -6.4820556640625, -6.2294921875, -5.9769287109375, -5.724365234375, -5.4718017578125, -5.21923828125, -4.9666748046875, -4.714111328125, -4.4615478515625, -4.208984375, -3.9564208984375, -3.703857421875, -3.4512939453125, -3.19873046875, -2.9461669921875, -2.693603515625, -2.4410400390625, -2.1884765625, -1.9359130859375, -1.683349609375, -1.4307861328125, -1.17822265625, -0.9256591796875, -0.673095703125, -0.4205322265625, -0.16796875, 0.0845947265625, 0.337158203125, 0.5897216796875, 0.84228515625, 1.0948486328125, 1.347412109375, 1.5999755859375, 1.8525390625, 2.1051025390625, 2.357666015625, 2.6102294921875, 2.86279296875, 3.1153564453125, 3.367919921875, 3.6204833984375, 3.873046875, 4.1256103515625, 4.378173828125, 4.6307373046875, 4.88330078125, 5.1358642578125, 5.388427734375, 5.6409912109375, 5.8935546875, 6.1461181640625, 6.398681640625, 6.6512451171875, 6.90380859375, 7.1563720703125, 7.408935546875, 7.6614990234375, 7.9140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 9.0, 18.0, 16.0, 17.0, 25.0, 19.0, 32.0, 34.0, 37.0, 38.0, 30.0, 41.0, 43.0, 40.0, 45.0, 41.0, 48.0, 41.0, 35.0, 39.0, 39.0, 47.0, 30.0, 20.0, 29.0, 41.0, 19.0, 22.0, 16.0, 8.0, 9.0, 11.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.49310302734375, -5.2947998046875, -5.09649658203125, -4.898193359375, -4.69989013671875, -4.5015869140625, -4.30328369140625, -4.10498046875, -3.90667724609375, -3.7083740234375, -3.51007080078125, -3.311767578125, -3.11346435546875, -2.9151611328125, -2.71685791015625, -2.5185546875, -2.32025146484375, -2.1219482421875, -1.92364501953125, -1.725341796875, -1.52703857421875, -1.3287353515625, -1.13043212890625, -0.93212890625, -0.73382568359375, -0.5355224609375, -0.33721923828125, -0.138916015625, 0.05938720703125, 0.2576904296875, 0.45599365234375, 0.654296875, 0.85260009765625, 1.0509033203125, 1.24920654296875, 1.447509765625, 1.64581298828125, 1.8441162109375, 2.04241943359375, 2.24072265625, 2.43902587890625, 2.6373291015625, 2.83563232421875, 3.033935546875, 3.23223876953125, 3.4305419921875, 3.62884521484375, 3.8271484375, 4.02545166015625, 4.2237548828125, 4.42205810546875, 4.620361328125, 4.81866455078125, 5.0169677734375, 5.21527099609375, 5.41357421875, 5.61187744140625, 5.8101806640625, 6.00848388671875, 6.206787109375, 6.40509033203125, 6.6033935546875, 6.80169677734375, 7.0]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 13.0, 12.0, 16.0, 24.0, 37.0, 67.0, 101.0, 162.0, 218.0, 323.0, 515.0, 828.0, 1253.0, 2066.0, 3479.0, 5850.0, 9951.0, 17370.0, 31320.0, 57398.0, 102919.0, 169329.0, 212705.0, 179045.0, 111342.0, 62153.0, 34064.0, 19148.0, 10841.0, 6224.0, 3780.0, 2152.0, 1381.0, 859.0, 547.0, 393.0, 205.0, 155.0, 96.0, 76.0, 34.0, 37.0, 19.0, 9.0, 12.0, 13.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.173828125, -3.076385498046875, -2.97894287109375, -2.881500244140625, -2.7840576171875, -2.686614990234375, -2.58917236328125, -2.491729736328125, -2.394287109375, -2.296844482421875, -2.19940185546875, -2.101959228515625, -2.0045166015625, -1.907073974609375, -1.80963134765625, -1.712188720703125, -1.61474609375, -1.517303466796875, -1.41986083984375, -1.322418212890625, -1.2249755859375, -1.127532958984375, -1.03009033203125, -0.932647705078125, -0.835205078125, -0.737762451171875, -0.64031982421875, -0.542877197265625, -0.4454345703125, -0.347991943359375, -0.25054931640625, -0.153106689453125, -0.0556640625, 0.041778564453125, 0.13922119140625, 0.236663818359375, 0.3341064453125, 0.431549072265625, 0.52899169921875, 0.626434326171875, 0.723876953125, 0.821319580078125, 0.91876220703125, 1.016204833984375, 1.1136474609375, 1.211090087890625, 1.30853271484375, 1.405975341796875, 1.50341796875, 1.600860595703125, 1.69830322265625, 1.795745849609375, 1.8931884765625, 1.990631103515625, 2.08807373046875, 2.185516357421875, 2.282958984375, 2.380401611328125, 2.47784423828125, 2.575286865234375, 2.6727294921875, 2.770172119140625, 2.86761474609375, 2.965057373046875, 3.0625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 2.0, 7.0, 3.0, 5.0, 7.0, 13.0, 12.0, 24.0, 29.0, 40.0, 36.0, 45.0, 52.0, 36.0, 57.0, 51.0, 80.0, 66.0, 56.0, 52.0, 49.0, 41.0, 35.0, 34.0, 31.0, 22.0, 25.0, 11.0, 13.0, 11.0, 14.0, 11.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001806020736694336, -0.00017494522035121918, -0.00016928836703300476, -0.00016363151371479034, -0.00015797466039657593, -0.0001523178070783615, -0.0001466609537601471, -0.00014100410044193268, -0.00013534724712371826, -0.00012969039380550385, -0.00012403354048728943, -0.00011837668716907501, -0.0001127198338508606, -0.00010706298053264618, -0.00010140612721443176, -9.574927389621735e-05, -9.009242057800293e-05, -8.443556725978851e-05, -7.87787139415741e-05, -7.312186062335968e-05, -6.746500730514526e-05, -6.180815398693085e-05, -5.615130066871643e-05, -5.0494447350502014e-05, -4.48375940322876e-05, -3.918074071407318e-05, -3.3523887395858765e-05, -2.7867034077644348e-05, -2.221018075942993e-05, -1.6553327441215515e-05, -1.0896474123001099e-05, -5.239620804786682e-06, 4.172325134277344e-07, 6.074085831642151e-06, 1.1730939149856567e-05, 1.7387792468070984e-05, 2.30446457862854e-05, 2.8701499104499817e-05, 3.4358352422714233e-05, 4.001520574092865e-05, 4.5672059059143066e-05, 5.132891237735748e-05, 5.69857656955719e-05, 6.264261901378632e-05, 6.829947233200073e-05, 7.395632565021515e-05, 7.961317896842957e-05, 8.527003228664398e-05, 9.09268856048584e-05, 9.658373892307281e-05, 0.00010224059224128723, 0.00010789744555950165, 0.00011355429887771606, 0.00011921115219593048, 0.0001248680055141449, 0.00013052485883235931, 0.00013618171215057373, 0.00014183856546878815, 0.00014749541878700256, 0.00015315227210521698, 0.0001588091254234314, 0.0001644659787416458, 0.00017012283205986023, 0.00017577968537807465, 0.00018143653869628906]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 9.0, 3.0, 9.0, 10.0, 16.0, 22.0, 21.0, 42.0, 59.0, 82.0, 135.0, 162.0, 255.0, 331.0, 506.0, 857.0, 1233.0, 2018.0, 3010.0, 4660.0, 7216.0, 11505.0, 18058.0, 28834.0, 45840.0, 70522.0, 105848.0, 143271.0, 160445.0, 142939.0, 105726.0, 70794.0, 45557.0, 28694.0, 18045.0, 11202.0, 7389.0, 4625.0, 2894.0, 1938.0, 1272.0, 842.0, 521.0, 362.0, 222.0, 180.0, 122.0, 75.0, 59.0, 35.0, 34.0, 15.0, 14.0, 9.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.306640625, -2.23565673828125, -2.1646728515625, -2.09368896484375, -2.022705078125, -1.95172119140625, -1.8807373046875, -1.80975341796875, -1.73876953125, -1.66778564453125, -1.5968017578125, -1.52581787109375, -1.454833984375, -1.38385009765625, -1.3128662109375, -1.24188232421875, -1.1708984375, -1.09991455078125, -1.0289306640625, -0.95794677734375, -0.886962890625, -0.81597900390625, -0.7449951171875, -0.67401123046875, -0.60302734375, -0.53204345703125, -0.4610595703125, -0.39007568359375, -0.319091796875, -0.24810791015625, -0.1771240234375, -0.10614013671875, -0.03515625, 0.03582763671875, 0.1068115234375, 0.17779541015625, 0.248779296875, 0.31976318359375, 0.3907470703125, 0.46173095703125, 0.53271484375, 0.60369873046875, 0.6746826171875, 0.74566650390625, 0.816650390625, 0.88763427734375, 0.9586181640625, 1.02960205078125, 1.1005859375, 1.17156982421875, 1.2425537109375, 1.31353759765625, 1.384521484375, 1.45550537109375, 1.5264892578125, 1.59747314453125, 1.66845703125, 1.73944091796875, 1.8104248046875, 1.88140869140625, 1.952392578125, 2.02337646484375, 2.0943603515625, 2.16534423828125, 2.236328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 11.0, 9.0, 13.0, 20.0, 21.0, 20.0, 32.0, 27.0, 47.0, 52.0, 66.0, 62.0, 52.0, 59.0, 54.0, 54.0, 68.0, 50.0, 51.0, 43.0, 32.0, 25.0, 34.0, 16.0, 16.0, 14.0, 11.0, 5.0, 8.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1043853759765625, -1.067169189453125, -1.0299530029296875, -0.99273681640625, -0.9555206298828125, -0.918304443359375, -0.8810882568359375, -0.8438720703125, -0.8066558837890625, -0.769439697265625, -0.7322235107421875, -0.69500732421875, -0.6577911376953125, -0.620574951171875, -0.5833587646484375, -0.546142578125, -0.5089263916015625, -0.471710205078125, -0.4344940185546875, -0.39727783203125, -0.3600616455078125, -0.322845458984375, -0.2856292724609375, -0.2484130859375, -0.2111968994140625, -0.173980712890625, -0.1367645263671875, -0.09954833984375, -0.0623321533203125, -0.025115966796875, 0.0121002197265625, 0.04931640625, 0.0865325927734375, 0.123748779296875, 0.1609649658203125, 0.19818115234375, 0.2353973388671875, 0.272613525390625, 0.3098297119140625, 0.3470458984375, 0.3842620849609375, 0.421478271484375, 0.4586944580078125, 0.49591064453125, 0.5331268310546875, 0.570343017578125, 0.6075592041015625, 0.644775390625, 0.6819915771484375, 0.719207763671875, 0.7564239501953125, 0.79364013671875, 0.8308563232421875, 0.868072509765625, 0.9052886962890625, 0.9425048828125, 0.9797210693359375, 1.016937255859375, 1.0541534423828125, 1.09136962890625, 1.1285858154296875, 1.165802001953125, 1.2030181884765625, 1.240234375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 7.0, 10.0, 5.0, 11.0, 14.0, 23.0, 24.0, 37.0, 42.0, 46.0, 62.0, 75.0, 72.0, 76.0, 78.0, 67.0, 69.0, 54.0, 40.0, 36.0, 31.0, 14.0, 24.0, 17.0, 11.0, 13.0, 13.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.603278160095215, -11.240944862365723, -10.878612518310547, -10.516279220581055, -10.153946876525879, -9.791613578796387, -9.429281234741211, -9.066947937011719, -8.704614639282227, -8.342281341552734, -7.979948997497559, -7.617615699768066, -7.255283355712891, -6.892950057983398, -6.5306172370910645, -6.1682844161987305, -5.805952072143555, -5.443619251251221, -5.081286430358887, -4.7189531326293945, -4.356620788574219, -3.9942877292633057, -3.6319546699523926, -3.2696218490600586, -2.9072890281677246, -2.5449562072753906, -2.1826233863830566, -1.8202903270721436, -1.4579575061798096, -1.0956246852874756, -0.7332916259765625, -0.3709588050842285, -0.008626937866210938, 0.3537059426307678, 0.7160388231277466, 1.0783717632293701, 1.440704584121704, 1.803037405014038, 2.165370464324951, 2.527703285217285, 2.890036106109619, 3.252368927001953, 3.614701747894287, 3.9770348072052, 4.339367866516113, 4.701700210571289, 5.064033508300781, 5.426366329193115, 5.788699150085449, 6.151031970977783, 6.513364791870117, 6.875698089599609, 7.238030433654785, 7.600363731384277, 7.962696552276611, 8.325029373168945, 8.687362670898438, 9.04969596862793, 9.412028312683105, 9.774361610412598, 10.136693954467773, 10.499027252197266, 10.861360549926758, 11.223692893981934, 11.58602523803711]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 16.0, 14.0, 17.0, 23.0, 20.0, 31.0, 23.0, 33.0, 28.0, 33.0, 30.0, 49.0, 42.0, 42.0, 38.0, 39.0, 47.0, 57.0, 51.0, 44.0, 21.0, 40.0, 28.0, 30.0, 28.0, 29.0, 15.0, 24.0, 22.0, 14.0, 10.0, 13.0, 7.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.761778831481934, -10.422074317932129, -10.08237075805664, -9.742666244506836, -9.402961730957031, -9.063257217407227, -8.723553657531738, -8.383849143981934, -8.044145584106445, -7.704441547393799, -7.364737033843994, -7.025032997131348, -6.685328483581543, -6.3456244468688965, -6.00592041015625, -5.666215896606445, -5.326511383056641, -4.986807346343994, -4.6471028327941895, -4.307398796081543, -3.9676945209503174, -3.627990245819092, -3.2882862091064453, -2.9485819339752197, -2.608877658843994, -2.2691733837127686, -1.9294692277908325, -1.5897650718688965, -1.250060796737671, -0.9103565216064453, -0.5706524848937988, -0.23094820976257324, 0.10875511169433594, 0.44845932722091675, 0.7881635427474976, 1.1278676986694336, 1.4675719738006592, 1.8072762489318848, 2.1469802856445312, 2.486684560775757, 2.8263888359069824, 3.166093111038208, 3.5057973861694336, 3.84550142288208, 4.185205459594727, 4.524909973144531, 4.864614009857178, 5.204318046569824, 5.544022560119629, 5.883726596832275, 6.22343111038208, 6.563135147094727, 6.902839660644531, 7.242543697357178, 7.582247734069824, 7.921952247619629, 8.261655807495117, 8.601360321044922, 8.94106388092041, 9.280768394470215, 9.62047290802002, 9.960176467895508, 10.299880981445312, 10.639585494995117, 10.979290008544922]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 6.0, 9.0, 10.0, 13.0, 31.0, 22.0, 45.0, 85.0, 87.0, 142.0, 239.0, 338.0, 546.0, 776.0, 1324.0, 2210.0, 3397.0, 5561.0, 8984.0, 15181.0, 25998.0, 44932.0, 79391.0, 144330.0, 267455.0, 486665.0, 788649.0, 883951.0, 629815.0, 358841.0, 193940.0, 106687.0, 59482.0, 33606.0, 19912.0, 11857.0, 7236.0, 4402.0, 2862.0, 1849.0, 1168.0, 775.0, 496.0, 325.0, 217.0, 160.0, 93.0, 68.0, 37.0, 38.0, 19.0, 13.0, 8.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.625, -8.3489990234375, -8.072998046875, -7.7969970703125, -7.52099609375, -7.2449951171875, -6.968994140625, -6.6929931640625, -6.4169921875, -6.1409912109375, -5.864990234375, -5.5889892578125, -5.31298828125, -5.0369873046875, -4.760986328125, -4.4849853515625, -4.208984375, -3.9329833984375, -3.656982421875, -3.3809814453125, -3.10498046875, -2.8289794921875, -2.552978515625, -2.2769775390625, -2.0009765625, -1.7249755859375, -1.448974609375, -1.1729736328125, -0.89697265625, -0.6209716796875, -0.344970703125, -0.0689697265625, 0.20703125, 0.4830322265625, 0.759033203125, 1.0350341796875, 1.31103515625, 1.5870361328125, 1.863037109375, 2.1390380859375, 2.4150390625, 2.6910400390625, 2.967041015625, 3.2430419921875, 3.51904296875, 3.7950439453125, 4.071044921875, 4.3470458984375, 4.623046875, 4.8990478515625, 5.175048828125, 5.4510498046875, 5.72705078125, 6.0030517578125, 6.279052734375, 6.5550537109375, 6.8310546875, 7.1070556640625, 7.383056640625, 7.6590576171875, 7.93505859375, 8.2110595703125, 8.487060546875, 8.7630615234375, 9.0390625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 8.0, 11.0, 11.0, 15.0, 14.0, 21.0, 31.0, 30.0, 24.0, 23.0, 26.0, 36.0, 38.0, 39.0, 42.0, 50.0, 39.0, 42.0, 40.0, 50.0, 46.0, 45.0, 39.0, 35.0, 43.0, 32.0, 23.0, 25.0, 24.0, 16.0, 15.0, 15.0, 9.0, 9.0, 8.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.75390625, -7.52197265625, -7.2900390625, -7.05810546875, -6.826171875, -6.59423828125, -6.3623046875, -6.13037109375, -5.8984375, -5.66650390625, -5.4345703125, -5.20263671875, -4.970703125, -4.73876953125, -4.5068359375, -4.27490234375, -4.04296875, -3.81103515625, -3.5791015625, -3.34716796875, -3.115234375, -2.88330078125, -2.6513671875, -2.41943359375, -2.1875, -1.95556640625, -1.7236328125, -1.49169921875, -1.259765625, -1.02783203125, -0.7958984375, -0.56396484375, -0.33203125, -0.10009765625, 0.1318359375, 0.36376953125, 0.595703125, 0.82763671875, 1.0595703125, 1.29150390625, 1.5234375, 1.75537109375, 1.9873046875, 2.21923828125, 2.451171875, 2.68310546875, 2.9150390625, 3.14697265625, 3.37890625, 3.61083984375, 3.8427734375, 4.07470703125, 4.306640625, 4.53857421875, 4.7705078125, 5.00244140625, 5.234375, 5.46630859375, 5.6982421875, 5.93017578125, 6.162109375, 6.39404296875, 6.6259765625, 6.85791015625, 7.08984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 10.0, 16.0, 23.0, 42.0, 57.0, 102.0, 153.0, 282.0, 472.0, 742.0, 1300.0, 2203.0, 3805.0, 6567.0, 11566.0, 21055.0, 38156.0, 69898.0, 130898.0, 241210.0, 428469.0, 677990.0, 830932.0, 706191.0, 454327.0, 258153.0, 140103.0, 76631.0, 41248.0, 22438.0, 12379.0, 7178.0, 3897.0, 2393.0, 1401.0, 760.0, 490.0, 296.0, 157.0, 118.0, 68.0, 37.0, 35.0, 15.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.484375, -9.2176513671875, -8.950927734375, -8.6842041015625, -8.41748046875, -8.1507568359375, -7.884033203125, -7.6173095703125, -7.3505859375, -7.0838623046875, -6.817138671875, -6.5504150390625, -6.28369140625, -6.0169677734375, -5.750244140625, -5.4835205078125, -5.216796875, -4.9500732421875, -4.683349609375, -4.4166259765625, -4.14990234375, -3.8831787109375, -3.616455078125, -3.3497314453125, -3.0830078125, -2.8162841796875, -2.549560546875, -2.2828369140625, -2.01611328125, -1.7493896484375, -1.482666015625, -1.2159423828125, -0.94921875, -0.6824951171875, -0.415771484375, -0.1490478515625, 0.11767578125, 0.3843994140625, 0.651123046875, 0.9178466796875, 1.1845703125, 1.4512939453125, 1.718017578125, 1.9847412109375, 2.25146484375, 2.5181884765625, 2.784912109375, 3.0516357421875, 3.318359375, 3.5850830078125, 3.851806640625, 4.1185302734375, 4.38525390625, 4.6519775390625, 4.918701171875, 5.1854248046875, 5.4521484375, 5.7188720703125, 5.985595703125, 6.2523193359375, 6.51904296875, 6.7857666015625, 7.052490234375, 7.3192138671875, 7.5859375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 11.0, 12.0, 8.0, 12.0, 20.0, 32.0, 35.0, 49.0, 50.0, 81.0, 89.0, 102.0, 152.0, 165.0, 174.0, 207.0, 216.0, 216.0, 224.0, 250.0, 255.0, 228.0, 218.0, 219.0, 159.0, 144.0, 124.0, 111.0, 105.0, 77.0, 66.0, 52.0, 60.0, 39.0, 24.0, 20.0, 20.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.845703125, -3.731689453125, -3.61767578125, -3.503662109375, -3.3896484375, -3.275634765625, -3.16162109375, -3.047607421875, -2.93359375, -2.819580078125, -2.70556640625, -2.591552734375, -2.4775390625, -2.363525390625, -2.24951171875, -2.135498046875, -2.021484375, -1.907470703125, -1.79345703125, -1.679443359375, -1.5654296875, -1.451416015625, -1.33740234375, -1.223388671875, -1.109375, -0.995361328125, -0.88134765625, -0.767333984375, -0.6533203125, -0.539306640625, -0.42529296875, -0.311279296875, -0.197265625, -0.083251953125, 0.03076171875, 0.144775390625, 0.2587890625, 0.372802734375, 0.48681640625, 0.600830078125, 0.71484375, 0.828857421875, 0.94287109375, 1.056884765625, 1.1708984375, 1.284912109375, 1.39892578125, 1.512939453125, 1.626953125, 1.740966796875, 1.85498046875, 1.968994140625, 2.0830078125, 2.197021484375, 2.31103515625, 2.425048828125, 2.5390625, 2.653076171875, 2.76708984375, 2.881103515625, 2.9951171875, 3.109130859375, 3.22314453125, 3.337158203125, 3.451171875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 8.0, 15.0, 10.0, 19.0, 32.0, 22.0, 39.0, 45.0, 58.0, 65.0, 69.0, 71.0, 72.0, 80.0, 72.0, 61.0, 60.0, 38.0, 19.0, 30.0, 21.0, 13.0, 13.0, 12.0, 12.0, 10.0, 4.0, 12.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.427229881286621, -10.062740325927734, -9.698249816894531, -9.333759307861328, -8.969269752502441, -8.604780197143555, -8.240289688110352, -7.875799655914307, -7.511309623718262, -7.146819591522217, -6.782329559326172, -6.417839527130127, -6.053349494934082, -5.688859462738037, -5.324369430541992, -4.959879398345947, -4.595389366149902, -4.230899333953857, -3.8664093017578125, -3.5019192695617676, -3.1374292373657227, -2.7729392051696777, -2.408449172973633, -2.043959140777588, -1.679469108581543, -1.314979076385498, -0.9504890441894531, -0.5859990119934082, -0.22150897979736328, 0.14298105239868164, 0.5074710845947266, 0.8719611167907715, 1.2364501953125, 1.600940227508545, 1.9654302597045898, 2.3299202919006348, 2.6944103240966797, 3.0589003562927246, 3.4233903884887695, 3.7878804206848145, 4.152370452880859, 4.516860485076904, 4.881350517272949, 5.245840549468994, 5.610330581665039, 5.974820613861084, 6.339310646057129, 6.703800678253174, 7.068290710449219, 7.432780742645264, 7.797270774841309, 8.161760330200195, 8.526250839233398, 8.890741348266602, 9.255230903625488, 9.619720458984375, 9.984210968017578, 10.348701477050781, 10.713191032409668, 11.077680587768555, 11.442171096801758, 11.806661605834961, 12.171151161193848, 12.535640716552734, 12.900131225585938]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 10.0, 11.0, 9.0, 26.0, 18.0, 24.0, 29.0, 30.0, 32.0, 17.0, 32.0, 46.0, 37.0, 45.0, 39.0, 54.0, 42.0, 40.0, 48.0, 48.0, 42.0, 38.0, 35.0, 29.0, 32.0, 24.0, 29.0, 20.0, 17.0, 17.0, 8.0, 12.0, 7.0, 7.0, 9.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.249926567077637, -8.944991111755371, -8.640055656433105, -8.335119247436523, -8.030183792114258, -7.725248336791992, -7.420312881469727, -7.115377426147461, -6.810441970825195, -6.50550651550293, -6.200570583343506, -5.89563512802124, -5.590699672698975, -5.285763740539551, -4.980828285217285, -4.6758928298950195, -4.370956897735596, -4.06602144241333, -3.7610857486724854, -3.4561500549316406, -3.151214599609375, -2.8462789058685303, -2.5413432121276855, -2.23640775680542, -1.9314720630645752, -1.62653648853302, -1.3216009140014648, -1.0166652202606201, -0.7117296457290649, -0.40679407119750977, -0.10185837745666504, 0.20307707786560059, 0.5080127716064453, 0.8129483461380005, 1.1178839206695557, 1.4228196144104004, 1.7277551889419556, 2.0326907634735107, 2.3376264572143555, 2.642561912536621, 2.947497606277466, 3.2524333000183105, 3.557368755340576, 3.862304449081421, 4.167240142822266, 4.472175598144531, 4.777111053466797, 5.0820465087890625, 5.386982440948486, 5.691917896270752, 5.996853828430176, 6.301789283752441, 6.606724739074707, 6.911660194396973, 7.2165961265563965, 7.521531581878662, 7.826467514038086, 8.131402969360352, 8.436338424682617, 8.741273880004883, 9.046210289001465, 9.35114574432373, 9.656081199645996, 9.961016654968262, 10.265952110290527]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 12.0, 28.0, 25.0, 46.0, 74.0, 134.0, 188.0, 313.0, 556.0, 851.0, 1397.0, 2484.0, 4212.0, 7468.0, 13228.0, 23790.0, 43075.0, 79868.0, 144852.0, 242662.0, 213770.0, 121268.0, 66115.0, 36018.0, 19911.0, 11181.0, 6174.0, 3571.0, 2135.0, 1208.0, 740.0, 427.0, 268.0, 190.0, 102.0, 73.0, 38.0, 31.0, 19.0, 11.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2274322509765625, -1.186309814453125, -1.1451873779296875, -1.10406494140625, -1.0629425048828125, -1.021820068359375, -0.9806976318359375, -0.9395751953125, -0.8984527587890625, -0.857330322265625, -0.8162078857421875, -0.77508544921875, -0.7339630126953125, -0.692840576171875, -0.6517181396484375, -0.610595703125, -0.5694732666015625, -0.528350830078125, -0.4872283935546875, -0.44610595703125, -0.4049835205078125, -0.363861083984375, -0.3227386474609375, -0.2816162109375, -0.2404937744140625, -0.199371337890625, -0.1582489013671875, -0.11712646484375, -0.0760040283203125, -0.034881591796875, 0.0062408447265625, 0.04736328125, 0.0884857177734375, 0.129608154296875, 0.1707305908203125, 0.21185302734375, 0.2529754638671875, 0.294097900390625, 0.3352203369140625, 0.3763427734375, 0.4174652099609375, 0.458587646484375, 0.4997100830078125, 0.54083251953125, 0.5819549560546875, 0.623077392578125, 0.6641998291015625, 0.705322265625, 0.7464447021484375, 0.787567138671875, 0.8286895751953125, 0.86981201171875, 0.9109344482421875, 0.952056884765625, 0.9931793212890625, 1.0343017578125, 1.0754241943359375, 1.116546630859375, 1.1576690673828125, 1.19879150390625, 1.2399139404296875, 1.281036376953125, 1.3221588134765625, 1.36328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 2.0, 5.0, 12.0, 12.0, 15.0, 15.0, 23.0, 25.0, 28.0, 26.0, 39.0, 39.0, 42.0, 43.0, 41.0, 55.0, 51.0, 41.0, 43.0, 54.0, 50.0, 37.0, 46.0, 39.0, 29.0, 36.0, 22.0, 21.0, 29.0, 11.0, 14.0, 15.0, 9.0, 4.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.0948486328125, -9.752197265625, -9.4095458984375, -9.06689453125, -8.7242431640625, -8.381591796875, -8.0389404296875, -7.6962890625, -7.3536376953125, -7.010986328125, -6.6683349609375, -6.32568359375, -5.9830322265625, -5.640380859375, -5.2977294921875, -4.955078125, -4.6124267578125, -4.269775390625, -3.9271240234375, -3.58447265625, -3.2418212890625, -2.899169921875, -2.5565185546875, -2.2138671875, -1.8712158203125, -1.528564453125, -1.1859130859375, -0.84326171875, -0.5006103515625, -0.157958984375, 0.1846923828125, 0.52734375, 0.8699951171875, 1.212646484375, 1.5552978515625, 1.89794921875, 2.2406005859375, 2.583251953125, 2.9259033203125, 3.2685546875, 3.6112060546875, 3.953857421875, 4.2965087890625, 4.63916015625, 4.9818115234375, 5.324462890625, 5.6671142578125, 6.009765625, 6.3524169921875, 6.695068359375, 7.0377197265625, 7.38037109375, 7.7230224609375, 8.065673828125, 8.4083251953125, 8.7509765625, 9.0936279296875, 9.436279296875, 9.7789306640625, 10.12158203125, 10.4642333984375, 10.806884765625, 11.1495361328125, 11.4921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 27.0, 18.0, 37.0, 53.0, 78.0, 124.0, 193.0, 293.0, 436.0, 758.0, 1278.0, 2072.0, 3659.0, 5873.0, 10348.0, 17603.0, 30294.0, 51387.0, 87839.0, 145926.0, 215639.0, 188015.0, 117743.0, 69846.0, 40843.0, 24141.0, 13833.0, 8138.0, 4799.0, 2796.0, 1718.0, 1049.0, 603.0, 377.0, 243.0, 145.0, 94.0, 72.0, 56.0, 33.0, 17.0, 12.0, 6.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.248046875, -1.2111053466796875, -1.174163818359375, -1.1372222900390625, -1.10028076171875, -1.0633392333984375, -1.026397705078125, -0.9894561767578125, -0.9525146484375, -0.9155731201171875, -0.878631591796875, -0.8416900634765625, -0.80474853515625, -0.7678070068359375, -0.730865478515625, -0.6939239501953125, -0.656982421875, -0.6200408935546875, -0.583099365234375, -0.5461578369140625, -0.50921630859375, -0.4722747802734375, -0.435333251953125, -0.3983917236328125, -0.3614501953125, -0.3245086669921875, -0.287567138671875, -0.2506256103515625, -0.21368408203125, -0.1767425537109375, -0.139801025390625, -0.1028594970703125, -0.06591796875, -0.0289764404296875, 0.007965087890625, 0.0449066162109375, 0.08184814453125, 0.1187896728515625, 0.155731201171875, 0.1926727294921875, 0.2296142578125, 0.2665557861328125, 0.303497314453125, 0.3404388427734375, 0.37738037109375, 0.4143218994140625, 0.451263427734375, 0.4882049560546875, 0.525146484375, 0.5620880126953125, 0.599029541015625, 0.6359710693359375, 0.67291259765625, 0.7098541259765625, 0.746795654296875, 0.7837371826171875, 0.8206787109375, 0.8576202392578125, 0.894561767578125, 0.9315032958984375, 0.96844482421875, 1.0053863525390625, 1.042327880859375, 1.0792694091796875, 1.1162109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 11.0, 3.0, 10.0, 10.0, 10.0, 9.0, 15.0, 22.0, 20.0, 22.0, 31.0, 20.0, 34.0, 41.0, 33.0, 41.0, 48.0, 48.0, 47.0, 40.0, 43.0, 34.0, 42.0, 34.0, 39.0, 37.0, 49.0, 28.0, 19.0, 22.0, 26.0, 23.0, 16.0, 16.0, 10.0, 11.0, 11.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.5899658203125, -5.394775390625, -5.1995849609375, -5.00439453125, -4.8092041015625, -4.614013671875, -4.4188232421875, -4.2236328125, -4.0284423828125, -3.833251953125, -3.6380615234375, -3.44287109375, -3.2476806640625, -3.052490234375, -2.8572998046875, -2.662109375, -2.4669189453125, -2.271728515625, -2.0765380859375, -1.88134765625, -1.6861572265625, -1.490966796875, -1.2957763671875, -1.1005859375, -0.9053955078125, -0.710205078125, -0.5150146484375, -0.31982421875, -0.1246337890625, 0.070556640625, 0.2657470703125, 0.4609375, 0.6561279296875, 0.851318359375, 1.0465087890625, 1.24169921875, 1.4368896484375, 1.632080078125, 1.8272705078125, 2.0224609375, 2.2176513671875, 2.412841796875, 2.6080322265625, 2.80322265625, 2.9984130859375, 3.193603515625, 3.3887939453125, 3.583984375, 3.7791748046875, 3.974365234375, 4.1695556640625, 4.36474609375, 4.5599365234375, 4.755126953125, 4.9503173828125, 5.1455078125, 5.3406982421875, 5.535888671875, 5.7310791015625, 5.92626953125, 6.1214599609375, 6.316650390625, 6.5118408203125, 6.70703125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 8.0, 5.0, 3.0, 11.0, 10.0, 21.0, 27.0, 24.0, 46.0, 59.0, 80.0, 105.0, 144.0, 230.0, 341.0, 532.0, 977.0, 1761.0, 3969.0, 10983.0, 39778.0, 231414.0, 607963.0, 112894.0, 23361.0, 7273.0, 2887.0, 1468.0, 764.0, 448.0, 296.0, 181.0, 130.0, 89.0, 79.0, 43.0, 40.0, 22.0, 23.0, 17.0, 11.0, 9.0, 7.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.3525390625, -0.3425559997558594, -0.33257293701171875, -0.3225898742675781, -0.3126068115234375, -0.3026237487792969, -0.29264068603515625, -0.2826576232910156, -0.272674560546875, -0.2626914978027344, -0.25270843505859375, -0.24272537231445312, -0.2327423095703125, -0.22275924682617188, -0.21277618408203125, -0.20279312133789062, -0.19281005859375, -0.18282699584960938, -0.17284393310546875, -0.16286087036132812, -0.1528778076171875, -0.14289474487304688, -0.13291168212890625, -0.12292861938476562, -0.112945556640625, -0.10296249389648438, -0.09297943115234375, -0.08299636840820312, -0.0730133056640625, -0.06303024291992188, -0.05304718017578125, -0.043064117431640625, -0.0330810546875, -0.023097991943359375, -0.01311492919921875, -0.003131866455078125, 0.0068511962890625, 0.016834259033203125, 0.02681732177734375, 0.036800384521484375, 0.046783447265625, 0.056766510009765625, 0.06674957275390625, 0.07673263549804688, 0.0867156982421875, 0.09669876098632812, 0.10668182373046875, 0.11666488647460938, 0.12664794921875, 0.13663101196289062, 0.14661407470703125, 0.15659713745117188, 0.1665802001953125, 0.17656326293945312, 0.18654632568359375, 0.19652938842773438, 0.206512451171875, 0.21649551391601562, 0.22647857666015625, 0.23646163940429688, 0.2464447021484375, 0.2564277648925781, 0.26641082763671875, 0.2763938903808594, 0.286376953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 18.0, 12.0, 15.0, 16.0, 29.0, 15.0, 22.0, 19.0, 31.0, 49.0, 42.0, 41.0, 46.0, 56.0, 49.0, 53.0, 41.0, 52.0, 43.0, 49.0, 31.0, 34.0, 21.0, 20.0, 22.0, 19.0, 25.0, 13.0, 17.0, 9.0, 7.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1674128472805023e-05, -1.130811870098114e-05, -1.0942108929157257e-05, -1.0576099157333374e-05, -1.0210089385509491e-05, -9.844079613685608e-06, -9.478069841861725e-06, -9.112060070037842e-06, -8.746050298213959e-06, -8.380040526390076e-06, -8.014030754566193e-06, -7.64802098274231e-06, -7.2820112109184265e-06, -6.9160014390945435e-06, -6.54999166727066e-06, -6.183981895446777e-06, -5.817972123622894e-06, -5.451962351799011e-06, -5.085952579975128e-06, -4.719942808151245e-06, -4.353933036327362e-06, -3.987923264503479e-06, -3.621913492679596e-06, -3.255903720855713e-06, -2.88989394903183e-06, -2.5238841772079468e-06, -2.1578744053840637e-06, -1.7918646335601807e-06, -1.4258548617362976e-06, -1.0598450899124146e-06, -6.938353180885315e-07, -3.2782554626464844e-07, 3.818422555923462e-08, 4.041939973831177e-07, 7.702037692070007e-07, 1.1362135410308838e-06, 1.5022233128547668e-06, 1.86823308467865e-06, 2.234242856502533e-06, 2.600252628326416e-06, 2.966262400150299e-06, 3.332272171974182e-06, 3.698281943798065e-06, 4.064291715621948e-06, 4.430301487445831e-06, 4.796311259269714e-06, 5.162321031093597e-06, 5.5283308029174805e-06, 5.8943405747413635e-06, 6.260350346565247e-06, 6.62636011838913e-06, 6.992369890213013e-06, 7.358379662036896e-06, 7.724389433860779e-06, 8.090399205684662e-06, 8.456408977508545e-06, 8.822418749332428e-06, 9.188428521156311e-06, 9.554438292980194e-06, 9.920448064804077e-06, 1.028645783662796e-05, 1.0652467608451843e-05, 1.1018477380275726e-05, 1.138448715209961e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 8.0, 5.0, 9.0, 11.0, 19.0, 16.0, 34.0, 49.0, 78.0, 116.0, 166.0, 232.0, 419.0, 701.0, 1161.0, 1871.0, 3406.0, 6273.0, 12281.0, 24808.0, 54106.0, 129998.0, 324508.0, 284732.0, 110820.0, 46906.0, 21678.0, 10888.0, 5660.0, 3122.0, 1719.0, 1055.0, 619.0, 402.0, 214.0, 158.0, 108.0, 60.0, 38.0, 30.0, 21.0, 14.0, 12.0, 12.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2177734375, -0.21115684509277344, -0.20454025268554688, -0.1979236602783203, -0.19130706787109375, -0.1846904754638672, -0.17807388305664062, -0.17145729064941406, -0.1648406982421875, -0.15822410583496094, -0.15160751342773438, -0.1449909210205078, -0.13837432861328125, -0.1317577362060547, -0.12514114379882812, -0.11852455139160156, -0.111907958984375, -0.10529136657714844, -0.09867477416992188, -0.09205818176269531, -0.08544158935546875, -0.07882499694824219, -0.07220840454101562, -0.06559181213378906, -0.0589752197265625, -0.05235862731933594, -0.045742034912109375, -0.03912544250488281, -0.03250885009765625, -0.025892257690429688, -0.019275665283203125, -0.012659072875976562, -0.00604248046875, 0.0005741119384765625, 0.007190704345703125, 0.013807296752929688, 0.02042388916015625, 0.027040481567382812, 0.033657073974609375, 0.04027366638183594, 0.0468902587890625, 0.05350685119628906, 0.060123443603515625, 0.06674003601074219, 0.07335662841796875, 0.07997322082519531, 0.08658981323242188, 0.09320640563964844, 0.099822998046875, 0.10643959045410156, 0.11305618286132812, 0.11967277526855469, 0.12628936767578125, 0.1329059600830078, 0.13952255249023438, 0.14613914489746094, 0.1527557373046875, 0.15937232971191406, 0.16598892211914062, 0.1726055145263672, 0.17922210693359375, 0.1858386993408203, 0.19245529174804688, 0.19907188415527344, 0.2056884765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 6.0, 15.0, 6.0, 12.0, 11.0, 14.0, 15.0, 28.0, 20.0, 43.0, 35.0, 49.0, 43.0, 45.0, 59.0, 74.0, 60.0, 49.0, 55.0, 49.0, 38.0, 33.0, 28.0, 25.0, 26.0, 20.0, 19.0, 16.0, 16.0, 12.0, 14.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0758056640625, -0.07328414916992188, -0.07076263427734375, -0.06824111938476562, -0.0657196044921875, -0.06319808959960938, -0.06067657470703125, -0.058155059814453125, -0.055633544921875, -0.053112030029296875, -0.05059051513671875, -0.048069000244140625, -0.0455474853515625, -0.043025970458984375, -0.04050445556640625, -0.037982940673828125, -0.03546142578125, -0.032939910888671875, -0.03041839599609375, -0.027896881103515625, -0.0253753662109375, -0.022853851318359375, -0.02033233642578125, -0.017810821533203125, -0.015289306640625, -0.012767791748046875, -0.01024627685546875, -0.007724761962890625, -0.0052032470703125, -0.002681732177734375, -0.00016021728515625, 0.002361297607421875, 0.0048828125, 0.007404327392578125, 0.00992584228515625, 0.012447357177734375, 0.0149688720703125, 0.017490386962890625, 0.02001190185546875, 0.022533416748046875, 0.025054931640625, 0.027576446533203125, 0.03009796142578125, 0.032619476318359375, 0.0351409912109375, 0.037662506103515625, 0.04018402099609375, 0.042705535888671875, 0.04522705078125, 0.047748565673828125, 0.05027008056640625, 0.052791595458984375, 0.0553131103515625, 0.057834625244140625, 0.06035614013671875, 0.06287765502929688, 0.065399169921875, 0.06792068481445312, 0.07044219970703125, 0.07296371459960938, 0.0754852294921875, 0.07800674438476562, 0.08052825927734375, 0.08304977416992188, 0.0855712890625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 13.0, 11.0, 22.0, 24.0, 29.0, 30.0, 44.0, 63.0, 61.0, 67.0, 70.0, 74.0, 68.0, 88.0, 60.0, 58.0, 45.0, 19.0, 32.0, 20.0, 15.0, 14.0, 11.0, 13.0, 8.0, 4.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.198831558227539, -9.832412719726562, -9.465993881225586, -9.09957504272461, -8.733156204223633, -8.366737365722656, -8.00031852722168, -7.633899688720703, -7.267480850219727, -6.90106201171875, -6.534643173217773, -6.168224334716797, -5.80180549621582, -5.435386657714844, -5.068967819213867, -4.702548980712891, -4.336130142211914, -3.9697113037109375, -3.603292465209961, -3.2368736267089844, -2.870454788208008, -2.5040359497070312, -2.1376171112060547, -1.7711982727050781, -1.4047794342041016, -1.038360595703125, -0.6719417572021484, -0.3055229187011719, 0.06089591979980469, 0.42731475830078125, 0.7937335968017578, 1.1601524353027344, 1.5265722274780273, 1.892991065979004, 2.2594099044799805, 2.625828742980957, 2.9922475814819336, 3.35866641998291, 3.7250852584838867, 4.091504096984863, 4.45792293548584, 4.824341773986816, 5.190760612487793, 5.5571794509887695, 5.923598289489746, 6.290017127990723, 6.656435966491699, 7.022854804992676, 7.389273643493652, 7.755692481994629, 8.122111320495605, 8.488530158996582, 8.854948997497559, 9.221367835998535, 9.587786674499512, 9.954205513000488, 10.320624351501465, 10.687043190002441, 11.053462028503418, 11.419880867004395, 11.786299705505371, 12.152718544006348, 12.519137382507324, 12.8855562210083, 13.251975059509277]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 11.0, 8.0, 12.0, 11.0, 24.0, 18.0, 25.0, 28.0, 31.0, 29.0, 18.0, 35.0, 44.0, 38.0, 45.0, 41.0, 50.0, 43.0, 41.0, 47.0, 50.0, 42.0, 37.0, 34.0, 31.0, 32.0, 23.0, 29.0, 21.0, 15.0, 18.0, 8.0, 13.0, 7.0, 6.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.239545822143555, -8.934578895568848, -8.629611015319824, -8.324644088745117, -8.01967716217041, -7.714709758758545, -7.40974235534668, -7.104775428771973, -6.799808025360107, -6.494840621948242, -6.189873695373535, -5.88490629196167, -5.579938888549805, -5.274971961975098, -4.970004558563232, -4.665037155151367, -4.36007022857666, -4.055102825164795, -3.750135898590088, -3.4451684951782227, -3.1402013301849365, -2.8352341651916504, -2.530266761779785, -2.225299596786499, -1.920332431793213, -1.6153652667999268, -1.310397982597351, -1.0054306983947754, -0.7004635334014893, -0.3954963684082031, -0.09052908420562744, 0.21443819999694824, 0.5194063186645508, 0.8243735432624817, 1.1293407678604126, 1.4343080520629883, 1.7392752170562744, 2.0442423820495605, 2.349209785461426, 2.654176950454712, 2.959144115447998, 3.264111280441284, 3.5690784454345703, 3.8740458488464355, 4.179013252258301, 4.483980178833008, 4.788947582244873, 5.093914985656738, 5.398881912231445, 5.7038493156433105, 6.008816242218018, 6.313783645629883, 6.61875057220459, 6.923717975616455, 7.22868537902832, 7.533652305603027, 7.838619709014893, 8.143587112426758, 8.448554039001465, 8.753520965576172, 9.058488845825195, 9.363455772399902, 9.66842269897461, 9.973390579223633, 10.27835750579834]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 5.0, 7.0, 11.0, 23.0, 28.0, 57.0, 68.0, 113.0, 166.0, 277.0, 432.0, 670.0, 1076.0, 1681.0, 2660.0, 4422.0, 7184.0, 11774.0, 19247.0, 31074.0, 49253.0, 77201.0, 111982.0, 146393.0, 158887.0, 138644.0, 102257.0, 68252.0, 43607.0, 27352.0, 16929.0, 10285.0, 6385.0, 3761.0, 2411.0, 1435.0, 927.0, 561.0, 395.0, 236.0, 159.0, 100.0, 69.0, 33.0, 29.0, 13.0, 15.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.56414794921875, -6.3548583984375, -6.14556884765625, -5.936279296875, -5.72698974609375, -5.5177001953125, -5.30841064453125, -5.09912109375, -4.88983154296875, -4.6805419921875, -4.47125244140625, -4.261962890625, -4.05267333984375, -3.8433837890625, -3.63409423828125, -3.4248046875, -3.21551513671875, -3.0062255859375, -2.79693603515625, -2.587646484375, -2.37835693359375, -2.1690673828125, -1.95977783203125, -1.75048828125, -1.54119873046875, -1.3319091796875, -1.12261962890625, -0.913330078125, -0.70404052734375, -0.4947509765625, -0.28546142578125, -0.076171875, 0.13311767578125, 0.3424072265625, 0.55169677734375, 0.760986328125, 0.97027587890625, 1.1795654296875, 1.38885498046875, 1.59814453125, 1.80743408203125, 2.0167236328125, 2.22601318359375, 2.435302734375, 2.64459228515625, 2.8538818359375, 3.06317138671875, 3.2724609375, 3.48175048828125, 3.6910400390625, 3.90032958984375, 4.109619140625, 4.31890869140625, 4.5281982421875, 4.73748779296875, 4.94677734375, 5.15606689453125, 5.3653564453125, 5.57464599609375, 5.783935546875, 5.99322509765625, 6.2025146484375, 6.41180419921875, 6.62109375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 5.0, 9.0, 11.0, 6.0, 10.0, 24.0, 15.0, 26.0, 38.0, 33.0, 30.0, 26.0, 27.0, 42.0, 34.0, 52.0, 36.0, 49.0, 49.0, 43.0, 58.0, 35.0, 45.0, 38.0, 37.0, 31.0, 27.0, 26.0, 25.0, 17.0, 15.0, 13.0, 12.0, 12.0, 7.0, 5.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.9168701171875, -9.607177734375, -9.2974853515625, -8.98779296875, -8.6781005859375, -8.368408203125, -8.0587158203125, -7.7490234375, -7.4393310546875, -7.129638671875, -6.8199462890625, -6.51025390625, -6.2005615234375, -5.890869140625, -5.5811767578125, -5.271484375, -4.9617919921875, -4.652099609375, -4.3424072265625, -4.03271484375, -3.7230224609375, -3.413330078125, -3.1036376953125, -2.7939453125, -2.4842529296875, -2.174560546875, -1.8648681640625, -1.55517578125, -1.2454833984375, -0.935791015625, -0.6260986328125, -0.31640625, -0.0067138671875, 0.302978515625, 0.6126708984375, 0.92236328125, 1.2320556640625, 1.541748046875, 1.8514404296875, 2.1611328125, 2.4708251953125, 2.780517578125, 3.0902099609375, 3.39990234375, 3.7095947265625, 4.019287109375, 4.3289794921875, 4.638671875, 4.9483642578125, 5.258056640625, 5.5677490234375, 5.87744140625, 6.1871337890625, 6.496826171875, 6.8065185546875, 7.1162109375, 7.4259033203125, 7.735595703125, 8.0452880859375, 8.35498046875, 8.6646728515625, 8.974365234375, 9.2840576171875, 9.59375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 11.0, 17.0, 22.0, 28.0, 33.0, 57.0, 94.0, 108.0, 165.0, 256.0, 397.0, 563.0, 857.0, 1232.0, 1952.0, 3077.0, 4763.0, 7309.0, 11330.0, 17464.0, 26245.0, 39415.0, 58160.0, 81319.0, 106324.0, 126681.0, 131507.0, 118839.0, 95488.0, 70316.0, 48833.0, 32944.0, 21815.0, 14429.0, 9267.0, 6135.0, 3741.0, 2486.0, 1591.0, 1075.0, 727.0, 448.0, 328.0, 245.0, 132.0, 99.0, 68.0, 51.0, 32.0, 29.0, 23.0, 12.0, 1.0, 9.0, 2.0, 3.0, 2.0, 3.0], "bins": [-5.74609375, -5.56805419921875, -5.3900146484375, -5.21197509765625, -5.033935546875, -4.85589599609375, -4.6778564453125, -4.49981689453125, -4.32177734375, -4.14373779296875, -3.9656982421875, -3.78765869140625, -3.609619140625, -3.43157958984375, -3.2535400390625, -3.07550048828125, -2.8974609375, -2.71942138671875, -2.5413818359375, -2.36334228515625, -2.185302734375, -2.00726318359375, -1.8292236328125, -1.65118408203125, -1.47314453125, -1.29510498046875, -1.1170654296875, -0.93902587890625, -0.760986328125, -0.58294677734375, -0.4049072265625, -0.22686767578125, -0.048828125, 0.12921142578125, 0.3072509765625, 0.48529052734375, 0.663330078125, 0.84136962890625, 1.0194091796875, 1.19744873046875, 1.37548828125, 1.55352783203125, 1.7315673828125, 1.90960693359375, 2.087646484375, 2.26568603515625, 2.4437255859375, 2.62176513671875, 2.7998046875, 2.97784423828125, 3.1558837890625, 3.33392333984375, 3.511962890625, 3.69000244140625, 3.8680419921875, 4.04608154296875, 4.22412109375, 4.40216064453125, 4.5802001953125, 4.75823974609375, 4.936279296875, 5.11431884765625, 5.2923583984375, 5.47039794921875, 5.6484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 8.0, 14.0, 11.0, 15.0, 9.0, 18.0, 21.0, 24.0, 24.0, 24.0, 31.0, 28.0, 39.0, 37.0, 45.0, 43.0, 42.0, 39.0, 23.0, 40.0, 51.0, 38.0, 30.0, 33.0, 36.0, 30.0, 30.0, 20.0, 30.0, 28.0, 20.0, 13.0, 20.0, 16.0, 13.0, 8.0, 8.0, 6.0, 10.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.41796875, -5.24993896484375, -5.0819091796875, -4.91387939453125, -4.745849609375, -4.57781982421875, -4.4097900390625, -4.24176025390625, -4.07373046875, -3.90570068359375, -3.7376708984375, -3.56964111328125, -3.401611328125, -3.23358154296875, -3.0655517578125, -2.89752197265625, -2.7294921875, -2.56146240234375, -2.3934326171875, -2.22540283203125, -2.057373046875, -1.88934326171875, -1.7213134765625, -1.55328369140625, -1.38525390625, -1.21722412109375, -1.0491943359375, -0.88116455078125, -0.713134765625, -0.54510498046875, -0.3770751953125, -0.20904541015625, -0.041015625, 0.12701416015625, 0.2950439453125, 0.46307373046875, 0.631103515625, 0.79913330078125, 0.9671630859375, 1.13519287109375, 1.30322265625, 1.47125244140625, 1.6392822265625, 1.80731201171875, 1.975341796875, 2.14337158203125, 2.3114013671875, 2.47943115234375, 2.6474609375, 2.81549072265625, 2.9835205078125, 3.15155029296875, 3.319580078125, 3.48760986328125, 3.6556396484375, 3.82366943359375, 3.99169921875, 4.15972900390625, 4.3277587890625, 4.49578857421875, 4.663818359375, 4.83184814453125, 4.9998779296875, 5.16790771484375, 5.3359375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 11.0, 14.0, 19.0, 22.0, 45.0, 64.0, 100.0, 101.0, 185.0, 281.0, 416.0, 603.0, 897.0, 1384.0, 2041.0, 3297.0, 5227.0, 8316.0, 13588.0, 22682.0, 37163.0, 62985.0, 100425.0, 148693.0, 178956.0, 161008.0, 115517.0, 72437.0, 43451.0, 26427.0, 15774.0, 9606.0, 6126.0, 3602.0, 2481.0, 1507.0, 987.0, 665.0, 450.0, 300.0, 227.0, 156.0, 95.0, 79.0, 51.0, 23.0, 25.0, 15.0, 13.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.306640625, -2.235992431640625, -2.16534423828125, -2.094696044921875, -2.0240478515625, -1.953399658203125, -1.88275146484375, -1.812103271484375, -1.741455078125, -1.670806884765625, -1.60015869140625, -1.529510498046875, -1.4588623046875, -1.388214111328125, -1.31756591796875, -1.246917724609375, -1.17626953125, -1.105621337890625, -1.03497314453125, -0.964324951171875, -0.8936767578125, -0.823028564453125, -0.75238037109375, -0.681732177734375, -0.611083984375, -0.540435791015625, -0.46978759765625, -0.399139404296875, -0.3284912109375, -0.257843017578125, -0.18719482421875, -0.116546630859375, -0.0458984375, 0.024749755859375, 0.09539794921875, 0.166046142578125, 0.2366943359375, 0.307342529296875, 0.37799072265625, 0.448638916015625, 0.519287109375, 0.589935302734375, 0.66058349609375, 0.731231689453125, 0.8018798828125, 0.872528076171875, 0.94317626953125, 1.013824462890625, 1.08447265625, 1.155120849609375, 1.22576904296875, 1.296417236328125, 1.3670654296875, 1.437713623046875, 1.50836181640625, 1.579010009765625, 1.649658203125, 1.720306396484375, 1.79095458984375, 1.861602783203125, 1.9322509765625, 2.002899169921875, 2.07354736328125, 2.144195556640625, 2.21484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 10.0, 10.0, 16.0, 18.0, 22.0, 31.0, 19.0, 40.0, 43.0, 43.0, 50.0, 57.0, 68.0, 61.0, 51.0, 48.0, 60.0, 41.0, 41.0, 45.0, 32.0, 19.0, 27.0, 25.0, 21.0, 21.0, 12.0, 3.0, 9.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.00014131143689155579, -0.00013671070337295532, -0.00013210996985435486, -0.0001275092363357544, -0.00012290850281715393, -0.00011830776929855347, -0.000113707035779953, -0.00010910630226135254, -0.00010450556874275208, -9.990483522415161e-05, -9.530410170555115e-05, -9.070336818695068e-05, -8.610263466835022e-05, -8.150190114974976e-05, -7.690116763114929e-05, -7.230043411254883e-05, -6.769970059394836e-05, -6.30989670753479e-05, -5.8498233556747437e-05, -5.389750003814697e-05, -4.929676651954651e-05, -4.4696033000946045e-05, -4.009529948234558e-05, -3.549456596374512e-05, -3.089383244514465e-05, -2.629309892654419e-05, -2.1692365407943726e-05, -1.7091631889343262e-05, -1.2490898370742798e-05, -7.890164852142334e-06, -3.28943133354187e-06, 1.3113021850585938e-06, 5.912035703659058e-06, 1.0512769222259521e-05, 1.5113502740859985e-05, 1.971423625946045e-05, 2.4314969778060913e-05, 2.8915703296661377e-05, 3.351643681526184e-05, 3.8117170333862305e-05, 4.271790385246277e-05, 4.731863737106323e-05, 5.1919370889663696e-05, 5.652010440826416e-05, 6.112083792686462e-05, 6.572157144546509e-05, 7.032230496406555e-05, 7.492303848266602e-05, 7.952377200126648e-05, 8.412450551986694e-05, 8.872523903846741e-05, 9.332597255706787e-05, 9.792670607566833e-05, 0.0001025274395942688, 0.00010712817311286926, 0.00011172890663146973, 0.00011632964015007019, 0.00012093037366867065, 0.00012553110718727112, 0.00013013184070587158, 0.00013473257422447205, 0.0001393333077430725, 0.00014393404126167297, 0.00014853477478027344]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 7.0, 12.0, 18.0, 28.0, 54.0, 71.0, 110.0, 143.0, 187.0, 300.0, 476.0, 716.0, 1122.0, 1767.0, 2706.0, 4416.0, 6800.0, 11186.0, 18028.0, 29320.0, 46566.0, 74206.0, 113356.0, 153450.0, 167372.0, 142591.0, 99790.0, 65473.0, 41292.0, 25096.0, 15717.0, 9564.0, 5992.0, 3774.0, 2371.0, 1533.0, 957.0, 677.0, 418.0, 293.0, 214.0, 121.0, 97.0, 57.0, 35.0, 25.0, 16.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.173828125, -2.1044921875, -2.03515625, -1.9658203125, -1.896484375, -1.8271484375, -1.7578125, -1.6884765625, -1.619140625, -1.5498046875, -1.48046875, -1.4111328125, -1.341796875, -1.2724609375, -1.203125, -1.1337890625, -1.064453125, -0.9951171875, -0.92578125, -0.8564453125, -0.787109375, -0.7177734375, -0.6484375, -0.5791015625, -0.509765625, -0.4404296875, -0.37109375, -0.3017578125, -0.232421875, -0.1630859375, -0.09375, -0.0244140625, 0.044921875, 0.1142578125, 0.18359375, 0.2529296875, 0.322265625, 0.3916015625, 0.4609375, 0.5302734375, 0.599609375, 0.6689453125, 0.73828125, 0.8076171875, 0.876953125, 0.9462890625, 1.015625, 1.0849609375, 1.154296875, 1.2236328125, 1.29296875, 1.3623046875, 1.431640625, 1.5009765625, 1.5703125, 1.6396484375, 1.708984375, 1.7783203125, 1.84765625, 1.9169921875, 1.986328125, 2.0556640625, 2.125, 2.1943359375, 2.263671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 0.0, 1.0, 7.0, 2.0, 11.0, 8.0, 14.0, 13.0, 13.0, 17.0, 29.0, 24.0, 31.0, 31.0, 48.0, 49.0, 39.0, 63.0, 67.0, 54.0, 56.0, 56.0, 52.0, 44.0, 43.0, 42.0, 22.0, 29.0, 17.0, 23.0, 11.0, 11.0, 17.0, 11.0, 12.0, 8.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.92822265625, -0.9004287719726562, -0.8726348876953125, -0.8448410034179688, -0.817047119140625, -0.7892532348632812, -0.7614593505859375, -0.7336654663085938, -0.70587158203125, -0.6780776977539062, -0.6502838134765625, -0.6224899291992188, -0.594696044921875, -0.5669021606445312, -0.5391082763671875, -0.5113143920898438, -0.4835205078125, -0.45572662353515625, -0.4279327392578125, -0.40013885498046875, -0.372344970703125, -0.34455108642578125, -0.3167572021484375, -0.28896331787109375, -0.26116943359375, -0.23337554931640625, -0.2055816650390625, -0.17778778076171875, -0.149993896484375, -0.12220001220703125, -0.0944061279296875, -0.06661224365234375, -0.038818359375, -0.01102447509765625, 0.0167694091796875, 0.04456329345703125, 0.072357177734375, 0.10015106201171875, 0.1279449462890625, 0.15573883056640625, 0.18353271484375, 0.21132659912109375, 0.2391204833984375, 0.26691436767578125, 0.294708251953125, 0.32250213623046875, 0.3502960205078125, 0.37808990478515625, 0.4058837890625, 0.43367767333984375, 0.4614715576171875, 0.48926544189453125, 0.517059326171875, 0.5448532104492188, 0.5726470947265625, 0.6004409790039062, 0.62823486328125, 0.6560287475585938, 0.6838226318359375, 0.7116165161132812, 0.739410400390625, 0.7672042846679688, 0.7949981689453125, 0.8227920532226562, 0.8505859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 9.0, 18.0, 18.0, 35.0, 28.0, 34.0, 58.0, 58.0, 61.0, 68.0, 60.0, 74.0, 56.0, 79.0, 47.0, 43.0, 38.0, 26.0, 31.0, 24.0, 17.0, 19.0, 8.0, 9.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.696889877319336, -9.367292404174805, -9.037694931030273, -8.708097457885742, -8.378499984741211, -8.04890251159668, -7.719305038452148, -7.389707565307617, -7.060110092163086, -6.730512619018555, -6.400915145874023, -6.071317672729492, -5.741720199584961, -5.41212272644043, -5.082525253295898, -4.752927780151367, -4.423329830169678, -4.0937323570251465, -3.7641348838806152, -3.434537410736084, -3.1049399375915527, -2.7753424644470215, -2.445744752883911, -2.11614727973938, -1.7865498065948486, -1.4569523334503174, -1.1273548603057861, -0.7977572679519653, -0.4681597948074341, -0.13856232166290283, 0.19103527069091797, 0.5206327438354492, 0.8502302169799805, 1.1798276901245117, 1.509425163269043, 1.8390227556228638, 2.1686201095581055, 2.4982175827026367, 2.827815294265747, 3.1574127674102783, 3.4870102405548096, 3.816607713699341, 4.146205425262451, 4.475802898406982, 4.805400371551514, 5.134997844696045, 5.464595317840576, 5.794192790985107, 6.123790264129639, 6.45338773727417, 6.782985210418701, 7.112582683563232, 7.442180156707764, 7.771777629852295, 8.101375579833984, 8.430973052978516, 8.760570526123047, 9.090167999267578, 9.41976547241211, 9.74936294555664, 10.078960418701172, 10.408557891845703, 10.738155364990234, 11.067752838134766, 11.397350311279297]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 6.0, 6.0, 4.0, 6.0, 7.0, 5.0, 10.0, 14.0, 23.0, 18.0, 19.0, 13.0, 24.0, 23.0, 25.0, 28.0, 30.0, 35.0, 35.0, 29.0, 35.0, 39.0, 35.0, 26.0, 45.0, 42.0, 45.0, 29.0, 28.0, 38.0, 38.0, 31.0, 30.0, 20.0, 21.0, 16.0, 22.0, 17.0, 10.0, 8.0, 9.0, 18.0, 7.0, 10.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 6.0], "bins": [-9.287074089050293, -9.02124309539795, -8.755411148071289, -8.489580154418945, -8.223749160766602, -7.957917213439941, -7.692086219787598, -7.426254749298096, -7.160423278808594, -6.894591808319092, -6.628760814666748, -6.362929344177246, -6.097097873687744, -5.831266403198242, -5.565435409545898, -5.2996039390563965, -5.033772945404053, -4.767941474914551, -4.502110481262207, -4.236279010772705, -3.970447540283203, -3.7046163082122803, -3.4387850761413574, -3.1729536056518555, -2.9071223735809326, -2.6412911415100098, -2.375459671020508, -2.109628438949585, -1.8437970876693726, -1.5779657363891602, -1.3121345043182373, -1.046303153038025, -0.7804718017578125, -0.5146404504776001, -0.24880915880203247, 0.017022132873535156, 0.28285348415374756, 0.54868483543396, 0.8145160675048828, 1.0803474187850952, 1.3461787700653076, 1.61201012134552, 1.8778414726257324, 2.1436727046966553, 2.409503936767578, 2.67533540725708, 2.941166639328003, 3.206997871398926, 3.4728293418884277, 3.7386605739593506, 4.004491806030273, 4.270323276519775, 4.536154747009277, 4.801985740661621, 5.067817211151123, 5.333648681640625, 5.599479675292969, 5.865311145782471, 6.1311421394348145, 6.396973609924316, 6.662805080413818, 6.92863655090332, 7.194467544555664, 7.460299015045166, 7.726130485534668]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 6.0, 8.0, 12.0, 16.0, 31.0, 49.0, 69.0, 95.0, 113.0, 173.0, 273.0, 430.0, 596.0, 970.0, 1412.0, 2094.0, 3162.0, 4844.0, 7786.0, 11960.0, 19517.0, 32053.0, 53248.0, 90616.0, 155930.0, 274137.0, 470673.0, 722376.0, 813362.0, 621755.0, 377513.0, 217108.0, 123769.0, 72753.0, 42873.0, 26406.0, 16284.0, 10016.0, 6603.0, 4335.0, 2855.0, 1883.0, 1308.0, 825.0, 608.0, 392.0, 304.0, 198.0, 153.0, 118.0, 76.0, 40.0, 31.0, 31.0, 19.0, 11.0, 2.0, 5.0, 5.0, 2.0, 4.0], "bins": [-7.484375, -7.2452392578125, -7.006103515625, -6.7669677734375, -6.52783203125, -6.2886962890625, -6.049560546875, -5.8104248046875, -5.5712890625, -5.3321533203125, -5.093017578125, -4.8538818359375, -4.61474609375, -4.3756103515625, -4.136474609375, -3.8973388671875, -3.658203125, -3.4190673828125, -3.179931640625, -2.9407958984375, -2.70166015625, -2.4625244140625, -2.223388671875, -1.9842529296875, -1.7451171875, -1.5059814453125, -1.266845703125, -1.0277099609375, -0.78857421875, -0.5494384765625, -0.310302734375, -0.0711669921875, 0.16796875, 0.4071044921875, 0.646240234375, 0.8853759765625, 1.12451171875, 1.3636474609375, 1.602783203125, 1.8419189453125, 2.0810546875, 2.3201904296875, 2.559326171875, 2.7984619140625, 3.03759765625, 3.2767333984375, 3.515869140625, 3.7550048828125, 3.994140625, 4.2332763671875, 4.472412109375, 4.7115478515625, 4.95068359375, 5.1898193359375, 5.428955078125, 5.6680908203125, 5.9072265625, 6.1463623046875, 6.385498046875, 6.6246337890625, 6.86376953125, 7.1029052734375, 7.342041015625, 7.5811767578125, 7.8203125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 8.0, 5.0, 4.0, 2.0, 11.0, 10.0, 13.0, 12.0, 13.0, 20.0, 13.0, 30.0, 21.0, 22.0, 24.0, 30.0, 27.0, 26.0, 41.0, 32.0, 38.0, 31.0, 44.0, 26.0, 41.0, 43.0, 36.0, 31.0, 30.0, 38.0, 28.0, 32.0, 25.0, 33.0, 19.0, 25.0, 20.0, 15.0, 9.0, 10.0, 6.0, 14.0, 6.0, 5.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-5.7109375, -5.53497314453125, -5.3590087890625, -5.18304443359375, -5.007080078125, -4.83111572265625, -4.6551513671875, -4.47918701171875, -4.30322265625, -4.12725830078125, -3.9512939453125, -3.77532958984375, -3.599365234375, -3.42340087890625, -3.2474365234375, -3.07147216796875, -2.8955078125, -2.71954345703125, -2.5435791015625, -2.36761474609375, -2.191650390625, -2.01568603515625, -1.8397216796875, -1.66375732421875, -1.48779296875, -1.31182861328125, -1.1358642578125, -0.95989990234375, -0.783935546875, -0.60797119140625, -0.4320068359375, -0.25604248046875, -0.080078125, 0.09588623046875, 0.2718505859375, 0.44781494140625, 0.623779296875, 0.79974365234375, 0.9757080078125, 1.15167236328125, 1.32763671875, 1.50360107421875, 1.6795654296875, 1.85552978515625, 2.031494140625, 2.20745849609375, 2.3834228515625, 2.55938720703125, 2.7353515625, 2.91131591796875, 3.0872802734375, 3.26324462890625, 3.439208984375, 3.61517333984375, 3.7911376953125, 3.96710205078125, 4.14306640625, 4.31903076171875, 4.4949951171875, 4.67095947265625, 4.846923828125, 5.02288818359375, 5.1988525390625, 5.37481689453125, 5.55078125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 14.0, 20.0, 36.0, 54.0, 74.0, 133.0, 212.0, 352.0, 561.0, 877.0, 1401.0, 2368.0, 3897.0, 6500.0, 11274.0, 19996.0, 34619.0, 62752.0, 114045.0, 205737.0, 362213.0, 587608.0, 782429.0, 747744.0, 528161.0, 316996.0, 178713.0, 98218.0, 54606.0, 30425.0, 17326.0, 10136.0, 6021.0, 3493.0, 2079.0, 1203.0, 746.0, 463.0, 298.0, 182.0, 112.0, 74.0, 47.0, 24.0, 14.0, 16.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.82171630859375, -6.5770263671875, -6.33233642578125, -6.087646484375, -5.84295654296875, -5.5982666015625, -5.35357666015625, -5.10888671875, -4.86419677734375, -4.6195068359375, -4.37481689453125, -4.130126953125, -3.88543701171875, -3.6407470703125, -3.39605712890625, -3.1513671875, -2.90667724609375, -2.6619873046875, -2.41729736328125, -2.172607421875, -1.92791748046875, -1.6832275390625, -1.43853759765625, -1.19384765625, -0.94915771484375, -0.7044677734375, -0.45977783203125, -0.215087890625, 0.02960205078125, 0.2742919921875, 0.51898193359375, 0.763671875, 1.00836181640625, 1.2530517578125, 1.49774169921875, 1.742431640625, 1.98712158203125, 2.2318115234375, 2.47650146484375, 2.72119140625, 2.96588134765625, 3.2105712890625, 3.45526123046875, 3.699951171875, 3.94464111328125, 4.1893310546875, 4.43402099609375, 4.6787109375, 4.92340087890625, 5.1680908203125, 5.41278076171875, 5.657470703125, 5.90216064453125, 6.1468505859375, 6.39154052734375, 6.63623046875, 6.88092041015625, 7.1256103515625, 7.37030029296875, 7.614990234375, 7.85968017578125, 8.1043701171875, 8.34906005859375, 8.59375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 9.0, 11.0, 18.0, 18.0, 28.0, 41.0, 49.0, 58.0, 68.0, 78.0, 102.0, 117.0, 122.0, 148.0, 165.0, 194.0, 201.0, 226.0, 219.0, 227.0, 235.0, 199.0, 231.0, 196.0, 157.0, 163.0, 149.0, 103.0, 86.0, 87.0, 59.0, 49.0, 52.0, 39.0, 30.0, 42.0, 17.0, 17.0, 8.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.951171875, -2.855316162109375, -2.75946044921875, -2.663604736328125, -2.5677490234375, -2.471893310546875, -2.37603759765625, -2.280181884765625, -2.184326171875, -2.088470458984375, -1.99261474609375, -1.896759033203125, -1.8009033203125, -1.705047607421875, -1.60919189453125, -1.513336181640625, -1.41748046875, -1.321624755859375, -1.22576904296875, -1.129913330078125, -1.0340576171875, -0.938201904296875, -0.84234619140625, -0.746490478515625, -0.650634765625, -0.554779052734375, -0.45892333984375, -0.363067626953125, -0.2672119140625, -0.171356201171875, -0.07550048828125, 0.020355224609375, 0.1162109375, 0.212066650390625, 0.30792236328125, 0.403778076171875, 0.4996337890625, 0.595489501953125, 0.69134521484375, 0.787200927734375, 0.883056640625, 0.978912353515625, 1.07476806640625, 1.170623779296875, 1.2664794921875, 1.362335205078125, 1.45819091796875, 1.554046630859375, 1.64990234375, 1.745758056640625, 1.84161376953125, 1.937469482421875, 2.0333251953125, 2.129180908203125, 2.22503662109375, 2.320892333984375, 2.416748046875, 2.512603759765625, 2.60845947265625, 2.704315185546875, 2.8001708984375, 2.896026611328125, 2.99188232421875, 3.087738037109375, 3.18359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 10.0, 3.0, 11.0, 14.0, 5.0, 11.0, 22.0, 22.0, 43.0, 44.0, 56.0, 70.0, 70.0, 87.0, 88.0, 81.0, 79.0, 53.0, 47.0, 46.0, 34.0, 22.0, 20.0, 12.0, 11.0, 9.0, 10.0, 9.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.693763732910156, -12.303945541381836, -11.914127349853516, -11.524309158325195, -11.134490966796875, -10.744671821594238, -10.354853630065918, -9.965035438537598, -9.575217247009277, -9.185399055480957, -8.795580863952637, -8.405762672424316, -8.01594352722168, -7.626125812530518, -7.236307144165039, -6.846488952636719, -6.456670761108398, -6.066852569580078, -5.677034378051758, -5.287215709686279, -4.897397518157959, -4.507579326629639, -4.11776065826416, -3.72794246673584, -3.3381242752075195, -2.948306083679199, -2.5584876537323, -2.1686692237854004, -1.77885103225708, -1.3890327215194702, -0.9992144107818604, -0.6093959808349609, -0.21957778930664062, 0.17024052143096924, 0.5600588321685791, 0.949877142906189, 1.3396954536437988, 1.7295137643814087, 2.1193320751190186, 2.509150505065918, 2.8989686965942383, 3.2887868881225586, 3.678605318069458, 4.068423748016357, 4.458241939544678, 4.848060131072998, 5.237878799438477, 5.627696990966797, 6.017515182495117, 6.4073333740234375, 6.797151565551758, 7.186970233917236, 7.576788425445557, 7.966606616973877, 8.356425285339355, 8.746243476867676, 9.136061668395996, 9.525879859924316, 9.915698051452637, 10.305516242980957, 10.695335388183594, 11.085153579711914, 11.474971771240234, 11.864789962768555, 12.254608154296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 7.0, 9.0, 6.0, 6.0, 12.0, 11.0, 21.0, 12.0, 24.0, 28.0, 13.0, 19.0, 27.0, 31.0, 26.0, 25.0, 40.0, 36.0, 37.0, 42.0, 41.0, 30.0, 39.0, 39.0, 38.0, 33.0, 35.0, 27.0, 42.0, 31.0, 22.0, 26.0, 25.0, 27.0, 15.0, 11.0, 16.0, 15.0, 9.0, 10.0, 6.0, 4.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.295062065124512, -8.04754638671875, -7.80003023147583, -7.55251407623291, -7.30499792098999, -7.05748176574707, -6.809966087341309, -6.562449932098389, -6.314933776855469, -6.067417621612549, -5.819901943206787, -5.572385787963867, -5.324869632720947, -5.077353477478027, -4.829837799072266, -4.582321643829346, -4.334805965423584, -4.087289810180664, -3.8397738933563232, -3.5922579765319824, -3.3447418212890625, -3.0972259044647217, -2.849709987640381, -2.602193832397461, -2.35467791557312, -2.1071619987487793, -1.8596458435058594, -1.6121299266815186, -1.3646138906478882, -1.1170978546142578, -0.869581937789917, -0.6220659017562866, -0.37455034255981445, -0.12703433632850647, 0.12048166990280151, 0.3679976463317871, 0.6155136823654175, 0.8630297183990479, 1.1105456352233887, 1.358061671257019, 1.6055777072906494, 1.8530937433242798, 2.10060977935791, 2.348125696182251, 2.595641613006592, 2.8431577682495117, 3.0906736850738525, 3.3381896018981934, 3.5857057571411133, 3.833221673965454, 4.080737590789795, 4.328253746032715, 4.575769901275635, 4.823286056518555, 5.070801734924316, 5.318317890167236, 5.565834045410156, 5.813350200653076, 6.060865879058838, 6.308382034301758, 6.555898189544678, 6.803414344787598, 7.050930023193359, 7.298446178436279, 7.545961856842041]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 13.0, 14.0, 11.0, 21.0, 38.0, 47.0, 77.0, 109.0, 152.0, 207.0, 267.0, 430.0, 667.0, 899.0, 1349.0, 1942.0, 2822.0, 4205.0, 6068.0, 9166.0, 14088.0, 20913.0, 31434.0, 47680.0, 71184.0, 106455.0, 149272.0, 169524.0, 133568.0, 92355.0, 61165.0, 40903.0, 27156.0, 17743.0, 11890.0, 7994.0, 5304.0, 3619.0, 2445.0, 1695.0, 1131.0, 763.0, 561.0, 358.0, 271.0, 162.0, 128.0, 91.0, 69.0, 45.0, 34.0, 20.0, 14.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.77880859375, -0.753936767578125, -0.72906494140625, -0.704193115234375, -0.6793212890625, -0.654449462890625, -0.62957763671875, -0.604705810546875, -0.579833984375, -0.554962158203125, -0.53009033203125, -0.505218505859375, -0.4803466796875, -0.455474853515625, -0.43060302734375, -0.405731201171875, -0.380859375, -0.355987548828125, -0.33111572265625, -0.306243896484375, -0.2813720703125, -0.256500244140625, -0.23162841796875, -0.206756591796875, -0.181884765625, -0.157012939453125, -0.13214111328125, -0.107269287109375, -0.0823974609375, -0.057525634765625, -0.03265380859375, -0.007781982421875, 0.01708984375, 0.041961669921875, 0.06683349609375, 0.091705322265625, 0.1165771484375, 0.141448974609375, 0.16632080078125, 0.191192626953125, 0.216064453125, 0.240936279296875, 0.26580810546875, 0.290679931640625, 0.3155517578125, 0.340423583984375, 0.36529541015625, 0.390167236328125, 0.4150390625, 0.439910888671875, 0.46478271484375, 0.489654541015625, 0.5145263671875, 0.539398193359375, 0.56427001953125, 0.589141845703125, 0.614013671875, 0.638885498046875, 0.66375732421875, 0.688629150390625, 0.7135009765625, 0.738372802734375, 0.76324462890625, 0.788116455078125, 0.81298828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 2.0, 8.0, 7.0, 12.0, 19.0, 15.0, 21.0, 19.0, 20.0, 24.0, 30.0, 28.0, 26.0, 29.0, 30.0, 43.0, 36.0, 58.0, 39.0, 37.0, 42.0, 45.0, 51.0, 42.0, 25.0, 42.0, 29.0, 30.0, 26.0, 29.0, 37.0, 18.0, 12.0, 14.0, 3.0, 6.0, 11.0, 2.0, 10.0, 2.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.5, -9.217041015625, -8.93408203125, -8.651123046875, -8.3681640625, -8.085205078125, -7.80224609375, -7.519287109375, -7.236328125, -6.953369140625, -6.67041015625, -6.387451171875, -6.1044921875, -5.821533203125, -5.53857421875, -5.255615234375, -4.97265625, -4.689697265625, -4.40673828125, -4.123779296875, -3.8408203125, -3.557861328125, -3.27490234375, -2.991943359375, -2.708984375, -2.426025390625, -2.14306640625, -1.860107421875, -1.5771484375, -1.294189453125, -1.01123046875, -0.728271484375, -0.4453125, -0.162353515625, 0.12060546875, 0.403564453125, 0.6865234375, 0.969482421875, 1.25244140625, 1.535400390625, 1.818359375, 2.101318359375, 2.38427734375, 2.667236328125, 2.9501953125, 3.233154296875, 3.51611328125, 3.799072265625, 4.08203125, 4.364990234375, 4.64794921875, 4.930908203125, 5.2138671875, 5.496826171875, 5.77978515625, 6.062744140625, 6.345703125, 6.628662109375, 6.91162109375, 7.194580078125, 7.4775390625, 7.760498046875, 8.04345703125, 8.326416015625, 8.609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 10.0, 16.0, 19.0, 37.0, 45.0, 72.0, 97.0, 149.0, 214.0, 381.0, 584.0, 1014.0, 1585.0, 2542.0, 4231.0, 7040.0, 11794.0, 20206.0, 34907.0, 59545.0, 99710.0, 160465.0, 218721.0, 167744.0, 104499.0, 62671.0, 37019.0, 21492.0, 12801.0, 7346.0, 4519.0, 2637.0, 1685.0, 1029.0, 652.0, 366.0, 251.0, 174.0, 109.0, 57.0, 41.0, 28.0, 14.0, 11.0, 8.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.1005859375, -1.0667724609375, -1.032958984375, -0.9991455078125, -0.96533203125, -0.9315185546875, -0.897705078125, -0.8638916015625, -0.830078125, -0.7962646484375, -0.762451171875, -0.7286376953125, -0.69482421875, -0.6610107421875, -0.627197265625, -0.5933837890625, -0.5595703125, -0.5257568359375, -0.491943359375, -0.4581298828125, -0.42431640625, -0.3905029296875, -0.356689453125, -0.3228759765625, -0.2890625, -0.2552490234375, -0.221435546875, -0.1876220703125, -0.15380859375, -0.1199951171875, -0.086181640625, -0.0523681640625, -0.0185546875, 0.0152587890625, 0.049072265625, 0.0828857421875, 0.11669921875, 0.1505126953125, 0.184326171875, 0.2181396484375, 0.251953125, 0.2857666015625, 0.319580078125, 0.3533935546875, 0.38720703125, 0.4210205078125, 0.454833984375, 0.4886474609375, 0.5224609375, 0.5562744140625, 0.590087890625, 0.6239013671875, 0.65771484375, 0.6915283203125, 0.725341796875, 0.7591552734375, 0.79296875, 0.8267822265625, 0.860595703125, 0.8944091796875, 0.92822265625, 0.9620361328125, 0.995849609375, 1.0296630859375, 1.0634765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 13.0, 8.0, 17.0, 15.0, 14.0, 20.0, 17.0, 22.0, 36.0, 35.0, 36.0, 42.0, 33.0, 27.0, 28.0, 41.0, 33.0, 38.0, 49.0, 33.0, 32.0, 36.0, 37.0, 30.0, 42.0, 23.0, 32.0, 26.0, 23.0, 22.0, 9.0, 17.0, 12.0, 14.0, 16.0, 10.0, 10.0, 3.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.37890625, -5.2161865234375, -5.053466796875, -4.8907470703125, -4.72802734375, -4.5653076171875, -4.402587890625, -4.2398681640625, -4.0771484375, -3.9144287109375, -3.751708984375, -3.5889892578125, -3.42626953125, -3.2635498046875, -3.100830078125, -2.9381103515625, -2.775390625, -2.6126708984375, -2.449951171875, -2.2872314453125, -2.12451171875, -1.9617919921875, -1.799072265625, -1.6363525390625, -1.4736328125, -1.3109130859375, -1.148193359375, -0.9854736328125, -0.82275390625, -0.6600341796875, -0.497314453125, -0.3345947265625, -0.171875, -0.0091552734375, 0.153564453125, 0.3162841796875, 0.47900390625, 0.6417236328125, 0.804443359375, 0.9671630859375, 1.1298828125, 1.2926025390625, 1.455322265625, 1.6180419921875, 1.78076171875, 1.9434814453125, 2.106201171875, 2.2689208984375, 2.431640625, 2.5943603515625, 2.757080078125, 2.9197998046875, 3.08251953125, 3.2452392578125, 3.407958984375, 3.5706787109375, 3.7333984375, 3.8961181640625, 4.058837890625, 4.2215576171875, 4.38427734375, 4.5469970703125, 4.709716796875, 4.8724365234375, 5.03515625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 6.0, 15.0, 23.0, 22.0, 25.0, 28.0, 59.0, 67.0, 109.0, 170.0, 213.0, 299.0, 449.0, 707.0, 1081.0, 1824.0, 3409.0, 7265.0, 18778.0, 68900.0, 407760.0, 430077.0, 71689.0, 19435.0, 7433.0, 3515.0, 1885.0, 1105.0, 685.0, 450.0, 336.0, 183.0, 149.0, 96.0, 78.0, 60.0, 49.0, 33.0, 20.0, 17.0, 14.0, 10.0, 5.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.28564453125, -0.27748680114746094, -0.2693290710449219, -0.2611713409423828, -0.25301361083984375, -0.2448558807373047, -0.23669815063476562, -0.22854042053222656, -0.2203826904296875, -0.21222496032714844, -0.20406723022460938, -0.1959095001220703, -0.18775177001953125, -0.1795940399169922, -0.17143630981445312, -0.16327857971191406, -0.155120849609375, -0.14696311950683594, -0.13880538940429688, -0.1306476593017578, -0.12248992919921875, -0.11433219909667969, -0.10617446899414062, -0.09801673889160156, -0.0898590087890625, -0.08170127868652344, -0.07354354858398438, -0.06538581848144531, -0.05722808837890625, -0.04907035827636719, -0.040912628173828125, -0.03275489807128906, -0.02459716796875, -0.016439437866210938, -0.008281707763671875, -0.0001239776611328125, 0.00803375244140625, 0.016191482543945312, 0.024349212646484375, 0.03250694274902344, 0.0406646728515625, 0.04882240295410156, 0.056980133056640625, 0.06513786315917969, 0.07329559326171875, 0.08145332336425781, 0.08961105346679688, 0.09776878356933594, 0.105926513671875, 0.11408424377441406, 0.12224197387695312, 0.1303997039794922, 0.13855743408203125, 0.1467151641845703, 0.15487289428710938, 0.16303062438964844, 0.1711883544921875, 0.17934608459472656, 0.18750381469726562, 0.1956615447998047, 0.20381927490234375, 0.2119770050048828, 0.22013473510742188, 0.22829246520996094, 0.2364501953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 7.0, 13.0, 18.0, 12.0, 21.0, 25.0, 23.0, 29.0, 34.0, 45.0, 53.0, 48.0, 52.0, 73.0, 58.0, 58.0, 64.0, 62.0, 49.0, 31.0, 37.0, 24.0, 36.0, 24.0, 18.0, 8.0, 11.0, 15.0, 9.0, 10.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1633150279521942e-05, -1.1226162314414978e-05, -1.0819174349308014e-05, -1.041218638420105e-05, -1.0005198419094086e-05, -9.598210453987122e-06, -9.191222488880157e-06, -8.784234523773193e-06, -8.37724655866623e-06, -7.970258593559265e-06, -7.563270628452301e-06, -7.156282663345337e-06, -6.749294698238373e-06, -6.342306733131409e-06, -5.935318768024445e-06, -5.5283308029174805e-06, -5.121342837810516e-06, -4.714354872703552e-06, -4.307366907596588e-06, -3.900378942489624e-06, -3.49339097738266e-06, -3.086403012275696e-06, -2.6794150471687317e-06, -2.2724270820617676e-06, -1.8654391169548035e-06, -1.4584511518478394e-06, -1.0514631867408752e-06, -6.444752216339111e-07, -2.3748725652694702e-07, 1.695007085800171e-07, 5.764886736869812e-07, 9.834766387939453e-07, 1.3904646039009094e-06, 1.7974525690078735e-06, 2.2044405341148376e-06, 2.6114284992218018e-06, 3.018416464328766e-06, 3.42540442943573e-06, 3.832392394542694e-06, 4.239380359649658e-06, 4.646368324756622e-06, 5.0533562898635864e-06, 5.4603442549705505e-06, 5.867332220077515e-06, 6.274320185184479e-06, 6.681308150291443e-06, 7.088296115398407e-06, 7.495284080505371e-06, 7.902272045612335e-06, 8.3092600107193e-06, 8.716247975826263e-06, 9.123235940933228e-06, 9.530223906040192e-06, 9.937211871147156e-06, 1.034419983625412e-05, 1.0751187801361084e-05, 1.1158175766468048e-05, 1.1565163731575012e-05, 1.1972151696681976e-05, 1.237913966178894e-05, 1.2786127626895905e-05, 1.3193115592002869e-05, 1.3600103557109833e-05, 1.4007091522216797e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 9.0, 13.0, 13.0, 25.0, 26.0, 22.0, 47.0, 59.0, 72.0, 94.0, 121.0, 198.0, 273.0, 424.0, 592.0, 876.0, 1376.0, 2340.0, 4325.0, 8700.0, 20532.0, 60380.0, 211939.0, 478202.0, 171878.0, 50276.0, 17982.0, 7609.0, 3867.0, 2266.0, 1318.0, 816.0, 563.0, 377.0, 260.0, 193.0, 109.0, 97.0, 81.0, 46.0, 44.0, 30.0, 20.0, 7.0, 18.0, 6.0, 10.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.296630859375, -0.2880134582519531, -0.27939605712890625, -0.2707786560058594, -0.2621612548828125, -0.2535438537597656, -0.24492645263671875, -0.23630905151367188, -0.227691650390625, -0.21907424926757812, -0.21045684814453125, -0.20183944702148438, -0.1932220458984375, -0.18460464477539062, -0.17598724365234375, -0.16736984252929688, -0.15875244140625, -0.15013504028320312, -0.14151763916015625, -0.13290023803710938, -0.1242828369140625, -0.11566543579101562, -0.10704803466796875, -0.09843063354492188, -0.089813232421875, -0.08119583129882812, -0.07257843017578125, -0.06396102905273438, -0.0553436279296875, -0.046726226806640625, -0.03810882568359375, -0.029491424560546875, -0.0208740234375, -0.012256622314453125, -0.00363922119140625, 0.004978179931640625, 0.0135955810546875, 0.022212982177734375, 0.03083038330078125, 0.039447784423828125, 0.048065185546875, 0.056682586669921875, 0.06529998779296875, 0.07391738891601562, 0.0825347900390625, 0.09115219116210938, 0.09976959228515625, 0.10838699340820312, 0.11700439453125, 0.12562179565429688, 0.13423919677734375, 0.14285659790039062, 0.1514739990234375, 0.16009140014648438, 0.16870880126953125, 0.17732620239257812, 0.185943603515625, 0.19456100463867188, 0.20317840576171875, 0.21179580688476562, 0.2204132080078125, 0.22903060913085938, 0.23764801025390625, 0.24626541137695312, 0.2548828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 5.0, 7.0, 13.0, 15.0, 16.0, 27.0, 43.0, 43.0, 69.0, 81.0, 112.0, 93.0, 124.0, 97.0, 47.0, 56.0, 44.0, 30.0, 19.0, 15.0, 8.0, 5.0, 12.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07708072662353516, -0.07377815246582031, -0.07047557830810547, -0.06717300415039062, -0.06387042999267578, -0.06056785583496094, -0.057265281677246094, -0.05396270751953125, -0.050660133361816406, -0.04735755920410156, -0.04405498504638672, -0.040752410888671875, -0.03744983673095703, -0.03414726257324219, -0.030844688415527344, -0.0275421142578125, -0.024239540100097656, -0.020936965942382812, -0.01763439178466797, -0.014331817626953125, -0.011029243469238281, -0.0077266693115234375, -0.004424095153808594, -0.00112152099609375, 0.0021810531616210938, 0.0054836273193359375, 0.008786201477050781, 0.012088775634765625, 0.015391349792480469, 0.018693923950195312, 0.021996498107910156, 0.025299072265625, 0.028601646423339844, 0.03190422058105469, 0.03520679473876953, 0.038509368896484375, 0.04181194305419922, 0.04511451721191406, 0.048417091369628906, 0.05171966552734375, 0.055022239685058594, 0.05832481384277344, 0.06162738800048828, 0.06492996215820312, 0.06823253631591797, 0.07153511047363281, 0.07483768463134766, 0.0781402587890625, 0.08144283294677734, 0.08474540710449219, 0.08804798126220703, 0.09135055541992188, 0.09465312957763672, 0.09795570373535156, 0.1012582778930664, 0.10456085205078125, 0.1078634262084961, 0.11116600036621094, 0.11446857452392578, 0.11777114868164062, 0.12107372283935547, 0.12437629699707031, 0.12767887115478516, 0.1309814453125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 4.0, 12.0, 13.0, 6.0, 9.0, 21.0, 26.0, 41.0, 37.0, 61.0, 70.0, 79.0, 78.0, 88.0, 91.0, 70.0, 57.0, 40.0, 48.0, 35.0, 21.0, 21.0, 12.0, 11.0, 10.0, 10.0, 9.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.704233169555664, -12.314088821411133, -11.923943519592285, -11.533798217773438, -11.143653869628906, -10.753509521484375, -10.363364219665527, -9.97321891784668, -9.583074569702148, -9.192930221557617, -8.80278491973877, -8.412639617919922, -8.02249526977539, -7.632350444793701, -7.242205619812012, -6.852060794830322, -6.461915969848633, -6.071771144866943, -5.681626319885254, -5.2914814949035645, -4.901336669921875, -4.5111918449401855, -4.121047019958496, -3.7309021949768066, -3.340757369995117, -2.9506125450134277, -2.5604677200317383, -2.170322895050049, -1.7801780700683594, -1.39003324508667, -0.9998884201049805, -0.609743595123291, -0.21959781646728516, 0.1705470085144043, 0.5606918334960938, 0.9508366584777832, 1.3409814834594727, 1.731126308441162, 2.1212711334228516, 2.511415958404541, 2.9015607833862305, 3.29170560836792, 3.6818504333496094, 4.071995258331299, 4.462140083312988, 4.852284908294678, 5.242429733276367, 5.632574558258057, 6.022719383239746, 6.4128642082214355, 6.803009033203125, 7.1931538581848145, 7.583298683166504, 7.973443508148193, 8.363588333129883, 8.753732681274414, 9.143877983093262, 9.53402328491211, 9.92416763305664, 10.314311981201172, 10.70445728302002, 11.094602584838867, 11.484746932983398, 11.87489128112793, 12.265036582946777]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 1.0, 9.0, 7.0, 6.0, 6.0, 13.0, 10.0, 21.0, 12.0, 26.0, 26.0, 15.0, 17.0, 29.0, 29.0, 27.0, 27.0, 39.0, 36.0, 36.0, 43.0, 41.0, 30.0, 38.0, 40.0, 39.0, 32.0, 34.0, 30.0, 39.0, 29.0, 23.0, 27.0, 26.0, 25.0, 14.0, 14.0, 14.0, 16.0, 9.0, 9.0, 6.0, 3.0, 7.0, 4.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-8.295742988586426, -8.048453330993652, -7.801163673400879, -7.5538740158081055, -7.306584358215332, -7.059294700622559, -6.812004566192627, -6.5647149085998535, -6.31742525100708, -6.070135593414307, -5.822845935821533, -5.57555627822876, -5.328266143798828, -5.080976486206055, -4.833686828613281, -4.586397171020508, -4.339107513427734, -4.091817855834961, -3.8445281982421875, -3.597238302230835, -3.3499486446380615, -3.102658987045288, -2.8553690910339355, -2.608079433441162, -2.3607897758483887, -2.1135001182556152, -1.8662103414535522, -1.6189205646514893, -1.3716309070587158, -1.1243412494659424, -0.8770514726638794, -0.6297616958618164, -0.38247203826904297, -0.13518232107162476, 0.11210739612579346, 0.35939711332321167, 0.6066868305206299, 0.8539764881134033, 1.1012662649154663, 1.3485560417175293, 1.5958456993103027, 1.8431353569030762, 2.0904250144958496, 2.337714910507202, 2.5850045680999756, 2.832294225692749, 3.0795841217041016, 3.326873779296875, 3.5741634368896484, 3.821453094482422, 4.068742752075195, 4.316032409667969, 4.563322067260742, 4.810611724853516, 5.057901859283447, 5.305191516876221, 5.552481174468994, 5.799770832061768, 6.047060489654541, 6.2943501472473145, 6.541640281677246, 6.7889299392700195, 7.036219596862793, 7.283509254455566, 7.53079891204834]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 9.0, 14.0, 26.0, 43.0, 66.0, 101.0, 133.0, 203.0, 317.0, 450.0, 686.0, 1018.0, 1637.0, 2477.0, 3839.0, 6009.0, 9308.0, 14894.0, 23083.0, 36171.0, 55292.0, 80891.0, 111020.0, 137037.0, 143160.0, 126563.0, 97798.0, 68448.0, 45444.0, 29603.0, 18898.0, 12059.0, 7780.0, 5039.0, 3143.0, 2030.0, 1312.0, 871.0, 559.0, 366.0, 251.0, 155.0, 108.0, 78.0, 62.0, 32.0, 27.0, 16.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.6484375, -5.46783447265625, -5.2872314453125, -5.10662841796875, -4.926025390625, -4.74542236328125, -4.5648193359375, -4.38421630859375, -4.20361328125, -4.02301025390625, -3.8424072265625, -3.66180419921875, -3.481201171875, -3.30059814453125, -3.1199951171875, -2.93939208984375, -2.7587890625, -2.57818603515625, -2.3975830078125, -2.21697998046875, -2.036376953125, -1.85577392578125, -1.6751708984375, -1.49456787109375, -1.31396484375, -1.13336181640625, -0.9527587890625, -0.77215576171875, -0.591552734375, -0.41094970703125, -0.2303466796875, -0.04974365234375, 0.130859375, 0.31146240234375, 0.4920654296875, 0.67266845703125, 0.853271484375, 1.03387451171875, 1.2144775390625, 1.39508056640625, 1.57568359375, 1.75628662109375, 1.9368896484375, 2.11749267578125, 2.298095703125, 2.47869873046875, 2.6593017578125, 2.83990478515625, 3.0205078125, 3.20111083984375, 3.3817138671875, 3.56231689453125, 3.742919921875, 3.92352294921875, 4.1041259765625, 4.28472900390625, 4.46533203125, 4.64593505859375, 4.8265380859375, 5.00714111328125, 5.187744140625, 5.36834716796875, 5.5489501953125, 5.72955322265625, 5.91015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 12.0, 7.0, 7.0, 10.0, 10.0, 8.0, 18.0, 19.0, 23.0, 20.0, 31.0, 30.0, 32.0, 33.0, 28.0, 35.0, 45.0, 42.0, 47.0, 45.0, 44.0, 41.0, 38.0, 41.0, 48.0, 31.0, 31.0, 30.0, 33.0, 30.0, 23.0, 14.0, 16.0, 16.0, 12.0, 6.0, 10.0, 14.0, 5.0, 3.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.3671875, -9.08984375, -8.8125, -8.53515625, -8.2578125, -7.98046875, -7.703125, -7.42578125, -7.1484375, -6.87109375, -6.59375, -6.31640625, -6.0390625, -5.76171875, -5.484375, -5.20703125, -4.9296875, -4.65234375, -4.375, -4.09765625, -3.8203125, -3.54296875, -3.265625, -2.98828125, -2.7109375, -2.43359375, -2.15625, -1.87890625, -1.6015625, -1.32421875, -1.046875, -0.76953125, -0.4921875, -0.21484375, 0.0625, 0.33984375, 0.6171875, 0.89453125, 1.171875, 1.44921875, 1.7265625, 2.00390625, 2.28125, 2.55859375, 2.8359375, 3.11328125, 3.390625, 3.66796875, 3.9453125, 4.22265625, 4.5, 4.77734375, 5.0546875, 5.33203125, 5.609375, 5.88671875, 6.1640625, 6.44140625, 6.71875, 6.99609375, 7.2734375, 7.55078125, 7.828125, 8.10546875, 8.3828125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 9.0, 11.0, 26.0, 34.0, 56.0, 77.0, 122.0, 184.0, 299.0, 431.0, 672.0, 1067.0, 1685.0, 2801.0, 4208.0, 6903.0, 10936.0, 16879.0, 26862.0, 41234.0, 61430.0, 86822.0, 115164.0, 134812.0, 136496.0, 118903.0, 91947.0, 65685.0, 43945.0, 28562.0, 18511.0, 11817.0, 7397.0, 4563.0, 2936.0, 1814.0, 1134.0, 737.0, 477.0, 337.0, 215.0, 112.0, 88.0, 59.0, 32.0, 23.0, 18.0, 14.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.90625, -5.72772216796875, -5.5491943359375, -5.37066650390625, -5.192138671875, -5.01361083984375, -4.8350830078125, -4.65655517578125, -4.47802734375, -4.29949951171875, -4.1209716796875, -3.94244384765625, -3.763916015625, -3.58538818359375, -3.4068603515625, -3.22833251953125, -3.0498046875, -2.87127685546875, -2.6927490234375, -2.51422119140625, -2.335693359375, -2.15716552734375, -1.9786376953125, -1.80010986328125, -1.62158203125, -1.44305419921875, -1.2645263671875, -1.08599853515625, -0.907470703125, -0.72894287109375, -0.5504150390625, -0.37188720703125, -0.193359375, -0.01483154296875, 0.1636962890625, 0.34222412109375, 0.520751953125, 0.69927978515625, 0.8778076171875, 1.05633544921875, 1.23486328125, 1.41339111328125, 1.5919189453125, 1.77044677734375, 1.948974609375, 2.12750244140625, 2.3060302734375, 2.48455810546875, 2.6630859375, 2.84161376953125, 3.0201416015625, 3.19866943359375, 3.377197265625, 3.55572509765625, 3.7342529296875, 3.91278076171875, 4.09130859375, 4.26983642578125, 4.4483642578125, 4.62689208984375, 4.805419921875, 4.98394775390625, 5.1624755859375, 5.34100341796875, 5.51953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 9.0, 7.0, 14.0, 15.0, 19.0, 18.0, 28.0, 25.0, 30.0, 22.0, 34.0, 40.0, 32.0, 43.0, 44.0, 41.0, 46.0, 24.0, 47.0, 42.0, 42.0, 42.0, 45.0, 35.0, 32.0, 25.0, 30.0, 25.0, 26.0, 24.0, 21.0, 19.0, 7.0, 5.0, 9.0, 7.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.296875, -5.12371826171875, -4.9505615234375, -4.77740478515625, -4.604248046875, -4.43109130859375, -4.2579345703125, -4.08477783203125, -3.91162109375, -3.73846435546875, -3.5653076171875, -3.39215087890625, -3.218994140625, -3.04583740234375, -2.8726806640625, -2.69952392578125, -2.5263671875, -2.35321044921875, -2.1800537109375, -2.00689697265625, -1.833740234375, -1.66058349609375, -1.4874267578125, -1.31427001953125, -1.14111328125, -0.96795654296875, -0.7947998046875, -0.62164306640625, -0.448486328125, -0.27532958984375, -0.1021728515625, 0.07098388671875, 0.244140625, 0.41729736328125, 0.5904541015625, 0.76361083984375, 0.936767578125, 1.10992431640625, 1.2830810546875, 1.45623779296875, 1.62939453125, 1.80255126953125, 1.9757080078125, 2.14886474609375, 2.322021484375, 2.49517822265625, 2.6683349609375, 2.84149169921875, 3.0146484375, 3.18780517578125, 3.3609619140625, 3.53411865234375, 3.707275390625, 3.88043212890625, 4.0535888671875, 4.22674560546875, 4.39990234375, 4.57305908203125, 4.7462158203125, 4.91937255859375, 5.092529296875, 5.26568603515625, 5.4388427734375, 5.61199951171875, 5.78515625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 14.0, 14.0, 30.0, 40.0, 56.0, 82.0, 129.0, 168.0, 246.0, 361.0, 534.0, 747.0, 1107.0, 1638.0, 2483.0, 3638.0, 5379.0, 8266.0, 12719.0, 19932.0, 31044.0, 48962.0, 76701.0, 114436.0, 152229.0, 162284.0, 135571.0, 95628.0, 62264.0, 39406.0, 25074.0, 16082.0, 10318.0, 6822.0, 4608.0, 3039.0, 2054.0, 1377.0, 1000.0, 645.0, 464.0, 331.0, 215.0, 129.0, 86.0, 63.0, 48.0, 30.0, 22.0, 21.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.949371337890625, -1.88702392578125, -1.824676513671875, -1.7623291015625, -1.699981689453125, -1.63763427734375, -1.575286865234375, -1.512939453125, -1.450592041015625, -1.38824462890625, -1.325897216796875, -1.2635498046875, -1.201202392578125, -1.13885498046875, -1.076507568359375, -1.01416015625, -0.951812744140625, -0.88946533203125, -0.827117919921875, -0.7647705078125, -0.702423095703125, -0.64007568359375, -0.577728271484375, -0.515380859375, -0.453033447265625, -0.39068603515625, -0.328338623046875, -0.2659912109375, -0.203643798828125, -0.14129638671875, -0.078948974609375, -0.0166015625, 0.045745849609375, 0.10809326171875, 0.170440673828125, 0.2327880859375, 0.295135498046875, 0.35748291015625, 0.419830322265625, 0.482177734375, 0.544525146484375, 0.60687255859375, 0.669219970703125, 0.7315673828125, 0.793914794921875, 0.85626220703125, 0.918609619140625, 0.98095703125, 1.043304443359375, 1.10565185546875, 1.167999267578125, 1.2303466796875, 1.292694091796875, 1.35504150390625, 1.417388916015625, 1.479736328125, 1.542083740234375, 1.60443115234375, 1.666778564453125, 1.7291259765625, 1.791473388671875, 1.85382080078125, 1.916168212890625, 1.978515625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 7.0, 5.0, 5.0, 14.0, 14.0, 16.0, 17.0, 15.0, 28.0, 29.0, 28.0, 43.0, 35.0, 48.0, 49.0, 61.0, 65.0, 54.0, 59.0, 65.0, 47.0, 47.0, 24.0, 39.0, 30.0, 31.0, 26.0, 21.0, 17.0, 5.0, 6.0, 13.0, 8.0, 5.0, 7.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013697147369384766, -0.0001321006566286087, -0.00012722983956336975, -0.0001223590224981308, -0.00011748820543289185, -0.00011261738836765289, -0.00010774657130241394, -0.00010287575423717499, -9.800493717193604e-05, -9.313412010669708e-05, -8.826330304145813e-05, -8.339248597621918e-05, -7.852166891098022e-05, -7.365085184574127e-05, -6.878003478050232e-05, -6.390921771526337e-05, -5.9038400650024414e-05, -5.416758358478546e-05, -4.929676651954651e-05, -4.4425949454307556e-05, -3.9555132389068604e-05, -3.468431532382965e-05, -2.9813498258590698e-05, -2.4942681193351746e-05, -2.0071864128112793e-05, -1.520104706287384e-05, -1.0330229997634888e-05, -5.459412932395935e-06, -5.885958671569824e-07, 4.28222119808197e-06, 9.153038263320923e-06, 1.4023855328559875e-05, 1.8894672393798828e-05, 2.376548945903778e-05, 2.8636306524276733e-05, 3.3507123589515686e-05, 3.837794065475464e-05, 4.324875771999359e-05, 4.8119574785232544e-05, 5.2990391850471497e-05, 5.786120891571045e-05, 6.27320259809494e-05, 6.760284304618835e-05, 7.247366011142731e-05, 7.734447717666626e-05, 8.221529424190521e-05, 8.708611130714417e-05, 9.195692837238312e-05, 9.682774543762207e-05, 0.00010169856250286102, 0.00010656937956809998, 0.00011144019663333893, 0.00011631101369857788, 0.00012118183076381683, 0.00012605264782905579, 0.00013092346489429474, 0.0001357942819595337, 0.00014066509902477264, 0.0001455359160900116, 0.00015040673315525055, 0.0001552775502204895, 0.00016014836728572845, 0.0001650191843509674, 0.00016989000141620636, 0.0001747608184814453]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 12.0, 7.0, 20.0, 14.0, 20.0, 40.0, 46.0, 48.0, 92.0, 141.0, 201.0, 267.0, 391.0, 637.0, 1022.0, 1486.0, 2345.0, 3992.0, 6566.0, 11352.0, 19930.0, 36134.0, 66140.0, 117384.0, 185085.0, 213768.0, 162105.0, 96541.0, 53201.0, 29370.0, 16301.0, 9320.0, 5450.0, 3308.0, 2046.0, 1244.0, 839.0, 545.0, 343.0, 259.0, 158.0, 110.0, 79.0, 54.0, 38.0, 25.0, 27.0, 11.0, 9.0, 11.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.634765625, -2.553253173828125, -2.47174072265625, -2.390228271484375, -2.3087158203125, -2.227203369140625, -2.14569091796875, -2.064178466796875, -1.982666015625, -1.901153564453125, -1.81964111328125, -1.738128662109375, -1.6566162109375, -1.575103759765625, -1.49359130859375, -1.412078857421875, -1.33056640625, -1.249053955078125, -1.16754150390625, -1.086029052734375, -1.0045166015625, -0.923004150390625, -0.84149169921875, -0.759979248046875, -0.678466796875, -0.596954345703125, -0.51544189453125, -0.433929443359375, -0.3524169921875, -0.270904541015625, -0.18939208984375, -0.107879638671875, -0.0263671875, 0.055145263671875, 0.13665771484375, 0.218170166015625, 0.2996826171875, 0.381195068359375, 0.46270751953125, 0.544219970703125, 0.625732421875, 0.707244873046875, 0.78875732421875, 0.870269775390625, 0.9517822265625, 1.033294677734375, 1.11480712890625, 1.196319580078125, 1.27783203125, 1.359344482421875, 1.44085693359375, 1.522369384765625, 1.6038818359375, 1.685394287109375, 1.76690673828125, 1.848419189453125, 1.929931640625, 2.011444091796875, 2.09295654296875, 2.174468994140625, 2.2559814453125, 2.337493896484375, 2.41900634765625, 2.500518798828125, 2.58203125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 5.0, 9.0, 17.0, 14.0, 23.0, 14.0, 35.0, 37.0, 47.0, 47.0, 55.0, 59.0, 71.0, 69.0, 67.0, 62.0, 60.0, 51.0, 54.0, 34.0, 44.0, 24.0, 21.0, 12.0, 17.0, 10.0, 13.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1215972900390625, -1.084991455078125, -1.0483856201171875, -1.01177978515625, -0.9751739501953125, -0.938568115234375, -0.9019622802734375, -0.8653564453125, -0.8287506103515625, -0.792144775390625, -0.7555389404296875, -0.71893310546875, -0.6823272705078125, -0.645721435546875, -0.6091156005859375, -0.572509765625, -0.5359039306640625, -0.499298095703125, -0.4626922607421875, -0.42608642578125, -0.3894805908203125, -0.352874755859375, -0.3162689208984375, -0.2796630859375, -0.2430572509765625, -0.206451416015625, -0.1698455810546875, -0.13323974609375, -0.0966339111328125, -0.060028076171875, -0.0234222412109375, 0.01318359375, 0.0497894287109375, 0.086395263671875, 0.1230010986328125, 0.15960693359375, 0.1962127685546875, 0.232818603515625, 0.2694244384765625, 0.3060302734375, 0.3426361083984375, 0.379241943359375, 0.4158477783203125, 0.45245361328125, 0.4890594482421875, 0.525665283203125, 0.5622711181640625, 0.598876953125, 0.6354827880859375, 0.672088623046875, 0.7086944580078125, 0.74530029296875, 0.7819061279296875, 0.818511962890625, 0.8551177978515625, 0.8917236328125, 0.9283294677734375, 0.964935302734375, 1.0015411376953125, 1.03814697265625, 1.0747528076171875, 1.111358642578125, 1.1479644775390625, 1.1845703125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 4.0, 6.0, 9.0, 15.0, 21.0, 23.0, 30.0, 32.0, 44.0, 48.0, 74.0, 80.0, 72.0, 77.0, 81.0, 71.0, 62.0, 46.0, 34.0, 32.0, 31.0, 16.0, 21.0, 9.0, 11.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.472892761230469, -11.109395027160645, -10.745896339416504, -10.38239860534668, -10.018900871276855, -9.655403137207031, -9.29190444946289, -8.928406715393066, -8.564908981323242, -8.201411247253418, -7.8379130363464355, -7.474414825439453, -7.110917091369629, -6.7474188804626465, -6.383920669555664, -6.02042293548584, -5.656924247741699, -5.293426036834717, -4.929928302764893, -4.56643009185791, -4.202932357788086, -3.8394341468811035, -3.475935935974121, -3.1124379634857178, -2.7489399909973145, -2.385442018508911, -2.021944046020508, -1.6584458351135254, -1.294947862625122, -0.9314498901367188, -0.5679516792297363, -0.204453706741333, 0.1590442657470703, 0.5225422978401184, 0.8860403299331665, 1.2495384216308594, 1.6130363941192627, 1.976534366607666, 2.3400325775146484, 2.7035305500030518, 3.067028522491455, 3.4305264949798584, 3.7940244674682617, 4.157522678375244, 4.521020889282227, 4.884518623352051, 5.248016834259033, 5.611515045166016, 5.97501277923584, 6.338510990142822, 6.7020087242126465, 7.065506935119629, 7.429004669189453, 7.7925028800964355, 8.156001091003418, 8.519498825073242, 8.882997512817383, 9.246495246887207, 9.609993934631348, 9.973491668701172, 10.336989402770996, 10.70048713684082, 11.063985824584961, 11.427483558654785, 11.79098129272461]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 3.0, 5.0, 13.0, 7.0, 16.0, 21.0, 19.0, 19.0, 23.0, 19.0, 29.0, 30.0, 33.0, 24.0, 40.0, 32.0, 50.0, 43.0, 44.0, 47.0, 36.0, 45.0, 51.0, 35.0, 30.0, 34.0, 26.0, 33.0, 33.0, 19.0, 17.0, 14.0, 18.0, 18.0, 14.0, 11.0, 7.0, 3.0, 14.0, 5.0, 3.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.947351455688477, -8.6700439453125, -8.39273738861084, -8.115429878234863, -7.838123321533203, -7.560815811157227, -7.283508777618408, -7.00620174407959, -6.7288947105407715, -6.451587677001953, -6.174280643463135, -5.896973609924316, -5.61966609954834, -5.34235954284668, -5.065052032470703, -4.787744998931885, -4.510437965393066, -4.233130931854248, -3.9558238983154297, -3.6785166263580322, -3.401209592819214, -3.1239025592803955, -2.846595287322998, -2.5692882537841797, -2.2919812202453613, -2.014674186706543, -1.737367033958435, -1.4600598812103271, -1.1827528476715088, -0.9054458141326904, -0.6281386613845825, -0.3508315086364746, -0.07352542877197266, 0.20378166437149048, 0.4810887575149536, 0.7583958506584167, 1.0357029438018799, 1.3130099773406982, 1.5903171300888062, 1.867624282836914, 2.1449313163757324, 2.422238349914551, 2.699545383453369, 2.9768526554107666, 3.254159688949585, 3.5314667224884033, 3.808773994445801, 4.086081027984619, 4.3633880615234375, 4.640695095062256, 4.918002128601074, 5.195309162139893, 5.472616195678711, 5.7499237060546875, 6.027230739593506, 6.304537773132324, 6.581844806671143, 6.859151840209961, 7.136458873748779, 7.413765907287598, 7.691073417663574, 7.968379974365234, 8.245687484741211, 8.522994995117188, 8.800301551818848]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 16.0, 19.0, 21.0, 35.0, 36.0, 73.0, 123.0, 133.0, 226.0, 354.0, 521.0, 810.0, 1271.0, 1943.0, 3178.0, 5134.0, 8659.0, 14856.0, 25792.0, 45307.0, 81431.0, 151042.0, 285708.0, 526557.0, 834624.0, 883968.0, 599361.0, 331232.0, 175748.0, 93172.0, 51346.0, 29228.0, 16545.0, 9807.0, 5984.0, 3627.0, 2208.0, 1406.0, 946.0, 616.0, 393.0, 263.0, 178.0, 109.0, 74.0, 63.0, 39.0, 38.0, 21.0, 11.0, 6.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.1171875, -7.8563232421875, -7.595458984375, -7.3345947265625, -7.07373046875, -6.8128662109375, -6.552001953125, -6.2911376953125, -6.0302734375, -5.7694091796875, -5.508544921875, -5.2476806640625, -4.98681640625, -4.7259521484375, -4.465087890625, -4.2042236328125, -3.943359375, -3.6824951171875, -3.421630859375, -3.1607666015625, -2.89990234375, -2.6390380859375, -2.378173828125, -2.1173095703125, -1.8564453125, -1.5955810546875, -1.334716796875, -1.0738525390625, -0.81298828125, -0.5521240234375, -0.291259765625, -0.0303955078125, 0.23046875, 0.4913330078125, 0.752197265625, 1.0130615234375, 1.27392578125, 1.5347900390625, 1.795654296875, 2.0565185546875, 2.3173828125, 2.5782470703125, 2.839111328125, 3.0999755859375, 3.36083984375, 3.6217041015625, 3.882568359375, 4.1434326171875, 4.404296875, 4.6651611328125, 4.926025390625, 5.1868896484375, 5.44775390625, 5.7086181640625, 5.969482421875, 6.2303466796875, 6.4912109375, 6.7520751953125, 7.012939453125, 7.2738037109375, 7.53466796875, 7.7955322265625, 8.056396484375, 8.3172607421875, 8.578125]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 5.0, 9.0, 8.0, 17.0, 10.0, 14.0, 22.0, 13.0, 27.0, 15.0, 22.0, 35.0, 35.0, 26.0, 32.0, 39.0, 32.0, 47.0, 38.0, 38.0, 56.0, 45.0, 35.0, 31.0, 37.0, 37.0, 32.0, 31.0, 27.0, 27.0, 23.0, 12.0, 19.0, 15.0, 13.0, 10.0, 11.0, 11.0, 6.0, 5.0, 8.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.98046875, -5.798583984375, -5.61669921875, -5.434814453125, -5.2529296875, -5.071044921875, -4.88916015625, -4.707275390625, -4.525390625, -4.343505859375, -4.16162109375, -3.979736328125, -3.7978515625, -3.615966796875, -3.43408203125, -3.252197265625, -3.0703125, -2.888427734375, -2.70654296875, -2.524658203125, -2.3427734375, -2.160888671875, -1.97900390625, -1.797119140625, -1.615234375, -1.433349609375, -1.25146484375, -1.069580078125, -0.8876953125, -0.705810546875, -0.52392578125, -0.342041015625, -0.16015625, 0.021728515625, 0.20361328125, 0.385498046875, 0.5673828125, 0.749267578125, 0.93115234375, 1.113037109375, 1.294921875, 1.476806640625, 1.65869140625, 1.840576171875, 2.0224609375, 2.204345703125, 2.38623046875, 2.568115234375, 2.75, 2.931884765625, 3.11376953125, 3.295654296875, 3.4775390625, 3.659423828125, 3.84130859375, 4.023193359375, 4.205078125, 4.386962890625, 4.56884765625, 4.750732421875, 4.9326171875, 5.114501953125, 5.29638671875, 5.478271484375, 5.66015625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 6.0, 12.0, 18.0, 35.0, 45.0, 82.0, 123.0, 183.0, 317.0, 457.0, 760.0, 1222.0, 2074.0, 3354.0, 5687.0, 9923.0, 17138.0, 29823.0, 52964.0, 92569.0, 166296.0, 291307.0, 485164.0, 702137.0, 777748.0, 619215.0, 396634.0, 233051.0, 131949.0, 74164.0, 42280.0, 24205.0, 13618.0, 7976.0, 4669.0, 2715.0, 1666.0, 965.0, 663.0, 420.0, 243.0, 147.0, 70.0, 67.0, 49.0, 21.0, 15.0, 13.0, 9.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.6171875, -7.38134765625, -7.1455078125, -6.90966796875, -6.673828125, -6.43798828125, -6.2021484375, -5.96630859375, -5.73046875, -5.49462890625, -5.2587890625, -5.02294921875, -4.787109375, -4.55126953125, -4.3154296875, -4.07958984375, -3.84375, -3.60791015625, -3.3720703125, -3.13623046875, -2.900390625, -2.66455078125, -2.4287109375, -2.19287109375, -1.95703125, -1.72119140625, -1.4853515625, -1.24951171875, -1.013671875, -0.77783203125, -0.5419921875, -0.30615234375, -0.0703125, 0.16552734375, 0.4013671875, 0.63720703125, 0.873046875, 1.10888671875, 1.3447265625, 1.58056640625, 1.81640625, 2.05224609375, 2.2880859375, 2.52392578125, 2.759765625, 2.99560546875, 3.2314453125, 3.46728515625, 3.703125, 3.93896484375, 4.1748046875, 4.41064453125, 4.646484375, 4.88232421875, 5.1181640625, 5.35400390625, 5.58984375, 5.82568359375, 6.0615234375, 6.29736328125, 6.533203125, 6.76904296875, 7.0048828125, 7.24072265625, 7.4765625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 13.0, 9.0, 17.0, 23.0, 34.0, 37.0, 56.0, 70.0, 90.0, 121.0, 148.0, 171.0, 187.0, 191.0, 241.0, 276.0, 274.0, 272.0, 275.0, 232.0, 241.0, 197.0, 158.0, 148.0, 116.0, 111.0, 78.0, 64.0, 48.0, 42.0, 38.0, 28.0, 16.0, 8.0, 8.0, 13.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.269683837890625, -3.15850830078125, -3.047332763671875, -2.9361572265625, -2.824981689453125, -2.71380615234375, -2.602630615234375, -2.491455078125, -2.380279541015625, -2.26910400390625, -2.157928466796875, -2.0467529296875, -1.935577392578125, -1.82440185546875, -1.713226318359375, -1.60205078125, -1.490875244140625, -1.37969970703125, -1.268524169921875, -1.1573486328125, -1.046173095703125, -0.93499755859375, -0.823822021484375, -0.712646484375, -0.601470947265625, -0.49029541015625, -0.379119873046875, -0.2679443359375, -0.156768798828125, -0.04559326171875, 0.065582275390625, 0.1767578125, 0.287933349609375, 0.39910888671875, 0.510284423828125, 0.6214599609375, 0.732635498046875, 0.84381103515625, 0.954986572265625, 1.066162109375, 1.177337646484375, 1.28851318359375, 1.399688720703125, 1.5108642578125, 1.622039794921875, 1.73321533203125, 1.844390869140625, 1.95556640625, 2.066741943359375, 2.17791748046875, 2.289093017578125, 2.4002685546875, 2.511444091796875, 2.62261962890625, 2.733795166015625, 2.844970703125, 2.956146240234375, 3.06732177734375, 3.178497314453125, 3.2896728515625, 3.400848388671875, 3.51202392578125, 3.623199462890625, 3.734375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 4.0, 10.0, 6.0, 11.0, 12.0, 20.0, 11.0, 29.0, 28.0, 41.0, 33.0, 59.0, 51.0, 75.0, 70.0, 71.0, 85.0, 65.0, 61.0, 53.0, 40.0, 24.0, 25.0, 19.0, 22.0, 18.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.416095733642578, -7.088052272796631, -6.760008811950684, -6.431965351104736, -6.103921890258789, -5.775878429412842, -5.4478349685668945, -5.1197919845581055, -4.791748046875, -4.463704586029053, -4.1356611251831055, -3.807617664337158, -3.479574203491211, -3.1515307426452637, -2.8234875202178955, -2.4954440593719482, -2.16740083694458, -1.8393573760986328, -1.5113139152526855, -1.1832705736160278, -0.8552271127700806, -0.5271836519241333, -0.19914031028747559, 0.12890315055847168, 0.45694661140441895, 0.7849900722503662, 1.1130335330963135, 1.4410768747329712, 1.7691203355789185, 2.097163677215576, 2.4252071380615234, 2.7532505989074707, 3.081294059753418, 3.4093375205993652, 3.7373809814453125, 4.06542444229126, 4.393467903137207, 4.721511363983154, 5.049554824829102, 5.377597808837891, 5.705641746520996, 6.033685207366943, 6.361728668212891, 6.689772129058838, 7.017815589904785, 7.345859050750732, 7.67390251159668, 8.001945495605469, 8.329988479614258, 8.658031463623047, 8.986075401306152, 9.314118385314941, 9.642162322998047, 9.970205307006836, 10.298249244689941, 10.62629222869873, 10.954336166381836, 11.282379150390625, 11.61042308807373, 11.93846607208252, 12.266510009765625, 12.594552993774414, 12.92259693145752, 13.250639915466309, 13.578683853149414]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 13.0, 10.0, 15.0, 13.0, 17.0, 18.0, 21.0, 27.0, 29.0, 26.0, 31.0, 35.0, 25.0, 37.0, 48.0, 45.0, 46.0, 54.0, 39.0, 42.0, 38.0, 35.0, 34.0, 33.0, 33.0, 26.0, 31.0, 25.0, 20.0, 19.0, 27.0, 9.0, 16.0, 10.0, 7.0, 12.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.387712478637695, -8.123156547546387, -7.858600616455078, -7.594045162200928, -7.329489231109619, -7.0649333000183105, -6.80037784576416, -6.535821914672852, -6.271265983581543, -6.006710052490234, -5.742154121398926, -5.477598667144775, -5.213042736053467, -4.948486804962158, -4.683931350708008, -4.419375419616699, -4.154819488525391, -3.890263557434082, -3.6257078647613525, -3.361152172088623, -3.0965962409973145, -2.832040309906006, -2.5674846172332764, -2.302928924560547, -2.0383729934692383, -1.7738171815872192, -1.5092613697052002, -1.2447055578231812, -0.9801497459411621, -0.7155939340591431, -0.451038122177124, -0.18648231029510498, 0.07807350158691406, 0.3426293134689331, 0.6071851253509521, 0.8717409372329712, 1.1362967491149902, 1.4008525609970093, 1.6654083728790283, 1.9299641847610474, 2.1945199966430664, 2.459075927734375, 2.7236316204071045, 2.988187313079834, 3.2527432441711426, 3.517299175262451, 3.7818548679351807, 4.04641056060791, 4.310966491699219, 4.575522422790527, 4.840078353881836, 5.104633808135986, 5.369189739227295, 5.6337456703186035, 5.898301124572754, 6.1628570556640625, 6.427412986755371, 6.69196891784668, 6.956524848937988, 7.221080303192139, 7.485636234283447, 7.750192165374756, 8.014747619628906, 8.279303550720215, 8.543859481811523]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 9.0, 14.0, 13.0, 32.0, 41.0, 83.0, 107.0, 184.0, 280.0, 464.0, 695.0, 1167.0, 1711.0, 2821.0, 4474.0, 6966.0, 11334.0, 18042.0, 29531.0, 48019.0, 77046.0, 124524.0, 188047.0, 192368.0, 129754.0, 80337.0, 49376.0, 30796.0, 19065.0, 11573.0, 7329.0, 4571.0, 2808.0, 1864.0, 1117.0, 708.0, 461.0, 307.0, 190.0, 125.0, 66.0, 49.0, 27.0, 24.0, 19.0, 9.0, 1.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8482284545898438, -0.8199920654296875, -0.7917556762695312, -0.763519287109375, -0.7352828979492188, -0.7070465087890625, -0.6788101196289062, -0.65057373046875, -0.6223373413085938, -0.5941009521484375, -0.5658645629882812, -0.537628173828125, -0.5093917846679688, -0.4811553955078125, -0.45291900634765625, -0.4246826171875, -0.39644622802734375, -0.3682098388671875, -0.33997344970703125, -0.311737060546875, -0.28350067138671875, -0.2552642822265625, -0.22702789306640625, -0.19879150390625, -0.17055511474609375, -0.1423187255859375, -0.11408233642578125, -0.085845947265625, -0.05760955810546875, -0.0293731689453125, -0.00113677978515625, 0.027099609375, 0.05533599853515625, 0.0835723876953125, 0.11180877685546875, 0.140045166015625, 0.16828155517578125, 0.1965179443359375, 0.22475433349609375, 0.25299072265625, 0.28122711181640625, 0.3094635009765625, 0.33769989013671875, 0.365936279296875, 0.39417266845703125, 0.4224090576171875, 0.45064544677734375, 0.4788818359375, 0.5071182250976562, 0.5353546142578125, 0.5635910034179688, 0.591827392578125, 0.6200637817382812, 0.6483001708984375, 0.6765365600585938, 0.70477294921875, 0.7330093383789062, 0.7612457275390625, 0.7894821166992188, 0.817718505859375, 0.8459548950195312, 0.8741912841796875, 0.9024276733398438, 0.9306640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 13.0, 9.0, 16.0, 12.0, 15.0, 23.0, 26.0, 30.0, 31.0, 24.0, 23.0, 30.0, 35.0, 50.0, 42.0, 43.0, 51.0, 47.0, 46.0, 37.0, 35.0, 38.0, 39.0, 31.0, 29.0, 25.0, 32.0, 12.0, 25.0, 22.0, 18.0, 14.0, 15.0, 8.0, 7.0, 11.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4140625, -8.144287109375, -7.87451171875, -7.604736328125, -7.3349609375, -7.065185546875, -6.79541015625, -6.525634765625, -6.255859375, -5.986083984375, -5.71630859375, -5.446533203125, -5.1767578125, -4.906982421875, -4.63720703125, -4.367431640625, -4.09765625, -3.827880859375, -3.55810546875, -3.288330078125, -3.0185546875, -2.748779296875, -2.47900390625, -2.209228515625, -1.939453125, -1.669677734375, -1.39990234375, -1.130126953125, -0.8603515625, -0.590576171875, -0.32080078125, -0.051025390625, 0.21875, 0.488525390625, 0.75830078125, 1.028076171875, 1.2978515625, 1.567626953125, 1.83740234375, 2.107177734375, 2.376953125, 2.646728515625, 2.91650390625, 3.186279296875, 3.4560546875, 3.725830078125, 3.99560546875, 4.265380859375, 4.53515625, 4.804931640625, 5.07470703125, 5.344482421875, 5.6142578125, 5.884033203125, 6.15380859375, 6.423583984375, 6.693359375, 6.963134765625, 7.23291015625, 7.502685546875, 7.7724609375, 8.042236328125, 8.31201171875, 8.581787109375, 8.8515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 10.0, 24.0, 37.0, 42.0, 92.0, 145.0, 218.0, 445.0, 720.0, 1227.0, 2101.0, 3671.0, 6422.0, 11345.0, 19875.0, 34519.0, 60471.0, 106047.0, 184348.0, 239485.0, 161882.0, 91957.0, 53022.0, 30096.0, 17328.0, 9905.0, 5582.0, 3208.0, 1733.0, 1099.0, 620.0, 367.0, 191.0, 112.0, 89.0, 34.0, 42.0, 20.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9669036865234375, -0.932830810546875, -0.8987579345703125, -0.86468505859375, -0.8306121826171875, -0.796539306640625, -0.7624664306640625, -0.7283935546875, -0.6943206787109375, -0.660247802734375, -0.6261749267578125, -0.59210205078125, -0.5580291748046875, -0.523956298828125, -0.4898834228515625, -0.455810546875, -0.4217376708984375, -0.387664794921875, -0.3535919189453125, -0.31951904296875, -0.2854461669921875, -0.251373291015625, -0.2173004150390625, -0.1832275390625, -0.1491546630859375, -0.115081787109375, -0.0810089111328125, -0.04693603515625, -0.0128631591796875, 0.021209716796875, 0.0552825927734375, 0.08935546875, 0.1234283447265625, 0.157501220703125, 0.1915740966796875, 0.22564697265625, 0.2597198486328125, 0.293792724609375, 0.3278656005859375, 0.3619384765625, 0.3960113525390625, 0.430084228515625, 0.4641571044921875, 0.49822998046875, 0.5323028564453125, 0.566375732421875, 0.6004486083984375, 0.634521484375, 0.6685943603515625, 0.702667236328125, 0.7367401123046875, 0.77081298828125, 0.8048858642578125, 0.838958740234375, 0.8730316162109375, 0.9071044921875, 0.9411773681640625, 0.975250244140625, 1.0093231201171875, 1.04339599609375, 1.0774688720703125, 1.111541748046875, 1.1456146240234375, 1.1796875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 4.0, 11.0, 6.0, 13.0, 11.0, 13.0, 11.0, 19.0, 19.0, 22.0, 31.0, 27.0, 42.0, 31.0, 35.0, 43.0, 34.0, 49.0, 41.0, 35.0, 47.0, 36.0, 32.0, 42.0, 39.0, 42.0, 24.0, 31.0, 28.0, 26.0, 25.0, 28.0, 19.0, 17.0, 13.0, 9.0, 8.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.55859375, -5.39483642578125, -5.2310791015625, -5.06732177734375, -4.903564453125, -4.73980712890625, -4.5760498046875, -4.41229248046875, -4.24853515625, -4.08477783203125, -3.9210205078125, -3.75726318359375, -3.593505859375, -3.42974853515625, -3.2659912109375, -3.10223388671875, -2.9384765625, -2.77471923828125, -2.6109619140625, -2.44720458984375, -2.283447265625, -2.11968994140625, -1.9559326171875, -1.79217529296875, -1.62841796875, -1.46466064453125, -1.3009033203125, -1.13714599609375, -0.973388671875, -0.80963134765625, -0.6458740234375, -0.48211669921875, -0.318359375, -0.15460205078125, 0.0091552734375, 0.17291259765625, 0.336669921875, 0.50042724609375, 0.6641845703125, 0.82794189453125, 0.99169921875, 1.15545654296875, 1.3192138671875, 1.48297119140625, 1.646728515625, 1.81048583984375, 1.9742431640625, 2.13800048828125, 2.3017578125, 2.46551513671875, 2.6292724609375, 2.79302978515625, 2.956787109375, 3.12054443359375, 3.2843017578125, 3.44805908203125, 3.61181640625, 3.77557373046875, 3.9393310546875, 4.10308837890625, 4.266845703125, 4.43060302734375, 4.5943603515625, 4.75811767578125, 4.921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 7.0, 8.0, 7.0, 18.0, 16.0, 29.0, 36.0, 38.0, 74.0, 103.0, 133.0, 189.0, 294.0, 524.0, 804.0, 1524.0, 2871.0, 6129.0, 15955.0, 58865.0, 414002.0, 453498.0, 63324.0, 16916.0, 6352.0, 2991.0, 1530.0, 769.0, 528.0, 317.0, 210.0, 132.0, 100.0, 72.0, 59.0, 22.0, 28.0, 24.0, 13.0, 12.0, 9.0, 7.0, 1.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.344970703125, -0.3338508605957031, -0.32273101806640625, -0.3116111755371094, -0.3004913330078125, -0.2893714904785156, -0.27825164794921875, -0.2671318054199219, -0.256011962890625, -0.24489212036132812, -0.23377227783203125, -0.22265243530273438, -0.2115325927734375, -0.20041275024414062, -0.18929290771484375, -0.17817306518554688, -0.16705322265625, -0.15593338012695312, -0.14481353759765625, -0.13369369506835938, -0.1225738525390625, -0.11145401000976562, -0.10033416748046875, -0.08921432495117188, -0.078094482421875, -0.06697463989257812, -0.05585479736328125, -0.044734954833984375, -0.0336151123046875, -0.022495269775390625, -0.01137542724609375, -0.000255584716796875, 0.0108642578125, 0.021984100341796875, 0.03310394287109375, 0.044223785400390625, 0.0553436279296875, 0.06646347045898438, 0.07758331298828125, 0.08870315551757812, 0.099822998046875, 0.11094284057617188, 0.12206268310546875, 0.13318252563476562, 0.1443023681640625, 0.15542221069335938, 0.16654205322265625, 0.17766189575195312, 0.18878173828125, 0.19990158081054688, 0.21102142333984375, 0.22214126586914062, 0.2332611083984375, 0.24438095092773438, 0.25550079345703125, 0.2666206359863281, 0.277740478515625, 0.2888603210449219, 0.29998016357421875, 0.3111000061035156, 0.3222198486328125, 0.3333396911621094, 0.34445953369140625, 0.3555793762207031, 0.36669921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 6.0, 12.0, 14.0, 19.0, 21.0, 24.0, 36.0, 48.0, 44.0, 37.0, 40.0, 69.0, 52.0, 46.0, 48.0, 73.0, 65.0, 51.0, 36.0, 43.0, 37.0, 23.0, 28.0, 22.0, 19.0, 22.0, 11.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0477378964424133e-05, -1.0047107934951782e-05, -9.616836905479431e-06, -9.18656587600708e-06, -8.756294846534729e-06, -8.326023817062378e-06, -7.895752787590027e-06, -7.465481758117676e-06, -7.035210728645325e-06, -6.604939699172974e-06, -6.1746686697006226e-06, -5.7443976402282715e-06, -5.31412661075592e-06, -4.883855581283569e-06, -4.453584551811218e-06, -4.023313522338867e-06, -3.593042492866516e-06, -3.162771463394165e-06, -2.732500433921814e-06, -2.302229404449463e-06, -1.8719583749771118e-06, -1.4416873455047607e-06, -1.0114163160324097e-06, -5.811452865600586e-07, -1.5087425708770752e-07, 2.7939677238464355e-07, 7.096678018569946e-07, 1.1399388313293457e-06, 1.5702098608016968e-06, 2.000480890274048e-06, 2.430751919746399e-06, 2.86102294921875e-06, 3.291293978691101e-06, 3.721565008163452e-06, 4.151836037635803e-06, 4.582107067108154e-06, 5.012378096580505e-06, 5.4426491260528564e-06, 5.8729201555252075e-06, 6.303191184997559e-06, 6.73346221446991e-06, 7.163733243942261e-06, 7.594004273414612e-06, 8.024275302886963e-06, 8.454546332359314e-06, 8.884817361831665e-06, 9.315088391304016e-06, 9.745359420776367e-06, 1.0175630450248718e-05, 1.060590147972107e-05, 1.103617250919342e-05, 1.1466443538665771e-05, 1.1896714568138123e-05, 1.2326985597610474e-05, 1.2757256627082825e-05, 1.3187527656555176e-05, 1.3617798686027527e-05, 1.4048069715499878e-05, 1.4478340744972229e-05, 1.490861177444458e-05, 1.533888280391693e-05, 1.5769153833389282e-05, 1.6199424862861633e-05, 1.6629695892333984e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 11.0, 11.0, 20.0, 19.0, 30.0, 32.0, 52.0, 56.0, 94.0, 98.0, 158.0, 199.0, 242.0, 399.0, 575.0, 843.0, 1271.0, 2050.0, 3645.0, 6297.0, 12019.0, 24542.0, 56689.0, 155052.0, 412134.0, 227268.0, 78093.0, 32550.0, 14891.0, 7707.0, 4237.0, 2494.0, 1534.0, 989.0, 656.0, 431.0, 278.0, 229.0, 160.0, 113.0, 108.0, 67.0, 52.0, 35.0, 36.0, 32.0, 15.0, 12.0, 13.0, 6.0, 2.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.245361328125, -0.23761367797851562, -0.22986602783203125, -0.22211837768554688, -0.2143707275390625, -0.20662307739257812, -0.19887542724609375, -0.19112777709960938, -0.183380126953125, -0.17563247680664062, -0.16788482666015625, -0.16013717651367188, -0.1523895263671875, -0.14464187622070312, -0.13689422607421875, -0.12914657592773438, -0.12139892578125, -0.11365127563476562, -0.10590362548828125, -0.09815597534179688, -0.0904083251953125, -0.08266067504882812, -0.07491302490234375, -0.06716537475585938, -0.059417724609375, -0.051670074462890625, -0.04392242431640625, -0.036174774169921875, -0.0284271240234375, -0.020679473876953125, -0.01293182373046875, -0.005184173583984375, 0.0025634765625, 0.010311126708984375, 0.01805877685546875, 0.025806427001953125, 0.0335540771484375, 0.041301727294921875, 0.04904937744140625, 0.056797027587890625, 0.064544677734375, 0.07229232788085938, 0.08003997802734375, 0.08778762817382812, 0.0955352783203125, 0.10328292846679688, 0.11103057861328125, 0.11877822875976562, 0.12652587890625, 0.13427352905273438, 0.14202117919921875, 0.14976882934570312, 0.1575164794921875, 0.16526412963867188, 0.17301177978515625, 0.18075942993164062, 0.188507080078125, 0.19625473022460938, 0.20400238037109375, 0.21175003051757812, 0.2194976806640625, 0.22724533081054688, 0.23499298095703125, 0.24274063110351562, 0.25048828125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 5.0, 7.0, 8.0, 10.0, 17.0, 16.0, 26.0, 32.0, 44.0, 72.0, 104.0, 141.0, 134.0, 102.0, 82.0, 61.0, 36.0, 21.0, 27.0, 11.0, 9.0, 13.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1044921875, -0.1011343002319336, -0.09777641296386719, -0.09441852569580078, -0.09106063842773438, -0.08770275115966797, -0.08434486389160156, -0.08098697662353516, -0.07762908935546875, -0.07427120208740234, -0.07091331481933594, -0.06755542755126953, -0.06419754028320312, -0.06083965301513672, -0.05748176574707031, -0.054123878479003906, -0.0507659912109375, -0.047408103942871094, -0.04405021667480469, -0.04069232940673828, -0.037334442138671875, -0.03397655487060547, -0.030618667602539062, -0.027260780334472656, -0.02390289306640625, -0.020545005798339844, -0.017187118530273438, -0.013829231262207031, -0.010471343994140625, -0.007113456726074219, -0.0037555694580078125, -0.00039768218994140625, 0.002960205078125, 0.006318092346191406, 0.009675979614257812, 0.013033866882324219, 0.016391754150390625, 0.01974964141845703, 0.023107528686523438, 0.026465415954589844, 0.02982330322265625, 0.033181190490722656, 0.03653907775878906, 0.03989696502685547, 0.043254852294921875, 0.04661273956298828, 0.04997062683105469, 0.053328514099121094, 0.0566864013671875, 0.060044288635253906, 0.06340217590332031, 0.06676006317138672, 0.07011795043945312, 0.07347583770751953, 0.07683372497558594, 0.08019161224365234, 0.08354949951171875, 0.08690738677978516, 0.09026527404785156, 0.09362316131591797, 0.09698104858398438, 0.10033893585205078, 0.10369682312011719, 0.1070547103881836, 0.11041259765625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 8.0, 8.0, 9.0, 12.0, 18.0, 17.0, 20.0, 24.0, 43.0, 32.0, 53.0, 54.0, 67.0, 72.0, 70.0, 82.0, 70.0, 68.0, 51.0, 43.0, 30.0, 25.0, 23.0, 17.0, 22.0, 13.0, 14.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.568352699279785, -7.23896598815918, -6.909578800201416, -6.580191612243652, -6.250804901123047, -5.921418190002441, -5.592031002044678, -5.262643814086914, -4.933257102966309, -4.603870391845703, -4.2744832038879395, -3.945096254348755, -3.6157093048095703, -3.2863223552703857, -2.956935405731201, -2.6275484561920166, -2.298161506652832, -1.9687745571136475, -1.639387607574463, -1.3100006580352783, -0.9806137084960938, -0.6512267589569092, -0.3218398094177246, 0.007547140121459961, 0.33693408966064453, 0.6663210391998291, 0.9957079887390137, 1.3250949382781982, 1.6544818878173828, 1.9838688373565674, 2.313255786895752, 2.6426427364349365, 2.9720306396484375, 3.301417589187622, 3.6308045387268066, 3.960191488265991, 4.289578437805176, 4.618965148925781, 4.948352336883545, 5.277739524841309, 5.607126235961914, 5.9365129470825195, 6.265900135040283, 6.595287322998047, 6.924674034118652, 7.254060745239258, 7.5834479331970215, 7.912835121154785, 8.24222183227539, 8.571608543395996, 8.900995254516602, 9.230382919311523, 9.559769630432129, 9.889156341552734, 10.218544006347656, 10.547930717468262, 10.877317428588867, 11.206704139709473, 11.536090850830078, 11.865478515625, 12.194865226745605, 12.524251937866211, 12.853639602661133, 13.183026313781738, 13.512413024902344]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 13.0, 11.0, 14.0, 11.0, 18.0, 21.0, 19.0, 28.0, 28.0, 25.0, 33.0, 32.0, 27.0, 37.0, 48.0, 46.0, 43.0, 55.0, 39.0, 43.0, 38.0, 37.0, 32.0, 33.0, 33.0, 25.0, 32.0, 25.0, 20.0, 19.0, 24.0, 12.0, 16.0, 10.0, 8.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.398783683776855, -8.134746551513672, -7.870710372924805, -7.606673240661621, -7.342636585235596, -7.07859992980957, -6.814562797546387, -6.550526142120361, -6.286489486694336, -6.0224528312683105, -5.758416175842285, -5.494379043579102, -5.230342388153076, -4.966305732727051, -4.702268600463867, -4.438231945037842, -4.174195289611816, -3.910158634185791, -3.6461217403411865, -3.382084846496582, -3.1180481910705566, -2.8540115356445312, -2.5899746417999268, -2.3259377479553223, -2.061901092529297, -1.797864317893982, -1.533827543258667, -1.269790768623352, -1.005753993988037, -0.7417172193527222, -0.4776804447174072, -0.21364367008209229, 0.050393104553222656, 0.3144298791885376, 0.5784666538238525, 0.8425034284591675, 1.1065402030944824, 1.3705769777297974, 1.6346137523651123, 1.8986505270004272, 2.162687301635742, 2.4267239570617676, 2.690760850906372, 2.9547977447509766, 3.218834400177002, 3.4828710556030273, 3.746907949447632, 4.010944843292236, 4.274981498718262, 4.539018154144287, 4.8030548095703125, 5.067091941833496, 5.3311285972595215, 5.595165252685547, 5.8592023849487305, 6.123239040374756, 6.387275695800781, 6.651312351226807, 6.915349006652832, 7.179386138916016, 7.443422794342041, 7.707459449768066, 7.97149658203125, 8.235532760620117, 8.4995698928833]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 21.0, 30.0, 41.0, 74.0, 127.0, 175.0, 294.0, 461.0, 712.0, 1202.0, 1900.0, 2978.0, 4960.0, 7861.0, 12460.0, 19707.0, 31207.0, 48297.0, 72992.0, 104037.0, 132492.0, 146085.0, 135483.0, 107088.0, 76932.0, 51128.0, 33325.0, 21107.0, 13284.0, 8357.0, 5161.0, 3150.0, 1991.0, 1260.0, 779.0, 543.0, 306.0, 204.0, 115.0, 75.0, 54.0, 28.0, 22.0, 17.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.78125, -5.6090087890625, -5.436767578125, -5.2645263671875, -5.09228515625, -4.9200439453125, -4.747802734375, -4.5755615234375, -4.4033203125, -4.2310791015625, -4.058837890625, -3.8865966796875, -3.71435546875, -3.5421142578125, -3.369873046875, -3.1976318359375, -3.025390625, -2.8531494140625, -2.680908203125, -2.5086669921875, -2.33642578125, -2.1641845703125, -1.991943359375, -1.8197021484375, -1.6474609375, -1.4752197265625, -1.302978515625, -1.1307373046875, -0.95849609375, -0.7862548828125, -0.614013671875, -0.4417724609375, -0.26953125, -0.0972900390625, 0.074951171875, 0.2471923828125, 0.41943359375, 0.5916748046875, 0.763916015625, 0.9361572265625, 1.1083984375, 1.2806396484375, 1.452880859375, 1.6251220703125, 1.79736328125, 1.9696044921875, 2.141845703125, 2.3140869140625, 2.486328125, 2.6585693359375, 2.830810546875, 3.0030517578125, 3.17529296875, 3.3475341796875, 3.519775390625, 3.6920166015625, 3.8642578125, 4.0364990234375, 4.208740234375, 4.3809814453125, 4.55322265625, 4.7254638671875, 4.897705078125, 5.0699462890625, 5.2421875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 10.0, 9.0, 6.0, 16.0, 17.0, 22.0, 24.0, 26.0, 36.0, 29.0, 31.0, 44.0, 44.0, 33.0, 41.0, 58.0, 54.0, 57.0, 49.0, 38.0, 34.0, 41.0, 38.0, 35.0, 25.0, 38.0, 21.0, 24.0, 21.0, 20.0, 16.0, 11.0, 4.0, 11.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7449951171875, -8.443115234375, -8.1412353515625, -7.83935546875, -7.5374755859375, -7.235595703125, -6.9337158203125, -6.6318359375, -6.3299560546875, -6.028076171875, -5.7261962890625, -5.42431640625, -5.1224365234375, -4.820556640625, -4.5186767578125, -4.216796875, -3.9149169921875, -3.613037109375, -3.3111572265625, -3.00927734375, -2.7073974609375, -2.405517578125, -2.1036376953125, -1.8017578125, -1.4998779296875, -1.197998046875, -0.8961181640625, -0.59423828125, -0.2923583984375, 0.009521484375, 0.3114013671875, 0.61328125, 0.9151611328125, 1.217041015625, 1.5189208984375, 1.82080078125, 2.1226806640625, 2.424560546875, 2.7264404296875, 3.0283203125, 3.3302001953125, 3.632080078125, 3.9339599609375, 4.23583984375, 4.5377197265625, 4.839599609375, 5.1414794921875, 5.443359375, 5.7452392578125, 6.047119140625, 6.3489990234375, 6.65087890625, 6.9527587890625, 7.254638671875, 7.5565185546875, 7.8583984375, 8.1602783203125, 8.462158203125, 8.7640380859375, 9.06591796875, 9.3677978515625, 9.669677734375, 9.9715576171875, 10.2734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 11.0, 2.0, 11.0, 16.0, 32.0, 54.0, 50.0, 95.0, 135.0, 202.0, 275.0, 434.0, 631.0, 955.0, 1342.0, 1911.0, 2973.0, 4143.0, 6158.0, 8929.0, 13350.0, 19095.0, 27185.0, 39497.0, 54545.0, 73626.0, 93474.0, 109479.0, 116881.0, 111546.0, 95429.0, 75857.0, 56765.0, 41118.0, 28919.0, 19881.0, 13966.0, 9340.0, 6188.0, 4423.0, 3077.0, 2070.0, 1409.0, 1014.0, 667.0, 429.0, 328.0, 211.0, 142.0, 89.0, 79.0, 41.0, 28.0, 26.0, 11.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-4.36328125, -4.22503662109375, -4.0867919921875, -3.94854736328125, -3.810302734375, -3.67205810546875, -3.5338134765625, -3.39556884765625, -3.25732421875, -3.11907958984375, -2.9808349609375, -2.84259033203125, -2.704345703125, -2.56610107421875, -2.4278564453125, -2.28961181640625, -2.1513671875, -2.01312255859375, -1.8748779296875, -1.73663330078125, -1.598388671875, -1.46014404296875, -1.3218994140625, -1.18365478515625, -1.04541015625, -0.90716552734375, -0.7689208984375, -0.63067626953125, -0.492431640625, -0.35418701171875, -0.2159423828125, -0.07769775390625, 0.060546875, 0.19879150390625, 0.3370361328125, 0.47528076171875, 0.613525390625, 0.75177001953125, 0.8900146484375, 1.02825927734375, 1.16650390625, 1.30474853515625, 1.4429931640625, 1.58123779296875, 1.719482421875, 1.85772705078125, 1.9959716796875, 2.13421630859375, 2.2724609375, 2.41070556640625, 2.5489501953125, 2.68719482421875, 2.825439453125, 2.96368408203125, 3.1019287109375, 3.24017333984375, 3.37841796875, 3.51666259765625, 3.6549072265625, 3.79315185546875, 3.931396484375, 4.06964111328125, 4.2078857421875, 4.34613037109375, 4.484375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 3.0, 8.0, 9.0, 13.0, 11.0, 17.0, 16.0, 20.0, 18.0, 28.0, 30.0, 25.0, 32.0, 34.0, 31.0, 39.0, 36.0, 42.0, 44.0, 31.0, 39.0, 41.0, 41.0, 37.0, 35.0, 28.0, 33.0, 23.0, 22.0, 25.0, 26.0, 18.0, 22.0, 12.0, 20.0, 13.0, 8.0, 10.0, 4.0, 10.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-4.70703125, -4.55908203125, -4.4111328125, -4.26318359375, -4.115234375, -3.96728515625, -3.8193359375, -3.67138671875, -3.5234375, -3.37548828125, -3.2275390625, -3.07958984375, -2.931640625, -2.78369140625, -2.6357421875, -2.48779296875, -2.33984375, -2.19189453125, -2.0439453125, -1.89599609375, -1.748046875, -1.60009765625, -1.4521484375, -1.30419921875, -1.15625, -1.00830078125, -0.8603515625, -0.71240234375, -0.564453125, -0.41650390625, -0.2685546875, -0.12060546875, 0.02734375, 0.17529296875, 0.3232421875, 0.47119140625, 0.619140625, 0.76708984375, 0.9150390625, 1.06298828125, 1.2109375, 1.35888671875, 1.5068359375, 1.65478515625, 1.802734375, 1.95068359375, 2.0986328125, 2.24658203125, 2.39453125, 2.54248046875, 2.6904296875, 2.83837890625, 2.986328125, 3.13427734375, 3.2822265625, 3.43017578125, 3.578125, 3.72607421875, 3.8740234375, 4.02197265625, 4.169921875, 4.31787109375, 4.4658203125, 4.61376953125, 4.76171875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 9.0, 17.0, 24.0, 33.0, 47.0, 71.0, 98.0, 134.0, 212.0, 295.0, 451.0, 688.0, 1122.0, 1498.0, 2316.0, 3577.0, 5627.0, 8480.0, 13307.0, 20977.0, 32834.0, 50750.0, 77239.0, 111637.0, 144498.0, 154085.0, 133418.0, 98248.0, 65939.0, 43231.0, 27322.0, 17736.0, 11386.0, 7302.0, 4755.0, 3142.0, 1994.0, 1366.0, 861.0, 580.0, 399.0, 254.0, 195.0, 120.0, 81.0, 55.0, 49.0, 20.0, 18.0, 12.0, 17.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.671875, -1.614837646484375, -1.55780029296875, -1.500762939453125, -1.4437255859375, -1.386688232421875, -1.32965087890625, -1.272613525390625, -1.215576171875, -1.158538818359375, -1.10150146484375, -1.044464111328125, -0.9874267578125, -0.930389404296875, -0.87335205078125, -0.816314697265625, -0.75927734375, -0.702239990234375, -0.64520263671875, -0.588165283203125, -0.5311279296875, -0.474090576171875, -0.41705322265625, -0.360015869140625, -0.302978515625, -0.245941162109375, -0.18890380859375, -0.131866455078125, -0.0748291015625, -0.017791748046875, 0.03924560546875, 0.096282958984375, 0.1533203125, 0.210357666015625, 0.26739501953125, 0.324432373046875, 0.3814697265625, 0.438507080078125, 0.49554443359375, 0.552581787109375, 0.609619140625, 0.666656494140625, 0.72369384765625, 0.780731201171875, 0.8377685546875, 0.894805908203125, 0.95184326171875, 1.008880615234375, 1.06591796875, 1.122955322265625, 1.17999267578125, 1.237030029296875, 1.2940673828125, 1.351104736328125, 1.40814208984375, 1.465179443359375, 1.522216796875, 1.579254150390625, 1.63629150390625, 1.693328857421875, 1.7503662109375, 1.807403564453125, 1.86444091796875, 1.921478271484375, 1.978515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 10.0, 8.0, 15.0, 14.0, 30.0, 34.0, 27.0, 45.0, 44.0, 36.0, 47.0, 60.0, 51.0, 55.0, 62.0, 53.0, 63.0, 62.0, 43.0, 48.0, 41.0, 32.0, 32.0, 19.0, 15.0, 18.0, 8.0, 11.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002124309539794922, -0.00020698830485343933, -0.00020154565572738647, -0.00019610300660133362, -0.00019066035747528076, -0.0001852177083492279, -0.00017977505922317505, -0.0001743324100971222, -0.00016888976097106934, -0.00016344711184501648, -0.00015800446271896362, -0.00015256181359291077, -0.0001471191644668579, -0.00014167651534080505, -0.0001362338662147522, -0.00013079121708869934, -0.00012534856796264648, -0.00011990591883659363, -0.00011446326971054077, -0.00010902062058448792, -0.00010357797145843506, -9.81353223323822e-05, -9.269267320632935e-05, -8.725002408027649e-05, -8.180737495422363e-05, -7.636472582817078e-05, -7.092207670211792e-05, -6.547942757606506e-05, -6.003677845001221e-05, -5.459412932395935e-05, -4.9151480197906494e-05, -4.370883107185364e-05, -3.826618194580078e-05, -3.2823532819747925e-05, -2.738088369369507e-05, -2.1938234567642212e-05, -1.6495585441589355e-05, -1.1052936315536499e-05, -5.610287189483643e-06, -1.6763806343078613e-07, 5.27501106262207e-06, 1.0717660188674927e-05, 1.6160309314727783e-05, 2.160295844078064e-05, 2.7045607566833496e-05, 3.248825669288635e-05, 3.793090581893921e-05, 4.3373554944992065e-05, 4.881620407104492e-05, 5.425885319709778e-05, 5.9701502323150635e-05, 6.514415144920349e-05, 7.058680057525635e-05, 7.60294497013092e-05, 8.147209882736206e-05, 8.691474795341492e-05, 9.235739707946777e-05, 9.780004620552063e-05, 0.00010324269533157349, 0.00010868534445762634, 0.0001141279935836792, 0.00011957064270973206, 0.0001250132918357849, 0.00013045594096183777, 0.00013589859008789062]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 7.0, 16.0, 15.0, 29.0, 28.0, 48.0, 90.0, 126.0, 214.0, 308.0, 483.0, 785.0, 1298.0, 2120.0, 3572.0, 6046.0, 10581.0, 17889.0, 30184.0, 51431.0, 85402.0, 131460.0, 173598.0, 176235.0, 136126.0, 88715.0, 54254.0, 31593.0, 18657.0, 10979.0, 6402.0, 3816.0, 2319.0, 1376.0, 864.0, 543.0, 335.0, 199.0, 143.0, 97.0, 59.0, 32.0, 27.0, 10.0, 15.0, 10.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.25, -2.181915283203125, -2.11383056640625, -2.045745849609375, -1.9776611328125, -1.909576416015625, -1.84149169921875, -1.773406982421875, -1.705322265625, -1.637237548828125, -1.56915283203125, -1.501068115234375, -1.4329833984375, -1.364898681640625, -1.29681396484375, -1.228729248046875, -1.16064453125, -1.092559814453125, -1.02447509765625, -0.956390380859375, -0.8883056640625, -0.820220947265625, -0.75213623046875, -0.684051513671875, -0.615966796875, -0.547882080078125, -0.47979736328125, -0.411712646484375, -0.3436279296875, -0.275543212890625, -0.20745849609375, -0.139373779296875, -0.0712890625, -0.003204345703125, 0.06488037109375, 0.132965087890625, 0.2010498046875, 0.269134521484375, 0.33721923828125, 0.405303955078125, 0.473388671875, 0.541473388671875, 0.60955810546875, 0.677642822265625, 0.7457275390625, 0.813812255859375, 0.88189697265625, 0.949981689453125, 1.01806640625, 1.086151123046875, 1.15423583984375, 1.222320556640625, 1.2904052734375, 1.358489990234375, 1.42657470703125, 1.494659423828125, 1.562744140625, 1.630828857421875, 1.69891357421875, 1.766998291015625, 1.8350830078125, 1.903167724609375, 1.97125244140625, 2.039337158203125, 2.107421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 15.0, 9.0, 11.0, 20.0, 25.0, 28.0, 29.0, 27.0, 33.0, 58.0, 61.0, 57.0, 71.0, 71.0, 55.0, 59.0, 56.0, 53.0, 45.0, 30.0, 25.0, 37.0, 24.0, 17.0, 15.0, 11.0, 17.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.9580535888671875, -0.927825927734375, -0.8975982666015625, -0.86737060546875, -0.8371429443359375, -0.806915283203125, -0.7766876220703125, -0.7464599609375, -0.7162322998046875, -0.686004638671875, -0.6557769775390625, -0.62554931640625, -0.5953216552734375, -0.565093994140625, -0.5348663330078125, -0.504638671875, -0.4744110107421875, -0.444183349609375, -0.4139556884765625, -0.38372802734375, -0.3535003662109375, -0.323272705078125, -0.2930450439453125, -0.2628173828125, -0.2325897216796875, -0.202362060546875, -0.1721343994140625, -0.14190673828125, -0.1116790771484375, -0.081451416015625, -0.0512237548828125, -0.02099609375, 0.0092315673828125, 0.039459228515625, 0.0696868896484375, 0.09991455078125, 0.1301422119140625, 0.160369873046875, 0.1905975341796875, 0.2208251953125, 0.2510528564453125, 0.281280517578125, 0.3115081787109375, 0.34173583984375, 0.3719635009765625, 0.402191162109375, 0.4324188232421875, 0.462646484375, 0.4928741455078125, 0.523101806640625, 0.5533294677734375, 0.58355712890625, 0.6137847900390625, 0.644012451171875, 0.6742401123046875, 0.7044677734375, 0.7346954345703125, 0.764923095703125, 0.7951507568359375, 0.82537841796875, 0.8556060791015625, 0.885833740234375, 0.9160614013671875, 0.9462890625]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 12.0, 19.0, 13.0, 19.0, 25.0, 24.0, 39.0, 51.0, 59.0, 58.0, 74.0, 64.0, 68.0, 78.0, 86.0, 45.0, 53.0, 29.0, 27.0, 25.0, 28.0, 17.0, 18.0, 14.0, 13.0, 4.0, 3.0, 1.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.159231185913086, -7.824673652648926, -7.490115642547607, -7.155557632446289, -6.821000099182129, -6.486442565917969, -6.15188455581665, -5.817326545715332, -5.482769012451172, -5.148211479187012, -4.813653469085693, -4.479095458984375, -4.144537925720215, -3.8099801540374756, -3.4754223823547363, -3.140864610671997, -2.806306838989258, -2.4717490673065186, -2.1371912956237793, -1.80263352394104, -1.4680757522583008, -1.1335179805755615, -0.7989602088928223, -0.464402437210083, -0.12984466552734375, 0.2047131061553955, 0.5392708778381348, 0.873828649520874, 1.2083864212036133, 1.5429441928863525, 1.8775019645690918, 2.212059736251831, 2.546616554260254, 2.881174325942993, 3.2157320976257324, 3.5502898693084717, 3.884847640991211, 4.219405174255371, 4.5539631843566895, 4.888521194458008, 5.223078727722168, 5.557636260986328, 5.8921942710876465, 6.226752281188965, 6.561309814453125, 6.895867347717285, 7.2304253578186035, 7.564983367919922, 7.899540901184082, 8.234098434448242, 8.568656921386719, 8.903214454650879, 9.237771987915039, 9.5723295211792, 9.90688705444336, 10.241445541381836, 10.576003074645996, 10.910560607910156, 11.245119094848633, 11.579676628112793, 11.914234161376953, 12.248791694641113, 12.583349227905273, 12.91790771484375, 13.25246524810791]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 9.0, 15.0, 8.0, 15.0, 12.0, 17.0, 15.0, 22.0, 26.0, 28.0, 27.0, 36.0, 29.0, 35.0, 33.0, 37.0, 42.0, 43.0, 40.0, 40.0, 38.0, 40.0, 50.0, 35.0, 35.0, 30.0, 27.0, 32.0, 24.0, 23.0, 21.0, 16.0, 21.0, 8.0, 14.0, 10.0, 10.0, 9.0, 10.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0], "bins": [-9.387768745422363, -9.122356414794922, -8.856943130493164, -8.591530799865723, -8.326118469238281, -8.060705184936523, -7.795292854309082, -7.529880046844482, -7.264467239379883, -6.999054431915283, -6.733642101287842, -6.468229293823242, -6.202816486358643, -5.937403678894043, -5.671991348266602, -5.406578540802002, -5.1411662101745605, -4.875753402709961, -4.6103410720825195, -4.34492826461792, -4.07951545715332, -3.8141028881073, -3.5486903190612793, -3.2832775115966797, -3.017864942550659, -2.7524523735046387, -2.487039566040039, -2.2216269969940186, -1.9562143087387085, -1.6908016204833984, -1.425389051437378, -1.1599763631820679, -0.8945636749267578, -0.6291509866714478, -0.36373835802078247, -0.09832572937011719, 0.16708695888519287, 0.43249964714050293, 0.6979122161865234, 0.9633249044418335, 1.2287375926971436, 1.4941502809524536, 1.7595629692077637, 2.024975538253784, 2.2903881072998047, 2.5558009147644043, 2.821213483810425, 3.0866260528564453, 3.352038860321045, 3.6174514293670654, 3.882864236831665, 4.1482768058776855, 4.413689613342285, 4.679101943969727, 4.944514751434326, 5.209927558898926, 5.475339889526367, 5.740752696990967, 6.006165027618408, 6.271577835083008, 6.536990642547607, 6.802403450012207, 7.067815780639648, 7.333228588104248, 7.598641395568848]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 7.0, 11.0, 14.0, 25.0, 35.0, 49.0, 74.0, 106.0, 151.0, 241.0, 380.0, 649.0, 1052.0, 1831.0, 3076.0, 5163.0, 9234.0, 16249.0, 29482.0, 54776.0, 103030.0, 199482.0, 386182.0, 700388.0, 958463.0, 780347.0, 448020.0, 232023.0, 120499.0, 63065.0, 34420.0, 18949.0, 10683.0, 6328.0, 3763.0, 2256.0, 1416.0, 827.0, 559.0, 338.0, 236.0, 138.0, 99.0, 69.0, 24.0, 27.0, 17.0, 12.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6407470703125, -8.367431640625, -8.0941162109375, -7.82080078125, -7.5474853515625, -7.274169921875, -7.0008544921875, -6.7275390625, -6.4542236328125, -6.180908203125, -5.9075927734375, -5.63427734375, -5.3609619140625, -5.087646484375, -4.8143310546875, -4.541015625, -4.2677001953125, -3.994384765625, -3.7210693359375, -3.44775390625, -3.1744384765625, -2.901123046875, -2.6278076171875, -2.3544921875, -2.0811767578125, -1.807861328125, -1.5345458984375, -1.26123046875, -0.9879150390625, -0.714599609375, -0.4412841796875, -0.16796875, 0.1053466796875, 0.378662109375, 0.6519775390625, 0.92529296875, 1.1986083984375, 1.471923828125, 1.7452392578125, 2.0185546875, 2.2918701171875, 2.565185546875, 2.8385009765625, 3.11181640625, 3.3851318359375, 3.658447265625, 3.9317626953125, 4.205078125, 4.4783935546875, 4.751708984375, 5.0250244140625, 5.29833984375, 5.5716552734375, 5.844970703125, 6.1182861328125, 6.3916015625, 6.6649169921875, 6.938232421875, 7.2115478515625, 7.48486328125, 7.7581787109375, 8.031494140625, 8.3048095703125, 8.578125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 15.0, 6.0, 12.0, 21.0, 16.0, 17.0, 16.0, 28.0, 31.0, 34.0, 36.0, 32.0, 32.0, 41.0, 35.0, 39.0, 41.0, 41.0, 38.0, 48.0, 45.0, 33.0, 33.0, 39.0, 31.0, 29.0, 27.0, 30.0, 23.0, 19.0, 12.0, 14.0, 13.0, 11.0, 7.0, 9.0, 12.0, 7.0, 5.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 2.0], "bins": [-6.5078125, -6.325439453125, -6.14306640625, -5.960693359375, -5.7783203125, -5.595947265625, -5.41357421875, -5.231201171875, -5.048828125, -4.866455078125, -4.68408203125, -4.501708984375, -4.3193359375, -4.136962890625, -3.95458984375, -3.772216796875, -3.58984375, -3.407470703125, -3.22509765625, -3.042724609375, -2.8603515625, -2.677978515625, -2.49560546875, -2.313232421875, -2.130859375, -1.948486328125, -1.76611328125, -1.583740234375, -1.4013671875, -1.218994140625, -1.03662109375, -0.854248046875, -0.671875, -0.489501953125, -0.30712890625, -0.124755859375, 0.0576171875, 0.239990234375, 0.42236328125, 0.604736328125, 0.787109375, 0.969482421875, 1.15185546875, 1.334228515625, 1.5166015625, 1.698974609375, 1.88134765625, 2.063720703125, 2.24609375, 2.428466796875, 2.61083984375, 2.793212890625, 2.9755859375, 3.157958984375, 3.34033203125, 3.522705078125, 3.705078125, 3.887451171875, 4.06982421875, 4.252197265625, 4.4345703125, 4.616943359375, 4.79931640625, 4.981689453125, 5.1640625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 14.0, 16.0, 29.0, 29.0, 77.0, 111.0, 190.0, 297.0, 499.0, 833.0, 1351.0, 2170.0, 3693.0, 6221.0, 10787.0, 18068.0, 31468.0, 55890.0, 98754.0, 171282.0, 292582.0, 474813.0, 668589.0, 740892.0, 613656.0, 412530.0, 249657.0, 144065.0, 83112.0, 47556.0, 26710.0, 15637.0, 8968.0, 5470.0, 3293.0, 1928.0, 1196.0, 681.0, 411.0, 272.0, 154.0, 110.0, 76.0, 53.0, 26.0, 23.0, 20.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.046875, -6.82208251953125, -6.5972900390625, -6.37249755859375, -6.147705078125, -5.92291259765625, -5.6981201171875, -5.47332763671875, -5.24853515625, -5.02374267578125, -4.7989501953125, -4.57415771484375, -4.349365234375, -4.12457275390625, -3.8997802734375, -3.67498779296875, -3.4501953125, -3.22540283203125, -3.0006103515625, -2.77581787109375, -2.551025390625, -2.32623291015625, -2.1014404296875, -1.87664794921875, -1.65185546875, -1.42706298828125, -1.2022705078125, -0.97747802734375, -0.752685546875, -0.52789306640625, -0.3031005859375, -0.07830810546875, 0.146484375, 0.37127685546875, 0.5960693359375, 0.82086181640625, 1.045654296875, 1.27044677734375, 1.4952392578125, 1.72003173828125, 1.94482421875, 2.16961669921875, 2.3944091796875, 2.61920166015625, 2.843994140625, 3.06878662109375, 3.2935791015625, 3.51837158203125, 3.7431640625, 3.96795654296875, 4.1927490234375, 4.41754150390625, 4.642333984375, 4.86712646484375, 5.0919189453125, 5.31671142578125, 5.54150390625, 5.76629638671875, 5.9910888671875, 6.21588134765625, 6.440673828125, 6.66546630859375, 6.8902587890625, 7.11505126953125, 7.33984375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 10.0, 15.0, 24.0, 16.0, 26.0, 36.0, 44.0, 64.0, 75.0, 94.0, 99.0, 113.0, 144.0, 155.0, 162.0, 193.0, 215.0, 236.0, 197.0, 190.0, 229.0, 216.0, 204.0, 186.0, 166.0, 142.0, 127.0, 105.0, 94.0, 84.0, 68.0, 56.0, 46.0, 44.0, 42.0, 33.0, 33.0, 16.0, 12.0, 9.0, 9.0, 9.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.701171875, -2.613372802734375, -2.52557373046875, -2.437774658203125, -2.3499755859375, -2.262176513671875, -2.17437744140625, -2.086578369140625, -1.998779296875, -1.910980224609375, -1.82318115234375, -1.735382080078125, -1.6475830078125, -1.559783935546875, -1.47198486328125, -1.384185791015625, -1.29638671875, -1.208587646484375, -1.12078857421875, -1.032989501953125, -0.9451904296875, -0.857391357421875, -0.76959228515625, -0.681793212890625, -0.593994140625, -0.506195068359375, -0.41839599609375, -0.330596923828125, -0.2427978515625, -0.154998779296875, -0.06719970703125, 0.020599365234375, 0.1083984375, 0.196197509765625, 0.28399658203125, 0.371795654296875, 0.4595947265625, 0.547393798828125, 0.63519287109375, 0.722991943359375, 0.810791015625, 0.898590087890625, 0.98638916015625, 1.074188232421875, 1.1619873046875, 1.249786376953125, 1.33758544921875, 1.425384521484375, 1.51318359375, 1.600982666015625, 1.68878173828125, 1.776580810546875, 1.8643798828125, 1.952178955078125, 2.03997802734375, 2.127777099609375, 2.215576171875, 2.303375244140625, 2.39117431640625, 2.478973388671875, 2.5667724609375, 2.654571533203125, 2.74237060546875, 2.830169677734375, 2.91796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 13.0, 17.0, 24.0, 26.0, 44.0, 51.0, 53.0, 56.0, 76.0, 78.0, 89.0, 83.0, 54.0, 52.0, 49.0, 28.0, 31.0, 31.0, 24.0, 13.0, 13.0, 14.0, 8.0, 7.0, 7.0, 1.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.138949394226074, -8.816730499267578, -8.494511604309082, -8.172292709350586, -7.850073337554932, -7.5278544425964355, -7.205635070800781, -6.883416175842285, -6.561197280883789, -6.238978385925293, -5.916759490966797, -5.594540119171143, -5.2723212242126465, -4.95010232925415, -4.627882957458496, -4.3056640625, -3.983445167541504, -3.661226272583008, -3.3390071392059326, -3.0167880058288574, -2.6945691108703613, -2.3723502159118652, -2.05013108253479, -1.7279119491577148, -1.4056930541992188, -1.083474040031433, -0.7612550258636475, -0.4390360116958618, -0.11681699752807617, 0.20540201663970947, 0.5276210308074951, 0.8498401641845703, 1.17205810546875, 1.4942771196365356, 1.8164961338043213, 2.1387152671813965, 2.4609341621398926, 2.7831530570983887, 3.105372190475464, 3.427591323852539, 3.749810218811035, 4.072029113769531, 4.394248008728027, 4.716467380523682, 5.038686275482178, 5.360905170440674, 5.683124542236328, 6.005343437194824, 6.32756233215332, 6.649781227111816, 6.9720001220703125, 7.294219493865967, 7.616438388824463, 7.938657283782959, 8.260876655578613, 8.58309555053711, 8.905314445495605, 9.227533340454102, 9.549752235412598, 9.871971130371094, 10.194190979003906, 10.516409873962402, 10.838628768920898, 11.160847663879395, 11.48306655883789]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 12.0, 10.0, 15.0, 17.0, 21.0, 20.0, 26.0, 13.0, 29.0, 25.0, 42.0, 33.0, 36.0, 41.0, 26.0, 46.0, 47.0, 49.0, 37.0, 42.0, 39.0, 43.0, 41.0, 37.0, 26.0, 27.0, 29.0, 22.0, 18.0, 23.0, 11.0, 11.0, 13.0, 19.0, 9.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0], "bins": [-8.888531684875488, -8.632902145385742, -8.37727165222168, -8.121642112731934, -7.866012096405029, -7.610382080078125, -7.354752540588379, -7.099122524261475, -6.84349250793457, -6.587862491607666, -6.332232475280762, -6.076602935791016, -5.820972919464111, -5.565342903137207, -5.309713363647461, -5.054083347320557, -4.798453330993652, -4.542823314666748, -4.287193298339844, -4.031563758850098, -3.7759337425231934, -3.520303726196289, -3.264673948287964, -3.0090441703796387, -2.7534141540527344, -2.49778413772583, -2.242154359817505, -1.9865244626998901, -1.7308945655822754, -1.4752646684646606, -1.219634771347046, -0.9640048742294312, -0.7083749771118164, -0.45274507999420166, -0.19711518287658691, 0.05851471424102783, 0.3141446113586426, 0.5697745084762573, 0.8254044055938721, 1.0810343027114868, 1.3366641998291016, 1.5922940969467163, 1.847923994064331, 2.1035537719726562, 2.3591837882995605, 2.614813804626465, 2.87044358253479, 3.1260733604431152, 3.3817033767700195, 3.637333393096924, 3.892963171005249, 4.148592948913574, 4.4042229652404785, 4.659852981567383, 4.915482521057129, 5.171112537384033, 5.4267425537109375, 5.682372570037842, 5.938002586364746, 6.193632125854492, 6.4492621421813965, 6.704892158508301, 6.960521697998047, 7.216151714324951, 7.4717817306518555]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 6.0, 8.0, 12.0, 18.0, 24.0, 35.0, 43.0, 62.0, 101.0, 117.0, 195.0, 293.0, 405.0, 576.0, 846.0, 1259.0, 1923.0, 2809.0, 4215.0, 6353.0, 9654.0, 14800.0, 23014.0, 35694.0, 55564.0, 87063.0, 133732.0, 183561.0, 166622.0, 112651.0, 73601.0, 46858.0, 30071.0, 19355.0, 12590.0, 8144.0, 5269.0, 3630.0, 2401.0, 1534.0, 1095.0, 715.0, 499.0, 346.0, 208.0, 165.0, 115.0, 88.0, 76.0, 43.0, 27.0, 17.0, 22.0, 11.0, 8.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.8154296875, -0.7889556884765625, -0.762481689453125, -0.7360076904296875, -0.70953369140625, -0.6830596923828125, -0.656585693359375, -0.6301116943359375, -0.6036376953125, -0.5771636962890625, -0.550689697265625, -0.5242156982421875, -0.49774169921875, -0.4712677001953125, -0.444793701171875, -0.4183197021484375, -0.391845703125, -0.3653717041015625, -0.338897705078125, -0.3124237060546875, -0.28594970703125, -0.2594757080078125, -0.233001708984375, -0.2065277099609375, -0.1800537109375, -0.1535797119140625, -0.127105712890625, -0.1006317138671875, -0.07415771484375, -0.0476837158203125, -0.021209716796875, 0.0052642822265625, 0.03173828125, 0.0582122802734375, 0.084686279296875, 0.1111602783203125, 0.13763427734375, 0.1641082763671875, 0.190582275390625, 0.2170562744140625, 0.2435302734375, 0.2700042724609375, 0.296478271484375, 0.3229522705078125, 0.34942626953125, 0.3759002685546875, 0.402374267578125, 0.4288482666015625, 0.455322265625, 0.4817962646484375, 0.508270263671875, 0.5347442626953125, 0.56121826171875, 0.5876922607421875, 0.614166259765625, 0.6406402587890625, 0.6671142578125, 0.6935882568359375, 0.720062255859375, 0.7465362548828125, 0.77301025390625, 0.7994842529296875, 0.825958251953125, 0.8524322509765625, 0.87890625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 10.0, 29.0, 21.0, 17.0, 24.0, 24.0, 23.0, 32.0, 33.0, 37.0, 42.0, 35.0, 43.0, 50.0, 51.0, 37.0, 41.0, 46.0, 39.0, 52.0, 38.0, 26.0, 29.0, 35.0, 16.0, 19.0, 21.0, 19.0, 14.0, 9.0, 17.0, 14.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.3031005859375, -8.028076171875, -7.7530517578125, -7.47802734375, -7.2030029296875, -6.927978515625, -6.6529541015625, -6.3779296875, -6.1029052734375, -5.827880859375, -5.5528564453125, -5.27783203125, -5.0028076171875, -4.727783203125, -4.4527587890625, -4.177734375, -3.9027099609375, -3.627685546875, -3.3526611328125, -3.07763671875, -2.8026123046875, -2.527587890625, -2.2525634765625, -1.9775390625, -1.7025146484375, -1.427490234375, -1.1524658203125, -0.87744140625, -0.6024169921875, -0.327392578125, -0.0523681640625, 0.22265625, 0.4976806640625, 0.772705078125, 1.0477294921875, 1.32275390625, 1.5977783203125, 1.872802734375, 2.1478271484375, 2.4228515625, 2.6978759765625, 2.972900390625, 3.2479248046875, 3.52294921875, 3.7979736328125, 4.072998046875, 4.3480224609375, 4.623046875, 4.8980712890625, 5.173095703125, 5.4481201171875, 5.72314453125, 5.9981689453125, 6.273193359375, 6.5482177734375, 6.8232421875, 7.0982666015625, 7.373291015625, 7.6483154296875, 7.92333984375, 8.1983642578125, 8.473388671875, 8.7484130859375, 9.0234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 15.0, 18.0, 40.0, 37.0, 61.0, 100.0, 146.0, 213.0, 357.0, 634.0, 1031.0, 1716.0, 3147.0, 5479.0, 9746.0, 17696.0, 31977.0, 58409.0, 104784.0, 182456.0, 244104.0, 169366.0, 96825.0, 53509.0, 29464.0, 16324.0, 8862.0, 5081.0, 2806.0, 1612.0, 1013.0, 557.0, 353.0, 209.0, 130.0, 93.0, 53.0, 35.0, 26.0, 13.0, 19.0, 4.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1147308349609375, -1.078094482421875, -1.0414581298828125, -1.00482177734375, -0.9681854248046875, -0.931549072265625, -0.8949127197265625, -0.8582763671875, -0.8216400146484375, -0.785003662109375, -0.7483673095703125, -0.71173095703125, -0.6750946044921875, -0.638458251953125, -0.6018218994140625, -0.565185546875, -0.5285491943359375, -0.491912841796875, -0.4552764892578125, -0.41864013671875, -0.3820037841796875, -0.345367431640625, -0.3087310791015625, -0.2720947265625, -0.2354583740234375, -0.198822021484375, -0.1621856689453125, -0.12554931640625, -0.0889129638671875, -0.052276611328125, -0.0156402587890625, 0.02099609375, 0.0576324462890625, 0.094268798828125, 0.1309051513671875, 0.16754150390625, 0.2041778564453125, 0.240814208984375, 0.2774505615234375, 0.3140869140625, 0.3507232666015625, 0.387359619140625, 0.4239959716796875, 0.46063232421875, 0.4972686767578125, 0.533905029296875, 0.5705413818359375, 0.607177734375, 0.6438140869140625, 0.680450439453125, 0.7170867919921875, 0.75372314453125, 0.7903594970703125, 0.826995849609375, 0.8636322021484375, 0.9002685546875, 0.9369049072265625, 0.973541259765625, 1.0101776123046875, 1.04681396484375, 1.0834503173828125, 1.120086669921875, 1.1567230224609375, 1.193359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 4.0, 11.0, 14.0, 14.0, 17.0, 18.0, 18.0, 27.0, 34.0, 26.0, 23.0, 37.0, 39.0, 27.0, 36.0, 35.0, 43.0, 59.0, 51.0, 37.0, 48.0, 39.0, 34.0, 36.0, 30.0, 29.0, 38.0, 24.0, 24.0, 24.0, 14.0, 14.0, 12.0, 10.0, 11.0, 6.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.11328125, -4.94696044921875, -4.7806396484375, -4.61431884765625, -4.447998046875, -4.28167724609375, -4.1153564453125, -3.94903564453125, -3.78271484375, -3.61639404296875, -3.4500732421875, -3.28375244140625, -3.117431640625, -2.95111083984375, -2.7847900390625, -2.61846923828125, -2.4521484375, -2.28582763671875, -2.1195068359375, -1.95318603515625, -1.786865234375, -1.62054443359375, -1.4542236328125, -1.28790283203125, -1.12158203125, -0.95526123046875, -0.7889404296875, -0.62261962890625, -0.456298828125, -0.28997802734375, -0.1236572265625, 0.04266357421875, 0.208984375, 0.37530517578125, 0.5416259765625, 0.70794677734375, 0.874267578125, 1.04058837890625, 1.2069091796875, 1.37322998046875, 1.53955078125, 1.70587158203125, 1.8721923828125, 2.03851318359375, 2.204833984375, 2.37115478515625, 2.5374755859375, 2.70379638671875, 2.8701171875, 3.03643798828125, 3.2027587890625, 3.36907958984375, 3.535400390625, 3.70172119140625, 3.8680419921875, 4.03436279296875, 4.20068359375, 4.36700439453125, 4.5333251953125, 4.69964599609375, 4.865966796875, 5.03228759765625, 5.1986083984375, 5.36492919921875, 5.53125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 18.0, 31.0, 28.0, 45.0, 66.0, 113.0, 208.0, 336.0, 515.0, 988.0, 1834.0, 3918.0, 8985.0, 23239.0, 80656.0, 424179.0, 390537.0, 74605.0, 21972.0, 8448.0, 3660.0, 1825.0, 982.0, 551.0, 288.0, 177.0, 111.0, 71.0, 47.0, 28.0, 26.0, 24.0, 7.0, 1.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.287353515625, -0.27936553955078125, -0.2713775634765625, -0.26338958740234375, -0.255401611328125, -0.24741363525390625, -0.2394256591796875, -0.23143768310546875, -0.22344970703125, -0.21546173095703125, -0.2074737548828125, -0.19948577880859375, -0.191497802734375, -0.18350982666015625, -0.1755218505859375, -0.16753387451171875, -0.1595458984375, -0.15155792236328125, -0.1435699462890625, -0.13558197021484375, -0.127593994140625, -0.11960601806640625, -0.1116180419921875, -0.10363006591796875, -0.09564208984375, -0.08765411376953125, -0.0796661376953125, -0.07167816162109375, -0.063690185546875, -0.05570220947265625, -0.0477142333984375, -0.03972625732421875, -0.03173828125, -0.02375030517578125, -0.0157623291015625, -0.00777435302734375, 0.000213623046875, 0.00820159912109375, 0.0161895751953125, 0.02417755126953125, 0.03216552734375, 0.04015350341796875, 0.0481414794921875, 0.05612945556640625, 0.064117431640625, 0.07210540771484375, 0.0800933837890625, 0.08808135986328125, 0.0960693359375, 0.10405731201171875, 0.1120452880859375, 0.12003326416015625, 0.128021240234375, 0.13600921630859375, 0.1439971923828125, 0.15198516845703125, 0.15997314453125, 0.16796112060546875, 0.1759490966796875, 0.18393707275390625, 0.191925048828125, 0.19991302490234375, 0.2079010009765625, 0.21588897705078125, 0.223876953125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 8.0, 12.0, 5.0, 17.0, 12.0, 18.0, 32.0, 34.0, 29.0, 39.0, 46.0, 46.0, 52.0, 61.0, 54.0, 71.0, 54.0, 65.0, 51.0, 42.0, 43.0, 40.0, 24.0, 28.0, 28.0, 13.0, 17.0, 11.0, 6.0, 5.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.9252300262451172e-05, -1.8773600459098816e-05, -1.829490065574646e-05, -1.7816200852394104e-05, -1.7337501049041748e-05, -1.6858801245689392e-05, -1.6380101442337036e-05, -1.590140163898468e-05, -1.5422701835632324e-05, -1.4944002032279968e-05, -1.4465302228927612e-05, -1.3986602425575256e-05, -1.35079026222229e-05, -1.3029202818870544e-05, -1.2550503015518188e-05, -1.2071803212165833e-05, -1.1593103408813477e-05, -1.111440360546112e-05, -1.0635703802108765e-05, -1.0157003998756409e-05, -9.678304195404053e-06, -9.199604392051697e-06, -8.72090458869934e-06, -8.242204785346985e-06, -7.763504981994629e-06, -7.284805178642273e-06, -6.806105375289917e-06, -6.327405571937561e-06, -5.848705768585205e-06, -5.370005965232849e-06, -4.891306161880493e-06, -4.412606358528137e-06, -3.933906555175781e-06, -3.4552067518234253e-06, -2.9765069484710693e-06, -2.4978071451187134e-06, -2.0191073417663574e-06, -1.5404075384140015e-06, -1.0617077350616455e-06, -5.830079317092896e-07, -1.043081283569336e-07, 3.7439167499542236e-07, 8.530914783477783e-07, 1.3317912817001343e-06, 1.8104910850524902e-06, 2.289190888404846e-06, 2.767890691757202e-06, 3.246590495109558e-06, 3.725290298461914e-06, 4.20399010181427e-06, 4.682689905166626e-06, 5.161389708518982e-06, 5.640089511871338e-06, 6.118789315223694e-06, 6.59748911857605e-06, 7.076188921928406e-06, 7.554888725280762e-06, 8.033588528633118e-06, 8.512288331985474e-06, 8.99098813533783e-06, 9.469687938690186e-06, 9.948387742042542e-06, 1.0427087545394897e-05, 1.0905787348747253e-05, 1.138448715209961e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 18.0, 19.0, 34.0, 47.0, 87.0, 123.0, 137.0, 213.0, 314.0, 450.0, 642.0, 948.0, 1425.0, 2022.0, 3160.0, 4784.0, 7426.0, 12454.0, 21235.0, 36967.0, 67729.0, 134695.0, 266294.0, 233365.0, 113947.0, 58400.0, 32107.0, 18652.0, 11111.0, 6914.0, 4297.0, 2693.0, 1785.0, 1282.0, 814.0, 613.0, 391.0, 276.0, 195.0, 142.0, 94.0, 79.0, 53.0, 44.0, 25.0, 13.0, 10.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.135986328125, -0.13143539428710938, -0.12688446044921875, -0.12233352661132812, -0.1177825927734375, -0.11323165893554688, -0.10868072509765625, -0.10412979125976562, -0.099578857421875, -0.09502792358398438, -0.09047698974609375, -0.08592605590820312, -0.0813751220703125, -0.07682418823242188, -0.07227325439453125, -0.06772232055664062, -0.06317138671875, -0.058620452880859375, -0.05406951904296875, -0.049518585205078125, -0.0449676513671875, -0.040416717529296875, -0.03586578369140625, -0.031314849853515625, -0.026763916015625, -0.022212982177734375, -0.01766204833984375, -0.013111114501953125, -0.0085601806640625, -0.004009246826171875, 0.00054168701171875, 0.005092620849609375, 0.0096435546875, 0.014194488525390625, 0.01874542236328125, 0.023296356201171875, 0.0278472900390625, 0.032398223876953125, 0.03694915771484375, 0.041500091552734375, 0.046051025390625, 0.050601959228515625, 0.05515289306640625, 0.059703826904296875, 0.0642547607421875, 0.06880569458007812, 0.07335662841796875, 0.07790756225585938, 0.08245849609375, 0.08700942993164062, 0.09156036376953125, 0.09611129760742188, 0.1006622314453125, 0.10521316528320312, 0.10976409912109375, 0.11431503295898438, 0.118865966796875, 0.12341690063476562, 0.12796783447265625, 0.13251876831054688, 0.1370697021484375, 0.14162063598632812, 0.14617156982421875, 0.15072250366210938, 0.1552734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 7.0, 12.0, 15.0, 18.0, 10.0, 21.0, 28.0, 25.0, 35.0, 49.0, 42.0, 80.0, 76.0, 83.0, 96.0, 62.0, 50.0, 59.0, 41.0, 25.0, 18.0, 21.0, 19.0, 20.0, 13.0, 15.0, 9.0, 9.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038665771484375, -0.0372166633605957, -0.035767555236816406, -0.03431844711303711, -0.03286933898925781, -0.031420230865478516, -0.02997112274169922, -0.028522014617919922, -0.027072906494140625, -0.025623798370361328, -0.02417469024658203, -0.022725582122802734, -0.021276473999023438, -0.01982736587524414, -0.018378257751464844, -0.016929149627685547, -0.01548004150390625, -0.014030933380126953, -0.012581825256347656, -0.01113271713256836, -0.009683609008789062, -0.008234500885009766, -0.006785392761230469, -0.005336284637451172, -0.003887176513671875, -0.002438068389892578, -0.0009889602661132812, 0.0004601478576660156, 0.0019092559814453125, 0.0033583641052246094, 0.004807472229003906, 0.006256580352783203, 0.0077056884765625, 0.009154796600341797, 0.010603904724121094, 0.01205301284790039, 0.013502120971679688, 0.014951229095458984, 0.01640033721923828, 0.017849445343017578, 0.019298553466796875, 0.020747661590576172, 0.02219676971435547, 0.023645877838134766, 0.025094985961914062, 0.02654409408569336, 0.027993202209472656, 0.029442310333251953, 0.03089141845703125, 0.03234052658081055, 0.033789634704589844, 0.03523874282836914, 0.03668785095214844, 0.038136959075927734, 0.03958606719970703, 0.04103517532348633, 0.042484283447265625, 0.04393339157104492, 0.04538249969482422, 0.046831607818603516, 0.04828071594238281, 0.04972982406616211, 0.051178932189941406, 0.0526280403137207, 0.0540771484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 3.0, 6.0, 9.0, 9.0, 10.0, 15.0, 21.0, 29.0, 35.0, 50.0, 60.0, 50.0, 73.0, 68.0, 90.0, 87.0, 65.0, 53.0, 47.0, 34.0, 30.0, 35.0, 23.0, 14.0, 20.0, 8.0, 10.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.202949523925781, -8.881631851196289, -8.560314178466797, -8.238996505737305, -7.917679309844971, -7.5963616371154785, -7.275043964385986, -6.953726768493652, -6.63240909576416, -6.311091423034668, -5.989773750305176, -5.668456077575684, -5.34713888168335, -5.025821208953857, -4.704503536224365, -4.383186340332031, -4.061868190765381, -3.7405505180358887, -3.4192330837249756, -3.0979154109954834, -2.7765979766845703, -2.455280303955078, -2.133962631225586, -1.8126451969146729, -1.4913275241851807, -1.170009970664978, -0.8486923575401306, -0.5273747444152832, -0.20605719089508057, 0.11526036262512207, 0.43657803535461426, 0.7578954696655273, 1.0792131423950195, 1.4005306959152222, 1.7218482494354248, 2.043165922164917, 2.36448335647583, 2.6858010292053223, 3.0071187019348145, 3.3284361362457275, 3.6497538089752197, 3.971071481704712, 4.292388916015625, 4.613706588745117, 4.935024261474609, 5.256341934204102, 5.577659606933594, 5.898976802825928, 6.22029447555542, 6.541612148284912, 6.862929821014404, 7.184247016906738, 7.5055646896362305, 7.826882362365723, 8.148200035095215, 8.469517707824707, 8.7908353805542, 9.112153053283691, 9.433470726013184, 9.754788398742676, 10.076106071472168, 10.397422790527344, 10.718740463256836, 11.040058135986328, 11.36137580871582]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 13.0, 10.0, 15.0, 19.0, 19.0, 20.0, 25.0, 15.0, 28.0, 26.0, 43.0, 32.0, 35.0, 39.0, 30.0, 46.0, 47.0, 48.0, 37.0, 41.0, 40.0, 42.0, 42.0, 36.0, 26.0, 27.0, 30.0, 21.0, 19.0, 23.0, 10.0, 11.0, 14.0, 19.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0], "bins": [-8.821856498718262, -8.56679630279541, -8.311736106872559, -8.056675910949707, -7.801616191864014, -7.546555995941162, -7.291496276855469, -7.036436080932617, -6.781375885009766, -6.526315689086914, -6.2712554931640625, -6.016195774078369, -5.761135578155518, -5.506075382232666, -5.251015663146973, -4.995955467224121, -4.7408952713012695, -4.485835075378418, -4.230774879455566, -3.975715160369873, -3.7206549644470215, -3.46559476852417, -3.2105348110198975, -2.955474853515625, -2.7004146575927734, -2.445354461669922, -2.1902945041656494, -1.9352344274520874, -1.6801743507385254, -1.4251142740249634, -1.1700541973114014, -0.9149941205978394, -0.6599335670471191, -0.40487349033355713, -0.14981341361999512, 0.1052466630935669, 0.3603067398071289, 0.6153668165206909, 0.8704268932342529, 1.125486969947815, 1.380547046661377, 1.635607123374939, 1.890667200088501, 2.1457271575927734, 2.400787353515625, 2.6558475494384766, 2.910907506942749, 3.1659674644470215, 3.421027660369873, 3.6760878562927246, 3.931147813796997, 4.1862077713012695, 4.441267967224121, 4.696328163146973, 4.951388359069824, 5.206448078155518, 5.461508274078369, 5.716568470001221, 5.971628189086914, 6.226688385009766, 6.481748580932617, 6.736808776855469, 6.99186897277832, 7.246928691864014, 7.501988887786865]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 14.0, 9.0, 19.0, 13.0, 34.0, 48.0, 78.0, 166.0, 240.0, 358.0, 577.0, 979.0, 1536.0, 2395.0, 3749.0, 6005.0, 9141.0, 14322.0, 21761.0, 33061.0, 48949.0, 69894.0, 94316.0, 118404.0, 132585.0, 127467.0, 106831.0, 81873.0, 58253.0, 39936.0, 26540.0, 17643.0, 11194.0, 7287.0, 4643.0, 3004.0, 1883.0, 1213.0, 788.0, 495.0, 322.0, 204.0, 108.0, 78.0, 51.0, 31.0, 24.0, 23.0, 14.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.26171875, -5.10577392578125, -4.9498291015625, -4.79388427734375, -4.637939453125, -4.48199462890625, -4.3260498046875, -4.17010498046875, -4.01416015625, -3.85821533203125, -3.7022705078125, -3.54632568359375, -3.390380859375, -3.23443603515625, -3.0784912109375, -2.92254638671875, -2.7666015625, -2.61065673828125, -2.4547119140625, -2.29876708984375, -2.142822265625, -1.98687744140625, -1.8309326171875, -1.67498779296875, -1.51904296875, -1.36309814453125, -1.2071533203125, -1.05120849609375, -0.895263671875, -0.73931884765625, -0.5833740234375, -0.42742919921875, -0.271484375, -0.11553955078125, 0.0404052734375, 0.19635009765625, 0.352294921875, 0.50823974609375, 0.6641845703125, 0.82012939453125, 0.97607421875, 1.13201904296875, 1.2879638671875, 1.44390869140625, 1.599853515625, 1.75579833984375, 1.9117431640625, 2.06768798828125, 2.2236328125, 2.37957763671875, 2.5355224609375, 2.69146728515625, 2.847412109375, 3.00335693359375, 3.1593017578125, 3.31524658203125, 3.47119140625, 3.62713623046875, 3.7830810546875, 3.93902587890625, 4.094970703125, 4.25091552734375, 4.4068603515625, 4.56280517578125, 4.71875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 14.0, 7.0, 23.0, 24.0, 29.0, 16.0, 25.0, 24.0, 38.0, 32.0, 40.0, 42.0, 42.0, 56.0, 42.0, 48.0, 44.0, 44.0, 53.0, 46.0, 41.0, 34.0, 28.0, 23.0, 32.0, 22.0, 26.0, 10.0, 12.0, 15.0, 12.0, 7.0, 8.0, 8.0, 9.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.6640625, -9.3831787109375, -9.102294921875, -8.8214111328125, -8.54052734375, -8.2596435546875, -7.978759765625, -7.6978759765625, -7.4169921875, -7.1361083984375, -6.855224609375, -6.5743408203125, -6.29345703125, -6.0125732421875, -5.731689453125, -5.4508056640625, -5.169921875, -4.8890380859375, -4.608154296875, -4.3272705078125, -4.04638671875, -3.7655029296875, -3.484619140625, -3.2037353515625, -2.9228515625, -2.6419677734375, -2.361083984375, -2.0802001953125, -1.79931640625, -1.5184326171875, -1.237548828125, -0.9566650390625, -0.67578125, -0.3948974609375, -0.114013671875, 0.1668701171875, 0.44775390625, 0.7286376953125, 1.009521484375, 1.2904052734375, 1.5712890625, 1.8521728515625, 2.133056640625, 2.4139404296875, 2.69482421875, 2.9757080078125, 3.256591796875, 3.5374755859375, 3.818359375, 4.0992431640625, 4.380126953125, 4.6610107421875, 4.94189453125, 5.2227783203125, 5.503662109375, 5.7845458984375, 6.0654296875, 6.3463134765625, 6.627197265625, 6.9080810546875, 7.18896484375, 7.4698486328125, 7.750732421875, 8.0316162109375, 8.3125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 18.0, 17.0, 58.0, 58.0, 90.0, 153.0, 223.0, 377.0, 605.0, 1010.0, 1592.0, 2524.0, 4022.0, 6778.0, 11296.0, 18627.0, 30186.0, 48035.0, 74488.0, 107498.0, 140917.0, 155670.0, 139972.0, 106947.0, 72881.0, 47510.0, 29692.0, 18366.0, 11197.0, 6914.0, 4188.0, 2571.0, 1520.0, 899.0, 589.0, 383.0, 239.0, 156.0, 115.0, 68.0, 30.0, 28.0, 16.0, 7.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.52362060546875, -5.3363037109375, -5.14898681640625, -4.961669921875, -4.77435302734375, -4.5870361328125, -4.39971923828125, -4.21240234375, -4.02508544921875, -3.8377685546875, -3.65045166015625, -3.463134765625, -3.27581787109375, -3.0885009765625, -2.90118408203125, -2.7138671875, -2.52655029296875, -2.3392333984375, -2.15191650390625, -1.964599609375, -1.77728271484375, -1.5899658203125, -1.40264892578125, -1.21533203125, -1.02801513671875, -0.8406982421875, -0.65338134765625, -0.466064453125, -0.27874755859375, -0.0914306640625, 0.09588623046875, 0.283203125, 0.47052001953125, 0.6578369140625, 0.84515380859375, 1.032470703125, 1.21978759765625, 1.4071044921875, 1.59442138671875, 1.78173828125, 1.96905517578125, 2.1563720703125, 2.34368896484375, 2.531005859375, 2.71832275390625, 2.9056396484375, 3.09295654296875, 3.2802734375, 3.46759033203125, 3.6549072265625, 3.84222412109375, 4.029541015625, 4.21685791015625, 4.4041748046875, 4.59149169921875, 4.77880859375, 4.96612548828125, 5.1534423828125, 5.34075927734375, 5.528076171875, 5.71539306640625, 5.9027099609375, 6.09002685546875, 6.27734375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 8.0, 7.0, 9.0, 13.0, 12.0, 17.0, 30.0, 27.0, 28.0, 20.0, 19.0, 32.0, 30.0, 30.0, 41.0, 39.0, 39.0, 38.0, 34.0, 44.0, 37.0, 53.0, 36.0, 36.0, 34.0, 39.0, 22.0, 26.0, 21.0, 28.0, 17.0, 17.0, 21.0, 14.0, 13.0, 10.0, 5.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.32928466796875, -4.1741943359375, -4.01910400390625, -3.864013671875, -3.70892333984375, -3.5538330078125, -3.39874267578125, -3.24365234375, -3.08856201171875, -2.9334716796875, -2.77838134765625, -2.623291015625, -2.46820068359375, -2.3131103515625, -2.15802001953125, -2.0029296875, -1.84783935546875, -1.6927490234375, -1.53765869140625, -1.382568359375, -1.22747802734375, -1.0723876953125, -0.91729736328125, -0.76220703125, -0.60711669921875, -0.4520263671875, -0.29693603515625, -0.141845703125, 0.01324462890625, 0.1683349609375, 0.32342529296875, 0.478515625, 0.63360595703125, 0.7886962890625, 0.94378662109375, 1.098876953125, 1.25396728515625, 1.4090576171875, 1.56414794921875, 1.71923828125, 1.87432861328125, 2.0294189453125, 2.18450927734375, 2.339599609375, 2.49468994140625, 2.6497802734375, 2.80487060546875, 2.9599609375, 3.11505126953125, 3.2701416015625, 3.42523193359375, 3.580322265625, 3.73541259765625, 3.8905029296875, 4.04559326171875, 4.20068359375, 4.35577392578125, 4.5108642578125, 4.66595458984375, 4.821044921875, 4.97613525390625, 5.1312255859375, 5.28631591796875, 5.44140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 6.0, 10.0, 17.0, 23.0, 36.0, 48.0, 64.0, 110.0, 164.0, 224.0, 359.0, 465.0, 743.0, 1163.0, 1792.0, 2913.0, 4456.0, 7683.0, 12951.0, 23072.0, 41062.0, 73353.0, 127811.0, 191199.0, 204774.0, 148967.0, 88788.0, 49378.0, 27630.0, 15527.0, 9081.0, 5492.0, 3258.0, 2054.0, 1335.0, 863.0, 536.0, 375.0, 244.0, 158.0, 112.0, 94.0, 51.0, 33.0, 20.0, 18.0, 15.0, 11.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.337890625, -2.2603759765625, -2.182861328125, -2.1053466796875, -2.02783203125, -1.9503173828125, -1.872802734375, -1.7952880859375, -1.7177734375, -1.6402587890625, -1.562744140625, -1.4852294921875, -1.40771484375, -1.3302001953125, -1.252685546875, -1.1751708984375, -1.09765625, -1.0201416015625, -0.942626953125, -0.8651123046875, -0.78759765625, -0.7100830078125, -0.632568359375, -0.5550537109375, -0.4775390625, -0.4000244140625, -0.322509765625, -0.2449951171875, -0.16748046875, -0.0899658203125, -0.012451171875, 0.0650634765625, 0.142578125, 0.2200927734375, 0.297607421875, 0.3751220703125, 0.45263671875, 0.5301513671875, 0.607666015625, 0.6851806640625, 0.7626953125, 0.8402099609375, 0.917724609375, 0.9952392578125, 1.07275390625, 1.1502685546875, 1.227783203125, 1.3052978515625, 1.3828125, 1.4603271484375, 1.537841796875, 1.6153564453125, 1.69287109375, 1.7703857421875, 1.847900390625, 1.9254150390625, 2.0029296875, 2.0804443359375, 2.157958984375, 2.2354736328125, 2.31298828125, 2.3905029296875, 2.468017578125, 2.5455322265625, 2.623046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 6.0, 11.0, 9.0, 14.0, 17.0, 19.0, 23.0, 30.0, 30.0, 30.0, 43.0, 39.0, 62.0, 41.0, 60.0, 52.0, 56.0, 54.0, 55.0, 48.0, 44.0, 35.0, 38.0, 29.0, 28.0, 19.0, 13.0, 17.0, 8.0, 9.0, 12.0, 4.0, 4.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.00014829635620117188, -0.00014391914010047913, -0.00013954192399978638, -0.00013516470789909363, -0.00013078749179840088, -0.00012641027569770813, -0.00012203305959701538, -0.00011765584349632263, -0.00011327862739562988, -0.00010890141129493713, -0.00010452419519424438, -0.00010014697909355164, -9.576976299285889e-05, -9.139254689216614e-05, -8.701533079147339e-05, -8.263811469078064e-05, -7.826089859008789e-05, -7.388368248939514e-05, -6.950646638870239e-05, -6.512925028800964e-05, -6.0752034187316895e-05, -5.6374818086624146e-05, -5.1997601985931396e-05, -4.762038588523865e-05, -4.32431697845459e-05, -3.886595368385315e-05, -3.44887375831604e-05, -3.011152148246765e-05, -2.5734305381774902e-05, -2.1357089281082153e-05, -1.6979873180389404e-05, -1.2602657079696655e-05, -8.225440979003906e-06, -3.848224878311157e-06, 5.289912223815918e-07, 4.906207323074341e-06, 9.28342342376709e-06, 1.3660639524459839e-05, 1.8037855625152588e-05, 2.2415071725845337e-05, 2.6792287826538086e-05, 3.1169503927230835e-05, 3.5546720027923584e-05, 3.992393612861633e-05, 4.430115222930908e-05, 4.867836833000183e-05, 5.305558443069458e-05, 5.743280053138733e-05, 6.181001663208008e-05, 6.618723273277283e-05, 7.056444883346558e-05, 7.494166493415833e-05, 7.931888103485107e-05, 8.369609713554382e-05, 8.807331323623657e-05, 9.245052933692932e-05, 9.682774543762207e-05, 0.00010120496153831482, 0.00010558217763900757, 0.00010995939373970032, 0.00011433660984039307, 0.00011871382594108582, 0.00012309104204177856, 0.0001274682581424713, 0.00013184547424316406]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 5.0, 14.0, 17.0, 29.0, 41.0, 65.0, 129.0, 192.0, 345.0, 563.0, 990.0, 1749.0, 3134.0, 5836.0, 10958.0, 22079.0, 44798.0, 92831.0, 179010.0, 259257.0, 206205.0, 111113.0, 54268.0, 26268.0, 13211.0, 6881.0, 3641.0, 2078.0, 1144.0, 709.0, 350.0, 242.0, 134.0, 100.0, 51.0, 32.0, 23.0, 15.0, 6.0, 3.0, 10.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.419921875, -3.3211669921875, -3.222412109375, -3.1236572265625, -3.02490234375, -2.9261474609375, -2.827392578125, -2.7286376953125, -2.6298828125, -2.5311279296875, -2.432373046875, -2.3336181640625, -2.23486328125, -2.1361083984375, -2.037353515625, -1.9385986328125, -1.83984375, -1.7410888671875, -1.642333984375, -1.5435791015625, -1.44482421875, -1.3460693359375, -1.247314453125, -1.1485595703125, -1.0498046875, -0.9510498046875, -0.852294921875, -0.7535400390625, -0.65478515625, -0.5560302734375, -0.457275390625, -0.3585205078125, -0.259765625, -0.1610107421875, -0.062255859375, 0.0364990234375, 0.13525390625, 0.2340087890625, 0.332763671875, 0.4315185546875, 0.5302734375, 0.6290283203125, 0.727783203125, 0.8265380859375, 0.92529296875, 1.0240478515625, 1.122802734375, 1.2215576171875, 1.3203125, 1.4190673828125, 1.517822265625, 1.6165771484375, 1.71533203125, 1.8140869140625, 1.912841796875, 2.0115966796875, 2.1103515625, 2.2091064453125, 2.307861328125, 2.4066162109375, 2.50537109375, 2.6041259765625, 2.702880859375, 2.8016357421875, 2.900390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 3.0, 3.0, 7.0, 11.0, 11.0, 7.0, 11.0, 14.0, 25.0, 33.0, 29.0, 40.0, 52.0, 38.0, 50.0, 60.0, 56.0, 57.0, 62.0, 66.0, 63.0, 53.0, 42.0, 33.0, 31.0, 36.0, 18.0, 12.0, 20.0, 14.0, 10.0, 7.0, 6.0, 2.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0859375, -1.0537567138671875, -1.021575927734375, -0.9893951416015625, -0.95721435546875, -0.9250335693359375, -0.892852783203125, -0.8606719970703125, -0.8284912109375, -0.7963104248046875, -0.764129638671875, -0.7319488525390625, -0.69976806640625, -0.6675872802734375, -0.635406494140625, -0.6032257080078125, -0.571044921875, -0.5388641357421875, -0.506683349609375, -0.4745025634765625, -0.44232177734375, -0.4101409912109375, -0.377960205078125, -0.3457794189453125, -0.3135986328125, -0.2814178466796875, -0.249237060546875, -0.2170562744140625, -0.18487548828125, -0.1526947021484375, -0.120513916015625, -0.0883331298828125, -0.05615234375, -0.0239715576171875, 0.008209228515625, 0.0403900146484375, 0.07257080078125, 0.1047515869140625, 0.136932373046875, 0.1691131591796875, 0.2012939453125, 0.2334747314453125, 0.265655517578125, 0.2978363037109375, 0.33001708984375, 0.3621978759765625, 0.394378662109375, 0.4265594482421875, 0.458740234375, 0.4909210205078125, 0.523101806640625, 0.5552825927734375, 0.58746337890625, 0.6196441650390625, 0.651824951171875, 0.6840057373046875, 0.7161865234375, 0.7483673095703125, 0.780548095703125, 0.8127288818359375, 0.84490966796875, 0.8770904541015625, 0.909271240234375, 0.9414520263671875, 0.9736328125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 4.0, 5.0, 4.0, 10.0, 8.0, 13.0, 15.0, 28.0, 31.0, 43.0, 44.0, 59.0, 61.0, 77.0, 81.0, 77.0, 74.0, 67.0, 52.0, 47.0, 31.0, 33.0, 28.0, 23.0, 13.0, 12.0, 9.0, 12.0, 4.0, 8.0, 1.0, 2.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.546056747436523, -9.218202590942383, -8.890349388122559, -8.562495231628418, -8.234642028808594, -7.906787872314453, -7.578934192657471, -7.251080513000488, -6.923226833343506, -6.595373153686523, -6.267519474029541, -5.939665794372559, -5.611811637878418, -5.283958435058594, -4.956104278564453, -4.628250598907471, -4.300396919250488, -3.972543239593506, -3.6446895599365234, -3.316835641860962, -2.9889819622039795, -2.661128282546997, -2.3332743644714355, -2.005420684814453, -1.6775670051574707, -1.3497133255004883, -1.0218595266342163, -0.6940057873725891, -0.3661520481109619, -0.03829836845397949, 0.2895554304122925, 0.6174092292785645, 0.9452619552612305, 1.273115634918213, 1.6009694337844849, 1.9288232326507568, 2.2566769123077393, 2.5845305919647217, 2.912384510040283, 3.2402381896972656, 3.568091869354248, 3.8959455490112305, 4.223799228668213, 4.551652908325195, 4.879507064819336, 5.20736026763916, 5.535214424133301, 5.863068103790283, 6.190921783447266, 6.518775463104248, 6.8466291427612305, 7.174482822418213, 7.502336502075195, 7.830190658569336, 8.15804386138916, 8.4858980178833, 8.813751220703125, 9.141605377197266, 9.46945858001709, 9.79731273651123, 10.125165939331055, 10.453020095825195, 10.78087329864502, 11.10872745513916, 11.4365816116333]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 8.0, 20.0, 13.0, 11.0, 12.0, 18.0, 16.0, 22.0, 21.0, 24.0, 26.0, 31.0, 41.0, 35.0, 32.0, 39.0, 43.0, 47.0, 36.0, 33.0, 39.0, 47.0, 37.0, 36.0, 32.0, 32.0, 31.0, 34.0, 25.0, 20.0, 22.0, 8.0, 17.0, 16.0, 14.0, 10.0, 7.0, 6.0, 6.0, 8.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.305575370788574, -8.051009178161621, -7.79644250869751, -7.541875839233398, -7.287309646606445, -7.032742977142334, -6.778176307678223, -6.5236101150512695, -6.269043445587158, -6.014476776123047, -5.759910583496094, -5.505343914031982, -5.250777244567871, -4.996211051940918, -4.741644382476807, -4.487077713012695, -4.232511520385742, -3.97794508934021, -3.7233786582946777, -3.4688119888305664, -3.214245557785034, -2.959679126739502, -2.7051124572753906, -2.4505460262298584, -2.195979595184326, -1.941413164138794, -1.6868466138839722, -1.4322800636291504, -1.1777136325836182, -0.9231472015380859, -0.6685806512832642, -0.4140141010284424, -0.15944766998291016, 0.09511882066726685, 0.34968531131744385, 0.6042518019676208, 0.8588182926177979, 1.11338472366333, 1.3679512739181519, 1.6225178241729736, 1.8770842552185059, 2.131650686264038, 2.3862171173095703, 2.6407837867736816, 2.895350217819214, 3.149916648864746, 3.4044833183288574, 3.6590497493743896, 3.913616180419922, 4.168182849884033, 4.422749042510986, 4.677315711975098, 4.931881904602051, 5.186448574066162, 5.441015243530273, 5.695581436157227, 5.950148105621338, 6.204714775085449, 6.459280967712402, 6.713847637176514, 6.968414306640625, 7.222980499267578, 7.4775471687316895, 7.732113838195801, 7.986680030822754]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 22.0, 20.0, 54.0, 67.0, 120.0, 199.0, 308.0, 476.0, 818.0, 1201.0, 2165.0, 3522.0, 5879.0, 10154.0, 17166.0, 30581.0, 55396.0, 101403.0, 189489.0, 352449.0, 619580.0, 873615.0, 803103.0, 510340.0, 280616.0, 150619.0, 80774.0, 44386.0, 24683.0, 14003.0, 8239.0, 4740.0, 3001.0, 1798.0, 1165.0, 696.0, 479.0, 314.0, 190.0, 131.0, 108.0, 64.0, 32.0, 33.0, 25.0, 26.0, 11.0, 5.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.48046875, -7.22088623046875, -6.9613037109375, -6.70172119140625, -6.442138671875, -6.18255615234375, -5.9229736328125, -5.66339111328125, -5.40380859375, -5.14422607421875, -4.8846435546875, -4.62506103515625, -4.365478515625, -4.10589599609375, -3.8463134765625, -3.58673095703125, -3.3271484375, -3.06756591796875, -2.8079833984375, -2.54840087890625, -2.288818359375, -2.02923583984375, -1.7696533203125, -1.51007080078125, -1.25048828125, -0.99090576171875, -0.7313232421875, -0.47174072265625, -0.212158203125, 0.04742431640625, 0.3070068359375, 0.56658935546875, 0.826171875, 1.08575439453125, 1.3453369140625, 1.60491943359375, 1.864501953125, 2.12408447265625, 2.3836669921875, 2.64324951171875, 2.90283203125, 3.16241455078125, 3.4219970703125, 3.68157958984375, 3.941162109375, 4.20074462890625, 4.4603271484375, 4.71990966796875, 4.9794921875, 5.23907470703125, 5.4986572265625, 5.75823974609375, 6.017822265625, 6.27740478515625, 6.5369873046875, 6.79656982421875, 7.05615234375, 7.31573486328125, 7.5753173828125, 7.83489990234375, 8.094482421875, 8.35406494140625, 8.6136474609375, 8.87322998046875, 9.1328125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 7.0, 10.0, 18.0, 12.0, 16.0, 19.0, 20.0, 19.0, 20.0, 21.0, 28.0, 30.0, 35.0, 30.0, 32.0, 35.0, 52.0, 42.0, 42.0, 32.0, 37.0, 41.0, 46.0, 35.0, 42.0, 27.0, 30.0, 27.0, 27.0, 24.0, 18.0, 19.0, 19.0, 12.0, 15.0, 10.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.8671875, -5.68896484375, -5.5107421875, -5.33251953125, -5.154296875, -4.97607421875, -4.7978515625, -4.61962890625, -4.44140625, -4.26318359375, -4.0849609375, -3.90673828125, -3.728515625, -3.55029296875, -3.3720703125, -3.19384765625, -3.015625, -2.83740234375, -2.6591796875, -2.48095703125, -2.302734375, -2.12451171875, -1.9462890625, -1.76806640625, -1.58984375, -1.41162109375, -1.2333984375, -1.05517578125, -0.876953125, -0.69873046875, -0.5205078125, -0.34228515625, -0.1640625, 0.01416015625, 0.1923828125, 0.37060546875, 0.548828125, 0.72705078125, 0.9052734375, 1.08349609375, 1.26171875, 1.43994140625, 1.6181640625, 1.79638671875, 1.974609375, 2.15283203125, 2.3310546875, 2.50927734375, 2.6875, 2.86572265625, 3.0439453125, 3.22216796875, 3.400390625, 3.57861328125, 3.7568359375, 3.93505859375, 4.11328125, 4.29150390625, 4.4697265625, 4.64794921875, 4.826171875, 5.00439453125, 5.1826171875, 5.36083984375, 5.5390625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 8.0, 15.0, 28.0, 43.0, 45.0, 102.0, 151.0, 260.0, 390.0, 693.0, 1090.0, 1846.0, 3152.0, 5479.0, 9493.0, 17038.0, 30791.0, 56289.0, 104025.0, 188547.0, 334319.0, 546669.0, 749096.0, 764104.0, 573064.0, 357272.0, 202210.0, 111799.0, 60166.0, 33162.0, 18394.0, 10164.0, 5971.0, 3360.0, 1967.0, 1152.0, 701.0, 439.0, 276.0, 179.0, 115.0, 78.0, 51.0, 33.0, 25.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.9635009765625, -6.723876953125, -6.4842529296875, -6.24462890625, -6.0050048828125, -5.765380859375, -5.5257568359375, -5.2861328125, -5.0465087890625, -4.806884765625, -4.5672607421875, -4.32763671875, -4.0880126953125, -3.848388671875, -3.6087646484375, -3.369140625, -3.1295166015625, -2.889892578125, -2.6502685546875, -2.41064453125, -2.1710205078125, -1.931396484375, -1.6917724609375, -1.4521484375, -1.2125244140625, -0.972900390625, -0.7332763671875, -0.49365234375, -0.2540283203125, -0.014404296875, 0.2252197265625, 0.46484375, 0.7044677734375, 0.944091796875, 1.1837158203125, 1.42333984375, 1.6629638671875, 1.902587890625, 2.1422119140625, 2.3818359375, 2.6214599609375, 2.861083984375, 3.1007080078125, 3.34033203125, 3.5799560546875, 3.819580078125, 4.0592041015625, 4.298828125, 4.5384521484375, 4.778076171875, 5.0177001953125, 5.25732421875, 5.4969482421875, 5.736572265625, 5.9761962890625, 6.2158203125, 6.4554443359375, 6.695068359375, 6.9346923828125, 7.17431640625, 7.4139404296875, 7.653564453125, 7.8931884765625, 8.1328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 17.0, 28.0, 26.0, 35.0, 43.0, 55.0, 71.0, 70.0, 86.0, 125.0, 142.0, 149.0, 182.0, 195.0, 191.0, 205.0, 247.0, 214.0, 198.0, 228.0, 201.0, 183.0, 167.0, 162.0, 139.0, 126.0, 72.0, 99.0, 78.0, 50.0, 44.0, 42.0, 41.0, 31.0, 24.0, 21.0, 14.0, 16.0, 12.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.84765625, -2.7562255859375, -2.664794921875, -2.5733642578125, -2.48193359375, -2.3905029296875, -2.299072265625, -2.2076416015625, -2.1162109375, -2.0247802734375, -1.933349609375, -1.8419189453125, -1.75048828125, -1.6590576171875, -1.567626953125, -1.4761962890625, -1.384765625, -1.2933349609375, -1.201904296875, -1.1104736328125, -1.01904296875, -0.9276123046875, -0.836181640625, -0.7447509765625, -0.6533203125, -0.5618896484375, -0.470458984375, -0.3790283203125, -0.28759765625, -0.1961669921875, -0.104736328125, -0.0133056640625, 0.078125, 0.1695556640625, 0.260986328125, 0.3524169921875, 0.44384765625, 0.5352783203125, 0.626708984375, 0.7181396484375, 0.8095703125, 0.9010009765625, 0.992431640625, 1.0838623046875, 1.17529296875, 1.2667236328125, 1.358154296875, 1.4495849609375, 1.541015625, 1.6324462890625, 1.723876953125, 1.8153076171875, 1.90673828125, 1.9981689453125, 2.089599609375, 2.1810302734375, 2.2724609375, 2.3638916015625, 2.455322265625, 2.5467529296875, 2.63818359375, 2.7296142578125, 2.821044921875, 2.9124755859375, 3.00390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 11.0, 9.0, 14.0, 23.0, 28.0, 42.0, 38.0, 49.0, 67.0, 61.0, 77.0, 72.0, 63.0, 65.0, 50.0, 57.0, 40.0, 38.0, 27.0, 21.0, 29.0, 21.0, 11.0, 11.0, 13.0, 4.0, 6.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.533435821533203, -10.231127738952637, -9.92881965637207, -9.626510620117188, -9.324202537536621, -9.021894454956055, -8.719585418701172, -8.417277336120605, -8.114969253540039, -7.812661170959473, -7.510352611541748, -7.208044052124023, -6.905735969543457, -6.603427886962891, -6.301119327545166, -5.998810768127441, -5.696502685546875, -5.394194602966309, -5.091886043548584, -4.789577484130859, -4.487269401550293, -4.184961318969727, -3.882652759552002, -3.5803444385528564, -3.278036117553711, -2.9757277965545654, -2.67341947555542, -2.3711111545562744, -2.068802833557129, -1.7664945125579834, -1.464186191558838, -1.1618778705596924, -0.8595695495605469, -0.5572612285614014, -0.25495290756225586, 0.04735541343688965, 0.34966373443603516, 0.6519720554351807, 0.9542803764343262, 1.2565886974334717, 1.5588970184326172, 1.8612053394317627, 2.163513660430908, 2.4658219814300537, 2.768130302429199, 3.0704386234283447, 3.3727469444274902, 3.6750552654266357, 3.9773635864257812, 4.279671669006348, 4.581980228424072, 4.884288787841797, 5.186596870422363, 5.48890495300293, 5.791213512420654, 6.093522071838379, 6.395830154418945, 6.698138236999512, 7.000446796417236, 7.302755355834961, 7.605063438415527, 7.907371520996094, 8.209680557250977, 8.511988639831543, 8.81429672241211]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 4.0, 5.0, 7.0, 13.0, 15.0, 14.0, 19.0, 9.0, 19.0, 20.0, 11.0, 19.0, 38.0, 29.0, 42.0, 44.0, 43.0, 52.0, 39.0, 42.0, 44.0, 41.0, 31.0, 41.0, 33.0, 38.0, 35.0, 29.0, 35.0, 22.0, 29.0, 19.0, 17.0, 19.0, 14.0, 8.0, 11.0, 9.0, 2.0, 4.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2379150390625, -7.990232944488525, -7.742550849914551, -7.494868278503418, -7.247186183929443, -6.999504089355469, -6.751821517944336, -6.504139423370361, -6.256457328796387, -6.008775234222412, -5.7610931396484375, -5.513410568237305, -5.26572847366333, -5.0180463790893555, -4.770363807678223, -4.522681713104248, -4.274999618530273, -4.027317523956299, -3.779635190963745, -3.5319528579711914, -3.284270763397217, -3.036588668823242, -2.7889063358306885, -2.5412240028381348, -2.29354190826416, -2.0458598136901855, -1.7981774806976318, -1.5504952669143677, -1.3028130531311035, -1.0551308393478394, -0.8074486255645752, -0.559766411781311, -0.3120846748352051, -0.06440246105194092, 0.18327975273132324, 0.4309619665145874, 0.6786441802978516, 0.9263263940811157, 1.1740086078643799, 1.421690821647644, 1.6693730354309082, 1.9170552492141724, 2.1647374629974365, 2.4124197959899902, 2.660101890563965, 2.9077839851379395, 3.155466318130493, 3.403148651123047, 3.6508307456970215, 3.898512840270996, 4.146195411682129, 4.3938775062561035, 4.641559600830078, 4.889241695404053, 5.136923789978027, 5.38460636138916, 5.632288455963135, 5.879970550537109, 6.127653121948242, 6.375335216522217, 6.623017311096191, 6.870699405670166, 7.118381500244141, 7.366064071655273, 7.613746166229248]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 6.0, 9.0, 10.0, 25.0, 33.0, 52.0, 60.0, 106.0, 135.0, 208.0, 345.0, 573.0, 844.0, 1362.0, 2292.0, 3598.0, 5590.0, 9434.0, 15477.0, 26027.0, 43177.0, 73329.0, 123415.0, 193372.0, 206209.0, 138249.0, 82372.0, 48882.0, 28619.0, 17216.0, 10438.0, 6463.0, 4045.0, 2437.0, 1465.0, 939.0, 620.0, 395.0, 238.0, 175.0, 104.0, 68.0, 34.0, 39.0, 20.0, 20.0, 9.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.96826171875, -0.9390182495117188, -0.9097747802734375, -0.8805313110351562, -0.851287841796875, -0.8220443725585938, -0.7928009033203125, -0.7635574340820312, -0.73431396484375, -0.7050704956054688, -0.6758270263671875, -0.6465835571289062, -0.617340087890625, -0.5880966186523438, -0.5588531494140625, -0.5296096801757812, -0.5003662109375, -0.47112274169921875, -0.4418792724609375, -0.41263580322265625, -0.383392333984375, -0.35414886474609375, -0.3249053955078125, -0.29566192626953125, -0.26641845703125, -0.23717498779296875, -0.2079315185546875, -0.17868804931640625, -0.149444580078125, -0.12020111083984375, -0.0909576416015625, -0.06171417236328125, -0.032470703125, -0.00322723388671875, 0.0260162353515625, 0.05525970458984375, 0.084503173828125, 0.11374664306640625, 0.1429901123046875, 0.17223358154296875, 0.20147705078125, 0.23072052001953125, 0.2599639892578125, 0.28920745849609375, 0.318450927734375, 0.34769439697265625, 0.3769378662109375, 0.40618133544921875, 0.4354248046875, 0.46466827392578125, 0.4939117431640625, 0.5231552124023438, 0.552398681640625, 0.5816421508789062, 0.6108856201171875, 0.6401290893554688, 0.66937255859375, 0.6986160278320312, 0.7278594970703125, 0.7571029663085938, 0.786346435546875, 0.8155899047851562, 0.8448333740234375, 0.8740768432617188, 0.9033203125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 11.0, 13.0, 9.0, 26.0, 12.0, 16.0, 22.0, 15.0, 33.0, 36.0, 31.0, 27.0, 37.0, 54.0, 64.0, 49.0, 47.0, 42.0, 49.0, 40.0, 27.0, 33.0, 45.0, 36.0, 28.0, 27.0, 29.0, 27.0, 18.0, 11.0, 11.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.609375, -9.3336181640625, -9.057861328125, -8.7821044921875, -8.50634765625, -8.2305908203125, -7.954833984375, -7.6790771484375, -7.4033203125, -7.1275634765625, -6.851806640625, -6.5760498046875, -6.30029296875, -6.0245361328125, -5.748779296875, -5.4730224609375, -5.197265625, -4.9215087890625, -4.645751953125, -4.3699951171875, -4.09423828125, -3.8184814453125, -3.542724609375, -3.2669677734375, -2.9912109375, -2.7154541015625, -2.439697265625, -2.1639404296875, -1.88818359375, -1.6124267578125, -1.336669921875, -1.0609130859375, -0.78515625, -0.5093994140625, -0.233642578125, 0.0421142578125, 0.31787109375, 0.5936279296875, 0.869384765625, 1.1451416015625, 1.4208984375, 1.6966552734375, 1.972412109375, 2.2481689453125, 2.52392578125, 2.7996826171875, 3.075439453125, 3.3511962890625, 3.626953125, 3.9027099609375, 4.178466796875, 4.4542236328125, 4.72998046875, 5.0057373046875, 5.281494140625, 5.5572509765625, 5.8330078125, 6.1087646484375, 6.384521484375, 6.6602783203125, 6.93603515625, 7.2117919921875, 7.487548828125, 7.7633056640625, 8.0390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 19.0, 20.0, 39.0, 49.0, 89.0, 116.0, 196.0, 356.0, 614.0, 1010.0, 1827.0, 3139.0, 5396.0, 9508.0, 17177.0, 30067.0, 54104.0, 93326.0, 157782.0, 222667.0, 185538.0, 113692.0, 65992.0, 37291.0, 21058.0, 11765.0, 6672.0, 3832.0, 2144.0, 1253.0, 731.0, 428.0, 236.0, 158.0, 82.0, 61.0, 44.0, 27.0, 13.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.028961181640625, -0.99542236328125, -0.961883544921875, -0.9283447265625, -0.894805908203125, -0.86126708984375, -0.827728271484375, -0.794189453125, -0.760650634765625, -0.72711181640625, -0.693572998046875, -0.6600341796875, -0.626495361328125, -0.59295654296875, -0.559417724609375, -0.52587890625, -0.492340087890625, -0.45880126953125, -0.425262451171875, -0.3917236328125, -0.358184814453125, -0.32464599609375, -0.291107177734375, -0.257568359375, -0.224029541015625, -0.19049072265625, -0.156951904296875, -0.1234130859375, -0.089874267578125, -0.05633544921875, -0.022796630859375, 0.0107421875, 0.044281005859375, 0.07781982421875, 0.111358642578125, 0.1448974609375, 0.178436279296875, 0.21197509765625, 0.245513916015625, 0.279052734375, 0.312591552734375, 0.34613037109375, 0.379669189453125, 0.4132080078125, 0.446746826171875, 0.48028564453125, 0.513824462890625, 0.54736328125, 0.580902099609375, 0.61444091796875, 0.647979736328125, 0.6815185546875, 0.715057373046875, 0.74859619140625, 0.782135009765625, 0.815673828125, 0.849212646484375, 0.88275146484375, 0.916290283203125, 0.9498291015625, 0.983367919921875, 1.01690673828125, 1.050445556640625, 1.083984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 4.0, 10.0, 8.0, 12.0, 10.0, 12.0, 16.0, 18.0, 13.0, 20.0, 24.0, 28.0, 27.0, 44.0, 41.0, 27.0, 40.0, 41.0, 32.0, 46.0, 41.0, 40.0, 40.0, 47.0, 36.0, 31.0, 30.0, 34.0, 43.0, 23.0, 22.0, 13.0, 16.0, 19.0, 16.0, 12.0, 8.0, 12.0, 9.0, 11.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.82659912109375, -4.6649169921875, -4.50323486328125, -4.341552734375, -4.17987060546875, -4.0181884765625, -3.85650634765625, -3.69482421875, -3.53314208984375, -3.3714599609375, -3.20977783203125, -3.048095703125, -2.88641357421875, -2.7247314453125, -2.56304931640625, -2.4013671875, -2.23968505859375, -2.0780029296875, -1.91632080078125, -1.754638671875, -1.59295654296875, -1.4312744140625, -1.26959228515625, -1.10791015625, -0.94622802734375, -0.7845458984375, -0.62286376953125, -0.461181640625, -0.29949951171875, -0.1378173828125, 0.02386474609375, 0.185546875, 0.34722900390625, 0.5089111328125, 0.67059326171875, 0.832275390625, 0.99395751953125, 1.1556396484375, 1.31732177734375, 1.47900390625, 1.64068603515625, 1.8023681640625, 1.96405029296875, 2.125732421875, 2.28741455078125, 2.4490966796875, 2.61077880859375, 2.7724609375, 2.93414306640625, 3.0958251953125, 3.25750732421875, 3.419189453125, 3.58087158203125, 3.7425537109375, 3.90423583984375, 4.06591796875, 4.22760009765625, 4.3892822265625, 4.55096435546875, 4.712646484375, 4.87432861328125, 5.0360107421875, 5.19769287109375, 5.359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 13.0, 16.0, 30.0, 34.0, 60.0, 96.0, 149.0, 252.0, 437.0, 806.0, 1657.0, 3516.0, 8674.0, 25782.0, 99948.0, 481278.0, 328056.0, 66324.0, 18837.0, 6768.0, 2801.0, 1327.0, 715.0, 372.0, 213.0, 125.0, 81.0, 55.0, 34.0, 25.0, 16.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.266357421875, -0.2589302062988281, -0.25150299072265625, -0.24407577514648438, -0.2366485595703125, -0.22922134399414062, -0.22179412841796875, -0.21436691284179688, -0.206939697265625, -0.19951248168945312, -0.19208526611328125, -0.18465805053710938, -0.1772308349609375, -0.16980361938476562, -0.16237640380859375, -0.15494918823242188, -0.14752197265625, -0.14009475708007812, -0.13266754150390625, -0.12524032592773438, -0.1178131103515625, -0.11038589477539062, -0.10295867919921875, -0.09553146362304688, -0.088104248046875, -0.08067703247070312, -0.07324981689453125, -0.06582260131835938, -0.0583953857421875, -0.050968170166015625, -0.04354095458984375, -0.036113739013671875, -0.0286865234375, -0.021259307861328125, -0.01383209228515625, -0.006404876708984375, 0.0010223388671875, 0.008449554443359375, 0.01587677001953125, 0.023303985595703125, 0.030731201171875, 0.038158416748046875, 0.04558563232421875, 0.053012847900390625, 0.0604400634765625, 0.06786727905273438, 0.07529449462890625, 0.08272171020507812, 0.09014892578125, 0.09757614135742188, 0.10500335693359375, 0.11243057250976562, 0.1198577880859375, 0.12728500366210938, 0.13471221923828125, 0.14213943481445312, 0.149566650390625, 0.15699386596679688, 0.16442108154296875, 0.17184829711914062, 0.1792755126953125, 0.18670272827148438, 0.19412994384765625, 0.20155715942382812, 0.208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 4.0, 11.0, 15.0, 8.0, 14.0, 18.0, 21.0, 28.0, 34.0, 40.0, 31.0, 37.0, 34.0, 48.0, 45.0, 46.0, 43.0, 41.0, 56.0, 49.0, 63.0, 26.0, 46.0, 41.0, 35.0, 23.0, 16.0, 25.0, 23.0, 15.0, 8.0, 7.0, 7.0, 7.0, 5.0, 6.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1636875569820404e-05, -1.1233612895011902e-05, -1.08303502202034e-05, -1.0427087545394897e-05, -1.0023824870586395e-05, -9.620562195777893e-06, -9.217299520969391e-06, -8.814036846160889e-06, -8.410774171352386e-06, -8.007511496543884e-06, -7.604248821735382e-06, -7.20098614692688e-06, -6.797723472118378e-06, -6.3944607973098755e-06, -5.991198122501373e-06, -5.587935447692871e-06, -5.184672772884369e-06, -4.781410098075867e-06, -4.3781474232673645e-06, -3.974884748458862e-06, -3.57162207365036e-06, -3.168359398841858e-06, -2.7650967240333557e-06, -2.3618340492248535e-06, -1.9585713744163513e-06, -1.5553086996078491e-06, -1.152046024799347e-06, -7.487833499908447e-07, -3.4552067518234253e-07, 5.774199962615967e-08, 4.6100467443466187e-07, 8.642673492431641e-07, 1.2675300240516663e-06, 1.6707926988601685e-06, 2.0740553736686707e-06, 2.477318048477173e-06, 2.880580723285675e-06, 3.2838433980941772e-06, 3.6871060729026794e-06, 4.090368747711182e-06, 4.493631422519684e-06, 4.896894097328186e-06, 5.300156772136688e-06, 5.7034194469451904e-06, 6.106682121753693e-06, 6.509944796562195e-06, 6.913207471370697e-06, 7.316470146179199e-06, 7.719732820987701e-06, 8.122995495796204e-06, 8.526258170604706e-06, 8.929520845413208e-06, 9.33278352022171e-06, 9.736046195030212e-06, 1.0139308869838715e-05, 1.0542571544647217e-05, 1.0945834219455719e-05, 1.1349096894264221e-05, 1.1752359569072723e-05, 1.2155622243881226e-05, 1.2558884918689728e-05, 1.296214759349823e-05, 1.3365410268306732e-05, 1.3768672943115234e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 11.0, 5.0, 7.0, 13.0, 16.0, 28.0, 31.0, 51.0, 67.0, 97.0, 142.0, 186.0, 261.0, 335.0, 472.0, 646.0, 976.0, 1310.0, 2098.0, 3089.0, 4861.0, 7888.0, 13020.0, 22392.0, 39538.0, 72633.0, 138710.0, 251757.0, 222122.0, 117571.0, 62516.0, 34099.0, 19628.0, 11745.0, 6937.0, 4414.0, 2814.0, 1824.0, 1240.0, 864.0, 643.0, 427.0, 315.0, 195.0, 161.0, 104.0, 95.0, 57.0, 45.0, 29.0, 28.0, 19.0, 11.0, 10.0, 7.0, 2.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.12548828125, -0.121551513671875, -0.11761474609375, -0.113677978515625, -0.1097412109375, -0.105804443359375, -0.10186767578125, -0.097930908203125, -0.093994140625, -0.090057373046875, -0.08612060546875, -0.082183837890625, -0.0782470703125, -0.074310302734375, -0.07037353515625, -0.066436767578125, -0.0625, -0.058563232421875, -0.05462646484375, -0.050689697265625, -0.0467529296875, -0.042816162109375, -0.03887939453125, -0.034942626953125, -0.031005859375, -0.027069091796875, -0.02313232421875, -0.019195556640625, -0.0152587890625, -0.011322021484375, -0.00738525390625, -0.003448486328125, 0.00048828125, 0.004425048828125, 0.00836181640625, 0.012298583984375, 0.0162353515625, 0.020172119140625, 0.02410888671875, 0.028045654296875, 0.031982421875, 0.035919189453125, 0.03985595703125, 0.043792724609375, 0.0477294921875, 0.051666259765625, 0.05560302734375, 0.059539794921875, 0.0634765625, 0.067413330078125, 0.07135009765625, 0.075286865234375, 0.0792236328125, 0.083160400390625, 0.08709716796875, 0.091033935546875, 0.094970703125, 0.098907470703125, 0.10284423828125, 0.106781005859375, 0.1107177734375, 0.114654541015625, 0.11859130859375, 0.122528076171875, 0.12646484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 12.0, 11.0, 19.0, 19.0, 23.0, 33.0, 52.0, 69.0, 83.0, 98.0, 99.0, 89.0, 72.0, 63.0, 50.0, 46.0, 29.0, 18.0, 16.0, 15.0, 4.0, 8.0, 6.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.050567626953125, -0.04895782470703125, -0.0473480224609375, -0.04573822021484375, -0.04412841796875, -0.04251861572265625, -0.0409088134765625, -0.03929901123046875, -0.037689208984375, -0.03607940673828125, -0.0344696044921875, -0.03285980224609375, -0.03125, -0.02964019775390625, -0.0280303955078125, -0.02642059326171875, -0.024810791015625, -0.02320098876953125, -0.0215911865234375, -0.01998138427734375, -0.01837158203125, -0.01676177978515625, -0.0151519775390625, -0.01354217529296875, -0.011932373046875, -0.01032257080078125, -0.0087127685546875, -0.00710296630859375, -0.0054931640625, -0.00388336181640625, -0.0022735595703125, -0.00066375732421875, 0.000946044921875, 0.00255584716796875, 0.0041656494140625, 0.00577545166015625, 0.00738525390625, 0.00899505615234375, 0.0106048583984375, 0.01221466064453125, 0.013824462890625, 0.01543426513671875, 0.0170440673828125, 0.01865386962890625, 0.020263671875, 0.02187347412109375, 0.0234832763671875, 0.02509307861328125, 0.026702880859375, 0.02831268310546875, 0.0299224853515625, 0.03153228759765625, 0.03314208984375, 0.03475189208984375, 0.0363616943359375, 0.03797149658203125, 0.039581298828125, 0.04119110107421875, 0.0428009033203125, 0.04441070556640625, 0.0460205078125, 0.04763031005859375, 0.0492401123046875, 0.05084991455078125, 0.052459716796875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 10.0, 11.0, 7.0, 15.0, 28.0, 29.0, 40.0, 43.0, 46.0, 68.0, 70.0, 78.0, 66.0, 64.0, 64.0, 50.0, 52.0, 36.0, 37.0, 27.0, 24.0, 26.0, 20.0, 11.0, 12.0, 11.0, 3.0, 7.0, 7.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.441118240356445, -10.140073776245117, -9.839029312133789, -9.537984848022461, -9.236940383911133, -8.935895919799805, -8.634851455688477, -8.333806991577148, -8.03276252746582, -7.731718063354492, -7.430673599243164, -7.129629135131836, -6.828584671020508, -6.52754020690918, -6.226495742797852, -5.925451278686523, -5.624406337738037, -5.323361873626709, -5.022317409515381, -4.721272945404053, -4.420228481292725, -4.1191840171813965, -3.8181393146514893, -3.517094850540161, -3.216050386428833, -2.915005922317505, -2.6139614582061768, -2.3129167556762695, -2.0118722915649414, -1.7108279466629028, -1.4097833633422852, -1.108738899230957, -0.8076944351196289, -0.5066499710083008, -0.20560544729232788, 0.09543907642364502, 0.39648354053497314, 0.6975280046463013, 0.998572587966919, 1.299617052078247, 1.6006615161895752, 1.9017059803009033, 2.2027504444122314, 2.5037951469421387, 2.804839611053467, 3.105884075164795, 3.406928539276123, 3.707973003387451, 4.009017467498779, 4.310061931610107, 4.6111063957214355, 4.912150859832764, 5.213195323944092, 5.51423978805542, 5.815284729003906, 6.116329193115234, 6.4173736572265625, 6.718418121337891, 7.019462585449219, 7.320507049560547, 7.621551513671875, 7.922595977783203, 8.223640441894531, 8.52468490600586, 8.825729370117188]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 5.0, 7.0, 11.0, 17.0, 13.0, 18.0, 11.0, 19.0, 19.0, 12.0, 18.0, 36.0, 34.0, 41.0, 43.0, 42.0, 56.0, 37.0, 40.0, 44.0, 43.0, 35.0, 37.0, 33.0, 37.0, 36.0, 28.0, 35.0, 22.0, 30.0, 19.0, 17.0, 18.0, 14.0, 10.0, 10.0, 9.0, 1.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.24524974822998, -7.997048377990723, -7.748847007751465, -7.500646114349365, -7.252444744110107, -7.00424337387085, -6.75604248046875, -6.507841110229492, -6.259639739990234, -6.011438369750977, -5.763236999511719, -5.515036106109619, -5.266834735870361, -5.0186333656311035, -4.770432472229004, -4.522231101989746, -4.274029731750488, -4.0258283615112305, -3.7776272296905518, -3.529426097869873, -3.2812247276306152, -3.0330233573913574, -2.7848222255706787, -2.53662109375, -2.288419723510742, -2.0402183532714844, -1.7920172214508057, -1.5438159704208374, -1.2956147193908691, -1.0474134683609009, -0.7992122173309326, -0.5510109663009644, -0.3028101921081543, -0.054608941078186035, 0.19359230995178223, 0.4417935609817505, 0.6899948120117188, 0.938196063041687, 1.1863973140716553, 1.4345985651016235, 1.6827998161315918, 1.93100106716156, 2.1792023181915283, 2.427403450012207, 2.675604820251465, 2.9238061904907227, 3.1720073223114014, 3.42020845413208, 3.668409824371338, 3.9166111946105957, 4.164812088012695, 4.413013458251953, 4.661214828491211, 4.909416198730469, 5.157617568969727, 5.405818462371826, 5.654019832611084, 5.902221202850342, 6.150422096252441, 6.398623466491699, 6.646824836730957, 6.895026206970215, 7.143227577209473, 7.391428470611572, 7.63962984085083]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 16.0, 22.0, 24.0, 37.0, 69.0, 91.0, 147.0, 254.0, 362.0, 536.0, 860.0, 1351.0, 2165.0, 3236.0, 5142.0, 7940.0, 12750.0, 19946.0, 30586.0, 46310.0, 68964.0, 96026.0, 122555.0, 138842.0, 132765.0, 110624.0, 82289.0, 57299.0, 38155.0, 24846.0, 15912.0, 10315.0, 6573.0, 4113.0, 2659.0, 1727.0, 1077.0, 680.0, 473.0, 282.0, 207.0, 111.0, 84.0, 33.0, 38.0, 18.0, 16.0, 7.0, 8.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.8984375, -4.73919677734375, -4.5799560546875, -4.42071533203125, -4.261474609375, -4.10223388671875, -3.9429931640625, -3.78375244140625, -3.62451171875, -3.46527099609375, -3.3060302734375, -3.14678955078125, -2.987548828125, -2.82830810546875, -2.6690673828125, -2.50982666015625, -2.3505859375, -2.19134521484375, -2.0321044921875, -1.87286376953125, -1.713623046875, -1.55438232421875, -1.3951416015625, -1.23590087890625, -1.07666015625, -0.91741943359375, -0.7581787109375, -0.59893798828125, -0.439697265625, -0.28045654296875, -0.1212158203125, 0.03802490234375, 0.197265625, 0.35650634765625, 0.5157470703125, 0.67498779296875, 0.834228515625, 0.99346923828125, 1.1527099609375, 1.31195068359375, 1.47119140625, 1.63043212890625, 1.7896728515625, 1.94891357421875, 2.108154296875, 2.26739501953125, 2.4266357421875, 2.58587646484375, 2.7451171875, 2.90435791015625, 3.0635986328125, 3.22283935546875, 3.382080078125, 3.54132080078125, 3.7005615234375, 3.85980224609375, 4.01904296875, 4.17828369140625, 4.3375244140625, 4.49676513671875, 4.656005859375, 4.81524658203125, 4.9744873046875, 5.13372802734375, 5.29296875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 8.0, 7.0, 7.0, 8.0, 8.0, 14.0, 16.0, 15.0, 19.0, 9.0, 20.0, 24.0, 24.0, 26.0, 48.0, 40.0, 45.0, 58.0, 49.0, 44.0, 41.0, 43.0, 44.0, 37.0, 47.0, 34.0, 30.0, 32.0, 31.0, 31.0, 22.0, 19.0, 19.0, 16.0, 15.0, 8.0, 5.0, 7.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-9.4375, -9.1700439453125, -8.902587890625, -8.6351318359375, -8.36767578125, -8.1002197265625, -7.832763671875, -7.5653076171875, -7.2978515625, -7.0303955078125, -6.762939453125, -6.4954833984375, -6.22802734375, -5.9605712890625, -5.693115234375, -5.4256591796875, -5.158203125, -4.8907470703125, -4.623291015625, -4.3558349609375, -4.08837890625, -3.8209228515625, -3.553466796875, -3.2860107421875, -3.0185546875, -2.7510986328125, -2.483642578125, -2.2161865234375, -1.94873046875, -1.6812744140625, -1.413818359375, -1.1463623046875, -0.87890625, -0.6114501953125, -0.343994140625, -0.0765380859375, 0.19091796875, 0.4583740234375, 0.725830078125, 0.9932861328125, 1.2607421875, 1.5281982421875, 1.795654296875, 2.0631103515625, 2.33056640625, 2.5980224609375, 2.865478515625, 3.1329345703125, 3.400390625, 3.6678466796875, 3.935302734375, 4.2027587890625, 4.47021484375, 4.7376708984375, 5.005126953125, 5.2725830078125, 5.5400390625, 5.8074951171875, 6.074951171875, 6.3424072265625, 6.60986328125, 6.8773193359375, 7.144775390625, 7.4122314453125, 7.6796875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 10.0, 15.0, 12.0, 29.0, 25.0, 38.0, 74.0, 95.0, 163.0, 226.0, 344.0, 530.0, 834.0, 1328.0, 1904.0, 2876.0, 4629.0, 7060.0, 10650.0, 15904.0, 24106.0, 35191.0, 50651.0, 70694.0, 94400.0, 115545.0, 126000.0, 121116.0, 102810.0, 80138.0, 58259.0, 40272.0, 27844.0, 18632.0, 12526.0, 8038.0, 5447.0, 3694.0, 2186.0, 1483.0, 961.0, 620.0, 420.0, 270.0, 166.0, 114.0, 78.0, 53.0, 29.0, 31.0, 15.0, 15.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.578125, -4.428955078125, -4.27978515625, -4.130615234375, -3.9814453125, -3.832275390625, -3.68310546875, -3.533935546875, -3.384765625, -3.235595703125, -3.08642578125, -2.937255859375, -2.7880859375, -2.638916015625, -2.48974609375, -2.340576171875, -2.19140625, -2.042236328125, -1.89306640625, -1.743896484375, -1.5947265625, -1.445556640625, -1.29638671875, -1.147216796875, -0.998046875, -0.848876953125, -0.69970703125, -0.550537109375, -0.4013671875, -0.252197265625, -0.10302734375, 0.046142578125, 0.1953125, 0.344482421875, 0.49365234375, 0.642822265625, 0.7919921875, 0.941162109375, 1.09033203125, 1.239501953125, 1.388671875, 1.537841796875, 1.68701171875, 1.836181640625, 1.9853515625, 2.134521484375, 2.28369140625, 2.432861328125, 2.58203125, 2.731201171875, 2.88037109375, 3.029541015625, 3.1787109375, 3.327880859375, 3.47705078125, 3.626220703125, 3.775390625, 3.924560546875, 4.07373046875, 4.222900390625, 4.3720703125, 4.521240234375, 4.67041015625, 4.819580078125, 4.96875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 8.0, 11.0, 13.0, 11.0, 12.0, 21.0, 20.0, 18.0, 27.0, 35.0, 27.0, 35.0, 24.0, 33.0, 46.0, 37.0, 39.0, 48.0, 40.0, 39.0, 32.0, 31.0, 37.0, 32.0, 41.0, 33.0, 28.0, 33.0, 28.0, 20.0, 23.0, 21.0, 17.0, 15.0, 13.0, 5.0, 12.0, 13.0, 7.0, 3.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.33282470703125, -5.1734619140625, -5.01409912109375, -4.854736328125, -4.69537353515625, -4.5360107421875, -4.37664794921875, -4.21728515625, -4.05792236328125, -3.8985595703125, -3.73919677734375, -3.579833984375, -3.42047119140625, -3.2611083984375, -3.10174560546875, -2.9423828125, -2.78302001953125, -2.6236572265625, -2.46429443359375, -2.304931640625, -2.14556884765625, -1.9862060546875, -1.82684326171875, -1.66748046875, -1.50811767578125, -1.3487548828125, -1.18939208984375, -1.030029296875, -0.87066650390625, -0.7113037109375, -0.55194091796875, -0.392578125, -0.23321533203125, -0.0738525390625, 0.08551025390625, 0.244873046875, 0.40423583984375, 0.5635986328125, 0.72296142578125, 0.88232421875, 1.04168701171875, 1.2010498046875, 1.36041259765625, 1.519775390625, 1.67913818359375, 1.8385009765625, 1.99786376953125, 2.1572265625, 2.31658935546875, 2.4759521484375, 2.63531494140625, 2.794677734375, 2.95404052734375, 3.1134033203125, 3.27276611328125, 3.43212890625, 3.59149169921875, 3.7508544921875, 3.91021728515625, 4.069580078125, 4.22894287109375, 4.3883056640625, 4.54766845703125, 4.70703125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 5.0, 11.0, 6.0, 11.0, 18.0, 29.0, 33.0, 47.0, 68.0, 100.0, 152.0, 232.0, 295.0, 499.0, 714.0, 1101.0, 1807.0, 2846.0, 4773.0, 8436.0, 15688.0, 31121.0, 62867.0, 123824.0, 206741.0, 234848.0, 167169.0, 89720.0, 44982.0, 22408.0, 11660.0, 6333.0, 3632.0, 2225.0, 1364.0, 936.0, 585.0, 401.0, 265.0, 207.0, 121.0, 93.0, 55.0, 33.0, 31.0, 22.0, 19.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.575439453125, -2.48095703125, -2.386474609375, -2.2919921875, -2.197509765625, -2.10302734375, -2.008544921875, -1.9140625, -1.819580078125, -1.72509765625, -1.630615234375, -1.5361328125, -1.441650390625, -1.34716796875, -1.252685546875, -1.158203125, -1.063720703125, -0.96923828125, -0.874755859375, -0.7802734375, -0.685791015625, -0.59130859375, -0.496826171875, -0.40234375, -0.307861328125, -0.21337890625, -0.118896484375, -0.0244140625, 0.070068359375, 0.16455078125, 0.259033203125, 0.353515625, 0.447998046875, 0.54248046875, 0.636962890625, 0.7314453125, 0.825927734375, 0.92041015625, 1.014892578125, 1.109375, 1.203857421875, 1.29833984375, 1.392822265625, 1.4873046875, 1.581787109375, 1.67626953125, 1.770751953125, 1.865234375, 1.959716796875, 2.05419921875, 2.148681640625, 2.2431640625, 2.337646484375, 2.43212890625, 2.526611328125, 2.62109375, 2.715576171875, 2.81005859375, 2.904541015625, 2.9990234375, 3.093505859375, 3.18798828125, 3.282470703125, 3.376953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 6.0, 8.0, 14.0, 11.0, 19.0, 31.0, 40.0, 44.0, 54.0, 60.0, 79.0, 68.0, 86.0, 90.0, 70.0, 66.0, 62.0, 41.0, 35.0, 28.0, 23.0, 17.0, 13.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021266937255859375, -0.0002051927149295807, -0.00019771605730056763, -0.00019023939967155457, -0.0001827627420425415, -0.00017528608441352844, -0.00016780942678451538, -0.00016033276915550232, -0.00015285611152648926, -0.0001453794538974762, -0.00013790279626846313, -0.00013042613863945007, -0.000122949481010437, -0.00011547282338142395, -0.00010799616575241089, -0.00010051950812339783, -9.304285049438477e-05, -8.55661928653717e-05, -7.808953523635864e-05, -7.061287760734558e-05, -6.313621997833252e-05, -5.565956234931946e-05, -4.8182904720306396e-05, -4.0706247091293335e-05, -3.3229589462280273e-05, -2.5752931833267212e-05, -1.827627420425415e-05, -1.0799616575241089e-05, -3.3229589462280273e-06, 4.153698682785034e-06, 1.1630356311798096e-05, 1.9107013940811157e-05, 2.658367156982422e-05, 3.406032919883728e-05, 4.153698682785034e-05, 4.90136444568634e-05, 5.6490302085876465e-05, 6.396695971488953e-05, 7.144361734390259e-05, 7.892027497291565e-05, 8.639693260192871e-05, 9.387359023094177e-05, 0.00010135024785995483, 0.0001088269054889679, 0.00011630356311798096, 0.00012378022074699402, 0.00013125687837600708, 0.00013873353600502014, 0.0001462101936340332, 0.00015368685126304626, 0.00016116350889205933, 0.0001686401665210724, 0.00017611682415008545, 0.0001835934817790985, 0.00019107013940811157, 0.00019854679703712463, 0.0002060234546661377, 0.00021350011229515076, 0.00022097676992416382, 0.00022845342755317688, 0.00023593008518218994, 0.000243406742811203, 0.00025088340044021606, 0.0002583600580692291, 0.0002658367156982422]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 14.0, 12.0, 26.0, 25.0, 60.0, 102.0, 123.0, 210.0, 343.0, 656.0, 947.0, 1628.0, 2869.0, 5179.0, 9458.0, 18326.0, 36701.0, 74272.0, 146139.0, 231517.0, 228654.0, 142879.0, 73106.0, 36063.0, 17920.0, 9450.0, 4912.0, 2764.0, 1635.0, 992.0, 588.0, 357.0, 202.0, 133.0, 93.0, 65.0, 37.0, 33.0, 24.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.041015625, -2.94287109375, -2.8447265625, -2.74658203125, -2.6484375, -2.55029296875, -2.4521484375, -2.35400390625, -2.255859375, -2.15771484375, -2.0595703125, -1.96142578125, -1.86328125, -1.76513671875, -1.6669921875, -1.56884765625, -1.470703125, -1.37255859375, -1.2744140625, -1.17626953125, -1.078125, -0.97998046875, -0.8818359375, -0.78369140625, -0.685546875, -0.58740234375, -0.4892578125, -0.39111328125, -0.29296875, -0.19482421875, -0.0966796875, 0.00146484375, 0.099609375, 0.19775390625, 0.2958984375, 0.39404296875, 0.4921875, 0.59033203125, 0.6884765625, 0.78662109375, 0.884765625, 0.98291015625, 1.0810546875, 1.17919921875, 1.27734375, 1.37548828125, 1.4736328125, 1.57177734375, 1.669921875, 1.76806640625, 1.8662109375, 1.96435546875, 2.0625, 2.16064453125, 2.2587890625, 2.35693359375, 2.455078125, 2.55322265625, 2.6513671875, 2.74951171875, 2.84765625, 2.94580078125, 3.0439453125, 3.14208984375, 3.240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 7.0, 4.0, 10.0, 10.0, 10.0, 20.0, 15.0, 30.0, 32.0, 45.0, 37.0, 58.0, 56.0, 61.0, 87.0, 79.0, 92.0, 65.0, 40.0, 50.0, 30.0, 37.0, 22.0, 26.0, 12.0, 10.0, 10.0, 11.0, 9.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8914794921875, -0.861572265625, -0.8316650390625, -0.8017578125, -0.7718505859375, -0.741943359375, -0.7120361328125, -0.68212890625, -0.6522216796875, -0.622314453125, -0.5924072265625, -0.5625, -0.5325927734375, -0.502685546875, -0.4727783203125, -0.44287109375, -0.4129638671875, -0.383056640625, -0.3531494140625, -0.3232421875, -0.2933349609375, -0.263427734375, -0.2335205078125, -0.20361328125, -0.1737060546875, -0.143798828125, -0.1138916015625, -0.083984375, -0.0540771484375, -0.024169921875, 0.0057373046875, 0.03564453125, 0.0655517578125, 0.095458984375, 0.1253662109375, 0.1552734375, 0.1851806640625, 0.215087890625, 0.2449951171875, 0.27490234375, 0.3048095703125, 0.334716796875, 0.3646240234375, 0.39453125, 0.4244384765625, 0.454345703125, 0.4842529296875, 0.51416015625, 0.5440673828125, 0.573974609375, 0.6038818359375, 0.6337890625, 0.6636962890625, 0.693603515625, 0.7235107421875, 0.75341796875, 0.7833251953125, 0.813232421875, 0.8431396484375, 0.873046875, 0.9029541015625, 0.932861328125, 0.9627685546875, 0.99267578125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 7.0, 7.0, 14.0, 12.0, 21.0, 19.0, 32.0, 44.0, 35.0, 54.0, 57.0, 71.0, 59.0, 74.0, 63.0, 69.0, 58.0, 42.0, 37.0, 33.0, 26.0, 26.0, 18.0, 26.0, 6.0, 8.0, 9.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.823494911193848, -9.539056777954102, -9.254619598388672, -8.970181465148926, -8.685744285583496, -8.40130615234375, -8.11686897277832, -7.832430839538574, -7.547992706298828, -7.26355504989624, -6.979117393493652, -6.694679260253906, -6.410241603851318, -6.1258039474487305, -5.841366291046143, -5.556928634643555, -5.272490978240967, -4.988053321838379, -4.703615665435791, -4.419178009033203, -4.134739875793457, -3.850302219390869, -3.5658645629882812, -3.2814269065856934, -2.9969890117645264, -2.7125513553619385, -2.4281134605407715, -2.1436758041381836, -1.8592380285263062, -1.5748002529144287, -1.2903625965118408, -1.0059248208999634, -0.7214870452880859, -0.4370492994785309, -0.15261155366897583, 0.13182616233825684, 0.4162639379501343, 0.7007017135620117, 0.9851393699645996, 1.269577145576477, 1.5540149211883545, 1.838452696800232, 2.1228904724121094, 2.4073281288146973, 2.691765785217285, 2.976203680038452, 3.26064133644104, 3.545079231262207, 3.829516887664795, 4.113954544067383, 4.398392200469971, 4.682829856872559, 4.967267990112305, 5.251705646514893, 5.5361433029174805, 5.820580959320068, 6.105018615722656, 6.389456272125244, 6.673893928527832, 6.958332061767578, 7.242769718170166, 7.527207374572754, 7.811645030975342, 8.09608268737793, 8.380520820617676]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 13.0, 4.0, 14.0, 14.0, 20.0, 15.0, 11.0, 14.0, 26.0, 24.0, 35.0, 38.0, 40.0, 46.0, 44.0, 37.0, 39.0, 47.0, 41.0, 47.0, 43.0, 37.0, 27.0, 36.0, 38.0, 27.0, 34.0, 34.0, 28.0, 20.0, 11.0, 13.0, 10.0, 6.0, 6.0, 10.0, 6.0, 7.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.62846851348877, -8.365291595458984, -8.102115631103516, -7.8389387130737305, -7.575761795043945, -7.312585353851318, -7.049408912658691, -6.786231994628906, -6.523055553436279, -6.259879112243652, -5.996702194213867, -5.73352575302124, -5.470349311828613, -5.207172393798828, -4.943995952606201, -4.680819511413574, -4.417642593383789, -4.154466152191162, -3.891289234161377, -3.62811279296875, -3.364936113357544, -3.101759433746338, -2.838582992553711, -2.575406312942505, -2.312229633331299, -2.0490529537200928, -1.7858763933181763, -1.5226998329162598, -1.2595231533050537, -0.9963464736938477, -0.7331699132919312, -0.46999335289001465, -0.206817626953125, 0.05635899305343628, 0.31953561305999756, 0.5827122330665588, 0.8458888530731201, 1.1090655326843262, 1.3722420930862427, 1.6354186534881592, 1.8985953330993652, 2.1617720127105713, 2.4249486923217773, 2.6881251335144043, 2.9513018131256104, 3.2144784927368164, 3.4776549339294434, 3.7408316135406494, 4.0040082931518555, 4.267184734344482, 4.530361652374268, 4.7935380935668945, 5.05671501159668, 5.319891452789307, 5.583067893981934, 5.846244812011719, 6.109421253204346, 6.372597694396973, 6.635774612426758, 6.898951053619385, 7.162127494812012, 7.425304412841797, 7.688480854034424, 7.951657295227051, 8.214834213256836]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 6.0, 13.0, 8.0, 17.0, 31.0, 54.0, 82.0, 145.0, 195.0, 308.0, 460.0, 782.0, 1265.0, 1978.0, 3040.0, 5105.0, 8483.0, 13812.0, 23936.0, 41313.0, 73325.0, 131326.0, 237232.0, 421691.0, 680588.0, 838742.0, 696741.0, 439024.0, 249284.0, 139194.0, 77792.0, 44190.0, 25287.0, 14968.0, 8928.0, 5495.0, 3381.0, 2122.0, 1406.0, 859.0, 608.0, 359.0, 235.0, 165.0, 110.0, 77.0, 50.0, 27.0, 9.0, 14.0, 16.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.2890625, -7.0423583984375, -6.795654296875, -6.5489501953125, -6.30224609375, -6.0555419921875, -5.808837890625, -5.5621337890625, -5.3154296875, -5.0687255859375, -4.822021484375, -4.5753173828125, -4.32861328125, -4.0819091796875, -3.835205078125, -3.5885009765625, -3.341796875, -3.0950927734375, -2.848388671875, -2.6016845703125, -2.35498046875, -2.1082763671875, -1.861572265625, -1.6148681640625, -1.3681640625, -1.1214599609375, -0.874755859375, -0.6280517578125, -0.38134765625, -0.1346435546875, 0.112060546875, 0.3587646484375, 0.60546875, 0.8521728515625, 1.098876953125, 1.3455810546875, 1.59228515625, 1.8389892578125, 2.085693359375, 2.3323974609375, 2.5791015625, 2.8258056640625, 3.072509765625, 3.3192138671875, 3.56591796875, 3.8126220703125, 4.059326171875, 4.3060302734375, 4.552734375, 4.7994384765625, 5.046142578125, 5.2928466796875, 5.53955078125, 5.7862548828125, 6.032958984375, 6.2796630859375, 6.5263671875, 6.7730712890625, 7.019775390625, 7.2664794921875, 7.51318359375, 7.7598876953125, 8.006591796875, 8.2532958984375, 8.5]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 1.0, 7.0, 10.0, 8.0, 12.0, 16.0, 7.0, 13.0, 15.0, 20.0, 15.0, 24.0, 30.0, 38.0, 42.0, 23.0, 40.0, 39.0, 41.0, 46.0, 47.0, 52.0, 49.0, 37.0, 42.0, 41.0, 28.0, 38.0, 30.0, 32.0, 29.0, 21.0, 12.0, 20.0, 21.0, 15.0, 5.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.6640625, -6.4718017578125, -6.279541015625, -6.0872802734375, -5.89501953125, -5.7027587890625, -5.510498046875, -5.3182373046875, -5.1259765625, -4.9337158203125, -4.741455078125, -4.5491943359375, -4.35693359375, -4.1646728515625, -3.972412109375, -3.7801513671875, -3.587890625, -3.3956298828125, -3.203369140625, -3.0111083984375, -2.81884765625, -2.6265869140625, -2.434326171875, -2.2420654296875, -2.0498046875, -1.8575439453125, -1.665283203125, -1.4730224609375, -1.28076171875, -1.0885009765625, -0.896240234375, -0.7039794921875, -0.51171875, -0.3194580078125, -0.127197265625, 0.0650634765625, 0.25732421875, 0.4495849609375, 0.641845703125, 0.8341064453125, 1.0263671875, 1.2186279296875, 1.410888671875, 1.6031494140625, 1.79541015625, 1.9876708984375, 2.179931640625, 2.3721923828125, 2.564453125, 2.7567138671875, 2.948974609375, 3.1412353515625, 3.33349609375, 3.5257568359375, 3.718017578125, 3.9102783203125, 4.1025390625, 4.2947998046875, 4.487060546875, 4.6793212890625, 4.87158203125, 5.0638427734375, 5.256103515625, 5.4483642578125, 5.640625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 8.0, 11.0, 17.0, 35.0, 47.0, 71.0, 117.0, 169.0, 300.0, 494.0, 875.0, 1504.0, 2571.0, 4612.0, 8759.0, 16050.0, 30089.0, 58689.0, 112885.0, 215436.0, 394811.0, 644897.0, 828412.0, 754277.0, 507912.0, 289148.0, 153042.0, 79776.0, 41530.0, 21627.0, 11402.0, 6382.0, 3404.0, 1931.0, 1188.0, 666.0, 421.0, 267.0, 147.0, 107.0, 67.0, 44.0, 31.0, 17.0, 14.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0], "bins": [-9.2734375, -9.0064697265625, -8.739501953125, -8.4725341796875, -8.20556640625, -7.9385986328125, -7.671630859375, -7.4046630859375, -7.1376953125, -6.8707275390625, -6.603759765625, -6.3367919921875, -6.06982421875, -5.8028564453125, -5.535888671875, -5.2689208984375, -5.001953125, -4.7349853515625, -4.468017578125, -4.2010498046875, -3.93408203125, -3.6671142578125, -3.400146484375, -3.1331787109375, -2.8662109375, -2.5992431640625, -2.332275390625, -2.0653076171875, -1.79833984375, -1.5313720703125, -1.264404296875, -0.9974365234375, -0.73046875, -0.4635009765625, -0.196533203125, 0.0704345703125, 0.33740234375, 0.6043701171875, 0.871337890625, 1.1383056640625, 1.4052734375, 1.6722412109375, 1.939208984375, 2.2061767578125, 2.47314453125, 2.7401123046875, 3.007080078125, 3.2740478515625, 3.541015625, 3.8079833984375, 4.074951171875, 4.3419189453125, 4.60888671875, 4.8758544921875, 5.142822265625, 5.4097900390625, 5.6767578125, 5.9437255859375, 6.210693359375, 6.4776611328125, 6.74462890625, 7.0115966796875, 7.278564453125, 7.5455322265625, 7.8125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 12.0, 14.0, 21.0, 34.0, 27.0, 58.0, 70.0, 72.0, 84.0, 106.0, 132.0, 151.0, 156.0, 212.0, 243.0, 256.0, 249.0, 260.0, 234.0, 225.0, 239.0, 214.0, 157.0, 132.0, 130.0, 111.0, 98.0, 90.0, 55.0, 36.0, 38.0, 35.0, 25.0, 26.0, 18.0, 14.0, 9.0, 7.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.7208251953125, -2.615478515625, -2.5101318359375, -2.40478515625, -2.2994384765625, -2.194091796875, -2.0887451171875, -1.9833984375, -1.8780517578125, -1.772705078125, -1.6673583984375, -1.56201171875, -1.4566650390625, -1.351318359375, -1.2459716796875, -1.140625, -1.0352783203125, -0.929931640625, -0.8245849609375, -0.71923828125, -0.6138916015625, -0.508544921875, -0.4031982421875, -0.2978515625, -0.1925048828125, -0.087158203125, 0.0181884765625, 0.12353515625, 0.2288818359375, 0.334228515625, 0.4395751953125, 0.544921875, 0.6502685546875, 0.755615234375, 0.8609619140625, 0.96630859375, 1.0716552734375, 1.177001953125, 1.2823486328125, 1.3876953125, 1.4930419921875, 1.598388671875, 1.7037353515625, 1.80908203125, 1.9144287109375, 2.019775390625, 2.1251220703125, 2.23046875, 2.3358154296875, 2.441162109375, 2.5465087890625, 2.65185546875, 2.7572021484375, 2.862548828125, 2.9678955078125, 3.0732421875, 3.1785888671875, 3.283935546875, 3.3892822265625, 3.49462890625, 3.5999755859375, 3.705322265625, 3.8106689453125, 3.916015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 12.0, 5.0, 18.0, 10.0, 9.0, 16.0, 18.0, 24.0, 24.0, 37.0, 52.0, 58.0, 71.0, 55.0, 63.0, 58.0, 66.0, 71.0, 52.0, 59.0, 39.0, 30.0, 29.0, 26.0, 25.0, 15.0, 16.0, 14.0, 2.0, 2.0, 10.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.388952255249023, -9.080912590026855, -8.772871971130371, -8.464832305908203, -8.156791687011719, -7.848752021789551, -7.540711879730225, -7.232671737670898, -6.924631595611572, -6.616591453552246, -6.30855131149292, -6.000511169433594, -5.692471504211426, -5.384430885314941, -5.076391220092773, -4.768351078033447, -4.460310935974121, -4.152270793914795, -3.8442306518554688, -3.5361907482147217, -3.2281506061553955, -2.9201104640960693, -2.6120705604553223, -2.304030418395996, -1.99599027633667, -1.6879501342773438, -1.3799101114273071, -1.0718700885772705, -0.7638299465179443, -0.45578980445861816, -0.14774978160858154, 0.16029024124145508, 0.46833133697509766, 0.776371419429779, 1.0844115018844604, 1.392451524734497, 1.7004916667938232, 2.0085318088531494, 2.3165717124938965, 2.6246118545532227, 2.932651996612549, 3.240692138671875, 3.548732280731201, 3.8567721843719482, 4.164812088012695, 4.47285270690918, 4.780892372131348, 5.088932514190674, 5.39697265625, 5.705012798309326, 6.013052940368652, 6.3210930824279785, 6.629133224487305, 6.937172889709473, 7.245213031768799, 7.553253173828125, 7.861293315887451, 8.169333457946777, 8.477373123168945, 8.78541374206543, 9.093453407287598, 9.401494026184082, 9.70953369140625, 10.017574310302734, 10.325613975524902]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 9.0, 7.0, 12.0, 16.0, 17.0, 12.0, 21.0, 23.0, 17.0, 30.0, 33.0, 34.0, 35.0, 47.0, 47.0, 52.0, 45.0, 37.0, 55.0, 38.0, 45.0, 46.0, 43.0, 40.0, 33.0, 29.0, 32.0, 35.0, 18.0, 8.0, 8.0, 19.0, 15.0, 11.0, 7.0, 2.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.691173553466797, -10.407111167907715, -10.123048782348633, -9.838985443115234, -9.554923057556152, -9.27086067199707, -8.986797332763672, -8.70273494720459, -8.418672561645508, -8.134610176086426, -7.8505473136901855, -7.566484451293945, -7.282422065734863, -6.998359680175781, -6.714296817779541, -6.430233955383301, -6.146171569824219, -5.862109184265137, -5.5780463218688965, -5.293983459472656, -5.009921073913574, -4.725858688354492, -4.441795825958252, -4.157732963562012, -3.8736705780029297, -3.5896079540252686, -3.3055453300476074, -3.0214827060699463, -2.737420082092285, -2.453357458114624, -2.169294834136963, -1.8852322101593018, -1.6011686325073242, -1.317106008529663, -1.033043384552002, -0.7489807605743408, -0.4649181365966797, -0.18085551261901855, 0.10320711135864258, 0.3872697353363037, 0.6713323593139648, 0.955394983291626, 1.239457607269287, 1.5235202312469482, 1.8075828552246094, 2.0916454792022705, 2.3757081031799316, 2.6597707271575928, 2.943833351135254, 3.227895975112915, 3.511958599090576, 3.7960212230682373, 4.080083847045898, 4.3641462326049805, 4.648209095001221, 4.932271957397461, 5.216334342956543, 5.500396728515625, 5.784459590911865, 6.0685224533081055, 6.3525848388671875, 6.6366472244262695, 6.92071008682251, 7.20477294921875, 7.488835334777832]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 9.0, 15.0, 16.0, 17.0, 34.0, 59.0, 101.0, 109.0, 194.0, 284.0, 407.0, 612.0, 880.0, 1367.0, 2063.0, 3143.0, 4500.0, 7305.0, 11369.0, 17678.0, 28546.0, 45559.0, 74411.0, 119755.0, 177953.0, 190445.0, 135787.0, 84374.0, 52545.0, 32157.0, 20231.0, 12825.0, 8242.0, 5269.0, 3464.0, 2258.0, 1525.0, 1014.0, 680.0, 413.0, 306.0, 217.0, 118.0, 92.0, 62.0, 41.0, 38.0, 19.0, 13.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.86328125, -0.8355560302734375, -0.807830810546875, -0.7801055908203125, -0.75238037109375, -0.7246551513671875, -0.696929931640625, -0.6692047119140625, -0.6414794921875, -0.6137542724609375, -0.586029052734375, -0.5583038330078125, -0.53057861328125, -0.5028533935546875, -0.475128173828125, -0.4474029541015625, -0.419677734375, -0.3919525146484375, -0.364227294921875, -0.3365020751953125, -0.30877685546875, -0.2810516357421875, -0.253326416015625, -0.2256011962890625, -0.1978759765625, -0.1701507568359375, -0.142425537109375, -0.1147003173828125, -0.08697509765625, -0.0592498779296875, -0.031524658203125, -0.0037994384765625, 0.02392578125, 0.0516510009765625, 0.079376220703125, 0.1071014404296875, 0.13482666015625, 0.1625518798828125, 0.190277099609375, 0.2180023193359375, 0.2457275390625, 0.2734527587890625, 0.301177978515625, 0.3289031982421875, 0.35662841796875, 0.3843536376953125, 0.412078857421875, 0.4398040771484375, 0.467529296875, 0.4952545166015625, 0.522979736328125, 0.5507049560546875, 0.57843017578125, 0.6061553955078125, 0.633880615234375, 0.6616058349609375, 0.6893310546875, 0.7170562744140625, 0.744781494140625, 0.7725067138671875, 0.80023193359375, 0.8279571533203125, 0.855682373046875, 0.8834075927734375, 0.9111328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 8.0, 4.0, 12.0, 16.0, 12.0, 7.0, 21.0, 22.0, 27.0, 25.0, 26.0, 38.0, 45.0, 52.0, 38.0, 36.0, 51.0, 50.0, 41.0, 55.0, 48.0, 47.0, 39.0, 45.0, 31.0, 37.0, 31.0, 21.0, 23.0, 16.0, 17.0, 10.0, 9.0, 8.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-11.2578125, -10.9622802734375, -10.666748046875, -10.3712158203125, -10.07568359375, -9.7801513671875, -9.484619140625, -9.1890869140625, -8.8935546875, -8.5980224609375, -8.302490234375, -8.0069580078125, -7.71142578125, -7.4158935546875, -7.120361328125, -6.8248291015625, -6.529296875, -6.2337646484375, -5.938232421875, -5.6427001953125, -5.34716796875, -5.0516357421875, -4.756103515625, -4.4605712890625, -4.1650390625, -3.8695068359375, -3.573974609375, -3.2784423828125, -2.98291015625, -2.6873779296875, -2.391845703125, -2.0963134765625, -1.80078125, -1.5052490234375, -1.209716796875, -0.9141845703125, -0.61865234375, -0.3231201171875, -0.027587890625, 0.2679443359375, 0.5634765625, 0.8590087890625, 1.154541015625, 1.4500732421875, 1.74560546875, 2.0411376953125, 2.336669921875, 2.6322021484375, 2.927734375, 3.2232666015625, 3.518798828125, 3.8143310546875, 4.10986328125, 4.4053955078125, 4.700927734375, 4.9964599609375, 5.2919921875, 5.5875244140625, 5.883056640625, 6.1785888671875, 6.47412109375, 6.7696533203125, 7.065185546875, 7.3607177734375, 7.65625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 8.0, 10.0, 13.0, 26.0, 41.0, 52.0, 90.0, 140.0, 246.0, 395.0, 631.0, 1143.0, 1933.0, 3245.0, 5931.0, 10343.0, 18644.0, 33578.0, 60009.0, 108751.0, 188162.0, 241004.0, 164183.0, 92822.0, 51717.0, 28352.0, 16198.0, 8977.0, 5095.0, 2718.0, 1647.0, 1020.0, 530.0, 351.0, 220.0, 116.0, 69.0, 56.0, 27.0, 18.0, 14.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1572265625, -1.120330810546875, -1.08343505859375, -1.046539306640625, -1.0096435546875, -0.972747802734375, -0.93585205078125, -0.898956298828125, -0.862060546875, -0.825164794921875, -0.78826904296875, -0.751373291015625, -0.7144775390625, -0.677581787109375, -0.64068603515625, -0.603790283203125, -0.56689453125, -0.529998779296875, -0.49310302734375, -0.456207275390625, -0.4193115234375, -0.382415771484375, -0.34552001953125, -0.308624267578125, -0.271728515625, -0.234832763671875, -0.19793701171875, -0.161041259765625, -0.1241455078125, -0.087249755859375, -0.05035400390625, -0.013458251953125, 0.0234375, 0.060333251953125, 0.09722900390625, 0.134124755859375, 0.1710205078125, 0.207916259765625, 0.24481201171875, 0.281707763671875, 0.318603515625, 0.355499267578125, 0.39239501953125, 0.429290771484375, 0.4661865234375, 0.503082275390625, 0.53997802734375, 0.576873779296875, 0.61376953125, 0.650665283203125, 0.68756103515625, 0.724456787109375, 0.7613525390625, 0.798248291015625, 0.83514404296875, 0.872039794921875, 0.908935546875, 0.945831298828125, 0.98272705078125, 1.019622802734375, 1.0565185546875, 1.093414306640625, 1.13031005859375, 1.167205810546875, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 9.0, 5.0, 11.0, 19.0, 14.0, 21.0, 21.0, 24.0, 20.0, 28.0, 31.0, 27.0, 23.0, 42.0, 38.0, 45.0, 47.0, 36.0, 39.0, 28.0, 33.0, 38.0, 38.0, 43.0, 43.0, 35.0, 16.0, 23.0, 24.0, 26.0, 20.0, 15.0, 17.0, 11.0, 15.0, 11.0, 11.0, 6.0, 3.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-5.01953125, -4.86822509765625, -4.7169189453125, -4.56561279296875, -4.414306640625, -4.26300048828125, -4.1116943359375, -3.96038818359375, -3.80908203125, -3.65777587890625, -3.5064697265625, -3.35516357421875, -3.203857421875, -3.05255126953125, -2.9012451171875, -2.74993896484375, -2.5986328125, -2.44732666015625, -2.2960205078125, -2.14471435546875, -1.993408203125, -1.84210205078125, -1.6907958984375, -1.53948974609375, -1.38818359375, -1.23687744140625, -1.0855712890625, -0.93426513671875, -0.782958984375, -0.63165283203125, -0.4803466796875, -0.32904052734375, -0.177734375, -0.02642822265625, 0.1248779296875, 0.27618408203125, 0.427490234375, 0.57879638671875, 0.7301025390625, 0.88140869140625, 1.03271484375, 1.18402099609375, 1.3353271484375, 1.48663330078125, 1.637939453125, 1.78924560546875, 1.9405517578125, 2.09185791015625, 2.2431640625, 2.39447021484375, 2.5457763671875, 2.69708251953125, 2.848388671875, 2.99969482421875, 3.1510009765625, 3.30230712890625, 3.45361328125, 3.60491943359375, 3.7562255859375, 3.90753173828125, 4.058837890625, 4.21014404296875, 4.3614501953125, 4.51275634765625, 4.6640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 12.0, 25.0, 30.0, 41.0, 42.0, 73.0, 99.0, 138.0, 181.0, 290.0, 371.0, 612.0, 883.0, 1264.0, 1919.0, 3079.0, 5108.0, 8707.0, 16542.0, 33718.0, 78557.0, 205700.0, 371261.0, 181622.0, 70607.0, 30556.0, 15216.0, 8375.0, 4880.0, 2870.0, 1872.0, 1190.0, 833.0, 524.0, 393.0, 277.0, 190.0, 128.0, 99.0, 72.0, 42.0, 42.0, 29.0, 17.0, 13.0, 12.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0], "bins": [-0.144775390625, -0.14057159423828125, -0.1363677978515625, -0.13216400146484375, -0.127960205078125, -0.12375640869140625, -0.1195526123046875, -0.11534881591796875, -0.11114501953125, -0.10694122314453125, -0.1027374267578125, -0.09853363037109375, -0.094329833984375, -0.09012603759765625, -0.0859222412109375, -0.08171844482421875, -0.0775146484375, -0.07331085205078125, -0.0691070556640625, -0.06490325927734375, -0.060699462890625, -0.05649566650390625, -0.0522918701171875, -0.04808807373046875, -0.04388427734375, -0.03968048095703125, -0.0354766845703125, -0.03127288818359375, -0.027069091796875, -0.02286529541015625, -0.0186614990234375, -0.01445770263671875, -0.01025390625, -0.00605010986328125, -0.0018463134765625, 0.00235748291015625, 0.006561279296875, 0.01076507568359375, 0.0149688720703125, 0.01917266845703125, 0.02337646484375, 0.02758026123046875, 0.0317840576171875, 0.03598785400390625, 0.040191650390625, 0.04439544677734375, 0.0485992431640625, 0.05280303955078125, 0.0570068359375, 0.06121063232421875, 0.0654144287109375, 0.06961822509765625, 0.073822021484375, 0.07802581787109375, 0.0822296142578125, 0.08643341064453125, 0.09063720703125, 0.09484100341796875, 0.0990447998046875, 0.10324859619140625, 0.107452392578125, 0.11165618896484375, 0.1158599853515625, 0.12006378173828125, 0.124267578125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 8.0, 5.0, 8.0, 12.0, 19.0, 10.0, 27.0, 17.0, 31.0, 26.0, 27.0, 37.0, 53.0, 35.0, 41.0, 55.0, 53.0, 63.0, 43.0, 55.0, 55.0, 44.0, 42.0, 42.0, 33.0, 28.0, 23.0, 17.0, 13.0, 11.0, 15.0, 3.0, 9.0, 6.0, 2.0, 9.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1742115020751953e-05, -1.1350959539413452e-05, -1.0959804058074951e-05, -1.056864857673645e-05, -1.017749309539795e-05, -9.786337614059448e-06, -9.395182132720947e-06, -9.004026651382446e-06, -8.612871170043945e-06, -8.221715688705444e-06, -7.830560207366943e-06, -7.439404726028442e-06, -7.048249244689941e-06, -6.6570937633514404e-06, -6.2659382820129395e-06, -5.8747828006744385e-06, -5.4836273193359375e-06, -5.0924718379974365e-06, -4.7013163566589355e-06, -4.3101608753204346e-06, -3.919005393981934e-06, -3.5278499126434326e-06, -3.1366944313049316e-06, -2.7455389499664307e-06, -2.3543834686279297e-06, -1.9632279872894287e-06, -1.5720725059509277e-06, -1.1809170246124268e-06, -7.897615432739258e-07, -3.986060619354248e-07, -7.450580596923828e-09, 3.8370490074157715e-07, 7.748603820800781e-07, 1.166015863418579e-06, 1.55717134475708e-06, 1.948326826095581e-06, 2.339482307434082e-06, 2.730637788772583e-06, 3.121793270111084e-06, 3.512948751449585e-06, 3.904104232788086e-06, 4.295259714126587e-06, 4.686415195465088e-06, 5.077570676803589e-06, 5.46872615814209e-06, 5.859881639480591e-06, 6.251037120819092e-06, 6.642192602157593e-06, 7.033348083496094e-06, 7.424503564834595e-06, 7.815659046173096e-06, 8.206814527511597e-06, 8.597970008850098e-06, 8.989125490188599e-06, 9.3802809715271e-06, 9.7714364528656e-06, 1.0162591934204102e-05, 1.0553747415542603e-05, 1.0944902896881104e-05, 1.1336058378219604e-05, 1.1727213859558105e-05, 1.2118369340896606e-05, 1.2509524822235107e-05, 1.2900680303573608e-05, 1.329183578491211e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 19.0, 30.0, 42.0, 44.0, 94.0, 131.0, 196.0, 285.0, 344.0, 576.0, 875.0, 1380.0, 2020.0, 3164.0, 4961.0, 7748.0, 12401.0, 21306.0, 37058.0, 67442.0, 126334.0, 237786.0, 238675.0, 125894.0, 67200.0, 36995.0, 21140.0, 12487.0, 7802.0, 4804.0, 3181.0, 2035.0, 1345.0, 926.0, 554.0, 421.0, 260.0, 187.0, 138.0, 86.0, 56.0, 43.0, 26.0, 13.0, 20.0, 9.0, 6.0, 5.0, 1.0, 3.0], "bins": [-0.1370849609375, -0.13327693939208984, -0.1294689178466797, -0.12566089630126953, -0.12185287475585938, -0.11804485321044922, -0.11423683166503906, -0.1104288101196289, -0.10662078857421875, -0.1028127670288086, -0.09900474548339844, -0.09519672393798828, -0.09138870239257812, -0.08758068084716797, -0.08377265930175781, -0.07996463775634766, -0.0761566162109375, -0.07234859466552734, -0.06854057312011719, -0.06473255157470703, -0.060924530029296875, -0.05711650848388672, -0.05330848693847656, -0.049500465393066406, -0.04569244384765625, -0.041884422302246094, -0.03807640075683594, -0.03426837921142578, -0.030460357666015625, -0.02665233612060547, -0.022844314575195312, -0.019036293029785156, -0.015228271484375, -0.011420249938964844, -0.0076122283935546875, -0.0038042068481445312, 3.814697265625e-06, 0.0038118362426757812, 0.0076198577880859375, 0.011427879333496094, 0.01523590087890625, 0.019043922424316406, 0.022851943969726562, 0.02665996551513672, 0.030467987060546875, 0.03427600860595703, 0.03808403015136719, 0.041892051696777344, 0.0457000732421875, 0.049508094787597656, 0.05331611633300781, 0.05712413787841797, 0.060932159423828125, 0.06474018096923828, 0.06854820251464844, 0.0723562240600586, 0.07616424560546875, 0.0799722671508789, 0.08378028869628906, 0.08758831024169922, 0.09139633178710938, 0.09520435333251953, 0.09901237487792969, 0.10282039642333984, 0.10662841796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 10.0, 4.0, 4.0, 7.0, 8.0, 18.0, 21.0, 17.0, 28.0, 32.0, 43.0, 42.0, 66.0, 62.0, 72.0, 65.0, 79.0, 62.0, 54.0, 49.0, 44.0, 41.0, 41.0, 33.0, 29.0, 22.0, 6.0, 6.0, 7.0, 8.0, 5.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047698974609375, -0.046099185943603516, -0.04449939727783203, -0.04289960861206055, -0.04129981994628906, -0.03970003128051758, -0.038100242614746094, -0.03650045394897461, -0.034900665283203125, -0.03330087661743164, -0.031701087951660156, -0.030101299285888672, -0.028501510620117188, -0.026901721954345703, -0.02530193328857422, -0.023702144622802734, -0.02210235595703125, -0.020502567291259766, -0.01890277862548828, -0.017302989959716797, -0.015703201293945312, -0.014103412628173828, -0.012503623962402344, -0.01090383529663086, -0.009304046630859375, -0.007704257965087891, -0.006104469299316406, -0.004504680633544922, -0.0029048919677734375, -0.0013051033020019531, 0.00029468536376953125, 0.0018944740295410156, 0.0034942626953125, 0.005094051361083984, 0.006693840026855469, 0.008293628692626953, 0.009893417358398438, 0.011493206024169922, 0.013092994689941406, 0.01469278335571289, 0.016292572021484375, 0.01789236068725586, 0.019492149353027344, 0.021091938018798828, 0.022691726684570312, 0.024291515350341797, 0.02589130401611328, 0.027491092681884766, 0.02909088134765625, 0.030690670013427734, 0.03229045867919922, 0.0338902473449707, 0.03549003601074219, 0.03708982467651367, 0.038689613342285156, 0.04028940200805664, 0.041889190673828125, 0.04348897933959961, 0.045088768005371094, 0.04668855667114258, 0.04828834533691406, 0.04988813400268555, 0.05148792266845703, 0.053087711334228516, 0.0546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 10.0, 12.0, 11.0, 11.0, 11.0, 13.0, 21.0, 24.0, 27.0, 38.0, 53.0, 64.0, 66.0, 57.0, 60.0, 58.0, 78.0, 62.0, 56.0, 51.0, 39.0, 29.0, 31.0, 29.0, 17.0, 22.0, 13.0, 10.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.430907249450684, -9.120040893554688, -8.809173583984375, -8.498307228088379, -8.187440872192383, -7.876574516296387, -7.565707683563232, -7.254840850830078, -6.943974494934082, -6.633108139038086, -6.322241306304932, -6.011374473571777, -5.700508117675781, -5.389641761779785, -5.078774929046631, -4.767908096313477, -4.4570417404174805, -4.146175384521484, -3.83530855178833, -3.524441957473755, -3.2135753631591797, -2.9027087688446045, -2.5918421745300293, -2.280975580215454, -1.970108985900879, -1.6592423915863037, -1.3483757972717285, -1.0375092029571533, -0.7266426086425781, -0.41577601432800293, -0.10490942001342773, 0.20595717430114746, 0.5168228149414062, 0.8276894092559814, 1.1385560035705566, 1.4494225978851318, 1.760289192199707, 2.0711557865142822, 2.3820223808288574, 2.6928889751434326, 3.003755569458008, 3.314622163772583, 3.625488758087158, 3.9363553524017334, 4.247221946716309, 4.558088302612305, 4.868955135345459, 5.179821968078613, 5.490688323974609, 5.8015546798706055, 6.11242151260376, 6.423288345336914, 6.73415470123291, 7.045021057128906, 7.3558878898620605, 7.666754722595215, 7.977621078491211, 8.288487434387207, 8.599353790283203, 8.910221099853516, 9.221087455749512, 9.531953811645508, 9.84282112121582, 10.153687477111816, 10.464553833007812]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 6.0, 4.0, 10.0, 8.0, 11.0, 17.0, 16.0, 13.0, 18.0, 25.0, 19.0, 27.0, 37.0, 32.0, 36.0, 45.0, 48.0, 54.0, 42.0, 38.0, 56.0, 37.0, 47.0, 44.0, 45.0, 37.0, 34.0, 28.0, 34.0, 35.0, 16.0, 9.0, 8.0, 21.0, 12.0, 11.0, 7.0, 2.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.669071197509766, -10.385933876037598, -10.102797508239746, -9.819660186767578, -9.53652286529541, -9.253385543823242, -8.97024917602539, -8.687111854553223, -8.403974533081055, -8.120837211608887, -7.837700366973877, -7.554563522338867, -7.271426200866699, -6.9882893562316895, -6.70515251159668, -6.422015190124512, -6.13887882232666, -5.85574197769165, -5.572604656219482, -5.289467811584473, -5.006330490112305, -4.723193645477295, -4.440056800842285, -4.156919479370117, -3.8737826347351074, -3.5906455516815186, -3.3075084686279297, -3.02437162399292, -2.741234540939331, -2.458097457885742, -2.1749606132507324, -1.8918235301971436, -1.608687400817871, -1.3255503177642822, -1.042413353919983, -0.7592763304710388, -0.4761393070220947, -0.19300222396850586, 0.09013473987579346, 0.3732717037200928, 0.6564087867736816, 0.9395458102226257, 1.2226828336715698, 1.5058197975158691, 1.788956880569458, 2.072093963623047, 2.3552308082580566, 2.6383678913116455, 2.9215049743652344, 3.2046420574188232, 3.487779140472412, 3.770915985107422, 4.05405330657959, 4.3371901512146, 4.620326995849609, 4.903464317321777, 5.186601161956787, 5.469738006591797, 5.752875328063965, 6.036012172698975, 6.319149017333984, 6.602286338806152, 6.885423183441162, 7.168560028076172, 7.45169734954834]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 6.0, 6.0, 17.0, 22.0, 29.0, 27.0, 55.0, 87.0, 111.0, 179.0, 277.0, 393.0, 634.0, 934.0, 1377.0, 2058.0, 3116.0, 4603.0, 7039.0, 10524.0, 15208.0, 22700.0, 32853.0, 47443.0, 66128.0, 87660.0, 108130.0, 120720.0, 120336.0, 105160.0, 84567.0, 63611.0, 45042.0, 31725.0, 21589.0, 14496.0, 9807.0, 6577.0, 4396.0, 3050.0, 1950.0, 1258.0, 861.0, 577.0, 382.0, 285.0, 199.0, 132.0, 77.0, 45.0, 31.0, 21.0, 27.0, 11.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.87890625, -4.72613525390625, -4.5733642578125, -4.42059326171875, -4.267822265625, -4.11505126953125, -3.9622802734375, -3.80950927734375, -3.65673828125, -3.50396728515625, -3.3511962890625, -3.19842529296875, -3.045654296875, -2.89288330078125, -2.7401123046875, -2.58734130859375, -2.4345703125, -2.28179931640625, -2.1290283203125, -1.97625732421875, -1.823486328125, -1.67071533203125, -1.5179443359375, -1.36517333984375, -1.21240234375, -1.05963134765625, -0.9068603515625, -0.75408935546875, -0.601318359375, -0.44854736328125, -0.2957763671875, -0.14300537109375, 0.009765625, 0.16253662109375, 0.3153076171875, 0.46807861328125, 0.620849609375, 0.77362060546875, 0.9263916015625, 1.07916259765625, 1.23193359375, 1.38470458984375, 1.5374755859375, 1.69024658203125, 1.843017578125, 1.99578857421875, 2.1485595703125, 2.30133056640625, 2.4541015625, 2.60687255859375, 2.7596435546875, 2.91241455078125, 3.065185546875, 3.21795654296875, 3.3707275390625, 3.52349853515625, 3.67626953125, 3.82904052734375, 3.9818115234375, 4.13458251953125, 4.287353515625, 4.44012451171875, 4.5928955078125, 4.74566650390625, 4.8984375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 7.0, 6.0, 8.0, 16.0, 6.0, 14.0, 22.0, 20.0, 18.0, 21.0, 21.0, 33.0, 29.0, 43.0, 32.0, 41.0, 47.0, 46.0, 34.0, 41.0, 43.0, 49.0, 34.0, 39.0, 43.0, 45.0, 30.0, 23.0, 42.0, 19.0, 18.0, 20.0, 11.0, 11.0, 11.0, 15.0, 11.0, 6.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.265625, -8.9969482421875, -8.728271484375, -8.4595947265625, -8.19091796875, -7.9222412109375, -7.653564453125, -7.3848876953125, -7.1162109375, -6.8475341796875, -6.578857421875, -6.3101806640625, -6.04150390625, -5.7728271484375, -5.504150390625, -5.2354736328125, -4.966796875, -4.6981201171875, -4.429443359375, -4.1607666015625, -3.89208984375, -3.6234130859375, -3.354736328125, -3.0860595703125, -2.8173828125, -2.5487060546875, -2.280029296875, -2.0113525390625, -1.74267578125, -1.4739990234375, -1.205322265625, -0.9366455078125, -0.66796875, -0.3992919921875, -0.130615234375, 0.1380615234375, 0.40673828125, 0.6754150390625, 0.944091796875, 1.2127685546875, 1.4814453125, 1.7501220703125, 2.018798828125, 2.2874755859375, 2.55615234375, 2.8248291015625, 3.093505859375, 3.3621826171875, 3.630859375, 3.8995361328125, 4.168212890625, 4.4368896484375, 4.70556640625, 4.9742431640625, 5.242919921875, 5.5115966796875, 5.7802734375, 6.0489501953125, 6.317626953125, 6.5863037109375, 6.85498046875, 7.1236572265625, 7.392333984375, 7.6610107421875, 7.9296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 6.0, 10.0, 8.0, 22.0, 34.0, 60.0, 79.0, 109.0, 214.0, 353.0, 514.0, 785.0, 1241.0, 2045.0, 3158.0, 5047.0, 7954.0, 12743.0, 20003.0, 31557.0, 48545.0, 72520.0, 100533.0, 127087.0, 139474.0, 132112.0, 109315.0, 80128.0, 54564.0, 36053.0, 23013.0, 14646.0, 9117.0, 5728.0, 3552.0, 2299.0, 1472.0, 836.0, 581.0, 383.0, 244.0, 134.0, 97.0, 70.0, 51.0, 29.0, 16.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.03515625, -4.859375, -4.68359375, -4.5078125, -4.33203125, -4.15625, -3.98046875, -3.8046875, -3.62890625, -3.453125, -3.27734375, -3.1015625, -2.92578125, -2.75, -2.57421875, -2.3984375, -2.22265625, -2.046875, -1.87109375, -1.6953125, -1.51953125, -1.34375, -1.16796875, -0.9921875, -0.81640625, -0.640625, -0.46484375, -0.2890625, -0.11328125, 0.0625, 0.23828125, 0.4140625, 0.58984375, 0.765625, 0.94140625, 1.1171875, 1.29296875, 1.46875, 1.64453125, 1.8203125, 1.99609375, 2.171875, 2.34765625, 2.5234375, 2.69921875, 2.875, 3.05078125, 3.2265625, 3.40234375, 3.578125, 3.75390625, 3.9296875, 4.10546875, 4.28125, 4.45703125, 4.6328125, 4.80859375, 4.984375, 5.16015625, 5.3359375, 5.51171875, 5.6875, 5.86328125, 6.0390625, 6.21484375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 9.0, 9.0, 8.0, 10.0, 13.0, 20.0, 13.0, 15.0, 18.0, 19.0, 19.0, 26.0, 27.0, 30.0, 43.0, 23.0, 39.0, 38.0, 38.0, 38.0, 34.0, 33.0, 35.0, 35.0, 37.0, 41.0, 30.0, 39.0, 28.0, 24.0, 32.0, 19.0, 25.0, 19.0, 16.0, 13.0, 16.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.37890625, -4.2364501953125, -4.093994140625, -3.9515380859375, -3.80908203125, -3.6666259765625, -3.524169921875, -3.3817138671875, -3.2392578125, -3.0968017578125, -2.954345703125, -2.8118896484375, -2.66943359375, -2.5269775390625, -2.384521484375, -2.2420654296875, -2.099609375, -1.9571533203125, -1.814697265625, -1.6722412109375, -1.52978515625, -1.3873291015625, -1.244873046875, -1.1024169921875, -0.9599609375, -0.8175048828125, -0.675048828125, -0.5325927734375, -0.39013671875, -0.2476806640625, -0.105224609375, 0.0372314453125, 0.1796875, 0.3221435546875, 0.464599609375, 0.6070556640625, 0.74951171875, 0.8919677734375, 1.034423828125, 1.1768798828125, 1.3193359375, 1.4617919921875, 1.604248046875, 1.7467041015625, 1.88916015625, 2.0316162109375, 2.174072265625, 2.3165283203125, 2.458984375, 2.6014404296875, 2.743896484375, 2.8863525390625, 3.02880859375, 3.1712646484375, 3.313720703125, 3.4561767578125, 3.5986328125, 3.7410888671875, 3.883544921875, 4.0260009765625, 4.16845703125, 4.3109130859375, 4.453369140625, 4.5958251953125, 4.73828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 7.0, 10.0, 9.0, 28.0, 25.0, 38.0, 74.0, 84.0, 123.0, 211.0, 318.0, 441.0, 625.0, 928.0, 1368.0, 2220.0, 3339.0, 5104.0, 8497.0, 13450.0, 21930.0, 34785.0, 56620.0, 87585.0, 127119.0, 159138.0, 158776.0, 127183.0, 87824.0, 56946.0, 35335.0, 21628.0, 13486.0, 8262.0, 5397.0, 3303.0, 2129.0, 1346.0, 927.0, 583.0, 426.0, 306.0, 200.0, 122.0, 90.0, 64.0, 43.0, 34.0, 23.0, 13.0, 9.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0], "bins": [-2.12890625, -2.0623779296875, -1.995849609375, -1.9293212890625, -1.86279296875, -1.7962646484375, -1.729736328125, -1.6632080078125, -1.5966796875, -1.5301513671875, -1.463623046875, -1.3970947265625, -1.33056640625, -1.2640380859375, -1.197509765625, -1.1309814453125, -1.064453125, -0.9979248046875, -0.931396484375, -0.8648681640625, -0.79833984375, -0.7318115234375, -0.665283203125, -0.5987548828125, -0.5322265625, -0.4656982421875, -0.399169921875, -0.3326416015625, -0.26611328125, -0.1995849609375, -0.133056640625, -0.0665283203125, 0.0, 0.0665283203125, 0.133056640625, 0.1995849609375, 0.26611328125, 0.3326416015625, 0.399169921875, 0.4656982421875, 0.5322265625, 0.5987548828125, 0.665283203125, 0.7318115234375, 0.79833984375, 0.8648681640625, 0.931396484375, 0.9979248046875, 1.064453125, 1.1309814453125, 1.197509765625, 1.2640380859375, 1.33056640625, 1.3970947265625, 1.463623046875, 1.5301513671875, 1.5966796875, 1.6632080078125, 1.729736328125, 1.7962646484375, 1.86279296875, 1.9293212890625, 1.995849609375, 2.0623779296875, 2.12890625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 12.0, 19.0, 14.0, 25.0, 18.0, 29.0, 26.0, 34.0, 34.0, 38.0, 46.0, 63.0, 38.0, 63.0, 58.0, 44.0, 58.0, 46.0, 31.0, 36.0, 39.0, 40.0, 28.0, 21.0, 21.0, 21.0, 11.0, 17.0, 12.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.00014942511916160583, -0.00014459341764450073, -0.00013976171612739563, -0.00013493001461029053, -0.00013009831309318542, -0.00012526661157608032, -0.00012043491005897522, -0.00011560320854187012, -0.00011077150702476501, -0.00010593980550765991, -0.00010110810399055481, -9.627640247344971e-05, -9.14447009563446e-05, -8.66129994392395e-05, -8.17812979221344e-05, -7.69495964050293e-05, -7.21178948879242e-05, -6.728619337081909e-05, -6.245449185371399e-05, -5.762279033660889e-05, -5.2791088819503784e-05, -4.795938730239868e-05, -4.312768578529358e-05, -3.8295984268188477e-05, -3.3464282751083374e-05, -2.863258123397827e-05, -2.380087971687317e-05, -1.8969178199768066e-05, -1.4137476682662964e-05, -9.305775165557861e-06, -4.474073648452759e-06, 3.5762786865234375e-07, 5.189329385757446e-06, 1.0021030902862549e-05, 1.4852732419967651e-05, 1.9684433937072754e-05, 2.4516135454177856e-05, 2.934783697128296e-05, 3.417953848838806e-05, 3.9011240005493164e-05, 4.3842941522598267e-05, 4.867464303970337e-05, 5.350634455680847e-05, 5.8338046073913574e-05, 6.316974759101868e-05, 6.800144910812378e-05, 7.283315062522888e-05, 7.766485214233398e-05, 8.249655365943909e-05, 8.732825517654419e-05, 9.215995669364929e-05, 9.69916582107544e-05, 0.0001018233597278595, 0.0001066550612449646, 0.0001114867627620697, 0.0001163184642791748, 0.00012115016579627991, 0.000125981867313385, 0.0001308135688304901, 0.00013564527034759521, 0.00014047697186470032, 0.00014530867338180542, 0.00015014037489891052, 0.00015497207641601562]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 7.0, 9.0, 9.0, 25.0, 36.0, 47.0, 80.0, 124.0, 189.0, 342.0, 518.0, 820.0, 1292.0, 2251.0, 3733.0, 6419.0, 11007.0, 19307.0, 34446.0, 59659.0, 99203.0, 148480.0, 181496.0, 170532.0, 123594.0, 77690.0, 45624.0, 25851.0, 14852.0, 8458.0, 4995.0, 2947.0, 1677.0, 1075.0, 711.0, 374.0, 249.0, 160.0, 95.0, 53.0, 45.0, 29.0, 15.0, 10.0, 3.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.45703125, -2.38201904296875, -2.3070068359375, -2.23199462890625, -2.156982421875, -2.08197021484375, -2.0069580078125, -1.93194580078125, -1.85693359375, -1.78192138671875, -1.7069091796875, -1.63189697265625, -1.556884765625, -1.48187255859375, -1.4068603515625, -1.33184814453125, -1.2568359375, -1.18182373046875, -1.1068115234375, -1.03179931640625, -0.956787109375, -0.88177490234375, -0.8067626953125, -0.73175048828125, -0.65673828125, -0.58172607421875, -0.5067138671875, -0.43170166015625, -0.356689453125, -0.28167724609375, -0.2066650390625, -0.13165283203125, -0.056640625, 0.01837158203125, 0.0933837890625, 0.16839599609375, 0.243408203125, 0.31842041015625, 0.3934326171875, 0.46844482421875, 0.54345703125, 0.61846923828125, 0.6934814453125, 0.76849365234375, 0.843505859375, 0.91851806640625, 0.9935302734375, 1.06854248046875, 1.1435546875, 1.21856689453125, 1.2935791015625, 1.36859130859375, 1.443603515625, 1.51861572265625, 1.5936279296875, 1.66864013671875, 1.74365234375, 1.81866455078125, 1.8936767578125, 1.96868896484375, 2.043701171875, 2.11871337890625, 2.1937255859375, 2.26873779296875, 2.34375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 12.0, 12.0, 8.0, 20.0, 20.0, 23.0, 23.0, 31.0, 37.0, 56.0, 59.0, 58.0, 56.0, 68.0, 67.0, 60.0, 64.0, 63.0, 49.0, 33.0, 42.0, 22.0, 20.0, 13.0, 19.0, 9.0, 17.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.891082763671875, -0.86126708984375, -0.831451416015625, -0.8016357421875, -0.771820068359375, -0.74200439453125, -0.712188720703125, -0.682373046875, -0.652557373046875, -0.62274169921875, -0.592926025390625, -0.5631103515625, -0.533294677734375, -0.50347900390625, -0.473663330078125, -0.44384765625, -0.414031982421875, -0.38421630859375, -0.354400634765625, -0.3245849609375, -0.294769287109375, -0.26495361328125, -0.235137939453125, -0.205322265625, -0.175506591796875, -0.14569091796875, -0.115875244140625, -0.0860595703125, -0.056243896484375, -0.02642822265625, 0.003387451171875, 0.033203125, 0.063018798828125, 0.09283447265625, 0.122650146484375, 0.1524658203125, 0.182281494140625, 0.21209716796875, 0.241912841796875, 0.271728515625, 0.301544189453125, 0.33135986328125, 0.361175537109375, 0.3909912109375, 0.420806884765625, 0.45062255859375, 0.480438232421875, 0.51025390625, 0.540069580078125, 0.56988525390625, 0.599700927734375, 0.6295166015625, 0.659332275390625, 0.68914794921875, 0.718963623046875, 0.748779296875, 0.778594970703125, 0.80841064453125, 0.838226318359375, 0.8680419921875, 0.897857666015625, 0.92767333984375, 0.957489013671875, 0.9873046875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 12.0, 8.0, 5.0, 15.0, 7.0, 20.0, 18.0, 29.0, 43.0, 39.0, 55.0, 60.0, 69.0, 59.0, 82.0, 68.0, 54.0, 66.0, 45.0, 46.0, 28.0, 30.0, 34.0, 21.0, 17.0, 18.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.878427505493164, -8.569231033325195, -8.260034561157227, -7.950839042663574, -7.6416425704956055, -7.332446098327637, -7.023250102996826, -6.714054107666016, -6.404857635498047, -6.095661163330078, -5.786465167999268, -5.477269172668457, -5.168072700500488, -4.8588762283325195, -4.549680233001709, -4.240484237670898, -3.9312877655029297, -3.62209153175354, -3.3128952980041504, -3.0036990642547607, -2.694502830505371, -2.3853065967559814, -2.076110363006592, -1.7669141292572021, -1.4577178955078125, -1.1485216617584229, -0.8393254280090332, -0.5301291942596436, -0.2209329605102539, 0.08826327323913574, 0.3974595069885254, 0.706655740737915, 1.0158510208129883, 1.325047254562378, 1.6342434883117676, 1.9434397220611572, 2.252635955810547, 2.5618321895599365, 2.871028423309326, 3.180224657058716, 3.4894208908081055, 3.798617124557495, 4.107813358306885, 4.417009353637695, 4.726205825805664, 5.035402297973633, 5.344598293304443, 5.653794288635254, 5.962990760803223, 6.272187232971191, 6.581383228302002, 6.8905792236328125, 7.199775695800781, 7.50897216796875, 7.8181681632995605, 8.127364158630371, 8.43656063079834, 8.745757102966309, 9.054952621459961, 9.36414909362793, 9.673345565795898, 9.982542037963867, 10.291738510131836, 10.600934028625488, 10.910130500793457]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 11.0, 6.0, 8.0, 6.0, 24.0, 14.0, 15.0, 19.0, 30.0, 22.0, 36.0, 40.0, 37.0, 36.0, 31.0, 44.0, 43.0, 51.0, 54.0, 39.0, 53.0, 48.0, 44.0, 52.0, 40.0, 36.0, 21.0, 28.0, 18.0, 20.0, 15.0, 16.0, 9.0, 12.0, 6.0, 3.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.905338287353516, -10.5968017578125, -10.288265228271484, -9.979727745056152, -9.671191215515137, -9.362654685974121, -9.054118156433105, -8.74558162689209, -8.437044143676758, -8.128507614135742, -7.819970607757568, -7.511434078216553, -7.202897071838379, -6.894360542297363, -6.585824012756348, -6.277287483215332, -5.968750953674316, -5.660214424133301, -5.351677417755127, -5.043140888214111, -4.7346038818359375, -4.426067352294922, -4.117530822753906, -3.8089940547943115, -3.500457286834717, -3.191920518875122, -2.8833837509155273, -2.5748472213745117, -2.266310453414917, -1.9577736854553223, -1.649237036705017, -1.340700387954712, -1.0321645736694336, -0.7236278653144836, -0.4150911569595337, -0.10655444860458374, 0.2019822597503662, 0.5105190277099609, 0.8190556764602661, 1.1275923252105713, 1.436129093170166, 1.7446658611297607, 2.0532026290893555, 2.361739158630371, 2.670275926589966, 2.9788126945495605, 3.287349224090576, 3.595885992050171, 3.9044227600097656, 4.212959289550781, 4.521496295928955, 4.830032825469971, 5.1385698318481445, 5.44710636138916, 5.755642890930176, 6.064179420471191, 6.372716426849365, 6.681252956390381, 6.989789962768555, 7.29832649230957, 7.606863021850586, 7.91540002822876, 8.223937034606934, 8.53247356414795, 8.841010093688965]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 15.0, 25.0, 35.0, 49.0, 60.0, 86.0, 135.0, 241.0, 375.0, 523.0, 764.0, 1262.0, 1832.0, 3000.0, 4738.0, 7424.0, 11752.0, 19359.0, 32092.0, 53778.0, 91386.0, 156742.0, 267505.0, 440519.0, 651205.0, 751954.0, 637281.0, 426705.0, 260109.0, 151511.0, 88867.0, 52230.0, 30791.0, 18806.0, 11485.0, 7181.0, 4336.0, 2810.0, 1750.0, 1200.0, 777.0, 523.0, 305.0, 203.0, 166.0, 123.0, 92.0, 61.0, 33.0, 30.0, 12.0, 11.0, 9.0, 10.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.39453125, -7.15948486328125, -6.9244384765625, -6.68939208984375, -6.454345703125, -6.21929931640625, -5.9842529296875, -5.74920654296875, -5.51416015625, -5.27911376953125, -5.0440673828125, -4.80902099609375, -4.573974609375, -4.33892822265625, -4.1038818359375, -3.86883544921875, -3.6337890625, -3.39874267578125, -3.1636962890625, -2.92864990234375, -2.693603515625, -2.45855712890625, -2.2235107421875, -1.98846435546875, -1.75341796875, -1.51837158203125, -1.2833251953125, -1.04827880859375, -0.813232421875, -0.57818603515625, -0.3431396484375, -0.10809326171875, 0.126953125, 0.36199951171875, 0.5970458984375, 0.83209228515625, 1.067138671875, 1.30218505859375, 1.5372314453125, 1.77227783203125, 2.00732421875, 2.24237060546875, 2.4774169921875, 2.71246337890625, 2.947509765625, 3.18255615234375, 3.4176025390625, 3.65264892578125, 3.8876953125, 4.12274169921875, 4.3577880859375, 4.59283447265625, 4.827880859375, 5.06292724609375, 5.2979736328125, 5.53302001953125, 5.76806640625, 6.00311279296875, 6.2381591796875, 6.47320556640625, 6.708251953125, 6.94329833984375, 7.1783447265625, 7.41339111328125, 7.6484375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 7.0, 3.0, 10.0, 14.0, 19.0, 20.0, 17.0, 22.0, 25.0, 30.0, 38.0, 43.0, 32.0, 22.0, 44.0, 52.0, 49.0, 40.0, 49.0, 38.0, 54.0, 51.0, 54.0, 37.0, 35.0, 34.0, 23.0, 21.0, 19.0, 22.0, 19.0, 11.0, 5.0, 11.0, 6.0, 7.0, 5.0, 2.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.39434814453125, -7.1754150390625, -6.95648193359375, -6.737548828125, -6.51861572265625, -6.2996826171875, -6.08074951171875, -5.86181640625, -5.64288330078125, -5.4239501953125, -5.20501708984375, -4.986083984375, -4.76715087890625, -4.5482177734375, -4.32928466796875, -4.1103515625, -3.89141845703125, -3.6724853515625, -3.45355224609375, -3.234619140625, -3.01568603515625, -2.7967529296875, -2.57781982421875, -2.35888671875, -2.13995361328125, -1.9210205078125, -1.70208740234375, -1.483154296875, -1.26422119140625, -1.0452880859375, -0.82635498046875, -0.607421875, -0.38848876953125, -0.1695556640625, 0.04937744140625, 0.268310546875, 0.48724365234375, 0.7061767578125, 0.92510986328125, 1.14404296875, 1.36297607421875, 1.5819091796875, 1.80084228515625, 2.019775390625, 2.23870849609375, 2.4576416015625, 2.67657470703125, 2.8955078125, 3.11444091796875, 3.3333740234375, 3.55230712890625, 3.771240234375, 3.99017333984375, 4.2091064453125, 4.42803955078125, 4.64697265625, 4.86590576171875, 5.0848388671875, 5.30377197265625, 5.522705078125, 5.74163818359375, 5.9605712890625, 6.17950439453125, 6.3984375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 16.0, 22.0, 35.0, 51.0, 81.0, 139.0, 176.0, 262.0, 449.0, 705.0, 1112.0, 1805.0, 2973.0, 4888.0, 8150.0, 13340.0, 22795.0, 39086.0, 66768.0, 114266.0, 192461.0, 311351.0, 471418.0, 621272.0, 671736.0, 577079.0, 414177.0, 266085.0, 160986.0, 94553.0, 55298.0, 32489.0, 19265.0, 11414.0, 6861.0, 4072.0, 2480.0, 1499.0, 979.0, 613.0, 379.0, 257.0, 149.0, 100.0, 57.0, 51.0, 24.0, 20.0, 6.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0], "bins": [-7.30078125, -7.074951171875, -6.84912109375, -6.623291015625, -6.3974609375, -6.171630859375, -5.94580078125, -5.719970703125, -5.494140625, -5.268310546875, -5.04248046875, -4.816650390625, -4.5908203125, -4.364990234375, -4.13916015625, -3.913330078125, -3.6875, -3.461669921875, -3.23583984375, -3.010009765625, -2.7841796875, -2.558349609375, -2.33251953125, -2.106689453125, -1.880859375, -1.655029296875, -1.42919921875, -1.203369140625, -0.9775390625, -0.751708984375, -0.52587890625, -0.300048828125, -0.07421875, 0.151611328125, 0.37744140625, 0.603271484375, 0.8291015625, 1.054931640625, 1.28076171875, 1.506591796875, 1.732421875, 1.958251953125, 2.18408203125, 2.409912109375, 2.6357421875, 2.861572265625, 3.08740234375, 3.313232421875, 3.5390625, 3.764892578125, 3.99072265625, 4.216552734375, 4.4423828125, 4.668212890625, 4.89404296875, 5.119873046875, 5.345703125, 5.571533203125, 5.79736328125, 6.023193359375, 6.2490234375, 6.474853515625, 6.70068359375, 6.926513671875, 7.15234375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 11.0, 7.0, 14.0, 13.0, 18.0, 33.0, 43.0, 50.0, 70.0, 60.0, 103.0, 103.0, 130.0, 159.0, 155.0, 186.0, 171.0, 215.0, 212.0, 231.0, 223.0, 231.0, 209.0, 198.0, 164.0, 173.0, 144.0, 112.0, 110.0, 97.0, 74.0, 80.0, 46.0, 48.0, 37.0, 24.0, 28.0, 19.0, 16.0, 11.0, 6.0, 8.0, 10.0, 1.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.921875, -2.823272705078125, -2.72467041015625, -2.626068115234375, -2.5274658203125, -2.428863525390625, -2.33026123046875, -2.231658935546875, -2.133056640625, -2.034454345703125, -1.93585205078125, -1.837249755859375, -1.7386474609375, -1.640045166015625, -1.54144287109375, -1.442840576171875, -1.34423828125, -1.245635986328125, -1.14703369140625, -1.048431396484375, -0.9498291015625, -0.851226806640625, -0.75262451171875, -0.654022216796875, -0.555419921875, -0.456817626953125, -0.35821533203125, -0.259613037109375, -0.1610107421875, -0.062408447265625, 0.03619384765625, 0.134796142578125, 0.2333984375, 0.332000732421875, 0.43060302734375, 0.529205322265625, 0.6278076171875, 0.726409912109375, 0.82501220703125, 0.923614501953125, 1.022216796875, 1.120819091796875, 1.21942138671875, 1.318023681640625, 1.4166259765625, 1.515228271484375, 1.61383056640625, 1.712432861328125, 1.81103515625, 1.909637451171875, 2.00823974609375, 2.106842041015625, 2.2054443359375, 2.304046630859375, 2.40264892578125, 2.501251220703125, 2.599853515625, 2.698455810546875, 2.79705810546875, 2.895660400390625, 2.9942626953125, 3.092864990234375, 3.19146728515625, 3.290069580078125, 3.388671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 13.0, 8.0, 20.0, 27.0, 27.0, 28.0, 35.0, 38.0, 44.0, 47.0, 55.0, 51.0, 49.0, 64.0, 65.0, 72.0, 47.0, 36.0, 44.0, 27.0, 35.0, 35.0, 17.0, 13.0, 20.0, 10.0, 6.0, 5.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.171043872833252, -6.890178203582764, -6.609313011169434, -6.328447341918945, -6.047582149505615, -5.766716480255127, -5.485851287841797, -5.204985618591309, -4.92411994934082, -4.643254280090332, -4.362389087677002, -4.081523418426514, -3.8006582260131836, -3.5197925567626953, -3.238927125930786, -2.958061695098877, -2.677196502685547, -2.3963310718536377, -2.1154656410217285, -1.8346000909805298, -1.5537346601486206, -1.2728692293167114, -0.9920036792755127, -0.7111382484436035, -0.43027281761169434, -0.14940735697746277, 0.1314581036567688, 0.41232359409332275, 0.6931890249252319, 0.9740544557571411, 1.2549200057983398, 1.535785436630249, 1.816650390625, 2.097515821456909, 2.3783812522888184, 2.6592469215393066, 2.9401121139526367, 3.220977783203125, 3.501843214035034, 3.7827086448669434, 4.063573837280273, 4.344439506530762, 4.625304698944092, 4.90617036819458, 5.18703556060791, 5.467901229858398, 5.748766899108887, 6.029632091522217, 6.310497760772705, 6.591363430023193, 6.872228622436523, 7.153094291687012, 7.433959484100342, 7.71482515335083, 7.99569034576416, 8.276556015014648, 8.557421684265137, 8.838287353515625, 9.119153022766113, 9.400017738342285, 9.680883407592773, 9.961749076843262, 10.24261474609375, 10.523479461669922, 10.80434513092041]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 9.0, 17.0, 25.0, 24.0, 22.0, 22.0, 23.0, 34.0, 35.0, 38.0, 33.0, 40.0, 44.0, 35.0, 45.0, 37.0, 40.0, 49.0, 47.0, 46.0, 37.0, 29.0, 34.0, 32.0, 23.0, 22.0, 25.0, 26.0, 15.0, 15.0, 11.0, 8.0, 11.0, 5.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-9.94472599029541, -9.664044380187988, -9.383363723754883, -9.102682113647461, -8.822000503540039, -8.541318893432617, -8.260638236999512, -7.97995662689209, -7.699275493621826, -7.4185943603515625, -7.137912750244141, -6.857231616973877, -6.576550483703613, -6.295868873596191, -6.015187740325928, -5.734506607055664, -5.453824996948242, -5.1731438636779785, -4.892462253570557, -4.611781120300293, -4.331099510192871, -4.050418376922607, -3.7697372436523438, -3.489055871963501, -3.208374500274658, -2.9276931285858154, -2.6470117568969727, -2.366330623626709, -2.085649251937866, -1.8049678802490234, -1.5242866277694702, -1.243605375289917, -0.9629230499267578, -0.6822417378425598, -0.4015604257583618, -0.12087911367416382, 0.15980219841003418, 0.44048357009887695, 0.7211648225784302, 1.0018460750579834, 1.2825274467468262, 1.563208818435669, 1.8438900709152222, 2.1245713233947754, 2.405252695083618, 2.685934066772461, 2.9666152000427246, 3.2472965717315674, 3.52797794342041, 3.808659315109253, 4.089340686798096, 4.370021820068359, 4.650703430175781, 4.931384563446045, 5.212065696716309, 5.4927473068237305, 5.773428440093994, 6.054109573364258, 6.33479118347168, 6.615472316741943, 6.896153450012207, 7.176835060119629, 7.457516193389893, 7.738197326660156, 8.018878936767578]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 29.0, 23.0, 60.0, 68.0, 110.0, 127.0, 214.0, 341.0, 473.0, 736.0, 1077.0, 1550.0, 2388.0, 3721.0, 5557.0, 8412.0, 13026.0, 20701.0, 32773.0, 53770.0, 87639.0, 140381.0, 200329.0, 175136.0, 113473.0, 69432.0, 42937.0, 26698.0, 16473.0, 10461.0, 6912.0, 4536.0, 2952.0, 1947.0, 1309.0, 896.0, 603.0, 388.0, 290.0, 175.0, 145.0, 89.0, 55.0, 33.0, 30.0, 20.0, 21.0, 5.0, 7.0, 4.0, 3.0, 3.0], "bins": [-0.97900390625, -0.9508438110351562, -0.9226837158203125, -0.8945236206054688, -0.866363525390625, -0.8382034301757812, -0.8100433349609375, -0.7818832397460938, -0.75372314453125, -0.7255630493164062, -0.6974029541015625, -0.6692428588867188, -0.641082763671875, -0.6129226684570312, -0.5847625732421875, -0.5566024780273438, -0.5284423828125, -0.5002822875976562, -0.4721221923828125, -0.44396209716796875, -0.415802001953125, -0.38764190673828125, -0.3594818115234375, -0.33132171630859375, -0.30316162109375, -0.27500152587890625, -0.2468414306640625, -0.21868133544921875, -0.190521240234375, -0.16236114501953125, -0.1342010498046875, -0.10604095458984375, -0.077880859375, -0.04972076416015625, -0.0215606689453125, 0.00659942626953125, 0.034759521484375, 0.06291961669921875, 0.0910797119140625, 0.11923980712890625, 0.14739990234375, 0.17555999755859375, 0.2037200927734375, 0.23188018798828125, 0.260040283203125, 0.28820037841796875, 0.3163604736328125, 0.34452056884765625, 0.3726806640625, 0.40084075927734375, 0.4290008544921875, 0.45716094970703125, 0.485321044921875, 0.5134811401367188, 0.5416412353515625, 0.5698013305664062, 0.59796142578125, 0.6261215209960938, 0.6542816162109375, 0.6824417114257812, 0.710601806640625, 0.7387619018554688, 0.7669219970703125, 0.7950820922851562, 0.8232421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 3.0, 6.0, 10.0, 13.0, 13.0, 16.0, 16.0, 15.0, 34.0, 32.0, 32.0, 32.0, 32.0, 40.0, 45.0, 36.0, 33.0, 38.0, 48.0, 41.0, 54.0, 43.0, 44.0, 37.0, 38.0, 26.0, 34.0, 28.0, 23.0, 16.0, 25.0, 20.0, 18.0, 12.0, 7.0, 4.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.6015625, -9.314453125, -9.02734375, -8.740234375, -8.453125, -8.166015625, -7.87890625, -7.591796875, -7.3046875, -7.017578125, -6.73046875, -6.443359375, -6.15625, -5.869140625, -5.58203125, -5.294921875, -5.0078125, -4.720703125, -4.43359375, -4.146484375, -3.859375, -3.572265625, -3.28515625, -2.998046875, -2.7109375, -2.423828125, -2.13671875, -1.849609375, -1.5625, -1.275390625, -0.98828125, -0.701171875, -0.4140625, -0.126953125, 0.16015625, 0.447265625, 0.734375, 1.021484375, 1.30859375, 1.595703125, 1.8828125, 2.169921875, 2.45703125, 2.744140625, 3.03125, 3.318359375, 3.60546875, 3.892578125, 4.1796875, 4.466796875, 4.75390625, 5.041015625, 5.328125, 5.615234375, 5.90234375, 6.189453125, 6.4765625, 6.763671875, 7.05078125, 7.337890625, 7.625, 7.912109375, 8.19921875, 8.486328125, 8.7734375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 9.0, 16.0, 37.0, 44.0, 72.0, 128.0, 215.0, 367.0, 553.0, 1110.0, 1914.0, 3415.0, 6239.0, 11514.0, 21062.0, 39035.0, 72261.0, 131787.0, 228163.0, 232572.0, 135511.0, 74241.0, 40191.0, 21655.0, 11861.0, 6396.0, 3539.0, 1935.0, 1103.0, 681.0, 362.0, 211.0, 132.0, 75.0, 44.0, 29.0, 24.0, 15.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.375, -1.3357391357421875, -1.296478271484375, -1.2572174072265625, -1.21795654296875, -1.1786956787109375, -1.139434814453125, -1.1001739501953125, -1.0609130859375, -1.0216522216796875, -0.982391357421875, -0.9431304931640625, -0.90386962890625, -0.8646087646484375, -0.825347900390625, -0.7860870361328125, -0.746826171875, -0.7075653076171875, -0.668304443359375, -0.6290435791015625, -0.58978271484375, -0.5505218505859375, -0.511260986328125, -0.4720001220703125, -0.4327392578125, -0.3934783935546875, -0.354217529296875, -0.3149566650390625, -0.27569580078125, -0.2364349365234375, -0.197174072265625, -0.1579132080078125, -0.11865234375, -0.0793914794921875, -0.040130615234375, -0.0008697509765625, 0.03839111328125, 0.0776519775390625, 0.116912841796875, 0.1561737060546875, 0.1954345703125, 0.2346954345703125, 0.273956298828125, 0.3132171630859375, 0.35247802734375, 0.3917388916015625, 0.430999755859375, 0.4702606201171875, 0.509521484375, 0.5487823486328125, 0.588043212890625, 0.6273040771484375, 0.66656494140625, 0.7058258056640625, 0.745086669921875, 0.7843475341796875, 0.8236083984375, 0.8628692626953125, 0.902130126953125, 0.9413909912109375, 0.98065185546875, 1.0199127197265625, 1.059173583984375, 1.0984344482421875, 1.1376953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 10.0, 8.0, 10.0, 10.0, 19.0, 12.0, 20.0, 15.0, 13.0, 22.0, 29.0, 28.0, 29.0, 25.0, 34.0, 34.0, 37.0, 41.0, 33.0, 30.0, 50.0, 39.0, 40.0, 36.0, 24.0, 35.0, 28.0, 38.0, 37.0, 12.0, 30.0, 19.0, 29.0, 22.0, 16.0, 15.0, 15.0, 6.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-5.25390625, -5.09539794921875, -4.9368896484375, -4.77838134765625, -4.619873046875, -4.46136474609375, -4.3028564453125, -4.14434814453125, -3.98583984375, -3.82733154296875, -3.6688232421875, -3.51031494140625, -3.351806640625, -3.19329833984375, -3.0347900390625, -2.87628173828125, -2.7177734375, -2.55926513671875, -2.4007568359375, -2.24224853515625, -2.083740234375, -1.92523193359375, -1.7667236328125, -1.60821533203125, -1.44970703125, -1.29119873046875, -1.1326904296875, -0.97418212890625, -0.815673828125, -0.65716552734375, -0.4986572265625, -0.34014892578125, -0.181640625, -0.02313232421875, 0.1353759765625, 0.29388427734375, 0.452392578125, 0.61090087890625, 0.7694091796875, 0.92791748046875, 1.08642578125, 1.24493408203125, 1.4034423828125, 1.56195068359375, 1.720458984375, 1.87896728515625, 2.0374755859375, 2.19598388671875, 2.3544921875, 2.51300048828125, 2.6715087890625, 2.83001708984375, 2.988525390625, 3.14703369140625, 3.3055419921875, 3.46405029296875, 3.62255859375, 3.78106689453125, 3.9395751953125, 4.09808349609375, 4.256591796875, 4.41510009765625, 4.5736083984375, 4.73211669921875, 4.890625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 13.0, 15.0, 17.0, 24.0, 48.0, 68.0, 84.0, 117.0, 190.0, 238.0, 410.0, 583.0, 910.0, 1516.0, 2344.0, 4229.0, 7626.0, 14965.0, 34713.0, 99619.0, 350590.0, 358404.0, 102265.0, 35659.0, 15331.0, 7751.0, 4117.0, 2459.0, 1444.0, 967.0, 580.0, 394.0, 258.0, 180.0, 113.0, 100.0, 59.0, 52.0, 32.0, 23.0, 11.0, 11.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.181396484375, -0.1759014129638672, -0.17040634155273438, -0.16491127014160156, -0.15941619873046875, -0.15392112731933594, -0.14842605590820312, -0.1429309844970703, -0.1374359130859375, -0.1319408416748047, -0.12644577026367188, -0.12095069885253906, -0.11545562744140625, -0.10996055603027344, -0.10446548461914062, -0.09897041320800781, -0.093475341796875, -0.08798027038574219, -0.08248519897460938, -0.07699012756347656, -0.07149505615234375, -0.06599998474121094, -0.060504913330078125, -0.05500984191894531, -0.0495147705078125, -0.04401969909667969, -0.038524627685546875, -0.03302955627441406, -0.02753448486328125, -0.022039413452148438, -0.016544342041015625, -0.011049270629882812, -0.00555419921875, -5.91278076171875e-05, 0.005435943603515625, 0.010931015014648438, 0.01642608642578125, 0.021921157836914062, 0.027416229248046875, 0.03291130065917969, 0.0384063720703125, 0.04390144348144531, 0.049396514892578125, 0.05489158630371094, 0.06038665771484375, 0.06588172912597656, 0.07137680053710938, 0.07687187194824219, 0.082366943359375, 0.08786201477050781, 0.09335708618164062, 0.09885215759277344, 0.10434722900390625, 0.10984230041503906, 0.11533737182617188, 0.12083244323730469, 0.1263275146484375, 0.1318225860595703, 0.13731765747070312, 0.14281272888183594, 0.14830780029296875, 0.15380287170410156, 0.15929794311523438, 0.1647930145263672, 0.1702880859375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 4.0, 8.0, 11.0, 12.0, 22.0, 21.0, 18.0, 24.0, 31.0, 40.0, 35.0, 38.0, 45.0, 60.0, 48.0, 65.0, 53.0, 54.0, 67.0, 47.0, 44.0, 35.0, 36.0, 32.0, 30.0, 29.0, 27.0, 13.0, 11.0, 10.0, 8.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.245737075805664e-05, -1.2054108083248138e-05, -1.1650845408439636e-05, -1.1247582733631134e-05, -1.0844320058822632e-05, -1.044105738401413e-05, -1.0037794709205627e-05, -9.634532034397125e-06, -9.231269359588623e-06, -8.828006684780121e-06, -8.424744009971619e-06, -8.021481335163116e-06, -7.618218660354614e-06, -7.214955985546112e-06, -6.81169331073761e-06, -6.408430635929108e-06, -6.0051679611206055e-06, -5.601905286312103e-06, -5.198642611503601e-06, -4.795379936695099e-06, -4.392117261886597e-06, -3.9888545870780945e-06, -3.5855919122695923e-06, -3.18232923746109e-06, -2.779066562652588e-06, -2.3758038878440857e-06, -1.9725412130355835e-06, -1.5692785382270813e-06, -1.166015863418579e-06, -7.627531886100769e-07, -3.594905138015747e-07, 4.377216100692749e-08, 4.470348358154297e-07, 8.502975106239319e-07, 1.253560185432434e-06, 1.6568228602409363e-06, 2.0600855350494385e-06, 2.4633482098579407e-06, 2.866610884666443e-06, 3.269873559474945e-06, 3.6731362342834473e-06, 4.0763989090919495e-06, 4.479661583900452e-06, 4.882924258708954e-06, 5.286186933517456e-06, 5.689449608325958e-06, 6.0927122831344604e-06, 6.495974957942963e-06, 6.899237632751465e-06, 7.302500307559967e-06, 7.70576298236847e-06, 8.109025657176971e-06, 8.512288331985474e-06, 8.915551006793976e-06, 9.318813681602478e-06, 9.72207635641098e-06, 1.0125339031219482e-05, 1.0528601706027985e-05, 1.0931864380836487e-05, 1.1335127055644989e-05, 1.1738389730453491e-05, 1.2141652405261993e-05, 1.2544915080070496e-05, 1.2948177754878998e-05, 1.33514404296875e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 18.0, 25.0, 23.0, 39.0, 72.0, 113.0, 161.0, 235.0, 454.0, 697.0, 1229.0, 2040.0, 3563.0, 6756.0, 13172.0, 27554.0, 66211.0, 193132.0, 424352.0, 188958.0, 64439.0, 27162.0, 12812.0, 6691.0, 3604.0, 1951.0, 1136.0, 709.0, 422.0, 288.0, 162.0, 106.0, 81.0, 56.0, 41.0, 23.0, 9.0, 13.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.225341796875, -0.2189922332763672, -0.21264266967773438, -0.20629310607910156, -0.19994354248046875, -0.19359397888183594, -0.18724441528320312, -0.1808948516845703, -0.1745452880859375, -0.1681957244873047, -0.16184616088867188, -0.15549659729003906, -0.14914703369140625, -0.14279747009277344, -0.13644790649414062, -0.1300983428955078, -0.123748779296875, -0.11739921569824219, -0.11104965209960938, -0.10470008850097656, -0.09835052490234375, -0.09200096130371094, -0.08565139770507812, -0.07930183410644531, -0.0729522705078125, -0.06660270690917969, -0.060253143310546875, -0.05390357971191406, -0.04755401611328125, -0.04120445251464844, -0.034854888916015625, -0.028505325317382812, -0.02215576171875, -0.015806198120117188, -0.009456634521484375, -0.0031070709228515625, 0.00324249267578125, 0.009592056274414062, 0.015941619873046875, 0.022291183471679688, 0.0286407470703125, 0.03499031066894531, 0.041339874267578125, 0.04768943786621094, 0.05403900146484375, 0.06038856506347656, 0.06673812866210938, 0.07308769226074219, 0.079437255859375, 0.08578681945800781, 0.09213638305664062, 0.09848594665527344, 0.10483551025390625, 0.11118507385253906, 0.11753463745117188, 0.12388420104980469, 0.1302337646484375, 0.1365833282470703, 0.14293289184570312, 0.14928245544433594, 0.15563201904296875, 0.16198158264160156, 0.16833114624023438, 0.1746807098388672, 0.1810302734375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 5.0, 3.0, 14.0, 8.0, 17.0, 19.0, 14.0, 24.0, 25.0, 33.0, 39.0, 56.0, 54.0, 57.0, 87.0, 71.0, 81.0, 65.0, 58.0, 49.0, 35.0, 27.0, 22.0, 18.0, 25.0, 13.0, 18.0, 10.0, 9.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057891845703125, -0.05584001541137695, -0.053788185119628906, -0.05173635482788086, -0.04968452453613281, -0.047632694244384766, -0.04558086395263672, -0.04352903366088867, -0.041477203369140625, -0.03942537307739258, -0.03737354278564453, -0.035321712493896484, -0.03326988220214844, -0.03121805191040039, -0.029166221618652344, -0.027114391326904297, -0.02506256103515625, -0.023010730743408203, -0.020958900451660156, -0.01890707015991211, -0.016855239868164062, -0.014803409576416016, -0.012751579284667969, -0.010699748992919922, -0.008647918701171875, -0.006596088409423828, -0.004544258117675781, -0.0024924278259277344, -0.0004405975341796875, 0.0016112327575683594, 0.0036630630493164062, 0.005714893341064453, 0.0077667236328125, 0.009818553924560547, 0.011870384216308594, 0.01392221450805664, 0.015974044799804688, 0.018025875091552734, 0.02007770538330078, 0.022129535675048828, 0.024181365966796875, 0.026233196258544922, 0.02828502655029297, 0.030336856842041016, 0.03238868713378906, 0.03444051742553711, 0.036492347717285156, 0.0385441780090332, 0.04059600830078125, 0.0426478385925293, 0.044699668884277344, 0.04675149917602539, 0.04880332946777344, 0.050855159759521484, 0.05290699005126953, 0.05495882034301758, 0.057010650634765625, 0.05906248092651367, 0.06111431121826172, 0.06316614151000977, 0.06521797180175781, 0.06726980209350586, 0.0693216323852539, 0.07137346267700195, 0.07342529296875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 11.0, 9.0, 19.0, 22.0, 31.0, 25.0, 36.0, 39.0, 43.0, 53.0, 46.0, 52.0, 48.0, 65.0, 59.0, 71.0, 64.0, 29.0, 42.0, 31.0, 32.0, 32.0, 19.0, 21.0, 17.0, 9.0, 8.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.143039226531982, -6.864068984985352, -6.5850982666015625, -6.306127548217773, -6.027157306671143, -5.748187065124512, -5.469216346740723, -5.190245628356934, -4.911275386810303, -4.632305145263672, -4.353334426879883, -4.074363708496094, -3.795393466949463, -3.516422986984253, -3.237452507019043, -2.958482027053833, -2.679511547088623, -2.400541067123413, -2.121570587158203, -1.8426001071929932, -1.5636296272277832, -1.2846591472625732, -1.0056886672973633, -0.7267181873321533, -0.44774770736694336, -0.1687772274017334, 0.11019325256347656, 0.3891637325286865, 0.6681342124938965, 0.9471046924591064, 1.2260751724243164, 1.5050456523895264, 1.7840166091918945, 2.0629870891571045, 2.3419575691223145, 2.6209280490875244, 2.8998985290527344, 3.1788690090179443, 3.4578394889831543, 3.7368099689483643, 4.015780448913574, 4.294751167297363, 4.573721408843994, 4.852691650390625, 5.131662368774414, 5.410633087158203, 5.689603328704834, 5.968573570251465, 6.247544288635254, 6.526515007019043, 6.805485248565674, 7.084455490112305, 7.363426208496094, 7.642396926879883, 7.921367168426514, 8.200337409973145, 8.479308128356934, 8.758278846740723, 9.037248611450195, 9.316219329833984, 9.595190048217773, 9.874160766601562, 10.153131484985352, 10.432101249694824, 10.711071968078613]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 9.0, 18.0, 24.0, 25.0, 23.0, 21.0, 25.0, 32.0, 33.0, 41.0, 32.0, 42.0, 42.0, 37.0, 44.0, 38.0, 38.0, 50.0, 46.0, 46.0, 39.0, 27.0, 37.0, 29.0, 26.0, 18.0, 28.0, 24.0, 14.0, 15.0, 11.0, 9.0, 10.0, 5.0, 0.0, 4.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.90362548828125, -9.623322486877441, -9.34302043914795, -9.06271743774414, -8.782415390014648, -8.50211238861084, -8.221809387207031, -7.941506862640381, -7.6612043380737305, -7.38090181350708, -7.10059928894043, -6.820296287536621, -6.539993762969971, -6.25969123840332, -5.979388236999512, -5.699085712432861, -5.418783187866211, -5.1384806632995605, -4.85817813873291, -4.577875137329102, -4.297572612762451, -4.017270088195801, -3.7369673252105713, -3.456664562225342, -3.1763620376586914, -2.896059513092041, -2.6157567501068115, -2.335453987121582, -2.0551514625549316, -1.7748488187789917, -1.4945461750030518, -1.2142435312271118, -0.9339399337768555, -0.6536372900009155, -0.3733346462249756, -0.09303200244903564, 0.1872706413269043, 0.46757328510284424, 0.7478759288787842, 1.0281785726547241, 1.308481216430664, 1.588783860206604, 1.869086503982544, 2.1493892669677734, 2.429691791534424, 2.709994316101074, 2.9902970790863037, 3.270599842071533, 3.5509023666381836, 3.831204891204834, 4.111507415771484, 4.391810417175293, 4.672112941741943, 4.952415466308594, 5.232718467712402, 5.513020992279053, 5.793323516845703, 6.0736260414123535, 6.353928565979004, 6.6342315673828125, 6.914534091949463, 7.194836616516113, 7.475139617919922, 7.755442142486572, 8.035744667053223]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 8.0, 8.0, 12.0, 12.0, 26.0, 38.0, 65.0, 91.0, 161.0, 191.0, 324.0, 526.0, 814.0, 1238.0, 1877.0, 2904.0, 4279.0, 7099.0, 10674.0, 16463.0, 24572.0, 37770.0, 53901.0, 74592.0, 96996.0, 116322.0, 124736.0, 119103.0, 100857.0, 78348.0, 57372.0, 39672.0, 26726.0, 17912.0, 11712.0, 7458.0, 4887.0, 3049.0, 1953.0, 1307.0, 853.0, 565.0, 358.0, 246.0, 152.0, 123.0, 79.0, 49.0, 24.0, 18.0, 12.0, 14.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.578125, -4.42340087890625, -4.2686767578125, -4.11395263671875, -3.959228515625, -3.80450439453125, -3.6497802734375, -3.49505615234375, -3.34033203125, -3.18560791015625, -3.0308837890625, -2.87615966796875, -2.721435546875, -2.56671142578125, -2.4119873046875, -2.25726318359375, -2.1025390625, -1.94781494140625, -1.7930908203125, -1.63836669921875, -1.483642578125, -1.32891845703125, -1.1741943359375, -1.01947021484375, -0.86474609375, -0.71002197265625, -0.5552978515625, -0.40057373046875, -0.245849609375, -0.09112548828125, 0.0635986328125, 0.21832275390625, 0.373046875, 0.52777099609375, 0.6824951171875, 0.83721923828125, 0.991943359375, 1.14666748046875, 1.3013916015625, 1.45611572265625, 1.61083984375, 1.76556396484375, 1.9202880859375, 2.07501220703125, 2.229736328125, 2.38446044921875, 2.5391845703125, 2.69390869140625, 2.8486328125, 3.00335693359375, 3.1580810546875, 3.31280517578125, 3.467529296875, 3.62225341796875, 3.7769775390625, 3.93170166015625, 4.08642578125, 4.24114990234375, 4.3958740234375, 4.55059814453125, 4.705322265625, 4.86004638671875, 5.0147705078125, 5.16949462890625, 5.32421875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 4.0, 1.0, 6.0, 13.0, 11.0, 17.0, 16.0, 32.0, 24.0, 18.0, 25.0, 35.0, 27.0, 44.0, 31.0, 44.0, 37.0, 38.0, 36.0, 50.0, 41.0, 48.0, 43.0, 46.0, 42.0, 36.0, 27.0, 30.0, 27.0, 21.0, 22.0, 20.0, 15.0, 13.0, 21.0, 10.0, 7.0, 3.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.95654296875, -8.6708984375, -8.38525390625, -8.099609375, -7.81396484375, -7.5283203125, -7.24267578125, -6.95703125, -6.67138671875, -6.3857421875, -6.10009765625, -5.814453125, -5.52880859375, -5.2431640625, -4.95751953125, -4.671875, -4.38623046875, -4.1005859375, -3.81494140625, -3.529296875, -3.24365234375, -2.9580078125, -2.67236328125, -2.38671875, -2.10107421875, -1.8154296875, -1.52978515625, -1.244140625, -0.95849609375, -0.6728515625, -0.38720703125, -0.1015625, 0.18408203125, 0.4697265625, 0.75537109375, 1.041015625, 1.32666015625, 1.6123046875, 1.89794921875, 2.18359375, 2.46923828125, 2.7548828125, 3.04052734375, 3.326171875, 3.61181640625, 3.8974609375, 4.18310546875, 4.46875, 4.75439453125, 5.0400390625, 5.32568359375, 5.611328125, 5.89697265625, 6.1826171875, 6.46826171875, 6.75390625, 7.03955078125, 7.3251953125, 7.61083984375, 7.896484375, 8.18212890625, 8.4677734375, 8.75341796875, 9.0390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 11.0, 14.0, 16.0, 28.0, 22.0, 42.0, 90.0, 114.0, 201.0, 308.0, 481.0, 742.0, 1103.0, 1807.0, 2838.0, 4546.0, 7251.0, 11124.0, 17586.0, 26701.0, 40024.0, 58792.0, 81085.0, 105129.0, 123839.0, 128428.0, 118359.0, 96215.0, 72136.0, 51446.0, 34340.0, 22976.0, 14918.0, 9382.0, 6084.0, 3787.0, 2391.0, 1522.0, 955.0, 630.0, 397.0, 237.0, 173.0, 107.0, 78.0, 51.0, 19.0, 14.0, 8.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.40625, -5.24395751953125, -5.0816650390625, -4.91937255859375, -4.757080078125, -4.59478759765625, -4.4324951171875, -4.27020263671875, -4.10791015625, -3.94561767578125, -3.7833251953125, -3.62103271484375, -3.458740234375, -3.29644775390625, -3.1341552734375, -2.97186279296875, -2.8095703125, -2.64727783203125, -2.4849853515625, -2.32269287109375, -2.160400390625, -1.99810791015625, -1.8358154296875, -1.67352294921875, -1.51123046875, -1.34893798828125, -1.1866455078125, -1.02435302734375, -0.862060546875, -0.69976806640625, -0.5374755859375, -0.37518310546875, -0.212890625, -0.05059814453125, 0.1116943359375, 0.27398681640625, 0.436279296875, 0.59857177734375, 0.7608642578125, 0.92315673828125, 1.08544921875, 1.24774169921875, 1.4100341796875, 1.57232666015625, 1.734619140625, 1.89691162109375, 2.0592041015625, 2.22149658203125, 2.3837890625, 2.54608154296875, 2.7083740234375, 2.87066650390625, 3.032958984375, 3.19525146484375, 3.3575439453125, 3.51983642578125, 3.68212890625, 3.84442138671875, 4.0067138671875, 4.16900634765625, 4.331298828125, 4.49359130859375, 4.6558837890625, 4.81817626953125, 4.98046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 2.0, 5.0, 8.0, 9.0, 12.0, 11.0, 12.0, 16.0, 19.0, 27.0, 33.0, 25.0, 35.0, 27.0, 29.0, 45.0, 41.0, 37.0, 48.0, 42.0, 43.0, 36.0, 33.0, 38.0, 34.0, 39.0, 33.0, 25.0, 32.0, 35.0, 19.0, 25.0, 11.0, 24.0, 16.0, 15.0, 15.0, 10.0, 9.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.95703125, -4.790771484375, -4.62451171875, -4.458251953125, -4.2919921875, -4.125732421875, -3.95947265625, -3.793212890625, -3.626953125, -3.460693359375, -3.29443359375, -3.128173828125, -2.9619140625, -2.795654296875, -2.62939453125, -2.463134765625, -2.296875, -2.130615234375, -1.96435546875, -1.798095703125, -1.6318359375, -1.465576171875, -1.29931640625, -1.133056640625, -0.966796875, -0.800537109375, -0.63427734375, -0.468017578125, -0.3017578125, -0.135498046875, 0.03076171875, 0.197021484375, 0.36328125, 0.529541015625, 0.69580078125, 0.862060546875, 1.0283203125, 1.194580078125, 1.36083984375, 1.527099609375, 1.693359375, 1.859619140625, 2.02587890625, 2.192138671875, 2.3583984375, 2.524658203125, 2.69091796875, 2.857177734375, 3.0234375, 3.189697265625, 3.35595703125, 3.522216796875, 3.6884765625, 3.854736328125, 4.02099609375, 4.187255859375, 4.353515625, 4.519775390625, 4.68603515625, 4.852294921875, 5.0185546875, 5.184814453125, 5.35107421875, 5.517333984375, 5.68359375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 12.0, 16.0, 17.0, 17.0, 52.0, 57.0, 98.0, 196.0, 288.0, 520.0, 896.0, 1579.0, 2957.0, 5107.0, 9152.0, 16181.0, 29030.0, 50459.0, 85386.0, 133233.0, 176711.0, 179834.0, 139642.0, 91243.0, 54153.0, 31155.0, 17505.0, 10216.0, 5624.0, 3077.0, 1754.0, 1013.0, 557.0, 323.0, 177.0, 123.0, 72.0, 48.0, 31.0, 11.0, 9.0, 12.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.576171875, -2.5047454833984375, -2.433319091796875, -2.3618927001953125, -2.29046630859375, -2.2190399169921875, -2.147613525390625, -2.0761871337890625, -2.0047607421875, -1.9333343505859375, -1.861907958984375, -1.7904815673828125, -1.71905517578125, -1.6476287841796875, -1.576202392578125, -1.5047760009765625, -1.433349609375, -1.3619232177734375, -1.290496826171875, -1.2190704345703125, -1.14764404296875, -1.0762176513671875, -1.004791259765625, -0.9333648681640625, -0.8619384765625, -0.7905120849609375, -0.719085693359375, -0.6476593017578125, -0.57623291015625, -0.5048065185546875, -0.433380126953125, -0.3619537353515625, -0.29052734375, -0.2191009521484375, -0.147674560546875, -0.0762481689453125, -0.00482177734375, 0.0666046142578125, 0.138031005859375, 0.2094573974609375, 0.2808837890625, 0.3523101806640625, 0.423736572265625, 0.4951629638671875, 0.56658935546875, 0.6380157470703125, 0.709442138671875, 0.7808685302734375, 0.852294921875, 0.9237213134765625, 0.995147705078125, 1.0665740966796875, 1.13800048828125, 1.2094268798828125, 1.280853271484375, 1.3522796630859375, 1.4237060546875, 1.4951324462890625, 1.566558837890625, 1.6379852294921875, 1.70941162109375, 1.7808380126953125, 1.852264404296875, 1.9236907958984375, 1.9951171875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 8.0, 12.0, 16.0, 20.0, 19.0, 25.0, 29.0, 22.0, 25.0, 30.0, 31.0, 44.0, 39.0, 45.0, 39.0, 38.0, 43.0, 41.0, 34.0, 29.0, 57.0, 30.0, 30.0, 43.0, 40.0, 26.0, 31.0, 24.0, 19.0, 17.0, 19.0, 9.0, 14.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00014507770538330078, -0.0001409156247973442, -0.00013675354421138763, -0.00013259146362543106, -0.0001284293830394745, -0.00012426730245351791, -0.00012010522186756134, -0.00011594314128160477, -0.0001117810606956482, -0.00010761898010969162, -0.00010345689952373505, -9.929481893777847e-05, -9.51327383518219e-05, -9.097065776586533e-05, -8.680857717990875e-05, -8.264649659395218e-05, -7.84844160079956e-05, -7.432233542203903e-05, -7.016025483608246e-05, -6.599817425012589e-05, -6.183609366416931e-05, -5.767401307821274e-05, -5.3511932492256165e-05, -4.934985190629959e-05, -4.518777132034302e-05, -4.1025690734386444e-05, -3.686361014842987e-05, -3.27015295624733e-05, -2.8539448976516724e-05, -2.437736839056015e-05, -2.0215287804603577e-05, -1.6053207218647003e-05, -1.189112663269043e-05, -7.729046046733856e-06, -3.5669654607772827e-06, 5.951151251792908e-07, 4.757195711135864e-06, 8.919276297092438e-06, 1.3081356883049011e-05, 1.7243437469005585e-05, 2.1405518054962158e-05, 2.556759864091873e-05, 2.9729679226875305e-05, 3.389175981283188e-05, 3.805384039878845e-05, 4.2215920984745026e-05, 4.63780015707016e-05, 5.054008215665817e-05, 5.4702162742614746e-05, 5.886424332857132e-05, 6.302632391452789e-05, 6.718840450048447e-05, 7.135048508644104e-05, 7.551256567239761e-05, 7.967464625835419e-05, 8.383672684431076e-05, 8.799880743026733e-05, 9.216088801622391e-05, 9.632296860218048e-05, 0.00010048504918813705, 0.00010464712977409363, 0.0001088092103600502, 0.00011297129094600677, 0.00011713337153196335, 0.00012129545211791992]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 14.0, 16.0, 35.0, 39.0, 71.0, 102.0, 191.0, 244.0, 419.0, 660.0, 1094.0, 1859.0, 2902.0, 4783.0, 7826.0, 12271.0, 20070.0, 31957.0, 50346.0, 76896.0, 110515.0, 140727.0, 152460.0, 135221.0, 103226.0, 70811.0, 46403.0, 29532.0, 18324.0, 11420.0, 6757.0, 4292.0, 2677.0, 1687.0, 976.0, 614.0, 424.0, 249.0, 161.0, 86.0, 61.0, 42.0, 27.0, 17.0, 17.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9420166015625, -1.882080078125, -1.8221435546875, -1.76220703125, -1.7022705078125, -1.642333984375, -1.5823974609375, -1.5224609375, -1.4625244140625, -1.402587890625, -1.3426513671875, -1.28271484375, -1.2227783203125, -1.162841796875, -1.1029052734375, -1.04296875, -0.9830322265625, -0.923095703125, -0.8631591796875, -0.80322265625, -0.7432861328125, -0.683349609375, -0.6234130859375, -0.5634765625, -0.5035400390625, -0.443603515625, -0.3836669921875, -0.32373046875, -0.2637939453125, -0.203857421875, -0.1439208984375, -0.083984375, -0.0240478515625, 0.035888671875, 0.0958251953125, 0.15576171875, 0.2156982421875, 0.275634765625, 0.3355712890625, 0.3955078125, 0.4554443359375, 0.515380859375, 0.5753173828125, 0.63525390625, 0.6951904296875, 0.755126953125, 0.8150634765625, 0.875, 0.9349365234375, 0.994873046875, 1.0548095703125, 1.11474609375, 1.1746826171875, 1.234619140625, 1.2945556640625, 1.3544921875, 1.4144287109375, 1.474365234375, 1.5343017578125, 1.59423828125, 1.6541748046875, 1.714111328125, 1.7740478515625, 1.833984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 8.0, 8.0, 5.0, 13.0, 20.0, 22.0, 18.0, 23.0, 25.0, 34.0, 43.0, 57.0, 55.0, 56.0, 50.0, 52.0, 68.0, 55.0, 59.0, 53.0, 50.0, 35.0, 44.0, 26.0, 23.0, 15.0, 29.0, 14.0, 10.0, 7.0, 9.0, 6.0, 4.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.8791046142578125, -0.851959228515625, -0.8248138427734375, -0.79766845703125, -0.7705230712890625, -0.743377685546875, -0.7162322998046875, -0.6890869140625, -0.6619415283203125, -0.634796142578125, -0.6076507568359375, -0.58050537109375, -0.5533599853515625, -0.526214599609375, -0.4990692138671875, -0.471923828125, -0.4447784423828125, -0.417633056640625, -0.3904876708984375, -0.36334228515625, -0.3361968994140625, -0.309051513671875, -0.2819061279296875, -0.2547607421875, -0.2276153564453125, -0.200469970703125, -0.1733245849609375, -0.14617919921875, -0.1190338134765625, -0.091888427734375, -0.0647430419921875, -0.03759765625, -0.0104522705078125, 0.016693115234375, 0.0438385009765625, 0.07098388671875, 0.0981292724609375, 0.125274658203125, 0.1524200439453125, 0.1795654296875, 0.2067108154296875, 0.233856201171875, 0.2610015869140625, 0.28814697265625, 0.3152923583984375, 0.342437744140625, 0.3695831298828125, 0.396728515625, 0.4238739013671875, 0.451019287109375, 0.4781646728515625, 0.50531005859375, 0.5324554443359375, 0.559600830078125, 0.5867462158203125, 0.6138916015625, 0.6410369873046875, 0.668182373046875, 0.6953277587890625, 0.72247314453125, 0.7496185302734375, 0.776763916015625, 0.8039093017578125, 0.8310546875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 8.0, 5.0, 12.0, 15.0, 23.0, 21.0, 26.0, 34.0, 28.0, 35.0, 54.0, 59.0, 53.0, 56.0, 54.0, 71.0, 57.0, 70.0, 47.0, 43.0, 43.0, 31.0, 34.0, 19.0, 17.0, 18.0, 9.0, 10.0, 4.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.817793369293213, -7.5197343826293945, -7.221674919128418, -6.9236159324646, -6.625556945800781, -6.327497482299805, -6.029438495635986, -5.731379508972168, -5.433320045471191, -5.135261058807373, -4.8372015953063965, -4.539142608642578, -4.241083145141602, -3.943024158477783, -3.644965171813965, -3.3469059467315674, -3.04884672164917, -2.7507874965667725, -2.452728271484375, -2.1546692848205566, -1.8566100597381592, -1.5585508346557617, -1.2604917287826538, -0.9624326229095459, -0.6643733978271484, -0.36631423234939575, -0.06825506687164307, 0.22980409860610962, 0.5278632640838623, 0.8259224891662598, 1.1239815950393677, 1.4220407009124756, 1.7201004028320312, 2.0181596279144287, 2.316218852996826, 2.6142778396606445, 2.912337064743042, 3.2103962898254395, 3.508455276489258, 3.8065145015716553, 4.104573726654053, 4.402632713317871, 4.700692176818848, 4.998751163482666, 5.296810150146484, 5.594869613647461, 5.892928600311279, 6.190987586975098, 6.489047050476074, 6.787106037139893, 7.085165500640869, 7.3832244873046875, 7.681283950805664, 7.979342937469482, 8.2774019241333, 8.575461387634277, 8.873519897460938, 9.171579360961914, 9.469637870788574, 9.76769733428955, 10.065756797790527, 10.363815307617188, 10.661874771118164, 10.95993423461914, 11.257993698120117]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 5.0, 4.0, 15.0, 10.0, 13.0, 13.0, 18.0, 30.0, 16.0, 24.0, 36.0, 34.0, 33.0, 41.0, 53.0, 34.0, 38.0, 43.0, 39.0, 46.0, 48.0, 43.0, 37.0, 40.0, 38.0, 40.0, 31.0, 36.0, 29.0, 20.0, 20.0, 13.0, 12.0, 13.0, 9.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.205642700195312, -10.89029312133789, -10.574943542480469, -10.25959300994873, -9.944243431091309, -9.628893852233887, -9.313543319702148, -8.998193740844727, -8.682844161987305, -8.367494583129883, -8.052145004272461, -7.736794471740723, -7.421444892883301, -7.106095314025879, -6.790745258331299, -6.475395202636719, -6.160045623779297, -5.844696044921875, -5.529345989227295, -5.213995933532715, -4.898646354675293, -4.583296775817871, -4.267946720123291, -3.95259690284729, -3.637247085571289, -3.321897268295288, -3.006547451019287, -2.691197633743286, -2.375847816467285, -2.060497999191284, -1.7451481819152832, -1.4297983646392822, -1.1144475936889648, -0.7990977764129639, -0.4837479591369629, -0.16839814186096191, 0.14695167541503906, 0.46230149269104004, 0.777651309967041, 1.093001127243042, 1.408350944519043, 1.723700761795044, 2.039050579071045, 2.354400396347046, 2.669750213623047, 2.985100030899048, 3.300449848175049, 3.61579966545105, 3.931149482727051, 4.246499061584473, 4.561849117279053, 4.877199172973633, 5.192548751831055, 5.507898330688477, 5.823248386383057, 6.138598442077637, 6.453948020935059, 6.7692975997924805, 7.0846476554870605, 7.399997711181641, 7.7153472900390625, 8.030696868896484, 8.346046447753906, 8.661396980285645, 8.976746559143066]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 3.0, 13.0, 20.0, 25.0, 33.0, 31.0, 90.0, 131.0, 192.0, 309.0, 431.0, 655.0, 983.0, 1386.0, 2301.0, 3354.0, 5316.0, 8323.0, 12967.0, 20851.0, 33856.0, 55190.0, 90856.0, 151445.0, 253354.0, 410468.0, 601548.0, 718311.0, 646450.0, 460026.0, 287748.0, 171087.0, 100802.0, 60221.0, 36152.0, 21784.0, 13633.0, 8595.0, 5411.0, 3372.0, 2282.0, 1393.0, 913.0, 642.0, 415.0, 310.0, 166.0, 120.0, 121.0, 66.0, 48.0, 26.0, 20.0, 12.0, 10.0, 10.0, 3.0, 7.0, 5.0, 1.0, 1.0], "bins": [-7.2109375, -6.975341796875, -6.73974609375, -6.504150390625, -6.2685546875, -6.032958984375, -5.79736328125, -5.561767578125, -5.326171875, -5.090576171875, -4.85498046875, -4.619384765625, -4.3837890625, -4.148193359375, -3.91259765625, -3.677001953125, -3.44140625, -3.205810546875, -2.97021484375, -2.734619140625, -2.4990234375, -2.263427734375, -2.02783203125, -1.792236328125, -1.556640625, -1.321044921875, -1.08544921875, -0.849853515625, -0.6142578125, -0.378662109375, -0.14306640625, 0.092529296875, 0.328125, 0.563720703125, 0.79931640625, 1.034912109375, 1.2705078125, 1.506103515625, 1.74169921875, 1.977294921875, 2.212890625, 2.448486328125, 2.68408203125, 2.919677734375, 3.1552734375, 3.390869140625, 3.62646484375, 3.862060546875, 4.09765625, 4.333251953125, 4.56884765625, 4.804443359375, 5.0400390625, 5.275634765625, 5.51123046875, 5.746826171875, 5.982421875, 6.218017578125, 6.45361328125, 6.689208984375, 6.9248046875, 7.160400390625, 7.39599609375, 7.631591796875, 7.8671875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 8.0, 6.0, 20.0, 13.0, 14.0, 22.0, 26.0, 33.0, 25.0, 27.0, 34.0, 39.0, 44.0, 33.0, 53.0, 59.0, 42.0, 38.0, 64.0, 43.0, 29.0, 50.0, 42.0, 42.0, 47.0, 23.0, 24.0, 14.0, 20.0, 16.0, 10.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.86041259765625, -7.6114501953125, -7.36248779296875, -7.113525390625, -6.86456298828125, -6.6156005859375, -6.36663818359375, -6.11767578125, -5.86871337890625, -5.6197509765625, -5.37078857421875, -5.121826171875, -4.87286376953125, -4.6239013671875, -4.37493896484375, -4.1259765625, -3.87701416015625, -3.6280517578125, -3.37908935546875, -3.130126953125, -2.88116455078125, -2.6322021484375, -2.38323974609375, -2.13427734375, -1.88531494140625, -1.6363525390625, -1.38739013671875, -1.138427734375, -0.88946533203125, -0.6405029296875, -0.39154052734375, -0.142578125, 0.10638427734375, 0.3553466796875, 0.60430908203125, 0.853271484375, 1.10223388671875, 1.3511962890625, 1.60015869140625, 1.84912109375, 2.09808349609375, 2.3470458984375, 2.59600830078125, 2.844970703125, 3.09393310546875, 3.3428955078125, 3.59185791015625, 3.8408203125, 4.08978271484375, 4.3387451171875, 4.58770751953125, 4.836669921875, 5.08563232421875, 5.3345947265625, 5.58355712890625, 5.83251953125, 6.08148193359375, 6.3304443359375, 6.57940673828125, 6.828369140625, 7.07733154296875, 7.3262939453125, 7.57525634765625, 7.82421875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 9.0, 3.0, 14.0, 16.0, 30.0, 45.0, 86.0, 115.0, 202.0, 363.0, 562.0, 1007.0, 1723.0, 3201.0, 5623.0, 10564.0, 19431.0, 37267.0, 71517.0, 138417.0, 259305.0, 455050.0, 685399.0, 800778.0, 688273.0, 458184.0, 262633.0, 139842.0, 72954.0, 37980.0, 20103.0, 10470.0, 5722.0, 3148.0, 1797.0, 990.0, 605.0, 357.0, 192.0, 118.0, 69.0, 45.0, 30.0, 17.0, 17.0, 11.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.03125, -8.74462890625, -8.4580078125, -8.17138671875, -7.884765625, -7.59814453125, -7.3115234375, -7.02490234375, -6.73828125, -6.45166015625, -6.1650390625, -5.87841796875, -5.591796875, -5.30517578125, -5.0185546875, -4.73193359375, -4.4453125, -4.15869140625, -3.8720703125, -3.58544921875, -3.298828125, -3.01220703125, -2.7255859375, -2.43896484375, -2.15234375, -1.86572265625, -1.5791015625, -1.29248046875, -1.005859375, -0.71923828125, -0.4326171875, -0.14599609375, 0.140625, 0.42724609375, 0.7138671875, 1.00048828125, 1.287109375, 1.57373046875, 1.8603515625, 2.14697265625, 2.43359375, 2.72021484375, 3.0068359375, 3.29345703125, 3.580078125, 3.86669921875, 4.1533203125, 4.43994140625, 4.7265625, 5.01318359375, 5.2998046875, 5.58642578125, 5.873046875, 6.15966796875, 6.4462890625, 6.73291015625, 7.01953125, 7.30615234375, 7.5927734375, 7.87939453125, 8.166015625, 8.45263671875, 8.7392578125, 9.02587890625, 9.3125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 2.0, 3.0, 5.0, 3.0, 7.0, 13.0, 21.0, 19.0, 30.0, 41.0, 52.0, 55.0, 84.0, 86.0, 100.0, 126.0, 142.0, 179.0, 212.0, 192.0, 196.0, 220.0, 273.0, 199.0, 245.0, 201.0, 190.0, 185.0, 158.0, 150.0, 118.0, 101.0, 88.0, 74.0, 60.0, 59.0, 41.0, 25.0, 28.0, 29.0, 9.0, 11.0, 10.0, 8.0, 10.0, 1.0, 8.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.884765625, -2.774810791015625, -2.66485595703125, -2.554901123046875, -2.4449462890625, -2.334991455078125, -2.22503662109375, -2.115081787109375, -2.005126953125, -1.895172119140625, -1.78521728515625, -1.675262451171875, -1.5653076171875, -1.455352783203125, -1.34539794921875, -1.235443115234375, -1.12548828125, -1.015533447265625, -0.90557861328125, -0.795623779296875, -0.6856689453125, -0.575714111328125, -0.46575927734375, -0.355804443359375, -0.245849609375, -0.135894775390625, -0.02593994140625, 0.084014892578125, 0.1939697265625, 0.303924560546875, 0.41387939453125, 0.523834228515625, 0.6337890625, 0.743743896484375, 0.85369873046875, 0.963653564453125, 1.0736083984375, 1.183563232421875, 1.29351806640625, 1.403472900390625, 1.513427734375, 1.623382568359375, 1.73333740234375, 1.843292236328125, 1.9532470703125, 2.063201904296875, 2.17315673828125, 2.283111572265625, 2.39306640625, 2.503021240234375, 2.61297607421875, 2.722930908203125, 2.8328857421875, 2.942840576171875, 3.05279541015625, 3.162750244140625, 3.272705078125, 3.382659912109375, 3.49261474609375, 3.602569580078125, 3.7125244140625, 3.822479248046875, 3.93243408203125, 4.042388916015625, 4.15234375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 8.0, 17.0, 23.0, 29.0, 29.0, 46.0, 61.0, 59.0, 52.0, 66.0, 90.0, 94.0, 69.0, 73.0, 56.0, 44.0, 38.0, 33.0, 16.0, 26.0, 11.0, 10.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.803152084350586, -12.393132209777832, -11.983112335205078, -11.573092460632324, -11.16307258605957, -10.753052711486816, -10.343032836914062, -9.933013916015625, -9.522993087768555, -9.1129732131958, -8.702953338623047, -8.292933464050293, -7.882913589477539, -7.472893714904785, -7.0628743171691895, -6.6528544425964355, -6.24283504486084, -5.832815170288086, -5.422795295715332, -5.012775421142578, -4.602755546569824, -4.19273567199707, -3.7827162742614746, -3.3726963996887207, -2.962676525115967, -2.552656650543213, -2.142636775970459, -1.7326171398162842, -1.3225972652435303, -0.9125773906707764, -0.5025577545166016, -0.09253787994384766, 0.31748294830322266, 0.7275027632713318, 1.137522578239441, 1.5475423336029053, 1.9575622081756592, 2.367582082748413, 2.777601718902588, 3.187621593475342, 3.5976414680480957, 4.00766134262085, 4.4176812171936035, 4.827700614929199, 5.237720489501953, 5.647740364074707, 6.057760238647461, 6.467780113220215, 6.877799987792969, 7.287819862365723, 7.697839736938477, 8.10785961151123, 8.517879486083984, 8.927899360656738, 9.337919235229492, 9.74793815612793, 10.157958984375, 10.567978858947754, 10.977998733520508, 11.388018608093262, 11.798038482666016, 12.20805835723877, 12.618078231811523, 13.028097152709961, 13.438117027282715]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 7.0, 7.0, 5.0, 12.0, 5.0, 15.0, 11.0, 15.0, 22.0, 20.0, 23.0, 36.0, 31.0, 37.0, 38.0, 49.0, 43.0, 50.0, 46.0, 34.0, 37.0, 38.0, 41.0, 44.0, 37.0, 30.0, 44.0, 39.0, 31.0, 24.0, 31.0, 13.0, 16.0, 19.0, 9.0, 9.0, 6.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.15987777709961, -10.839599609375, -10.519322395324707, -10.199045181274414, -9.878767013549805, -9.558488845825195, -9.238211631774902, -8.91793441772461, -8.59765625, -8.27737808227539, -7.957100868225098, -7.6368231773376465, -7.316545486450195, -6.996267795562744, -6.675990104675293, -6.355712413787842, -6.035434722900391, -5.7151570320129395, -5.394879341125488, -5.074601650238037, -4.754323959350586, -4.434046268463135, -4.113768577575684, -3.7934908866882324, -3.4732131958007812, -3.15293550491333, -2.832657814025879, -2.5123801231384277, -2.1921024322509766, -1.8718247413635254, -1.5515470504760742, -1.231269359588623, -0.9109907150268555, -0.5907130241394043, -0.2704353332519531, 0.04984235763549805, 0.3701200485229492, 0.6903977394104004, 1.0106754302978516, 1.3309531211853027, 1.651230812072754, 1.971508502960205, 2.2917861938476562, 2.6120638847351074, 2.9323415756225586, 3.2526192665100098, 3.572896957397461, 3.893174648284912, 4.213452339172363, 4.5337300300598145, 4.854007720947266, 5.174285411834717, 5.494563102722168, 5.814840793609619, 6.13511848449707, 6.4553961753845215, 6.775673866271973, 7.095951557159424, 7.416229248046875, 7.736506938934326, 8.056784629821777, 8.37706184387207, 8.69734001159668, 9.017618179321289, 9.337895393371582]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 17.0, 17.0, 25.0, 46.0, 83.0, 105.0, 131.0, 256.0, 313.0, 485.0, 715.0, 1163.0, 1823.0, 2814.0, 4432.0, 6710.0, 10690.0, 16809.0, 27615.0, 44547.0, 72537.0, 116988.0, 179743.0, 198951.0, 136338.0, 85190.0, 52282.0, 32728.0, 20096.0, 12640.0, 7997.0, 5158.0, 3152.0, 2077.0, 1362.0, 864.0, 546.0, 359.0, 254.0, 167.0, 120.0, 72.0, 43.0, 29.0, 25.0, 12.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9912109375, -0.95941162109375, -0.9276123046875, -0.89581298828125, -0.864013671875, -0.83221435546875, -0.8004150390625, -0.76861572265625, -0.73681640625, -0.70501708984375, -0.6732177734375, -0.64141845703125, -0.609619140625, -0.57781982421875, -0.5460205078125, -0.51422119140625, -0.482421875, -0.45062255859375, -0.4188232421875, -0.38702392578125, -0.355224609375, -0.32342529296875, -0.2916259765625, -0.25982666015625, -0.22802734375, -0.19622802734375, -0.1644287109375, -0.13262939453125, -0.100830078125, -0.06903076171875, -0.0372314453125, -0.00543212890625, 0.0263671875, 0.05816650390625, 0.0899658203125, 0.12176513671875, 0.153564453125, 0.18536376953125, 0.2171630859375, 0.24896240234375, 0.28076171875, 0.31256103515625, 0.3443603515625, 0.37615966796875, 0.407958984375, 0.43975830078125, 0.4715576171875, 0.50335693359375, 0.53515625, 0.56695556640625, 0.5987548828125, 0.63055419921875, 0.662353515625, 0.69415283203125, 0.7259521484375, 0.75775146484375, 0.78955078125, 0.82135009765625, 0.8531494140625, 0.88494873046875, 0.916748046875, 0.94854736328125, 0.9803466796875, 1.01214599609375, 1.0439453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 5.0, 13.0, 10.0, 8.0, 14.0, 23.0, 24.0, 26.0, 27.0, 34.0, 34.0, 44.0, 48.0, 41.0, 47.0, 45.0, 55.0, 43.0, 42.0, 48.0, 39.0, 46.0, 47.0, 34.0, 31.0, 26.0, 26.0, 17.0, 22.0, 22.0, 9.0, 12.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.9453125, -12.5919189453125, -12.238525390625, -11.8851318359375, -11.53173828125, -11.1783447265625, -10.824951171875, -10.4715576171875, -10.1181640625, -9.7647705078125, -9.411376953125, -9.0579833984375, -8.70458984375, -8.3511962890625, -7.997802734375, -7.6444091796875, -7.291015625, -6.9376220703125, -6.584228515625, -6.2308349609375, -5.87744140625, -5.5240478515625, -5.170654296875, -4.8172607421875, -4.4638671875, -4.1104736328125, -3.757080078125, -3.4036865234375, -3.05029296875, -2.6968994140625, -2.343505859375, -1.9901123046875, -1.63671875, -1.2833251953125, -0.929931640625, -0.5765380859375, -0.22314453125, 0.1302490234375, 0.483642578125, 0.8370361328125, 1.1904296875, 1.5438232421875, 1.897216796875, 2.2506103515625, 2.60400390625, 2.9573974609375, 3.310791015625, 3.6641845703125, 4.017578125, 4.3709716796875, 4.724365234375, 5.0777587890625, 5.43115234375, 5.7845458984375, 6.137939453125, 6.4913330078125, 6.8447265625, 7.1981201171875, 7.551513671875, 7.9049072265625, 8.25830078125, 8.6116943359375, 8.965087890625, 9.3184814453125, 9.671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 10.0, 31.0, 47.0, 69.0, 104.0, 181.0, 323.0, 535.0, 932.0, 1529.0, 2623.0, 4441.0, 7924.0, 13931.0, 24134.0, 42643.0, 73749.0, 126655.0, 210595.0, 219130.0, 134867.0, 78272.0, 45250.0, 25843.0, 14878.0, 8219.0, 4903.0, 2771.0, 1590.0, 955.0, 561.0, 310.0, 204.0, 126.0, 70.0, 47.0, 25.0, 21.0, 10.0, 9.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2239227294921875, -1.183197021484375, -1.1424713134765625, -1.10174560546875, -1.0610198974609375, -1.020294189453125, -0.9795684814453125, -0.9388427734375, -0.8981170654296875, -0.857391357421875, -0.8166656494140625, -0.77593994140625, -0.7352142333984375, -0.694488525390625, -0.6537628173828125, -0.613037109375, -0.5723114013671875, -0.531585693359375, -0.4908599853515625, -0.45013427734375, -0.4094085693359375, -0.368682861328125, -0.3279571533203125, -0.2872314453125, -0.2465057373046875, -0.205780029296875, -0.1650543212890625, -0.12432861328125, -0.0836029052734375, -0.042877197265625, -0.0021514892578125, 0.03857421875, 0.0792999267578125, 0.120025634765625, 0.1607513427734375, 0.20147705078125, 0.2422027587890625, 0.282928466796875, 0.3236541748046875, 0.3643798828125, 0.4051055908203125, 0.445831298828125, 0.4865570068359375, 0.52728271484375, 0.5680084228515625, 0.608734130859375, 0.6494598388671875, 0.690185546875, 0.7309112548828125, 0.771636962890625, 0.8123626708984375, 0.85308837890625, 0.8938140869140625, 0.934539794921875, 0.9752655029296875, 1.0159912109375, 1.0567169189453125, 1.097442626953125, 1.1381683349609375, 1.17889404296875, 1.2196197509765625, 1.260345458984375, 1.3010711669921875, 1.341796875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0, 14.0, 3.0, 10.0, 14.0, 11.0, 18.0, 16.0, 19.0, 34.0, 27.0, 26.0, 22.0, 38.0, 28.0, 39.0, 31.0, 39.0, 40.0, 49.0, 34.0, 48.0, 40.0, 49.0, 38.0, 25.0, 28.0, 35.0, 22.0, 18.0, 14.0, 33.0, 26.0, 10.0, 12.0, 16.0, 15.0, 11.0, 4.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.09375, -5.908203125, -5.72265625, -5.537109375, -5.3515625, -5.166015625, -4.98046875, -4.794921875, -4.609375, -4.423828125, -4.23828125, -4.052734375, -3.8671875, -3.681640625, -3.49609375, -3.310546875, -3.125, -2.939453125, -2.75390625, -2.568359375, -2.3828125, -2.197265625, -2.01171875, -1.826171875, -1.640625, -1.455078125, -1.26953125, -1.083984375, -0.8984375, -0.712890625, -0.52734375, -0.341796875, -0.15625, 0.029296875, 0.21484375, 0.400390625, 0.5859375, 0.771484375, 0.95703125, 1.142578125, 1.328125, 1.513671875, 1.69921875, 1.884765625, 2.0703125, 2.255859375, 2.44140625, 2.626953125, 2.8125, 2.998046875, 3.18359375, 3.369140625, 3.5546875, 3.740234375, 3.92578125, 4.111328125, 4.296875, 4.482421875, 4.66796875, 4.853515625, 5.0390625, 5.224609375, 5.41015625, 5.595703125, 5.78125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 10.0, 4.0, 14.0, 20.0, 21.0, 45.0, 63.0, 84.0, 160.0, 264.0, 497.0, 793.0, 1460.0, 2833.0, 5790.0, 13917.0, 42196.0, 203706.0, 596710.0, 128116.0, 30714.0, 11083.0, 4737.0, 2316.0, 1221.0, 700.0, 437.0, 234.0, 141.0, 98.0, 62.0, 42.0, 26.0, 10.0, 12.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2860603332519531, -0.27597808837890625, -0.2658958435058594, -0.2558135986328125, -0.24573135375976562, -0.23564910888671875, -0.22556686401367188, -0.215484619140625, -0.20540237426757812, -0.19532012939453125, -0.18523788452148438, -0.1751556396484375, -0.16507339477539062, -0.15499114990234375, -0.14490890502929688, -0.13482666015625, -0.12474441528320312, -0.11466217041015625, -0.10457992553710938, -0.0944976806640625, -0.08441543579101562, -0.07433319091796875, -0.06425094604492188, -0.054168701171875, -0.044086456298828125, -0.03400421142578125, -0.023921966552734375, -0.0138397216796875, -0.003757476806640625, 0.00632476806640625, 0.016407012939453125, 0.0264892578125, 0.036571502685546875, 0.04665374755859375, 0.056735992431640625, 0.0668182373046875, 0.07690048217773438, 0.08698272705078125, 0.09706497192382812, 0.107147216796875, 0.11722946166992188, 0.12731170654296875, 0.13739395141601562, 0.1474761962890625, 0.15755844116210938, 0.16764068603515625, 0.17772293090820312, 0.18780517578125, 0.19788742065429688, 0.20796966552734375, 0.21805191040039062, 0.2281341552734375, 0.23821640014648438, 0.24829864501953125, 0.2583808898925781, 0.268463134765625, 0.2785453796386719, 0.28862762451171875, 0.2987098693847656, 0.3087921142578125, 0.3188743591308594, 0.32895660400390625, 0.3390388488769531, 0.34912109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 15.0, 10.0, 20.0, 21.0, 32.0, 29.0, 29.0, 31.0, 47.0, 56.0, 44.0, 47.0, 69.0, 61.0, 49.0, 53.0, 46.0, 39.0, 47.0, 28.0, 37.0, 27.0, 24.0, 17.0, 19.0, 20.0, 10.0, 9.0, 5.0, 3.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4901161193847656e-05, -1.447182148694992e-05, -1.4042481780052185e-05, -1.361314207315445e-05, -1.3183802366256714e-05, -1.2754462659358978e-05, -1.2325122952461243e-05, -1.1895783245563507e-05, -1.1466443538665771e-05, -1.1037103831768036e-05, -1.06077641248703e-05, -1.0178424417972565e-05, -9.749084711074829e-06, -9.319745004177094e-06, -8.890405297279358e-06, -8.461065590381622e-06, -8.031725883483887e-06, -7.602386176586151e-06, -7.1730464696884155e-06, -6.74370676279068e-06, -6.314367055892944e-06, -5.885027348995209e-06, -5.455687642097473e-06, -5.0263479351997375e-06, -4.597008228302002e-06, -4.167668521404266e-06, -3.7383288145065308e-06, -3.308989107608795e-06, -2.8796494007110596e-06, -2.450309693813324e-06, -2.0209699869155884e-06, -1.5916302800178528e-06, -1.1622905731201172e-06, -7.329508662223816e-07, -3.03611159324646e-07, 1.257285475730896e-07, 5.550682544708252e-07, 9.844079613685608e-07, 1.4137476682662964e-06, 1.843087375164032e-06, 2.2724270820617676e-06, 2.701766788959503e-06, 3.1311064958572388e-06, 3.5604462027549744e-06, 3.98978590965271e-06, 4.4191256165504456e-06, 4.848465323448181e-06, 5.277805030345917e-06, 5.707144737243652e-06, 6.136484444141388e-06, 6.5658241510391235e-06, 6.995163857936859e-06, 7.424503564834595e-06, 7.85384327173233e-06, 8.283182978630066e-06, 8.712522685527802e-06, 9.141862392425537e-06, 9.571202099323273e-06, 1.0000541806221008e-05, 1.0429881513118744e-05, 1.085922122001648e-05, 1.1288560926914215e-05, 1.171790063381195e-05, 1.2147240340709686e-05, 1.2576580047607422e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 16.0, 15.0, 26.0, 47.0, 37.0, 62.0, 71.0, 108.0, 154.0, 190.0, 265.0, 409.0, 587.0, 897.0, 1325.0, 1889.0, 2890.0, 4347.0, 6971.0, 11247.0, 19193.0, 34153.0, 65384.0, 135824.0, 275744.0, 241989.0, 113362.0, 55871.0, 29658.0, 17029.0, 10259.0, 6326.0, 4111.0, 2557.0, 1682.0, 1094.0, 787.0, 554.0, 403.0, 299.0, 216.0, 164.0, 111.0, 70.0, 42.0, 33.0, 31.0, 15.0, 13.0, 11.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.16423797607421875, -0.1589202880859375, -0.15360260009765625, -0.148284912109375, -0.14296722412109375, -0.1376495361328125, -0.13233184814453125, -0.12701416015625, -0.12169647216796875, -0.1163787841796875, -0.11106109619140625, -0.105743408203125, -0.10042572021484375, -0.0951080322265625, -0.08979034423828125, -0.08447265625, -0.07915496826171875, -0.0738372802734375, -0.06851959228515625, -0.063201904296875, -0.05788421630859375, -0.0525665283203125, -0.04724884033203125, -0.04193115234375, -0.03661346435546875, -0.0312957763671875, -0.02597808837890625, -0.020660400390625, -0.01534271240234375, -0.0100250244140625, -0.00470733642578125, 0.0006103515625, 0.00592803955078125, 0.0112457275390625, 0.01656341552734375, 0.021881103515625, 0.02719879150390625, 0.0325164794921875, 0.03783416748046875, 0.04315185546875, 0.04846954345703125, 0.0537872314453125, 0.05910491943359375, 0.064422607421875, 0.06974029541015625, 0.0750579833984375, 0.08037567138671875, 0.085693359375, 0.09101104736328125, 0.0963287353515625, 0.10164642333984375, 0.106964111328125, 0.11228179931640625, 0.1175994873046875, 0.12291717529296875, 0.12823486328125, 0.13355255126953125, 0.1388702392578125, 0.14418792724609375, 0.149505615234375, 0.15482330322265625, 0.1601409912109375, 0.16545867919921875, 0.1707763671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 14.0, 16.0, 14.0, 14.0, 16.0, 35.0, 37.0, 46.0, 46.0, 81.0, 96.0, 100.0, 83.0, 74.0, 56.0, 36.0, 30.0, 23.0, 21.0, 24.0, 12.0, 14.0, 10.0, 7.0, 3.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.07666015625, -0.07453441619873047, -0.07240867614746094, -0.0702829360961914, -0.06815719604492188, -0.06603145599365234, -0.06390571594238281, -0.06177997589111328, -0.05965423583984375, -0.05752849578857422, -0.05540275573730469, -0.053277015686035156, -0.051151275634765625, -0.049025535583496094, -0.04689979553222656, -0.04477405548095703, -0.0426483154296875, -0.04052257537841797, -0.03839683532714844, -0.036271095275878906, -0.034145355224609375, -0.032019615173339844, -0.029893875122070312, -0.02776813507080078, -0.02564239501953125, -0.02351665496826172, -0.021390914916992188, -0.019265174865722656, -0.017139434814453125, -0.015013694763183594, -0.012887954711914062, -0.010762214660644531, -0.008636474609375, -0.006510734558105469, -0.0043849945068359375, -0.0022592544555664062, -0.000133514404296875, 0.0019922256469726562, 0.0041179656982421875, 0.006243705749511719, 0.00836944580078125, 0.010495185852050781, 0.012620925903320312, 0.014746665954589844, 0.016872406005859375, 0.018998146057128906, 0.021123886108398438, 0.02324962615966797, 0.0253753662109375, 0.02750110626220703, 0.029626846313476562, 0.031752586364746094, 0.033878326416015625, 0.036004066467285156, 0.03812980651855469, 0.04025554656982422, 0.04238128662109375, 0.04450702667236328, 0.04663276672363281, 0.048758506774902344, 0.050884246826171875, 0.053009986877441406, 0.05513572692871094, 0.05726146697998047, 0.05938720703125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 17.0, 24.0, 22.0, 30.0, 40.0, 56.0, 59.0, 58.0, 56.0, 87.0, 91.0, 74.0, 78.0, 58.0, 50.0, 42.0, 33.0, 17.0, 27.0, 13.0, 13.0, 5.0, 10.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.890151023864746, -12.481563568115234, -12.072975158691406, -11.664387702941895, -11.255800247192383, -10.847211837768555, -10.438624382019043, -10.030036926269531, -9.621448516845703, -9.212861061096191, -8.804272651672363, -8.395685195922852, -7.987097263336182, -7.578509330749512, -7.169921875, -6.76133394241333, -6.35274600982666, -5.94415807723999, -5.53557014465332, -5.126982688903809, -4.718394756317139, -4.309806823730469, -3.901219129562378, -3.492631435394287, -3.084043502807617, -2.6754555702209473, -2.2668678760528564, -1.858280062675476, -1.4496922492980957, -1.0411043167114258, -0.632516622543335, -0.22392892837524414, 0.1846599578857422, 0.5932477712631226, 1.001835584640503, 1.4104233980178833, 1.8190112113952637, 2.2275991439819336, 2.6361868381500244, 3.0447745323181152, 3.453362464904785, 3.861950397491455, 4.270538330078125, 4.679125785827637, 5.087713718414307, 5.496301651000977, 5.904889106750488, 6.313477039337158, 6.722064971923828, 7.130652904510498, 7.539240837097168, 7.94782829284668, 8.356416702270508, 8.76500415802002, 9.173591613769531, 9.58218002319336, 9.990767478942871, 10.399354934692383, 10.807943344116211, 11.216530799865723, 11.625118255615234, 12.033706665039062, 12.442294120788574, 12.850881576538086, 13.259469985961914]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 7.0, 5.0, 11.0, 6.0, 15.0, 11.0, 16.0, 20.0, 21.0, 22.0, 35.0, 33.0, 38.0, 38.0, 46.0, 47.0, 49.0, 45.0, 35.0, 39.0, 35.0, 43.0, 42.0, 37.0, 29.0, 44.0, 40.0, 32.0, 23.0, 31.0, 15.0, 14.0, 20.0, 9.0, 8.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.100275039672852, -10.780584335327148, -10.460893630981445, -10.141202926635742, -9.821513175964355, -9.501822471618652, -9.18213176727295, -8.862441062927246, -8.542750358581543, -8.22305965423584, -7.903369426727295, -7.583678722381592, -7.263988018035889, -6.944297790527344, -6.624607086181641, -6.3049163818359375, -5.985226154327393, -5.6655354499816895, -5.3458452224731445, -5.026154518127441, -4.706463813781738, -4.386773109436035, -4.06708288192749, -3.747392177581787, -3.427701711654663, -3.108011245727539, -2.788320541381836, -2.468630075454712, -2.148939609527588, -1.8292489051818848, -1.5095584392547607, -1.1898677349090576, -0.8701772689819336, -0.55048668384552, -0.23079615831375122, 0.08889436721801758, 0.40858495235443115, 0.7282755374908447, 1.0479660034179688, 1.3676567077636719, 1.687347173690796, 2.00703763961792, 2.326728343963623, 2.646418809890747, 2.966109275817871, 3.285799980163574, 3.6054904460906982, 3.9251811504364014, 4.244871616363525, 4.5645623207092285, 4.884252548217773, 5.203943252563477, 5.52363395690918, 5.843324661254883, 6.163014888763428, 6.482705593109131, 6.802395820617676, 7.122086524963379, 7.441776752471924, 7.761467456817627, 8.081157684326172, 8.400848388671875, 8.720539093017578, 9.040229797363281, 9.359920501708984]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 15.0, 11.0, 21.0, 44.0, 64.0, 86.0, 138.0, 187.0, 320.0, 459.0, 779.0, 1220.0, 1870.0, 3150.0, 5186.0, 8796.0, 14425.0, 23504.0, 37767.0, 57948.0, 85489.0, 114630.0, 138401.0, 142533.0, 126173.0, 98335.0, 68361.0, 45215.0, 28334.0, 17639.0, 10520.0, 6497.0, 3900.0, 2366.0, 1501.0, 969.0, 588.0, 369.0, 270.0, 156.0, 107.0, 68.0, 44.0, 27.0, 28.0, 11.0, 13.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.09765625, -5.9083251953125, -5.718994140625, -5.5296630859375, -5.34033203125, -5.1510009765625, -4.961669921875, -4.7723388671875, -4.5830078125, -4.3936767578125, -4.204345703125, -4.0150146484375, -3.82568359375, -3.6363525390625, -3.447021484375, -3.2576904296875, -3.068359375, -2.8790283203125, -2.689697265625, -2.5003662109375, -2.31103515625, -2.1217041015625, -1.932373046875, -1.7430419921875, -1.5537109375, -1.3643798828125, -1.175048828125, -0.9857177734375, -0.79638671875, -0.6070556640625, -0.417724609375, -0.2283935546875, -0.0390625, 0.1502685546875, 0.339599609375, 0.5289306640625, 0.71826171875, 0.9075927734375, 1.096923828125, 1.2862548828125, 1.4755859375, 1.6649169921875, 1.854248046875, 2.0435791015625, 2.23291015625, 2.4222412109375, 2.611572265625, 2.8009033203125, 2.990234375, 3.1795654296875, 3.368896484375, 3.5582275390625, 3.74755859375, 3.9368896484375, 4.126220703125, 4.3155517578125, 4.5048828125, 4.6942138671875, 4.883544921875, 5.0728759765625, 5.26220703125, 5.4515380859375, 5.640869140625, 5.8302001953125, 6.01953125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 0.0, 2.0, 5.0, 12.0, 5.0, 11.0, 10.0, 21.0, 9.0, 14.0, 24.0, 23.0, 25.0, 33.0, 43.0, 34.0, 37.0, 55.0, 35.0, 46.0, 37.0, 34.0, 39.0, 55.0, 40.0, 36.0, 32.0, 38.0, 33.0, 27.0, 39.0, 24.0, 21.0, 13.0, 20.0, 16.0, 12.0, 7.0, 7.0, 5.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-11.8984375, -11.586669921875, -11.27490234375, -10.963134765625, -10.6513671875, -10.339599609375, -10.02783203125, -9.716064453125, -9.404296875, -9.092529296875, -8.78076171875, -8.468994140625, -8.1572265625, -7.845458984375, -7.53369140625, -7.221923828125, -6.91015625, -6.598388671875, -6.28662109375, -5.974853515625, -5.6630859375, -5.351318359375, -5.03955078125, -4.727783203125, -4.416015625, -4.104248046875, -3.79248046875, -3.480712890625, -3.1689453125, -2.857177734375, -2.54541015625, -2.233642578125, -1.921875, -1.610107421875, -1.29833984375, -0.986572265625, -0.6748046875, -0.363037109375, -0.05126953125, 0.260498046875, 0.572265625, 0.884033203125, 1.19580078125, 1.507568359375, 1.8193359375, 2.131103515625, 2.44287109375, 2.754638671875, 3.06640625, 3.378173828125, 3.68994140625, 4.001708984375, 4.3134765625, 4.625244140625, 4.93701171875, 5.248779296875, 5.560546875, 5.872314453125, 6.18408203125, 6.495849609375, 6.8076171875, 7.119384765625, 7.43115234375, 7.742919921875, 8.0546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 8.0, 13.0, 25.0, 44.0, 63.0, 93.0, 124.0, 203.0, 315.0, 457.0, 647.0, 937.0, 1475.0, 2114.0, 3141.0, 4545.0, 6695.0, 9834.0, 14350.0, 20602.0, 29656.0, 40967.0, 56675.0, 73591.0, 91944.0, 105907.0, 111190.0, 106551.0, 93312.0, 75254.0, 57836.0, 42161.0, 30125.0, 21431.0, 14628.0, 10233.0, 6997.0, 4632.0, 3169.0, 2094.0, 1461.0, 970.0, 697.0, 444.0, 328.0, 202.0, 139.0, 72.0, 62.0, 53.0, 31.0, 25.0, 14.0, 8.0, 3.0, 2.0, 1.0], "bins": [-4.90234375, -4.75616455078125, -4.6099853515625, -4.46380615234375, -4.317626953125, -4.17144775390625, -4.0252685546875, -3.87908935546875, -3.73291015625, -3.58673095703125, -3.4405517578125, -3.29437255859375, -3.148193359375, -3.00201416015625, -2.8558349609375, -2.70965576171875, -2.5634765625, -2.41729736328125, -2.2711181640625, -2.12493896484375, -1.978759765625, -1.83258056640625, -1.6864013671875, -1.54022216796875, -1.39404296875, -1.24786376953125, -1.1016845703125, -0.95550537109375, -0.809326171875, -0.66314697265625, -0.5169677734375, -0.37078857421875, -0.224609375, -0.07843017578125, 0.0677490234375, 0.21392822265625, 0.360107421875, 0.50628662109375, 0.6524658203125, 0.79864501953125, 0.94482421875, 1.09100341796875, 1.2371826171875, 1.38336181640625, 1.529541015625, 1.67572021484375, 1.8218994140625, 1.96807861328125, 2.1142578125, 2.26043701171875, 2.4066162109375, 2.55279541015625, 2.698974609375, 2.84515380859375, 2.9913330078125, 3.13751220703125, 3.28369140625, 3.42987060546875, 3.5760498046875, 3.72222900390625, 3.868408203125, 4.01458740234375, 4.1607666015625, 4.30694580078125, 4.453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 12.0, 6.0, 10.0, 17.0, 29.0, 19.0, 22.0, 21.0, 27.0, 23.0, 31.0, 26.0, 25.0, 30.0, 33.0, 40.0, 41.0, 38.0, 46.0, 34.0, 34.0, 39.0, 36.0, 35.0, 28.0, 24.0, 30.0, 19.0, 20.0, 30.0, 26.0, 21.0, 14.0, 14.0, 12.0, 12.0, 9.0, 9.0, 8.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-5.14453125, -4.98590087890625, -4.8272705078125, -4.66864013671875, -4.510009765625, -4.35137939453125, -4.1927490234375, -4.03411865234375, -3.87548828125, -3.71685791015625, -3.5582275390625, -3.39959716796875, -3.240966796875, -3.08233642578125, -2.9237060546875, -2.76507568359375, -2.6064453125, -2.44781494140625, -2.2891845703125, -2.13055419921875, -1.971923828125, -1.81329345703125, -1.6546630859375, -1.49603271484375, -1.33740234375, -1.17877197265625, -1.0201416015625, -0.86151123046875, -0.702880859375, -0.54425048828125, -0.3856201171875, -0.22698974609375, -0.068359375, 0.09027099609375, 0.2489013671875, 0.40753173828125, 0.566162109375, 0.72479248046875, 0.8834228515625, 1.04205322265625, 1.20068359375, 1.35931396484375, 1.5179443359375, 1.67657470703125, 1.835205078125, 1.99383544921875, 2.1524658203125, 2.31109619140625, 2.4697265625, 2.62835693359375, 2.7869873046875, 2.94561767578125, 3.104248046875, 3.26287841796875, 3.4215087890625, 3.58013916015625, 3.73876953125, 3.89739990234375, 4.0560302734375, 4.21466064453125, 4.373291015625, 4.53192138671875, 4.6905517578125, 4.84918212890625, 5.0078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 3.0, 11.0, 14.0, 21.0, 34.0, 40.0, 78.0, 97.0, 153.0, 278.0, 383.0, 642.0, 994.0, 1608.0, 2748.0, 4511.0, 7810.0, 13223.0, 22696.0, 38672.0, 64104.0, 99395.0, 138071.0, 162990.0, 156139.0, 122865.0, 83802.0, 51910.0, 31057.0, 18116.0, 10612.0, 6129.0, 3623.0, 2112.0, 1395.0, 838.0, 521.0, 300.0, 206.0, 112.0, 85.0, 55.0, 31.0, 26.0, 17.0, 11.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.2109375, -2.13671875, -2.0625, -1.98828125, -1.9140625, -1.83984375, -1.765625, -1.69140625, -1.6171875, -1.54296875, -1.46875, -1.39453125, -1.3203125, -1.24609375, -1.171875, -1.09765625, -1.0234375, -0.94921875, -0.875, -0.80078125, -0.7265625, -0.65234375, -0.578125, -0.50390625, -0.4296875, -0.35546875, -0.28125, -0.20703125, -0.1328125, -0.05859375, 0.015625, 0.08984375, 0.1640625, 0.23828125, 0.3125, 0.38671875, 0.4609375, 0.53515625, 0.609375, 0.68359375, 0.7578125, 0.83203125, 0.90625, 0.98046875, 1.0546875, 1.12890625, 1.203125, 1.27734375, 1.3515625, 1.42578125, 1.5, 1.57421875, 1.6484375, 1.72265625, 1.796875, 1.87109375, 1.9453125, 2.01953125, 2.09375, 2.16796875, 2.2421875, 2.31640625, 2.390625, 2.46484375, 2.5390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 5.0, 1.0, 11.0, 14.0, 16.0, 21.0, 23.0, 28.0, 27.0, 33.0, 33.0, 45.0, 53.0, 53.0, 50.0, 65.0, 58.0, 68.0, 58.0, 48.0, 57.0, 36.0, 38.0, 25.0, 25.0, 18.0, 17.0, 17.0, 17.0, 11.0, 5.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00020647048950195312, -0.00020047277212142944, -0.00019447505474090576, -0.00018847733736038208, -0.0001824796199798584, -0.00017648190259933472, -0.00017048418521881104, -0.00016448646783828735, -0.00015848875045776367, -0.00015249103307724, -0.0001464933156967163, -0.00014049559831619263, -0.00013449788093566895, -0.00012850016355514526, -0.00012250244617462158, -0.0001165047287940979, -0.00011050701141357422, -0.00010450929403305054, -9.851157665252686e-05, -9.251385927200317e-05, -8.651614189147949e-05, -8.051842451095581e-05, -7.452070713043213e-05, -6.852298974990845e-05, -6.252527236938477e-05, -5.6527554988861084e-05, -5.05298376083374e-05, -4.453212022781372e-05, -3.853440284729004e-05, -3.253668546676636e-05, -2.6538968086242676e-05, -2.0541250705718994e-05, -1.4543533325195312e-05, -8.545815944671631e-06, -2.5480985641479492e-06, 3.4496188163757324e-06, 9.447336196899414e-06, 1.5445053577423096e-05, 2.1442770957946777e-05, 2.744048833847046e-05, 3.343820571899414e-05, 3.943592309951782e-05, 4.5433640480041504e-05, 5.1431357860565186e-05, 5.742907524108887e-05, 6.342679262161255e-05, 6.942451000213623e-05, 7.542222738265991e-05, 8.14199447631836e-05, 8.741766214370728e-05, 9.341537952423096e-05, 9.941309690475464e-05, 0.00010541081428527832, 0.000111408531665802, 0.00011740624904632568, 0.00012340396642684937, 0.00012940168380737305, 0.00013539940118789673, 0.0001413971185684204, 0.0001473948359489441, 0.00015339255332946777, 0.00015939027070999146, 0.00016538798809051514, 0.00017138570547103882, 0.0001773834228515625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 11.0, 11.0, 26.0, 40.0, 51.0, 76.0, 87.0, 156.0, 241.0, 307.0, 582.0, 853.0, 1273.0, 1964.0, 2942.0, 4940.0, 7728.0, 12149.0, 19603.0, 31902.0, 50358.0, 76814.0, 109384.0, 138643.0, 150198.0, 135087.0, 104363.0, 72218.0, 47041.0, 29790.0, 18584.0, 11406.0, 7175.0, 4365.0, 2809.0, 1833.0, 1177.0, 782.0, 516.0, 342.0, 227.0, 156.0, 114.0, 58.0, 46.0, 41.0, 21.0, 20.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0], "bins": [-2.3359375, -2.26605224609375, -2.1961669921875, -2.12628173828125, -2.056396484375, -1.98651123046875, -1.9166259765625, -1.84674072265625, -1.77685546875, -1.70697021484375, -1.6370849609375, -1.56719970703125, -1.497314453125, -1.42742919921875, -1.3575439453125, -1.28765869140625, -1.2177734375, -1.14788818359375, -1.0780029296875, -1.00811767578125, -0.938232421875, -0.86834716796875, -0.7984619140625, -0.72857666015625, -0.65869140625, -0.58880615234375, -0.5189208984375, -0.44903564453125, -0.379150390625, -0.30926513671875, -0.2393798828125, -0.16949462890625, -0.099609375, -0.02972412109375, 0.0401611328125, 0.11004638671875, 0.179931640625, 0.24981689453125, 0.3197021484375, 0.38958740234375, 0.45947265625, 0.52935791015625, 0.5992431640625, 0.66912841796875, 0.739013671875, 0.80889892578125, 0.8787841796875, 0.94866943359375, 1.0185546875, 1.08843994140625, 1.1583251953125, 1.22821044921875, 1.298095703125, 1.36798095703125, 1.4378662109375, 1.50775146484375, 1.57763671875, 1.64752197265625, 1.7174072265625, 1.78729248046875, 1.857177734375, 1.92706298828125, 1.9969482421875, 2.06683349609375, 2.13671875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 12.0, 10.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 33.0, 39.0, 57.0, 54.0, 57.0, 45.0, 51.0, 60.0, 46.0, 59.0, 63.0, 48.0, 36.0, 40.0, 30.0, 27.0, 19.0, 23.0, 10.0, 17.0, 9.0, 11.0, 5.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0767440795898438, -1.0460662841796875, -1.0153884887695312, -0.984710693359375, -0.9540328979492188, -0.9233551025390625, -0.8926773071289062, -0.86199951171875, -0.8313217163085938, -0.8006439208984375, -0.7699661254882812, -0.739288330078125, -0.7086105346679688, -0.6779327392578125, -0.6472549438476562, -0.6165771484375, -0.5858993530273438, -0.5552215576171875, -0.5245437622070312, -0.493865966796875, -0.46318817138671875, -0.4325103759765625, -0.40183258056640625, -0.37115478515625, -0.34047698974609375, -0.3097991943359375, -0.27912139892578125, -0.248443603515625, -0.21776580810546875, -0.1870880126953125, -0.15641021728515625, -0.125732421875, -0.09505462646484375, -0.0643768310546875, -0.03369903564453125, -0.003021240234375, 0.02765655517578125, 0.0583343505859375, 0.08901214599609375, 0.11968994140625, 0.15036773681640625, 0.1810455322265625, 0.21172332763671875, 0.242401123046875, 0.27307891845703125, 0.3037567138671875, 0.33443450927734375, 0.3651123046875, 0.39579010009765625, 0.4264678955078125, 0.45714569091796875, 0.487823486328125, 0.5185012817382812, 0.5491790771484375, 0.5798568725585938, 0.61053466796875, 0.6412124633789062, 0.6718902587890625, 0.7025680541992188, 0.733245849609375, 0.7639236450195312, 0.7946014404296875, 0.8252792358398438, 0.85595703125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 7.0, 7.0, 6.0, 14.0, 19.0, 28.0, 35.0, 34.0, 42.0, 57.0, 51.0, 68.0, 78.0, 75.0, 82.0, 65.0, 62.0, 62.0, 33.0, 41.0, 31.0, 21.0, 22.0, 16.0, 11.0, 7.0, 7.0, 3.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.136466026306152, -11.742730140686035, -11.348994255065918, -10.9552583694458, -10.561522483825684, -10.167786598205566, -9.774051666259766, -9.380315780639648, -8.986579895019531, -8.592844009399414, -8.199108123779297, -7.80537223815918, -7.4116363525390625, -7.017900466918945, -6.624165058135986, -6.230429172515869, -5.836692810058594, -5.442956924438477, -5.049221038818359, -4.655485153198242, -4.261749267578125, -3.868013620376587, -3.474277973175049, -3.0805420875549316, -2.6868062019348145, -2.2930703163146973, -1.8993345499038696, -1.505598783493042, -1.1118628978729248, -0.7181270122528076, -0.32439136505126953, 0.06934452056884766, 0.46308040618896484, 0.8568162322044373, 1.2505520582199097, 1.6442878246307373, 2.0380237102508545, 2.4317595958709717, 2.8254952430725098, 3.219231128692627, 3.612967014312744, 4.006702899932861, 4.4004387855529785, 4.7941741943359375, 5.187910079956055, 5.581645965576172, 5.975381851196289, 6.369117736816406, 6.762853622436523, 7.156589508056641, 7.550325393676758, 7.944061279296875, 8.337797164916992, 8.73153305053711, 9.125268936157227, 9.519004821777344, 9.912740707397461, 10.306476593017578, 10.700212478637695, 11.093948364257812, 11.48768424987793, 11.881420135498047, 12.275156021118164, 12.668891906738281, 13.062626838684082]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 14.0, 7.0, 9.0, 8.0, 16.0, 26.0, 18.0, 26.0, 24.0, 41.0, 33.0, 34.0, 33.0, 54.0, 48.0, 37.0, 42.0, 49.0, 34.0, 50.0, 37.0, 51.0, 32.0, 46.0, 38.0, 33.0, 27.0, 20.0, 22.0, 16.0, 10.0, 10.0, 10.0, 8.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.84339427947998, -11.506845474243164, -11.170297622680664, -10.833748817443848, -10.497200012207031, -10.160651206970215, -9.824102401733398, -9.487554550170898, -9.151005744934082, -8.814456939697266, -8.477909088134766, -8.14136028289795, -7.804811477661133, -7.468262672424316, -7.131714344024658, -6.795166015625, -6.458617210388184, -6.122068405151367, -5.785520076751709, -5.448971748352051, -5.112422943115234, -4.775874137878418, -4.43932580947876, -4.102777481079102, -3.766228675842285, -3.429680109024048, -3.0931315422058105, -2.7565829753875732, -2.420034408569336, -2.0834858417510986, -1.7469372749328613, -1.410388708114624, -1.0738401412963867, -0.7372915744781494, -0.4007430076599121, -0.0641944408416748, 0.2723541259765625, 0.6089026927947998, 0.9454512596130371, 1.2819998264312744, 1.6185483932495117, 1.955096960067749, 2.2916455268859863, 2.6281940937042236, 2.964742660522461, 3.3012912273406982, 3.6378397941589355, 3.974388360977173, 4.31093692779541, 4.647485733032227, 4.984034061431885, 5.320582389831543, 5.657131195068359, 5.993680000305176, 6.330228328704834, 6.666776657104492, 7.003325462341309, 7.339874267578125, 7.676422595977783, 8.012970924377441, 8.349519729614258, 8.686068534851074, 9.02261734008789, 9.35916519165039, 9.695713996887207]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 13.0, 12.0, 12.0, 19.0, 34.0, 36.0, 63.0, 86.0, 139.0, 204.0, 284.0, 425.0, 628.0, 929.0, 1362.0, 2089.0, 3326.0, 5103.0, 8198.0, 13137.0, 20647.0, 33638.0, 55476.0, 90821.0, 149306.0, 242505.0, 381354.0, 549613.0, 666334.0, 635893.0, 487745.0, 325219.0, 203556.0, 123293.0, 74869.0, 45279.0, 27772.0, 16639.0, 10466.0, 6576.0, 3956.0, 2539.0, 1634.0, 1035.0, 711.0, 451.0, 284.0, 191.0, 125.0, 91.0, 62.0, 43.0, 25.0, 16.0, 11.0, 9.0, 7.0, 1.0, 1.0, 3.0], "bins": [-8.0234375, -7.77880859375, -7.5341796875, -7.28955078125, -7.044921875, -6.80029296875, -6.5556640625, -6.31103515625, -6.06640625, -5.82177734375, -5.5771484375, -5.33251953125, -5.087890625, -4.84326171875, -4.5986328125, -4.35400390625, -4.109375, -3.86474609375, -3.6201171875, -3.37548828125, -3.130859375, -2.88623046875, -2.6416015625, -2.39697265625, -2.15234375, -1.90771484375, -1.6630859375, -1.41845703125, -1.173828125, -0.92919921875, -0.6845703125, -0.43994140625, -0.1953125, 0.04931640625, 0.2939453125, 0.53857421875, 0.783203125, 1.02783203125, 1.2724609375, 1.51708984375, 1.76171875, 2.00634765625, 2.2509765625, 2.49560546875, 2.740234375, 2.98486328125, 3.2294921875, 3.47412109375, 3.71875, 3.96337890625, 4.2080078125, 4.45263671875, 4.697265625, 4.94189453125, 5.1865234375, 5.43115234375, 5.67578125, 5.92041015625, 6.1650390625, 6.40966796875, 6.654296875, 6.89892578125, 7.1435546875, 7.38818359375, 7.6328125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 3.0, 8.0, 8.0, 16.0, 6.0, 9.0, 20.0, 16.0, 17.0, 22.0, 20.0, 42.0, 28.0, 43.0, 30.0, 27.0, 34.0, 35.0, 55.0, 42.0, 41.0, 42.0, 44.0, 44.0, 39.0, 26.0, 33.0, 35.0, 45.0, 19.0, 27.0, 16.0, 20.0, 20.0, 12.0, 8.0, 10.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9921875, -7.7569580078125, -7.521728515625, -7.2864990234375, -7.05126953125, -6.8160400390625, -6.580810546875, -6.3455810546875, -6.1103515625, -5.8751220703125, -5.639892578125, -5.4046630859375, -5.16943359375, -4.9342041015625, -4.698974609375, -4.4637451171875, -4.228515625, -3.9932861328125, -3.758056640625, -3.5228271484375, -3.28759765625, -3.0523681640625, -2.817138671875, -2.5819091796875, -2.3466796875, -2.1114501953125, -1.876220703125, -1.6409912109375, -1.40576171875, -1.1705322265625, -0.935302734375, -0.7000732421875, -0.46484375, -0.2296142578125, 0.005615234375, 0.2408447265625, 0.47607421875, 0.7113037109375, 0.946533203125, 1.1817626953125, 1.4169921875, 1.6522216796875, 1.887451171875, 2.1226806640625, 2.35791015625, 2.5931396484375, 2.828369140625, 3.0635986328125, 3.298828125, 3.5340576171875, 3.769287109375, 4.0045166015625, 4.23974609375, 4.4749755859375, 4.710205078125, 4.9454345703125, 5.1806640625, 5.4158935546875, 5.651123046875, 5.8863525390625, 6.12158203125, 6.3568115234375, 6.592041015625, 6.8272705078125, 7.0625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 14.0, 7.0, 25.0, 33.0, 64.0, 79.0, 149.0, 247.0, 361.0, 540.0, 854.0, 1467.0, 2488.0, 4078.0, 6887.0, 11513.0, 19449.0, 33221.0, 57155.0, 95938.0, 159327.0, 253220.0, 381740.0, 517694.0, 605501.0, 597154.0, 493021.0, 356977.0, 234253.0, 146126.0, 88138.0, 51819.0, 30501.0, 17617.0, 10581.0, 6346.0, 3660.0, 2244.0, 1381.0, 906.0, 570.0, 361.0, 210.0, 129.0, 74.0, 46.0, 29.0, 36.0, 20.0, 9.0, 9.0, 7.0, 6.0, 0.0, 3.0], "bins": [-8.34375, -8.09771728515625, -7.8516845703125, -7.60565185546875, -7.359619140625, -7.11358642578125, -6.8675537109375, -6.62152099609375, -6.37548828125, -6.12945556640625, -5.8834228515625, -5.63739013671875, -5.391357421875, -5.14532470703125, -4.8992919921875, -4.65325927734375, -4.4072265625, -4.16119384765625, -3.9151611328125, -3.66912841796875, -3.423095703125, -3.17706298828125, -2.9310302734375, -2.68499755859375, -2.43896484375, -2.19293212890625, -1.9468994140625, -1.70086669921875, -1.454833984375, -1.20880126953125, -0.9627685546875, -0.71673583984375, -0.470703125, -0.22467041015625, 0.0213623046875, 0.26739501953125, 0.513427734375, 0.75946044921875, 1.0054931640625, 1.25152587890625, 1.49755859375, 1.74359130859375, 1.9896240234375, 2.23565673828125, 2.481689453125, 2.72772216796875, 2.9737548828125, 3.21978759765625, 3.4658203125, 3.71185302734375, 3.9578857421875, 4.20391845703125, 4.449951171875, 4.69598388671875, 4.9420166015625, 5.18804931640625, 5.43408203125, 5.68011474609375, 5.9261474609375, 6.17218017578125, 6.418212890625, 6.66424560546875, 6.9102783203125, 7.15631103515625, 7.40234375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 9.0, 15.0, 26.0, 35.0, 29.0, 50.0, 48.0, 88.0, 92.0, 120.0, 119.0, 147.0, 163.0, 186.0, 204.0, 218.0, 223.0, 226.0, 261.0, 223.0, 207.0, 180.0, 178.0, 163.0, 154.0, 123.0, 93.0, 91.0, 74.0, 68.0, 50.0, 43.0, 40.0, 24.0, 21.0, 15.0, 14.0, 11.0, 13.0, 4.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.150390625, -3.030364990234375, -2.91033935546875, -2.790313720703125, -2.6702880859375, -2.550262451171875, -2.43023681640625, -2.310211181640625, -2.190185546875, -2.070159912109375, -1.95013427734375, -1.830108642578125, -1.7100830078125, -1.590057373046875, -1.47003173828125, -1.350006103515625, -1.22998046875, -1.109954833984375, -0.98992919921875, -0.869903564453125, -0.7498779296875, -0.629852294921875, -0.50982666015625, -0.389801025390625, -0.269775390625, -0.149749755859375, -0.02972412109375, 0.090301513671875, 0.2103271484375, 0.330352783203125, 0.45037841796875, 0.570404052734375, 0.6904296875, 0.810455322265625, 0.93048095703125, 1.050506591796875, 1.1705322265625, 1.290557861328125, 1.41058349609375, 1.530609130859375, 1.650634765625, 1.770660400390625, 1.89068603515625, 2.010711669921875, 2.1307373046875, 2.250762939453125, 2.37078857421875, 2.490814208984375, 2.61083984375, 2.730865478515625, 2.85089111328125, 2.970916748046875, 3.0909423828125, 3.210968017578125, 3.33099365234375, 3.451019287109375, 3.571044921875, 3.691070556640625, 3.81109619140625, 3.931121826171875, 4.0511474609375, 4.171173095703125, 4.29119873046875, 4.411224365234375, 4.53125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 9.0, 10.0, 16.0, 11.0, 14.0, 19.0, 19.0, 26.0, 26.0, 41.0, 32.0, 40.0, 57.0, 75.0, 55.0, 64.0, 58.0, 57.0, 54.0, 44.0, 51.0, 32.0, 40.0, 31.0, 18.0, 19.0, 20.0, 10.0, 11.0, 12.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.193255424499512, -9.852581977844238, -9.511909484863281, -9.171236038208008, -8.83056354522705, -8.489890098571777, -8.14921760559082, -7.808544158935547, -7.467871189117432, -7.127198219299316, -6.786525249481201, -6.445852279663086, -6.1051788330078125, -5.7645063400268555, -5.423832893371582, -5.083159923553467, -4.742486953735352, -4.401813983917236, -4.061141014099121, -3.7204678058624268, -3.3797948360443115, -3.0391218662261963, -2.698448657989502, -2.3577756881713867, -2.0171027183532715, -1.6764297485351562, -1.3357566595077515, -0.9950835704803467, -0.6544106006622314, -0.3137376308441162, 0.026935577392578125, 0.36760854721069336, 0.708282470703125, 1.0489554405212402, 1.389628529548645, 1.7303016185760498, 2.070974588394165, 2.4116475582122803, 2.7523207664489746, 3.09299373626709, 3.433666706085205, 3.7743396759033203, 4.1150126457214355, 4.455685615539551, 4.796359062194824, 5.137031555175781, 5.477705001831055, 5.81837797164917, 6.159050941467285, 6.4997239112854, 6.840396881103516, 7.181070327758789, 7.521742820739746, 7.8624162673950195, 8.203088760375977, 8.54376220703125, 8.884435653686523, 9.225109100341797, 9.565781593322754, 9.906455039978027, 10.247127532958984, 10.587800979614258, 10.928474426269531, 11.269146919250488, 11.609819412231445]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 13.0, 10.0, 11.0, 18.0, 20.0, 18.0, 24.0, 18.0, 16.0, 25.0, 25.0, 34.0, 36.0, 40.0, 45.0, 32.0, 44.0, 40.0, 38.0, 29.0, 45.0, 44.0, 42.0, 33.0, 29.0, 36.0, 33.0, 31.0, 23.0, 20.0, 23.0, 21.0, 18.0, 6.0, 11.0, 11.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.02999496459961, -9.70927619934082, -9.388557434082031, -9.067838668823242, -8.747119903564453, -8.42640209197998, -8.105683326721191, -7.784964561462402, -7.464245796203613, -7.143527030944824, -6.822808265686035, -6.502089977264404, -6.181371212005615, -5.860652446746826, -5.539934158325195, -5.219215393066406, -4.898496627807617, -4.577777862548828, -4.257059097290039, -3.936340808868408, -3.615622043609619, -3.29490327835083, -2.97418475151062, -2.65346622467041, -2.332747459411621, -2.012028694152832, -1.691310167312622, -1.3705915212631226, -1.049872875213623, -0.7291542291641235, -0.408435583114624, -0.08771705627441406, 0.2330007553100586, 0.5537194013595581, 0.8744380474090576, 1.1951566934585571, 1.5158753395080566, 1.8365939855575562, 2.1573126316070557, 2.4780311584472656, 2.7987499237060547, 3.1194686889648438, 3.4401872158050537, 3.7609057426452637, 4.081624507904053, 4.402343273162842, 4.723061561584473, 5.043780326843262, 5.364499092102051, 5.68521785736084, 6.005936622619629, 6.32665491104126, 6.647373676300049, 6.968092441558838, 7.288810729980469, 7.609529495239258, 7.930248260498047, 8.250967025756836, 8.571685791015625, 8.892404556274414, 9.213123321533203, 9.533841133117676, 9.854559898376465, 10.175278663635254, 10.495997428894043]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 13.0, 12.0, 19.0, 32.0, 37.0, 71.0, 118.0, 158.0, 242.0, 373.0, 550.0, 866.0, 1402.0, 2216.0, 3384.0, 5494.0, 8798.0, 14087.0, 23149.0, 38502.0, 63435.0, 104892.0, 165156.0, 206972.0, 156591.0, 98357.0, 59912.0, 36199.0, 21654.0, 13357.0, 8400.0, 5247.0, 3185.0, 2008.0, 1301.0, 831.0, 564.0, 344.0, 228.0, 118.0, 88.0, 65.0, 53.0, 31.0, 14.0, 17.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0], "bins": [-1.255859375, -1.219390869140625, -1.18292236328125, -1.146453857421875, -1.1099853515625, -1.073516845703125, -1.03704833984375, -1.000579833984375, -0.964111328125, -0.927642822265625, -0.89117431640625, -0.854705810546875, -0.8182373046875, -0.781768798828125, -0.74530029296875, -0.708831787109375, -0.67236328125, -0.635894775390625, -0.59942626953125, -0.562957763671875, -0.5264892578125, -0.490020751953125, -0.45355224609375, -0.417083740234375, -0.380615234375, -0.344146728515625, -0.30767822265625, -0.271209716796875, -0.2347412109375, -0.198272705078125, -0.16180419921875, -0.125335693359375, -0.0888671875, -0.052398681640625, -0.01593017578125, 0.020538330078125, 0.0570068359375, 0.093475341796875, 0.12994384765625, 0.166412353515625, 0.202880859375, 0.239349365234375, 0.27581787109375, 0.312286376953125, 0.3487548828125, 0.385223388671875, 0.42169189453125, 0.458160400390625, 0.49462890625, 0.531097412109375, 0.56756591796875, 0.604034423828125, 0.6405029296875, 0.676971435546875, 0.71343994140625, 0.749908447265625, 0.786376953125, 0.822845458984375, 0.85931396484375, 0.895782470703125, 0.9322509765625, 0.968719482421875, 1.00518798828125, 1.041656494140625, 1.078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 17.0, 14.0, 14.0, 23.0, 24.0, 27.0, 28.0, 24.0, 32.0, 39.0, 42.0, 48.0, 51.0, 50.0, 39.0, 45.0, 46.0, 50.0, 45.0, 53.0, 37.0, 39.0, 40.0, 32.0, 21.0, 23.0, 19.0, 22.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.78125, -13.3870849609375, -12.992919921875, -12.5987548828125, -12.20458984375, -11.8104248046875, -11.416259765625, -11.0220947265625, -10.6279296875, -10.2337646484375, -9.839599609375, -9.4454345703125, -9.05126953125, -8.6571044921875, -8.262939453125, -7.8687744140625, -7.474609375, -7.0804443359375, -6.686279296875, -6.2921142578125, -5.89794921875, -5.5037841796875, -5.109619140625, -4.7154541015625, -4.3212890625, -3.9271240234375, -3.532958984375, -3.1387939453125, -2.74462890625, -2.3504638671875, -1.956298828125, -1.5621337890625, -1.16796875, -0.7738037109375, -0.379638671875, 0.0145263671875, 0.40869140625, 0.8028564453125, 1.197021484375, 1.5911865234375, 1.9853515625, 2.3795166015625, 2.773681640625, 3.1678466796875, 3.56201171875, 3.9561767578125, 4.350341796875, 4.7445068359375, 5.138671875, 5.5328369140625, 5.927001953125, 6.3211669921875, 6.71533203125, 7.1094970703125, 7.503662109375, 7.8978271484375, 8.2919921875, 8.6861572265625, 9.080322265625, 9.4744873046875, 9.86865234375, 10.2628173828125, 10.656982421875, 11.0511474609375, 11.4453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 9.0, 10.0, 17.0, 31.0, 38.0, 69.0, 108.0, 176.0, 302.0, 525.0, 922.0, 1582.0, 2933.0, 5428.0, 10079.0, 18517.0, 35471.0, 65259.0, 119962.0, 211385.0, 246769.0, 149691.0, 82782.0, 44486.0, 23951.0, 12697.0, 6843.0, 3745.0, 1995.0, 1180.0, 634.0, 383.0, 218.0, 148.0, 83.0, 44.0, 29.0, 21.0, 9.0, 8.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.4427642822265625, -1.393341064453125, -1.3439178466796875, -1.29449462890625, -1.2450714111328125, -1.195648193359375, -1.1462249755859375, -1.0968017578125, -1.0473785400390625, -0.997955322265625, -0.9485321044921875, -0.89910888671875, -0.8496856689453125, -0.800262451171875, -0.7508392333984375, -0.701416015625, -0.6519927978515625, -0.602569580078125, -0.5531463623046875, -0.50372314453125, -0.4542999267578125, -0.404876708984375, -0.3554534912109375, -0.3060302734375, -0.2566070556640625, -0.207183837890625, -0.1577606201171875, -0.10833740234375, -0.0589141845703125, -0.009490966796875, 0.0399322509765625, 0.08935546875, 0.1387786865234375, 0.188201904296875, 0.2376251220703125, 0.28704833984375, 0.3364715576171875, 0.385894775390625, 0.4353179931640625, 0.4847412109375, 0.5341644287109375, 0.583587646484375, 0.6330108642578125, 0.68243408203125, 0.7318572998046875, 0.781280517578125, 0.8307037353515625, 0.880126953125, 0.9295501708984375, 0.978973388671875, 1.0283966064453125, 1.07781982421875, 1.1272430419921875, 1.176666259765625, 1.2260894775390625, 1.2755126953125, 1.3249359130859375, 1.374359130859375, 1.4237823486328125, 1.47320556640625, 1.5226287841796875, 1.572052001953125, 1.6214752197265625, 1.6708984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 16.0, 14.0, 20.0, 14.0, 19.0, 24.0, 20.0, 18.0, 27.0, 42.0, 31.0, 36.0, 38.0, 52.0, 51.0, 43.0, 40.0, 41.0, 48.0, 50.0, 36.0, 37.0, 24.0, 27.0, 35.0, 13.0, 36.0, 17.0, 27.0, 20.0, 11.0, 7.0, 10.0, 9.0, 6.0, 5.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.31640625, -6.1024169921875, -5.888427734375, -5.6744384765625, -5.46044921875, -5.2464599609375, -5.032470703125, -4.8184814453125, -4.6044921875, -4.3905029296875, -4.176513671875, -3.9625244140625, -3.74853515625, -3.5345458984375, -3.320556640625, -3.1065673828125, -2.892578125, -2.6785888671875, -2.464599609375, -2.2506103515625, -2.03662109375, -1.8226318359375, -1.608642578125, -1.3946533203125, -1.1806640625, -0.9666748046875, -0.752685546875, -0.5386962890625, -0.32470703125, -0.1107177734375, 0.103271484375, 0.3172607421875, 0.53125, 0.7452392578125, 0.959228515625, 1.1732177734375, 1.38720703125, 1.6011962890625, 1.815185546875, 2.0291748046875, 2.2431640625, 2.4571533203125, 2.671142578125, 2.8851318359375, 3.09912109375, 3.3131103515625, 3.527099609375, 3.7410888671875, 3.955078125, 4.1690673828125, 4.383056640625, 4.5970458984375, 4.81103515625, 5.0250244140625, 5.239013671875, 5.4530029296875, 5.6669921875, 5.8809814453125, 6.094970703125, 6.3089599609375, 6.52294921875, 6.7369384765625, 6.950927734375, 7.1649169921875, 7.37890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 4.0, 13.0, 14.0, 14.0, 19.0, 44.0, 56.0, 84.0, 118.0, 191.0, 250.0, 469.0, 768.0, 1339.0, 2721.0, 5505.0, 14220.0, 48138.0, 266650.0, 562351.0, 104091.0, 24757.0, 8496.0, 3708.0, 1860.0, 1023.0, 594.0, 366.0, 217.0, 159.0, 106.0, 50.0, 44.0, 23.0, 26.0, 19.0, 14.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35498046875, -0.3443031311035156, -0.33362579345703125, -0.3229484558105469, -0.3122711181640625, -0.3015937805175781, -0.29091644287109375, -0.2802391052246094, -0.269561767578125, -0.2588844299316406, -0.24820709228515625, -0.23752975463867188, -0.2268524169921875, -0.21617507934570312, -0.20549774169921875, -0.19482040405273438, -0.18414306640625, -0.17346572875976562, -0.16278839111328125, -0.15211105346679688, -0.1414337158203125, -0.13075637817382812, -0.12007904052734375, -0.10940170288085938, -0.098724365234375, -0.08804702758789062, -0.07736968994140625, -0.06669235229492188, -0.0560150146484375, -0.045337677001953125, -0.03466033935546875, -0.023983001708984375, -0.0133056640625, -0.002628326416015625, 0.00804901123046875, 0.018726348876953125, 0.0294036865234375, 0.040081024169921875, 0.05075836181640625, 0.061435699462890625, 0.072113037109375, 0.08279037475585938, 0.09346771240234375, 0.10414505004882812, 0.1148223876953125, 0.12549972534179688, 0.13617706298828125, 0.14685440063476562, 0.15753173828125, 0.16820907592773438, 0.17888641357421875, 0.18956375122070312, 0.2002410888671875, 0.21091842651367188, 0.22159576416015625, 0.23227310180664062, 0.242950439453125, 0.2536277770996094, 0.26430511474609375, 0.2749824523925781, 0.2856597900390625, 0.2963371276855469, 0.30701446533203125, 0.3176918029785156, 0.328369140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 13.0, 30.0, 23.0, 37.0, 48.0, 70.0, 72.0, 104.0, 96.0, 79.0, 76.0, 87.0, 74.0, 49.0, 47.0, 28.0, 20.0, 15.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-05, -2.3562461137771606e-05, -2.2687017917633057e-05, -2.1811574697494507e-05, -2.0936131477355957e-05, -2.0060688257217407e-05, -1.9185245037078857e-05, -1.8309801816940308e-05, -1.7434358596801758e-05, -1.6558915376663208e-05, -1.5683472156524658e-05, -1.4808028936386108e-05, -1.3932585716247559e-05, -1.3057142496109009e-05, -1.2181699275970459e-05, -1.130625605583191e-05, -1.043081283569336e-05, -9.55536961555481e-06, -8.67992639541626e-06, -7.80448317527771e-06, -6.92903995513916e-06, -6.05359673500061e-06, -5.1781535148620605e-06, -4.302710294723511e-06, -3.427267074584961e-06, -2.551823854446411e-06, -1.6763806343078613e-06, -8.009374141693115e-07, 7.450580596923828e-08, 9.499490261077881e-07, 1.8253922462463379e-06, 2.7008354663848877e-06, 3.5762786865234375e-06, 4.451721906661987e-06, 5.327165126800537e-06, 6.202608346939087e-06, 7.078051567077637e-06, 7.953494787216187e-06, 8.828938007354736e-06, 9.704381227493286e-06, 1.0579824447631836e-05, 1.1455267667770386e-05, 1.2330710887908936e-05, 1.3206154108047485e-05, 1.4081597328186035e-05, 1.4957040548324585e-05, 1.5832483768463135e-05, 1.6707926988601685e-05, 1.7583370208740234e-05, 1.8458813428878784e-05, 1.9334256649017334e-05, 2.0209699869155884e-05, 2.1085143089294434e-05, 2.1960586309432983e-05, 2.2836029529571533e-05, 2.3711472749710083e-05, 2.4586915969848633e-05, 2.5462359189987183e-05, 2.6337802410125732e-05, 2.7213245630264282e-05, 2.8088688850402832e-05, 2.8964132070541382e-05, 2.983957529067993e-05, 3.071501851081848e-05, 3.159046173095703e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 18.0, 20.0, 20.0, 32.0, 49.0, 71.0, 78.0, 125.0, 180.0, 240.0, 393.0, 579.0, 881.0, 1444.0, 2592.0, 4776.0, 9660.0, 21028.0, 51899.0, 144398.0, 393558.0, 262856.0, 88696.0, 34437.0, 14592.0, 6892.0, 3591.0, 1986.0, 1163.0, 737.0, 474.0, 320.0, 226.0, 136.0, 117.0, 78.0, 47.0, 42.0, 27.0, 18.0, 14.0, 12.0, 8.0, 3.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.2578125, -0.24915313720703125, -0.2404937744140625, -0.23183441162109375, -0.223175048828125, -0.21451568603515625, -0.2058563232421875, -0.19719696044921875, -0.18853759765625, -0.17987823486328125, -0.1712188720703125, -0.16255950927734375, -0.153900146484375, -0.14524078369140625, -0.1365814208984375, -0.12792205810546875, -0.1192626953125, -0.11060333251953125, -0.1019439697265625, -0.09328460693359375, -0.084625244140625, -0.07596588134765625, -0.0673065185546875, -0.05864715576171875, -0.04998779296875, -0.04132843017578125, -0.0326690673828125, -0.02400970458984375, -0.015350341796875, -0.00669097900390625, 0.0019683837890625, 0.01062774658203125, 0.019287109375, 0.02794647216796875, 0.0366058349609375, 0.04526519775390625, 0.053924560546875, 0.06258392333984375, 0.0712432861328125, 0.07990264892578125, 0.08856201171875, 0.09722137451171875, 0.1058807373046875, 0.11454010009765625, 0.123199462890625, 0.13185882568359375, 0.1405181884765625, 0.14917755126953125, 0.1578369140625, 0.16649627685546875, 0.1751556396484375, 0.18381500244140625, 0.192474365234375, 0.20113372802734375, 0.2097930908203125, 0.21845245361328125, 0.22711181640625, 0.23577117919921875, 0.2444305419921875, 0.25308990478515625, 0.261749267578125, 0.27040863037109375, 0.2790679931640625, 0.28772735595703125, 0.29638671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 12.0, 7.0, 13.0, 24.0, 18.0, 40.0, 69.0, 78.0, 117.0, 112.0, 122.0, 100.0, 90.0, 51.0, 39.0, 27.0, 19.0, 20.0, 11.0, 5.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.1057577133178711, -0.10183525085449219, -0.09791278839111328, -0.09399032592773438, -0.09006786346435547, -0.08614540100097656, -0.08222293853759766, -0.07830047607421875, -0.07437801361083984, -0.07045555114746094, -0.06653308868408203, -0.06261062622070312, -0.05868816375732422, -0.05476570129394531, -0.050843238830566406, -0.0469207763671875, -0.042998313903808594, -0.03907585144042969, -0.03515338897705078, -0.031230926513671875, -0.02730846405029297, -0.023386001586914062, -0.019463539123535156, -0.01554107666015625, -0.011618614196777344, -0.0076961517333984375, -0.0037736892700195312, 0.000148773193359375, 0.004071235656738281, 0.007993698120117188, 0.011916160583496094, 0.015838623046875, 0.019761085510253906, 0.023683547973632812, 0.02760601043701172, 0.031528472900390625, 0.03545093536376953, 0.03937339782714844, 0.043295860290527344, 0.04721832275390625, 0.051140785217285156, 0.05506324768066406, 0.05898571014404297, 0.06290817260742188, 0.06683063507080078, 0.07075309753417969, 0.0746755599975586, 0.0785980224609375, 0.0825204849243164, 0.08644294738769531, 0.09036540985107422, 0.09428787231445312, 0.09821033477783203, 0.10213279724121094, 0.10605525970458984, 0.10997772216796875, 0.11390018463134766, 0.11782264709472656, 0.12174510955810547, 0.12566757202148438, 0.12959003448486328, 0.1335124969482422, 0.1374349594116211, 0.141357421875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 11.0, 11.0, 10.0, 14.0, 20.0, 16.0, 26.0, 19.0, 34.0, 41.0, 39.0, 46.0, 73.0, 60.0, 63.0, 58.0, 53.0, 58.0, 44.0, 52.0, 43.0, 38.0, 33.0, 24.0, 19.0, 20.0, 15.0, 7.0, 11.0, 10.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984786987304688, -9.644575119018555, -9.304364204406738, -8.964152336120605, -8.623940467834473, -8.283729553222656, -7.943517684936523, -7.603305816650391, -7.263094425201416, -6.922883033752441, -6.582671165466309, -6.242459774017334, -5.902248382568359, -5.562036514282227, -5.221825122833252, -4.881613731384277, -4.5414018630981445, -4.20119047164917, -3.860978603363037, -3.5207672119140625, -3.180555582046509, -2.840343952178955, -2.5001325607299805, -2.1599209308624268, -1.819709300994873, -1.4794976711273193, -1.1392861604690552, -0.799074649810791, -0.4588630199432373, -0.1186513900756836, 0.22156000137329102, 0.5617716312408447, 0.9019832611083984, 1.2421948909759521, 1.5824064016342163, 1.9226179122924805, 2.262829542160034, 2.603041172027588, 2.9432525634765625, 3.283464193344116, 3.62367582321167, 3.9638874530792236, 4.304099082946777, 4.644310474395752, 4.984521865844727, 5.324733734130859, 5.664945125579834, 6.005156517028809, 6.345368385314941, 6.685579776763916, 7.025791645050049, 7.366003036499023, 7.706214904785156, 8.046426773071289, 8.386637687683105, 8.726849555969238, 9.067060470581055, 9.407272338867188, 9.747483253479004, 10.087695121765137, 10.42790699005127, 10.768117904663086, 11.108329772949219, 11.448541641235352, 11.788753509521484]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 13.0, 8.0, 13.0, 17.0, 20.0, 18.0, 22.0, 21.0, 16.0, 21.0, 30.0, 32.0, 34.0, 39.0, 46.0, 32.0, 46.0, 39.0, 40.0, 29.0, 42.0, 46.0, 42.0, 32.0, 32.0, 33.0, 34.0, 30.0, 25.0, 20.0, 23.0, 21.0, 18.0, 5.0, 12.0, 11.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.070302963256836, -9.749284744262695, -9.428267478942871, -9.107250213623047, -8.786231994628906, -8.465213775634766, -8.144196510314941, -7.823178768157959, -7.502161026000977, -7.181143283843994, -6.860125541687012, -6.539107799530029, -6.218090057373047, -5.8970723152160645, -5.576054573059082, -5.2550368309021, -4.934019088745117, -4.613001346588135, -4.291983604431152, -3.97096586227417, -3.6499481201171875, -3.328930377960205, -3.0079126358032227, -2.6868948936462402, -2.365877151489258, -2.0448594093322754, -1.723841667175293, -1.4028239250183105, -1.0818061828613281, -0.7607884407043457, -0.4397706985473633, -0.11875295639038086, 0.20226573944091797, 0.5232834815979004, 0.8443012237548828, 1.1653189659118652, 1.4863367080688477, 1.80735445022583, 2.1283721923828125, 2.449389934539795, 2.7704076766967773, 3.0914254188537598, 3.412443161010742, 3.7334609031677246, 4.054478645324707, 4.3754963874816895, 4.696514129638672, 5.017531871795654, 5.338549613952637, 5.659567356109619, 5.980585098266602, 6.301602840423584, 6.622620582580566, 6.943638324737549, 7.264656066894531, 7.585673809051514, 7.906691551208496, 8.22770881652832, 8.548727035522461, 8.869745254516602, 9.190762519836426, 9.51177978515625, 9.83279800415039, 10.153816223144531, 10.474833488464355]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 7.0, 15.0, 12.0, 25.0, 39.0, 76.0, 119.0, 133.0, 210.0, 337.0, 512.0, 824.0, 1184.0, 1827.0, 2694.0, 4337.0, 6604.0, 10200.0, 15775.0, 23879.0, 35354.0, 52297.0, 73199.0, 95805.0, 115655.0, 126066.0, 120524.0, 102585.0, 80591.0, 58682.0, 40287.0, 26986.0, 17970.0, 11959.0, 7625.0, 4953.0, 3171.0, 2096.0, 1384.0, 844.0, 573.0, 423.0, 244.0, 158.0, 128.0, 56.0, 55.0, 30.0, 27.0, 14.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.98388671875, -4.8037109375, -4.62353515625, -4.443359375, -4.26318359375, -4.0830078125, -3.90283203125, -3.72265625, -3.54248046875, -3.3623046875, -3.18212890625, -3.001953125, -2.82177734375, -2.6416015625, -2.46142578125, -2.28125, -2.10107421875, -1.9208984375, -1.74072265625, -1.560546875, -1.38037109375, -1.2001953125, -1.02001953125, -0.83984375, -0.65966796875, -0.4794921875, -0.29931640625, -0.119140625, 0.06103515625, 0.2412109375, 0.42138671875, 0.6015625, 0.78173828125, 0.9619140625, 1.14208984375, 1.322265625, 1.50244140625, 1.6826171875, 1.86279296875, 2.04296875, 2.22314453125, 2.4033203125, 2.58349609375, 2.763671875, 2.94384765625, 3.1240234375, 3.30419921875, 3.484375, 3.66455078125, 3.8447265625, 4.02490234375, 4.205078125, 4.38525390625, 4.5654296875, 4.74560546875, 4.92578125, 5.10595703125, 5.2861328125, 5.46630859375, 5.646484375, 5.82666015625, 6.0068359375, 6.18701171875, 6.3671875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 13.0, 11.0, 15.0, 12.0, 18.0, 18.0, 21.0, 19.0, 24.0, 30.0, 27.0, 30.0, 36.0, 28.0, 48.0, 36.0, 48.0, 31.0, 46.0, 39.0, 40.0, 39.0, 29.0, 36.0, 39.0, 36.0, 33.0, 25.0, 26.0, 24.0, 23.0, 18.0, 12.0, 9.0, 16.0, 7.0, 7.0, 4.0, 2.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.0390625, -9.716552734375, -9.39404296875, -9.071533203125, -8.7490234375, -8.426513671875, -8.10400390625, -7.781494140625, -7.458984375, -7.136474609375, -6.81396484375, -6.491455078125, -6.1689453125, -5.846435546875, -5.52392578125, -5.201416015625, -4.87890625, -4.556396484375, -4.23388671875, -3.911376953125, -3.5888671875, -3.266357421875, -2.94384765625, -2.621337890625, -2.298828125, -1.976318359375, -1.65380859375, -1.331298828125, -1.0087890625, -0.686279296875, -0.36376953125, -0.041259765625, 0.28125, 0.603759765625, 0.92626953125, 1.248779296875, 1.5712890625, 1.893798828125, 2.21630859375, 2.538818359375, 2.861328125, 3.183837890625, 3.50634765625, 3.828857421875, 4.1513671875, 4.473876953125, 4.79638671875, 5.118896484375, 5.44140625, 5.763916015625, 6.08642578125, 6.408935546875, 6.7314453125, 7.053955078125, 7.37646484375, 7.698974609375, 8.021484375, 8.343994140625, 8.66650390625, 8.989013671875, 9.3115234375, 9.634033203125, 9.95654296875, 10.279052734375, 10.6015625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 15.0, 16.0, 37.0, 75.0, 87.0, 143.0, 210.0, 345.0, 514.0, 746.0, 1257.0, 1920.0, 2876.0, 4468.0, 6896.0, 10716.0, 15852.0, 24127.0, 35147.0, 49450.0, 68228.0, 88282.0, 105981.0, 115614.0, 114453.0, 103112.0, 85061.0, 65640.0, 47684.0, 33620.0, 22649.0, 15088.0, 9895.0, 6412.0, 4169.0, 2771.0, 1715.0, 1162.0, 779.0, 483.0, 282.0, 210.0, 124.0, 90.0, 61.0, 34.0, 12.0, 16.0, 10.0, 6.0, 2.0, 1.0, 2.0], "bins": [-5.98828125, -5.81683349609375, -5.6453857421875, -5.47393798828125, -5.302490234375, -5.13104248046875, -4.9595947265625, -4.78814697265625, -4.61669921875, -4.44525146484375, -4.2738037109375, -4.10235595703125, -3.930908203125, -3.75946044921875, -3.5880126953125, -3.41656494140625, -3.2451171875, -3.07366943359375, -2.9022216796875, -2.73077392578125, -2.559326171875, -2.38787841796875, -2.2164306640625, -2.04498291015625, -1.87353515625, -1.70208740234375, -1.5306396484375, -1.35919189453125, -1.187744140625, -1.01629638671875, -0.8448486328125, -0.67340087890625, -0.501953125, -0.33050537109375, -0.1590576171875, 0.01239013671875, 0.183837890625, 0.35528564453125, 0.5267333984375, 0.69818115234375, 0.86962890625, 1.04107666015625, 1.2125244140625, 1.38397216796875, 1.555419921875, 1.72686767578125, 1.8983154296875, 2.06976318359375, 2.2412109375, 2.41265869140625, 2.5841064453125, 2.75555419921875, 2.927001953125, 3.09844970703125, 3.2698974609375, 3.44134521484375, 3.61279296875, 3.78424072265625, 3.9556884765625, 4.12713623046875, 4.298583984375, 4.47003173828125, 4.6414794921875, 4.81292724609375, 4.984375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 7.0, 2.0, 4.0, 11.0, 13.0, 7.0, 7.0, 16.0, 19.0, 12.0, 23.0, 22.0, 34.0, 25.0, 26.0, 32.0, 34.0, 33.0, 38.0, 40.0, 46.0, 37.0, 33.0, 40.0, 41.0, 29.0, 31.0, 26.0, 40.0, 36.0, 23.0, 27.0, 36.0, 20.0, 18.0, 16.0, 14.0, 8.0, 11.0, 16.0, 10.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.8515625, -5.67041015625, -5.4892578125, -5.30810546875, -5.126953125, -4.94580078125, -4.7646484375, -4.58349609375, -4.40234375, -4.22119140625, -4.0400390625, -3.85888671875, -3.677734375, -3.49658203125, -3.3154296875, -3.13427734375, -2.953125, -2.77197265625, -2.5908203125, -2.40966796875, -2.228515625, -2.04736328125, -1.8662109375, -1.68505859375, -1.50390625, -1.32275390625, -1.1416015625, -0.96044921875, -0.779296875, -0.59814453125, -0.4169921875, -0.23583984375, -0.0546875, 0.12646484375, 0.3076171875, 0.48876953125, 0.669921875, 0.85107421875, 1.0322265625, 1.21337890625, 1.39453125, 1.57568359375, 1.7568359375, 1.93798828125, 2.119140625, 2.30029296875, 2.4814453125, 2.66259765625, 2.84375, 3.02490234375, 3.2060546875, 3.38720703125, 3.568359375, 3.74951171875, 3.9306640625, 4.11181640625, 4.29296875, 4.47412109375, 4.6552734375, 4.83642578125, 5.017578125, 5.19873046875, 5.3798828125, 5.56103515625, 5.7421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 9.0, 17.0, 32.0, 29.0, 52.0, 84.0, 106.0, 162.0, 249.0, 385.0, 589.0, 892.0, 1461.0, 2102.0, 3448.0, 5587.0, 8938.0, 14759.0, 23809.0, 37422.0, 58098.0, 85968.0, 117471.0, 140557.0, 144778.0, 125681.0, 95371.0, 65418.0, 43061.0, 27105.0, 16789.0, 10467.0, 6585.0, 4057.0, 2562.0, 1576.0, 1024.0, 631.0, 425.0, 272.0, 181.0, 120.0, 80.0, 52.0, 33.0, 25.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-2.330078125, -2.257598876953125, -2.18511962890625, -2.112640380859375, -2.0401611328125, -1.967681884765625, -1.89520263671875, -1.822723388671875, -1.750244140625, -1.677764892578125, -1.60528564453125, -1.532806396484375, -1.4603271484375, -1.387847900390625, -1.31536865234375, -1.242889404296875, -1.17041015625, -1.097930908203125, -1.02545166015625, -0.952972412109375, -0.8804931640625, -0.808013916015625, -0.73553466796875, -0.663055419921875, -0.590576171875, -0.518096923828125, -0.44561767578125, -0.373138427734375, -0.3006591796875, -0.228179931640625, -0.15570068359375, -0.083221435546875, -0.0107421875, 0.061737060546875, 0.13421630859375, 0.206695556640625, 0.2791748046875, 0.351654052734375, 0.42413330078125, 0.496612548828125, 0.569091796875, 0.641571044921875, 0.71405029296875, 0.786529541015625, 0.8590087890625, 0.931488037109375, 1.00396728515625, 1.076446533203125, 1.14892578125, 1.221405029296875, 1.29388427734375, 1.366363525390625, 1.4388427734375, 1.511322021484375, 1.58380126953125, 1.656280517578125, 1.728759765625, 1.801239013671875, 1.87371826171875, 1.946197509765625, 2.0186767578125, 2.091156005859375, 2.16363525390625, 2.236114501953125, 2.30859375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 9.0, 6.0, 12.0, 10.0, 14.0, 14.0, 20.0, 27.0, 27.0, 38.0, 30.0, 26.0, 53.0, 33.0, 49.0, 46.0, 55.0, 56.0, 52.0, 61.0, 45.0, 42.0, 40.0, 31.0, 36.0, 42.0, 27.0, 21.0, 13.0, 24.0, 11.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022900104522705078, -0.00022259168326854706, -0.00021618232131004333, -0.0002097729593515396, -0.0002033635973930359, -0.00019695423543453217, -0.00019054487347602844, -0.00018413551151752472, -0.000177726149559021, -0.00017131678760051727, -0.00016490742564201355, -0.00015849806368350983, -0.0001520887017250061, -0.00014567933976650238, -0.00013926997780799866, -0.00013286061584949493, -0.0001264512538909912, -0.00012004189193248749, -0.00011363252997398376, -0.00010722316801548004, -0.00010081380605697632, -9.44044440984726e-05, -8.799508213996887e-05, -8.158572018146515e-05, -7.517635822296143e-05, -6.87669962644577e-05, -6.235763430595398e-05, -5.5948272347450256e-05, -4.953891038894653e-05, -4.312954843044281e-05, -3.672018647193909e-05, -3.0310824513435364e-05, -2.390146255493164e-05, -1.7492100596427917e-05, -1.1082738637924194e-05, -4.673376679420471e-06, 1.735985279083252e-06, 8.145347237586975e-06, 1.4554709196090698e-05, 2.096407115459442e-05, 2.7373433113098145e-05, 3.378279507160187e-05, 4.019215703010559e-05, 4.6601518988609314e-05, 5.301088094711304e-05, 5.942024290561676e-05, 6.582960486412048e-05, 7.22389668226242e-05, 7.864832878112793e-05, 8.505769073963165e-05, 9.146705269813538e-05, 9.78764146566391e-05, 0.00010428577661514282, 0.00011069513857364655, 0.00011710450053215027, 0.000123513862490654, 0.00012992322444915771, 0.00013633258640766144, 0.00014274194836616516, 0.00014915131032466888, 0.0001555606722831726, 0.00016197003424167633, 0.00016837939620018005, 0.00017478875815868378, 0.0001811981201171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 13.0, 9.0, 10.0, 16.0, 23.0, 26.0, 42.0, 66.0, 109.0, 160.0, 251.0, 396.0, 640.0, 1035.0, 1636.0, 2491.0, 4205.0, 6747.0, 11027.0, 18128.0, 29057.0, 46806.0, 71922.0, 103628.0, 134148.0, 149248.0, 139296.0, 111325.0, 78935.0, 52234.0, 32319.0, 20133.0, 12554.0, 7399.0, 4702.0, 2877.0, 1801.0, 1159.0, 666.0, 445.0, 302.0, 194.0, 118.0, 96.0, 61.0, 31.0, 23.0, 26.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3125, -2.236968994140625, -2.16143798828125, -2.085906982421875, -2.0103759765625, -1.934844970703125, -1.85931396484375, -1.783782958984375, -1.708251953125, -1.632720947265625, -1.55718994140625, -1.481658935546875, -1.4061279296875, -1.330596923828125, -1.25506591796875, -1.179534912109375, -1.10400390625, -1.028472900390625, -0.95294189453125, -0.877410888671875, -0.8018798828125, -0.726348876953125, -0.65081787109375, -0.575286865234375, -0.499755859375, -0.424224853515625, -0.34869384765625, -0.273162841796875, -0.1976318359375, -0.122100830078125, -0.04656982421875, 0.028961181640625, 0.1044921875, 0.180023193359375, 0.25555419921875, 0.331085205078125, 0.4066162109375, 0.482147216796875, 0.55767822265625, 0.633209228515625, 0.708740234375, 0.784271240234375, 0.85980224609375, 0.935333251953125, 1.0108642578125, 1.086395263671875, 1.16192626953125, 1.237457275390625, 1.31298828125, 1.388519287109375, 1.46405029296875, 1.539581298828125, 1.6151123046875, 1.690643310546875, 1.76617431640625, 1.841705322265625, 1.917236328125, 1.992767333984375, 2.06829833984375, 2.143829345703125, 2.2193603515625, 2.294891357421875, 2.37042236328125, 2.445953369140625, 2.521484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 5.0, 11.0, 4.0, 12.0, 18.0, 10.0, 30.0, 22.0, 28.0, 39.0, 32.0, 29.0, 37.0, 35.0, 54.0, 40.0, 45.0, 41.0, 48.0, 42.0, 46.0, 44.0, 40.0, 39.0, 39.0, 31.0, 19.0, 25.0, 14.0, 20.0, 19.0, 15.0, 8.0, 10.0, 11.0, 5.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8673553466796875, -0.841644287109375, -0.8159332275390625, -0.79022216796875, -0.7645111083984375, -0.738800048828125, -0.7130889892578125, -0.6873779296875, -0.6616668701171875, -0.635955810546875, -0.6102447509765625, -0.58453369140625, -0.5588226318359375, -0.533111572265625, -0.5074005126953125, -0.481689453125, -0.4559783935546875, -0.430267333984375, -0.4045562744140625, -0.37884521484375, -0.3531341552734375, -0.327423095703125, -0.3017120361328125, -0.2760009765625, -0.2502899169921875, -0.224578857421875, -0.1988677978515625, -0.17315673828125, -0.1474456787109375, -0.121734619140625, -0.0960235595703125, -0.0703125, -0.0446014404296875, -0.018890380859375, 0.0068206787109375, 0.03253173828125, 0.0582427978515625, 0.083953857421875, 0.1096649169921875, 0.1353759765625, 0.1610870361328125, 0.186798095703125, 0.2125091552734375, 0.23822021484375, 0.2639312744140625, 0.289642333984375, 0.3153533935546875, 0.341064453125, 0.3667755126953125, 0.392486572265625, 0.4181976318359375, 0.44390869140625, 0.4696197509765625, 0.495330810546875, 0.5210418701171875, 0.5467529296875, 0.5724639892578125, 0.598175048828125, 0.6238861083984375, 0.64959716796875, 0.6753082275390625, 0.701019287109375, 0.7267303466796875, 0.75244140625]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 5.0, 7.0, 7.0, 8.0, 9.0, 14.0, 13.0, 23.0, 22.0, 24.0, 27.0, 34.0, 32.0, 52.0, 51.0, 43.0, 56.0, 55.0, 41.0, 55.0, 48.0, 37.0, 37.0, 34.0, 28.0, 39.0, 34.0, 30.0, 19.0, 12.0, 12.0, 17.0, 12.0, 16.0, 6.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.205920219421387, -7.918777942657471, -7.631636142730713, -7.344493865966797, -7.057351589202881, -6.770209312438965, -6.483067512512207, -6.195925235748291, -5.908782958984375, -5.621640682220459, -5.334498882293701, -5.047356605529785, -4.760214328765869, -4.473072052001953, -4.185930252075195, -3.8987879753112793, -3.6116461753845215, -3.3245041370391846, -3.0373618602752686, -2.7502198219299316, -2.4630775451660156, -2.1759355068206787, -1.8887934684753418, -1.6016511917114258, -1.3145091533660889, -1.0273669958114624, -0.7402248978614807, -0.453082799911499, -0.16594064235687256, 0.1212015151977539, 0.4083435535430908, 0.6954858303070068, 0.9826278686523438, 1.2697700262069702, 1.5569121837615967, 1.8440542221069336, 2.1311964988708496, 2.4183385372161865, 2.7054805755615234, 2.9926228523254395, 3.2797648906707764, 3.5669069290161133, 3.8540492057800293, 4.141191482543945, 4.428333282470703, 4.715475559234619, 5.002617835998535, 5.289759635925293, 5.576901912689209, 5.864044189453125, 6.151185989379883, 6.438328266143799, 6.725470542907715, 7.012612342834473, 7.299754619598389, 7.586896896362305, 7.8740386962890625, 8.16118049621582, 8.448323249816895, 8.735465049743652, 9.02260684967041, 9.309749603271484, 9.596891403198242, 9.884033203125, 10.171175956726074]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 12.0, 10.0, 7.0, 10.0, 13.0, 15.0, 14.0, 11.0, 20.0, 27.0, 39.0, 34.0, 26.0, 37.0, 34.0, 40.0, 53.0, 46.0, 33.0, 38.0, 40.0, 36.0, 45.0, 35.0, 40.0, 28.0, 39.0, 35.0, 21.0, 21.0, 19.0, 23.0, 17.0, 12.0, 14.0, 10.0, 10.0, 3.0, 4.0, 8.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.337403297424316, -9.99757194519043, -9.657740592956543, -9.317909240722656, -8.978078842163086, -8.6382474899292, -8.298416137695312, -7.958584785461426, -7.618753910064697, -7.2789225578308105, -6.939091682434082, -6.599260330200195, -6.259428977966309, -5.91959810256958, -5.579766750335693, -5.239935874938965, -4.900104522705078, -4.560273170471191, -4.220442295074463, -3.880610942840576, -3.5407798290252686, -3.200948715209961, -2.861117362976074, -2.5212862491607666, -2.181455135345459, -1.8416240215301514, -1.5017927885055542, -1.161961555480957, -0.8221304416656494, -0.4822993278503418, -0.14246797561645508, 0.19736313819885254, 0.5371952056884766, 0.877026379108429, 1.2168575525283813, 1.5566887855529785, 1.8965198993682861, 2.2363510131835938, 2.5761823654174805, 2.916013479232788, 3.2558445930480957, 3.5956757068634033, 3.935506820678711, 4.275338172912598, 4.615169525146484, 4.955000400543213, 5.2948317527771, 5.634662628173828, 5.974493980407715, 6.314325332641602, 6.65415620803833, 6.993987560272217, 7.333818435668945, 7.673649787902832, 8.013481140136719, 8.353312492370605, 8.693143844604492, 9.032975196838379, 9.372806549072266, 9.712636947631836, 10.052468299865723, 10.39229965209961, 10.732131004333496, 11.071962356567383, 11.411792755126953]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 14.0, 16.0, 44.0, 39.0, 72.0, 107.0, 204.0, 309.0, 456.0, 778.0, 1371.0, 2240.0, 3680.0, 6560.0, 11261.0, 19922.0, 35711.0, 63602.0, 112842.0, 199783.0, 336536.0, 528159.0, 702170.0, 723044.0, 568486.0, 372019.0, 220660.0, 124580.0, 69275.0, 38762.0, 21869.0, 12194.0, 7060.0, 4195.0, 2389.0, 1434.0, 927.0, 556.0, 331.0, 235.0, 138.0, 89.0, 60.0, 36.0, 16.0, 18.0, 12.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.0546875, -9.7508544921875, -9.447021484375, -9.1431884765625, -8.83935546875, -8.5355224609375, -8.231689453125, -7.9278564453125, -7.6240234375, -7.3201904296875, -7.016357421875, -6.7125244140625, -6.40869140625, -6.1048583984375, -5.801025390625, -5.4971923828125, -5.193359375, -4.8895263671875, -4.585693359375, -4.2818603515625, -3.97802734375, -3.6741943359375, -3.370361328125, -3.0665283203125, -2.7626953125, -2.4588623046875, -2.155029296875, -1.8511962890625, -1.54736328125, -1.2435302734375, -0.939697265625, -0.6358642578125, -0.33203125, -0.0281982421875, 0.275634765625, 0.5794677734375, 0.88330078125, 1.1871337890625, 1.490966796875, 1.7947998046875, 2.0986328125, 2.4024658203125, 2.706298828125, 3.0101318359375, 3.31396484375, 3.6177978515625, 3.921630859375, 4.2254638671875, 4.529296875, 4.8331298828125, 5.136962890625, 5.4407958984375, 5.74462890625, 6.0484619140625, 6.352294921875, 6.6561279296875, 6.9599609375, 7.2637939453125, 7.567626953125, 7.8714599609375, 8.17529296875, 8.4791259765625, 8.782958984375, 9.0867919921875, 9.390625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 10.0, 10.0, 9.0, 15.0, 15.0, 15.0, 16.0, 14.0, 35.0, 31.0, 34.0, 38.0, 37.0, 39.0, 49.0, 36.0, 47.0, 37.0, 27.0, 41.0, 41.0, 31.0, 40.0, 40.0, 37.0, 26.0, 40.0, 25.0, 26.0, 24.0, 13.0, 15.0, 9.0, 15.0, 6.0, 11.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.171875, -7.90673828125, -7.6416015625, -7.37646484375, -7.111328125, -6.84619140625, -6.5810546875, -6.31591796875, -6.05078125, -5.78564453125, -5.5205078125, -5.25537109375, -4.990234375, -4.72509765625, -4.4599609375, -4.19482421875, -3.9296875, -3.66455078125, -3.3994140625, -3.13427734375, -2.869140625, -2.60400390625, -2.3388671875, -2.07373046875, -1.80859375, -1.54345703125, -1.2783203125, -1.01318359375, -0.748046875, -0.48291015625, -0.2177734375, 0.04736328125, 0.3125, 0.57763671875, 0.8427734375, 1.10791015625, 1.373046875, 1.63818359375, 1.9033203125, 2.16845703125, 2.43359375, 2.69873046875, 2.9638671875, 3.22900390625, 3.494140625, 3.75927734375, 4.0244140625, 4.28955078125, 4.5546875, 4.81982421875, 5.0849609375, 5.35009765625, 5.615234375, 5.88037109375, 6.1455078125, 6.41064453125, 6.67578125, 6.94091796875, 7.2060546875, 7.47119140625, 7.736328125, 8.00146484375, 8.2666015625, 8.53173828125, 8.796875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 12.0, 18.0, 35.0, 44.0, 95.0, 173.0, 244.0, 446.0, 714.0, 1154.0, 2053.0, 3526.0, 6060.0, 10207.0, 17986.0, 30780.0, 52435.0, 88357.0, 144845.0, 227874.0, 337485.0, 460291.0, 556429.0, 580489.0, 517303.0, 403822.0, 283068.0, 186243.0, 114320.0, 69657.0, 41267.0, 23927.0, 13667.0, 7998.0, 4640.0, 2675.0, 1542.0, 928.0, 569.0, 356.0, 199.0, 124.0, 79.0, 49.0, 34.0, 22.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.1796875, -7.909423828125, -7.63916015625, -7.368896484375, -7.0986328125, -6.828369140625, -6.55810546875, -6.287841796875, -6.017578125, -5.747314453125, -5.47705078125, -5.206787109375, -4.9365234375, -4.666259765625, -4.39599609375, -4.125732421875, -3.85546875, -3.585205078125, -3.31494140625, -3.044677734375, -2.7744140625, -2.504150390625, -2.23388671875, -1.963623046875, -1.693359375, -1.423095703125, -1.15283203125, -0.882568359375, -0.6123046875, -0.342041015625, -0.07177734375, 0.198486328125, 0.46875, 0.739013671875, 1.00927734375, 1.279541015625, 1.5498046875, 1.820068359375, 2.09033203125, 2.360595703125, 2.630859375, 2.901123046875, 3.17138671875, 3.441650390625, 3.7119140625, 3.982177734375, 4.25244140625, 4.522705078125, 4.79296875, 5.063232421875, 5.33349609375, 5.603759765625, 5.8740234375, 6.144287109375, 6.41455078125, 6.684814453125, 6.955078125, 7.225341796875, 7.49560546875, 7.765869140625, 8.0361328125, 8.306396484375, 8.57666015625, 8.846923828125, 9.1171875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 12.0, 16.0, 14.0, 25.0, 27.0, 27.0, 36.0, 61.0, 60.0, 60.0, 80.0, 88.0, 104.0, 140.0, 157.0, 174.0, 143.0, 202.0, 182.0, 183.0, 177.0, 204.0, 211.0, 190.0, 178.0, 151.0, 174.0, 120.0, 104.0, 97.0, 98.0, 87.0, 73.0, 67.0, 61.0, 52.0, 43.0, 35.0, 30.0, 36.0, 18.0, 14.0, 11.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.53515625, -3.41497802734375, -3.2947998046875, -3.17462158203125, -3.054443359375, -2.93426513671875, -2.8140869140625, -2.69390869140625, -2.57373046875, -2.45355224609375, -2.3333740234375, -2.21319580078125, -2.093017578125, -1.97283935546875, -1.8526611328125, -1.73248291015625, -1.6123046875, -1.49212646484375, -1.3719482421875, -1.25177001953125, -1.131591796875, -1.01141357421875, -0.8912353515625, -0.77105712890625, -0.65087890625, -0.53070068359375, -0.4105224609375, -0.29034423828125, -0.170166015625, -0.04998779296875, 0.0701904296875, 0.19036865234375, 0.310546875, 0.43072509765625, 0.5509033203125, 0.67108154296875, 0.791259765625, 0.91143798828125, 1.0316162109375, 1.15179443359375, 1.27197265625, 1.39215087890625, 1.5123291015625, 1.63250732421875, 1.752685546875, 1.87286376953125, 1.9930419921875, 2.11322021484375, 2.2333984375, 2.35357666015625, 2.4737548828125, 2.59393310546875, 2.714111328125, 2.83428955078125, 2.9544677734375, 3.07464599609375, 3.19482421875, 3.31500244140625, 3.4351806640625, 3.55535888671875, 3.675537109375, 3.79571533203125, 3.9158935546875, 4.03607177734375, 4.15625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 9.0, 5.0, 7.0, 6.0, 7.0, 11.0, 9.0, 17.0, 15.0, 21.0, 22.0, 38.0, 41.0, 33.0, 46.0, 40.0, 47.0, 51.0, 49.0, 42.0, 52.0, 41.0, 43.0, 42.0, 50.0, 32.0, 37.0, 22.0, 24.0, 21.0, 23.0, 13.0, 12.0, 18.0, 14.0, 14.0, 5.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.852096557617188, -9.52309799194336, -9.194098472595215, -8.865099906921387, -8.536100387573242, -8.207101821899414, -7.878103256225586, -7.5491042137146, -7.220105171203613, -6.891106128692627, -6.562107086181641, -6.2331085205078125, -5.904109477996826, -5.57511043548584, -5.246111869812012, -4.917112827301025, -4.588113784790039, -4.259114742279053, -3.9301159381866455, -3.6011171340942383, -3.272118091583252, -2.9431190490722656, -2.6141202449798584, -2.285121440887451, -1.9561223983764648, -1.627123475074768, -1.2981245517730713, -0.9691256284713745, -0.6401267051696777, -0.31112778186798096, 0.01787114143371582, 0.34686994552612305, 0.675868034362793, 1.0048669576644897, 1.3338658809661865, 1.6628648042678833, 1.99186372756958, 2.3208627700805664, 2.6498615741729736, 2.978860378265381, 3.307859420776367, 3.6368584632873535, 3.9658572673797607, 4.294856071472168, 4.623855113983154, 4.952854156494141, 5.281852722167969, 5.610851764678955, 5.939850807189941, 6.268849849700928, 6.597848892211914, 6.926847457885742, 7.2558465003967285, 7.584845542907715, 7.913844108581543, 8.242843627929688, 8.571842193603516, 8.900840759277344, 9.229840278625488, 9.558838844299316, 9.887838363647461, 10.216836929321289, 10.545835494995117, 10.874834060668945, 11.20383358001709]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 8.0, 6.0, 6.0, 9.0, 6.0, 13.0, 16.0, 17.0, 15.0, 18.0, 27.0, 20.0, 28.0, 27.0, 27.0, 33.0, 37.0, 46.0, 32.0, 41.0, 37.0, 34.0, 42.0, 41.0, 33.0, 46.0, 40.0, 39.0, 29.0, 34.0, 24.0, 19.0, 26.0, 26.0, 21.0, 10.0, 17.0, 9.0, 6.0, 14.0, 4.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.876531600952148, -10.519359588623047, -10.162187576293945, -9.805015563964844, -9.447843551635742, -9.09067153930664, -8.733499526977539, -8.376327514648438, -8.019155502319336, -7.661983489990234, -7.304811477661133, -6.947639465332031, -6.59046745300293, -6.233295440673828, -5.876123905181885, -5.518951892852783, -5.16178035736084, -4.804608345031738, -4.447436332702637, -4.090264320373535, -3.7330925464630127, -3.375920534133911, -3.0187487602233887, -2.661576747894287, -2.3044047355651855, -1.947232723236084, -1.590060830116272, -1.23288893699646, -0.8757169246673584, -0.5185449123382568, -0.16137313842773438, 0.1957988739013672, 0.5529708862304688, 0.9101428389549255, 1.2673147916793823, 1.6244866847991943, 1.981658697128296, 2.3388307094573975, 2.69600248336792, 3.0531744956970215, 3.410346508026123, 3.7675185203552246, 4.124690532684326, 4.4818620681762695, 4.839034080505371, 5.196206092834473, 5.553378105163574, 5.910550117492676, 6.267722129821777, 6.624894142150879, 6.9820661544799805, 7.339238166809082, 7.696410179138184, 8.053582191467285, 8.41075325012207, 8.767925262451172, 9.125097274780273, 9.482269287109375, 9.839441299438477, 10.196613311767578, 10.55378532409668, 10.910957336425781, 11.268129348754883, 11.625301361083984, 11.982473373413086]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 12.0, 16.0, 21.0, 28.0, 53.0, 69.0, 98.0, 135.0, 221.0, 343.0, 467.0, 638.0, 1021.0, 1518.0, 2211.0, 3462.0, 5093.0, 7820.0, 12284.0, 18860.0, 30179.0, 47972.0, 76339.0, 120024.0, 175788.0, 185130.0, 130115.0, 83380.0, 52820.0, 32857.0, 21011.0, 13294.0, 8514.0, 5566.0, 3684.0, 2437.0, 1682.0, 1079.0, 731.0, 527.0, 321.0, 245.0, 137.0, 123.0, 78.0, 56.0, 23.0, 29.0, 20.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1796875, -1.141754150390625, -1.10382080078125, -1.065887451171875, -1.0279541015625, -0.990020751953125, -0.95208740234375, -0.914154052734375, -0.876220703125, -0.838287353515625, -0.80035400390625, -0.762420654296875, -0.7244873046875, -0.686553955078125, -0.64862060546875, -0.610687255859375, -0.57275390625, -0.534820556640625, -0.49688720703125, -0.458953857421875, -0.4210205078125, -0.383087158203125, -0.34515380859375, -0.307220458984375, -0.269287109375, -0.231353759765625, -0.19342041015625, -0.155487060546875, -0.1175537109375, -0.079620361328125, -0.04168701171875, -0.003753662109375, 0.0341796875, 0.072113037109375, 0.11004638671875, 0.147979736328125, 0.1859130859375, 0.223846435546875, 0.26177978515625, 0.299713134765625, 0.337646484375, 0.375579833984375, 0.41351318359375, 0.451446533203125, 0.4893798828125, 0.527313232421875, 0.56524658203125, 0.603179931640625, 0.64111328125, 0.679046630859375, 0.71697998046875, 0.754913330078125, 0.7928466796875, 0.830780029296875, 0.86871337890625, 0.906646728515625, 0.944580078125, 0.982513427734375, 1.02044677734375, 1.058380126953125, 1.0963134765625, 1.134246826171875, 1.17218017578125, 1.210113525390625, 1.248046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 10.0, 5.0, 9.0, 20.0, 21.0, 21.0, 27.0, 26.0, 34.0, 28.0, 35.0, 43.0, 43.0, 36.0, 33.0, 38.0, 50.0, 40.0, 44.0, 35.0, 43.0, 46.0, 37.0, 45.0, 29.0, 21.0, 38.0, 17.0, 22.0, 17.0, 17.0, 13.0, 7.0, 8.0, 4.0, 8.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5704345703125, -10.164306640625, -9.7581787109375, -9.35205078125, -8.9459228515625, -8.539794921875, -8.1336669921875, -7.7275390625, -7.3214111328125, -6.915283203125, -6.5091552734375, -6.10302734375, -5.6968994140625, -5.290771484375, -4.8846435546875, -4.478515625, -4.0723876953125, -3.666259765625, -3.2601318359375, -2.85400390625, -2.4478759765625, -2.041748046875, -1.6356201171875, -1.2294921875, -0.8233642578125, -0.417236328125, -0.0111083984375, 0.39501953125, 0.8011474609375, 1.207275390625, 1.6134033203125, 2.01953125, 2.4256591796875, 2.831787109375, 3.2379150390625, 3.64404296875, 4.0501708984375, 4.456298828125, 4.8624267578125, 5.2685546875, 5.6746826171875, 6.080810546875, 6.4869384765625, 6.89306640625, 7.2991943359375, 7.705322265625, 8.1114501953125, 8.517578125, 8.9237060546875, 9.329833984375, 9.7359619140625, 10.14208984375, 10.5482177734375, 10.954345703125, 11.3604736328125, 11.7666015625, 12.1727294921875, 12.578857421875, 12.9849853515625, 13.39111328125, 13.7972412109375, 14.203369140625, 14.6094970703125, 15.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 0.0, 5.0, 17.0, 12.0, 23.0, 37.0, 53.0, 73.0, 113.0, 220.0, 361.0, 691.0, 1090.0, 2015.0, 3578.0, 6444.0, 11759.0, 21156.0, 38322.0, 70560.0, 127496.0, 220742.0, 234403.0, 139341.0, 76931.0, 41577.0, 22585.0, 12729.0, 7066.0, 3999.0, 2167.0, 1236.0, 751.0, 400.0, 230.0, 147.0, 93.0, 43.0, 31.0, 15.0, 17.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6624908447265625, -1.607208251953125, -1.5519256591796875, -1.49664306640625, -1.4413604736328125, -1.386077880859375, -1.3307952880859375, -1.2755126953125, -1.2202301025390625, -1.164947509765625, -1.1096649169921875, -1.05438232421875, -0.9990997314453125, -0.943817138671875, -0.8885345458984375, -0.833251953125, -0.7779693603515625, -0.722686767578125, -0.6674041748046875, -0.61212158203125, -0.5568389892578125, -0.501556396484375, -0.4462738037109375, -0.3909912109375, -0.3357086181640625, -0.280426025390625, -0.2251434326171875, -0.16986083984375, -0.1145782470703125, -0.059295654296875, -0.0040130615234375, 0.05126953125, 0.1065521240234375, 0.161834716796875, 0.2171173095703125, 0.27239990234375, 0.3276824951171875, 0.382965087890625, 0.4382476806640625, 0.4935302734375, 0.5488128662109375, 0.604095458984375, 0.6593780517578125, 0.71466064453125, 0.7699432373046875, 0.825225830078125, 0.8805084228515625, 0.935791015625, 0.9910736083984375, 1.046356201171875, 1.1016387939453125, 1.15692138671875, 1.2122039794921875, 1.267486572265625, 1.3227691650390625, 1.3780517578125, 1.4333343505859375, 1.488616943359375, 1.5438995361328125, 1.59918212890625, 1.6544647216796875, 1.709747314453125, 1.7650299072265625, 1.8203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 2.0, 2.0, 8.0, 10.0, 11.0, 13.0, 14.0, 18.0, 23.0, 24.0, 36.0, 29.0, 36.0, 46.0, 48.0, 40.0, 57.0, 39.0, 44.0, 44.0, 49.0, 47.0, 46.0, 46.0, 49.0, 33.0, 41.0, 32.0, 25.0, 9.0, 24.0, 13.0, 5.0, 7.0, 8.0, 6.0, 11.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.62548828125, -8.3369140625, -8.04833984375, -7.759765625, -7.47119140625, -7.1826171875, -6.89404296875, -6.60546875, -6.31689453125, -6.0283203125, -5.73974609375, -5.451171875, -5.16259765625, -4.8740234375, -4.58544921875, -4.296875, -4.00830078125, -3.7197265625, -3.43115234375, -3.142578125, -2.85400390625, -2.5654296875, -2.27685546875, -1.98828125, -1.69970703125, -1.4111328125, -1.12255859375, -0.833984375, -0.54541015625, -0.2568359375, 0.03173828125, 0.3203125, 0.60888671875, 0.8974609375, 1.18603515625, 1.474609375, 1.76318359375, 2.0517578125, 2.34033203125, 2.62890625, 2.91748046875, 3.2060546875, 3.49462890625, 3.783203125, 4.07177734375, 4.3603515625, 4.64892578125, 4.9375, 5.22607421875, 5.5146484375, 5.80322265625, 6.091796875, 6.38037109375, 6.6689453125, 6.95751953125, 7.24609375, 7.53466796875, 7.8232421875, 8.11181640625, 8.400390625, 8.68896484375, 8.9775390625, 9.26611328125, 9.5546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 7.0, 2.0, 3.0, 9.0, 13.0, 30.0, 20.0, 29.0, 41.0, 78.0, 82.0, 141.0, 189.0, 286.0, 472.0, 802.0, 1530.0, 3299.0, 9400.0, 36485.0, 293295.0, 612084.0, 66597.0, 14345.0, 4710.0, 2025.0, 923.0, 559.0, 351.0, 201.0, 157.0, 108.0, 71.0, 54.0, 43.0, 30.0, 16.0, 15.0, 17.0, 11.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.48427581787109375, -0.4670867919921875, -0.44989776611328125, -0.432708740234375, -0.41551971435546875, -0.3983306884765625, -0.38114166259765625, -0.36395263671875, -0.34676361083984375, -0.3295745849609375, -0.31238555908203125, -0.295196533203125, -0.27800750732421875, -0.2608184814453125, -0.24362945556640625, -0.2264404296875, -0.20925140380859375, -0.1920623779296875, -0.17487335205078125, -0.157684326171875, -0.14049530029296875, -0.1233062744140625, -0.10611724853515625, -0.08892822265625, -0.07173919677734375, -0.0545501708984375, -0.03736114501953125, -0.020172119140625, -0.00298309326171875, 0.0142059326171875, 0.03139495849609375, 0.048583984375, 0.06577301025390625, 0.0829620361328125, 0.10015106201171875, 0.117340087890625, 0.13452911376953125, 0.1517181396484375, 0.16890716552734375, 0.18609619140625, 0.20328521728515625, 0.2204742431640625, 0.23766326904296875, 0.254852294921875, 0.27204132080078125, 0.2892303466796875, 0.30641937255859375, 0.3236083984375, 0.34079742431640625, 0.3579864501953125, 0.37517547607421875, 0.392364501953125, 0.40955352783203125, 0.4267425537109375, 0.44393157958984375, 0.46112060546875, 0.47830963134765625, 0.4954986572265625, 0.5126876831054688, 0.529876708984375, 0.5470657348632812, 0.5642547607421875, 0.5814437866210938, 0.5986328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 13.0, 19.0, 20.0, 27.0, 29.0, 30.0, 51.0, 63.0, 71.0, 68.0, 78.0, 69.0, 65.0, 62.0, 52.0, 58.0, 50.0, 33.0, 29.0, 21.0, 13.0, 16.0, 12.0, 12.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5570392608642578e-05, -2.48616561293602e-05, -2.415291965007782e-05, -2.344418317079544e-05, -2.273544669151306e-05, -2.2026710212230682e-05, -2.1317973732948303e-05, -2.0609237253665924e-05, -1.9900500774383545e-05, -1.9191764295101166e-05, -1.8483027815818787e-05, -1.7774291336536407e-05, -1.706555485725403e-05, -1.635681837797165e-05, -1.564808189868927e-05, -1.4939345419406891e-05, -1.4230608940124512e-05, -1.3521872460842133e-05, -1.2813135981559753e-05, -1.2104399502277374e-05, -1.1395663022994995e-05, -1.0686926543712616e-05, -9.978190064430237e-06, -9.269453585147858e-06, -8.560717105865479e-06, -7.8519806265831e-06, -7.14324414730072e-06, -6.434507668018341e-06, -5.725771188735962e-06, -5.017034709453583e-06, -4.308298230171204e-06, -3.5995617508888245e-06, -2.8908252716064453e-06, -2.182088792324066e-06, -1.473352313041687e-06, -7.646158337593079e-07, -5.587935447692871e-08, 6.528571248054504e-07, 1.3615936040878296e-06, 2.0703300833702087e-06, 2.779066562652588e-06, 3.487803041934967e-06, 4.196539521217346e-06, 4.905276000499725e-06, 5.6140124797821045e-06, 6.322748959064484e-06, 7.031485438346863e-06, 7.740221917629242e-06, 8.448958396911621e-06, 9.157694876194e-06, 9.86643135547638e-06, 1.0575167834758759e-05, 1.1283904314041138e-05, 1.1992640793323517e-05, 1.2701377272605896e-05, 1.3410113751888275e-05, 1.4118850231170654e-05, 1.4827586710453033e-05, 1.5536323189735413e-05, 1.6245059669017792e-05, 1.695379614830017e-05, 1.766253262758255e-05, 1.837126910686493e-05, 1.908000558614731e-05, 1.9788742065429688e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 14.0, 13.0, 15.0, 27.0, 34.0, 47.0, 70.0, 96.0, 129.0, 241.0, 304.0, 541.0, 1065.0, 1935.0, 4510.0, 12897.0, 53918.0, 403052.0, 481898.0, 63510.0, 14472.0, 4878.0, 2130.0, 1102.0, 572.0, 346.0, 206.0, 158.0, 101.0, 59.0, 46.0, 27.0, 28.0, 22.0, 24.0, 12.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6388931274414062, -0.6176300048828125, -0.5963668823242188, -0.575103759765625, -0.5538406372070312, -0.5325775146484375, -0.5113143920898438, -0.49005126953125, -0.46878814697265625, -0.4475250244140625, -0.42626190185546875, -0.404998779296875, -0.38373565673828125, -0.3624725341796875, -0.34120941162109375, -0.3199462890625, -0.29868316650390625, -0.2774200439453125, -0.25615692138671875, -0.234893798828125, -0.21363067626953125, -0.1923675537109375, -0.17110443115234375, -0.14984130859375, -0.12857818603515625, -0.1073150634765625, -0.08605194091796875, -0.064788818359375, -0.04352569580078125, -0.0222625732421875, -0.00099945068359375, 0.020263671875, 0.04152679443359375, 0.0627899169921875, 0.08405303955078125, 0.105316162109375, 0.12657928466796875, 0.1478424072265625, 0.16910552978515625, 0.19036865234375, 0.21163177490234375, 0.2328948974609375, 0.25415802001953125, 0.275421142578125, 0.29668426513671875, 0.3179473876953125, 0.33921051025390625, 0.3604736328125, 0.38173675537109375, 0.4029998779296875, 0.42426300048828125, 0.445526123046875, 0.46678924560546875, 0.4880523681640625, 0.5093154907226562, 0.53057861328125, 0.5518417358398438, 0.5731048583984375, 0.5943679809570312, 0.615631103515625, 0.6368942260742188, 0.6581573486328125, 0.6794204711914062, 0.70068359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 20.0, 35.0, 76.0, 145.0, 203.0, 220.0, 124.0, 58.0, 41.0, 18.0, 14.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.416015625, -0.4061012268066406, -0.39618682861328125, -0.3862724304199219, -0.3763580322265625, -0.3664436340332031, -0.35652923583984375, -0.3466148376464844, -0.336700439453125, -0.3267860412597656, -0.31687164306640625, -0.3069572448730469, -0.2970428466796875, -0.2871284484863281, -0.27721405029296875, -0.2672996520996094, -0.25738525390625, -0.24747085571289062, -0.23755645751953125, -0.22764205932617188, -0.2177276611328125, -0.20781326293945312, -0.19789886474609375, -0.18798446655273438, -0.178070068359375, -0.16815567016601562, -0.15824127197265625, -0.14832687377929688, -0.1384124755859375, -0.12849807739257812, -0.11858367919921875, -0.10866928100585938, -0.0987548828125, -0.08884048461914062, -0.07892608642578125, -0.06901168823242188, -0.0590972900390625, -0.049182891845703125, -0.03926849365234375, -0.029354095458984375, -0.019439697265625, -0.009525299072265625, 0.00038909912109375, 0.010303497314453125, 0.0202178955078125, 0.030132293701171875, 0.04004669189453125, 0.049961090087890625, 0.05987548828125, 0.06978988647460938, 0.07970428466796875, 0.08961868286132812, 0.0995330810546875, 0.10944747924804688, 0.11936187744140625, 0.12927627563476562, 0.139190673828125, 0.14910507202148438, 0.15901947021484375, 0.16893386840820312, 0.1788482666015625, 0.18876266479492188, 0.19867706298828125, 0.20859146118164062, 0.218505859375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 7.0, 6.0, 9.0, 8.0, 8.0, 9.0, 18.0, 16.0, 19.0, 26.0, 35.0, 40.0, 39.0, 43.0, 42.0, 44.0, 48.0, 53.0, 47.0, 48.0, 41.0, 45.0, 44.0, 46.0, 34.0, 31.0, 29.0, 23.0, 18.0, 20.0, 13.0, 16.0, 15.0, 11.0, 15.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.78907299041748, -9.460570335388184, -9.13206672668457, -8.803564071655273, -8.47506046295166, -8.146557807922363, -7.818054676055908, -7.489551544189453, -7.161048412322998, -6.832545280456543, -6.504042148590088, -6.175539016723633, -5.847036361694336, -5.518532752990723, -5.190030097961426, -4.861526966094971, -4.533023834228516, -4.2045207023620605, -3.8760175704956055, -3.5475146770477295, -3.2190115451812744, -2.8905084133148193, -2.5620055198669434, -2.2335023880004883, -1.9049992561340332, -1.5764961242675781, -1.2479931116104126, -0.9194900393486023, -0.590986967086792, -0.2624838352203369, 0.06601917743682861, 0.39452219009399414, 0.7230253219604492, 1.0515284538269043, 1.3800314664840698, 1.7085344791412354, 2.0370376110076904, 2.3655407428741455, 2.6940436363220215, 3.0225467681884766, 3.3510499000549316, 3.6795530319213867, 4.008056163787842, 4.336559295654297, 4.665061950683594, 4.993565559387207, 5.322068214416504, 5.650571346282959, 5.979074478149414, 6.307577610015869, 6.636080741882324, 6.964583873748779, 7.293087005615234, 7.621589660644531, 7.950092792510986, 8.278595924377441, 8.607099533081055, 8.935602188110352, 9.264105796813965, 9.592608451843262, 9.921112060546875, 10.249614715576172, 10.578118324279785, 10.906620979309082, 11.235123634338379]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 9.0, 7.0, 9.0, 6.0, 12.0, 16.0, 17.0, 16.0, 18.0, 24.0, 19.0, 31.0, 28.0, 27.0, 29.0, 38.0, 45.0, 37.0, 39.0, 34.0, 35.0, 43.0, 38.0, 36.0, 47.0, 39.0, 39.0, 28.0, 34.0, 25.0, 19.0, 24.0, 30.0, 19.0, 12.0, 17.0, 10.0, 5.0, 14.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.970178604125977, -10.6133394241333, -10.256500244140625, -9.899662017822266, -9.54282283782959, -9.185983657836914, -8.829144477844238, -8.472305297851562, -8.115467071533203, -7.758627891540527, -7.40178918838501, -7.044950008392334, -6.688111305236816, -6.331272125244141, -5.974432945251465, -5.617593765258789, -5.260754585266113, -4.9039154052734375, -4.54707670211792, -4.190237522125244, -3.8333985805511475, -3.476559638977051, -3.119720458984375, -2.7628815174102783, -2.4060425758361816, -2.049203634262085, -1.6923645734786987, -1.3355255126953125, -0.9786865711212158, -0.6218476295471191, -0.26500844955444336, 0.09183049201965332, 0.4486703872680664, 0.8055093884468079, 1.1623483896255493, 1.5191874504089355, 1.8760263919830322, 2.232865333557129, 2.5897045135498047, 2.9465434551239014, 3.303382396697998, 3.6602213382720947, 4.017060279846191, 4.373899459838867, 4.730738639831543, 5.0875773429870605, 5.444416522979736, 5.801255226135254, 6.15809440612793, 6.5149335861206055, 6.871772289276123, 7.228611469268799, 7.585450172424316, 7.942289352416992, 8.299128532409668, 8.655967712402344, 9.012805938720703, 9.369645118713379, 9.726484298706055, 10.083322525024414, 10.44016170501709, 10.797000885009766, 11.153840065002441, 11.510679244995117, 11.867518424987793]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 21.0, 31.0, 61.0, 68.0, 110.0, 155.0, 206.0, 362.0, 532.0, 733.0, 1198.0, 1757.0, 2736.0, 4148.0, 5961.0, 8878.0, 13216.0, 19103.0, 27373.0, 38701.0, 52803.0, 68219.0, 85154.0, 99787.0, 107231.0, 105946.0, 96895.0, 80615.0, 64340.0, 48287.0, 35521.0, 25082.0, 17506.0, 11541.0, 8005.0, 5519.0, 3505.0, 2501.0, 1583.0, 1077.0, 679.0, 450.0, 311.0, 230.0, 125.0, 81.0, 80.0, 46.0, 26.0, 15.0, 13.0, 11.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.2109375, -5.0421142578125, -4.873291015625, -4.7044677734375, -4.53564453125, -4.3668212890625, -4.197998046875, -4.0291748046875, -3.8603515625, -3.6915283203125, -3.522705078125, -3.3538818359375, -3.18505859375, -3.0162353515625, -2.847412109375, -2.6785888671875, -2.509765625, -2.3409423828125, -2.172119140625, -2.0032958984375, -1.83447265625, -1.6656494140625, -1.496826171875, -1.3280029296875, -1.1591796875, -0.9903564453125, -0.821533203125, -0.6527099609375, -0.48388671875, -0.3150634765625, -0.146240234375, 0.0225830078125, 0.19140625, 0.3602294921875, 0.529052734375, 0.6978759765625, 0.86669921875, 1.0355224609375, 1.204345703125, 1.3731689453125, 1.5419921875, 1.7108154296875, 1.879638671875, 2.0484619140625, 2.21728515625, 2.3861083984375, 2.554931640625, 2.7237548828125, 2.892578125, 3.0614013671875, 3.230224609375, 3.3990478515625, 3.56787109375, 3.7366943359375, 3.905517578125, 4.0743408203125, 4.2431640625, 4.4119873046875, 4.580810546875, 4.7496337890625, 4.91845703125, 5.0872802734375, 5.256103515625, 5.4249267578125, 5.59375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 8.0, 5.0, 9.0, 2.0, 12.0, 10.0, 15.0, 14.0, 15.0, 14.0, 20.0, 30.0, 30.0, 18.0, 34.0, 26.0, 28.0, 43.0, 39.0, 40.0, 41.0, 35.0, 31.0, 46.0, 39.0, 30.0, 39.0, 42.0, 27.0, 32.0, 34.0, 28.0, 25.0, 21.0, 15.0, 15.0, 16.0, 14.0, 13.0, 12.0, 9.0, 5.0, 4.0, 2.0, 4.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-11.7578125, -11.406005859375, -11.05419921875, -10.702392578125, -10.3505859375, -9.998779296875, -9.64697265625, -9.295166015625, -8.943359375, -8.591552734375, -8.23974609375, -7.887939453125, -7.5361328125, -7.184326171875, -6.83251953125, -6.480712890625, -6.12890625, -5.777099609375, -5.42529296875, -5.073486328125, -4.7216796875, -4.369873046875, -4.01806640625, -3.666259765625, -3.314453125, -2.962646484375, -2.61083984375, -2.259033203125, -1.9072265625, -1.555419921875, -1.20361328125, -0.851806640625, -0.5, -0.148193359375, 0.20361328125, 0.555419921875, 0.9072265625, 1.259033203125, 1.61083984375, 1.962646484375, 2.314453125, 2.666259765625, 3.01806640625, 3.369873046875, 3.7216796875, 4.073486328125, 4.42529296875, 4.777099609375, 5.12890625, 5.480712890625, 5.83251953125, 6.184326171875, 6.5361328125, 6.887939453125, 7.23974609375, 7.591552734375, 7.943359375, 8.295166015625, 8.64697265625, 8.998779296875, 9.3505859375, 9.702392578125, 10.05419921875, 10.406005859375, 10.7578125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 12.0, 9.0, 22.0, 36.0, 39.0, 76.0, 112.0, 191.0, 300.0, 411.0, 668.0, 1068.0, 1573.0, 2379.0, 3656.0, 5700.0, 8618.0, 12915.0, 18459.0, 27183.0, 39014.0, 53644.0, 71033.0, 88406.0, 102722.0, 110290.0, 108656.0, 96913.0, 81319.0, 63129.0, 46648.0, 33470.0, 23136.0, 15679.0, 10492.0, 6983.0, 4741.0, 3130.0, 2016.0, 1268.0, 842.0, 584.0, 358.0, 248.0, 136.0, 99.0, 71.0, 33.0, 20.0, 16.0, 13.0, 9.0, 4.0, 7.0, 3.0, 0.0, 1.0], "bins": [-5.76953125, -5.593505859375, -5.41748046875, -5.241455078125, -5.0654296875, -4.889404296875, -4.71337890625, -4.537353515625, -4.361328125, -4.185302734375, -4.00927734375, -3.833251953125, -3.6572265625, -3.481201171875, -3.30517578125, -3.129150390625, -2.953125, -2.777099609375, -2.60107421875, -2.425048828125, -2.2490234375, -2.072998046875, -1.89697265625, -1.720947265625, -1.544921875, -1.368896484375, -1.19287109375, -1.016845703125, -0.8408203125, -0.664794921875, -0.48876953125, -0.312744140625, -0.13671875, 0.039306640625, 0.21533203125, 0.391357421875, 0.5673828125, 0.743408203125, 0.91943359375, 1.095458984375, 1.271484375, 1.447509765625, 1.62353515625, 1.799560546875, 1.9755859375, 2.151611328125, 2.32763671875, 2.503662109375, 2.6796875, 2.855712890625, 3.03173828125, 3.207763671875, 3.3837890625, 3.559814453125, 3.73583984375, 3.911865234375, 4.087890625, 4.263916015625, 4.43994140625, 4.615966796875, 4.7919921875, 4.968017578125, 5.14404296875, 5.320068359375, 5.49609375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 0.0, 6.0, 10.0, 4.0, 5.0, 4.0, 8.0, 14.0, 10.0, 18.0, 17.0, 12.0, 16.0, 21.0, 26.0, 34.0, 33.0, 25.0, 31.0, 45.0, 44.0, 48.0, 47.0, 37.0, 43.0, 29.0, 37.0, 32.0, 27.0, 27.0, 32.0, 31.0, 23.0, 22.0, 28.0, 27.0, 25.0, 21.0, 16.0, 15.0, 6.0, 11.0, 7.0, 6.0, 6.0, 7.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.75311279296875, -5.5413818359375, -5.32965087890625, -5.117919921875, -4.90618896484375, -4.6944580078125, -4.48272705078125, -4.27099609375, -4.05926513671875, -3.8475341796875, -3.63580322265625, -3.424072265625, -3.21234130859375, -3.0006103515625, -2.78887939453125, -2.5771484375, -2.36541748046875, -2.1536865234375, -1.94195556640625, -1.730224609375, -1.51849365234375, -1.3067626953125, -1.09503173828125, -0.88330078125, -0.67156982421875, -0.4598388671875, -0.24810791015625, -0.036376953125, 0.17535400390625, 0.3870849609375, 0.59881591796875, 0.810546875, 1.02227783203125, 1.2340087890625, 1.44573974609375, 1.657470703125, 1.86920166015625, 2.0809326171875, 2.29266357421875, 2.50439453125, 2.71612548828125, 2.9278564453125, 3.13958740234375, 3.351318359375, 3.56304931640625, 3.7747802734375, 3.98651123046875, 4.1982421875, 4.40997314453125, 4.6217041015625, 4.83343505859375, 5.045166015625, 5.25689697265625, 5.4686279296875, 5.68035888671875, 5.89208984375, 6.10382080078125, 6.3155517578125, 6.52728271484375, 6.739013671875, 6.95074462890625, 7.1624755859375, 7.37420654296875, 7.5859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 13.0, 17.0, 46.0, 71.0, 99.0, 184.0, 273.0, 441.0, 704.0, 1060.0, 1621.0, 2688.0, 4256.0, 6628.0, 10729.0, 17150.0, 26998.0, 42039.0, 63288.0, 87736.0, 112925.0, 130164.0, 131999.0, 117977.0, 93615.0, 67908.0, 46364.0, 30206.0, 18995.0, 12148.0, 7440.0, 4679.0, 2859.0, 1843.0, 1252.0, 795.0, 517.0, 308.0, 207.0, 108.0, 77.0, 57.0, 23.0, 19.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.292999267578125, -2.21685791015625, -2.140716552734375, -2.0645751953125, -1.988433837890625, -1.91229248046875, -1.836151123046875, -1.760009765625, -1.683868408203125, -1.60772705078125, -1.531585693359375, -1.4554443359375, -1.379302978515625, -1.30316162109375, -1.227020263671875, -1.15087890625, -1.074737548828125, -0.99859619140625, -0.922454833984375, -0.8463134765625, -0.770172119140625, -0.69403076171875, -0.617889404296875, -0.541748046875, -0.465606689453125, -0.38946533203125, -0.313323974609375, -0.2371826171875, -0.161041259765625, -0.08489990234375, -0.008758544921875, 0.0673828125, 0.143524169921875, 0.21966552734375, 0.295806884765625, 0.3719482421875, 0.448089599609375, 0.52423095703125, 0.600372314453125, 0.676513671875, 0.752655029296875, 0.82879638671875, 0.904937744140625, 0.9810791015625, 1.057220458984375, 1.13336181640625, 1.209503173828125, 1.28564453125, 1.361785888671875, 1.43792724609375, 1.514068603515625, 1.5902099609375, 1.666351318359375, 1.74249267578125, 1.818634033203125, 1.894775390625, 1.970916748046875, 2.04705810546875, 2.123199462890625, 2.1993408203125, 2.275482177734375, 2.35162353515625, 2.427764892578125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 15.0, 9.0, 13.0, 18.0, 17.0, 28.0, 36.0, 44.0, 36.0, 33.0, 36.0, 47.0, 49.0, 77.0, 59.0, 54.0, 49.0, 37.0, 44.0, 29.0, 50.0, 26.0, 24.0, 28.0, 20.0, 34.0, 16.0, 11.0, 7.0, 6.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002434253692626953, -0.00023545324802398682, -0.00022748112678527832, -0.00021950900554656982, -0.00021153688430786133, -0.00020356476306915283, -0.00019559264183044434, -0.00018762052059173584, -0.00017964839935302734, -0.00017167627811431885, -0.00016370415687561035, -0.00015573203563690186, -0.00014775991439819336, -0.00013978779315948486, -0.00013181567192077637, -0.00012384355068206787, -0.00011587142944335938, -0.00010789930820465088, -9.992718696594238e-05, -9.195506572723389e-05, -8.398294448852539e-05, -7.60108232498169e-05, -6.80387020111084e-05, -6.00665807723999e-05, -5.2094459533691406e-05, -4.412233829498291e-05, -3.6150217056274414e-05, -2.8178095817565918e-05, -2.0205974578857422e-05, -1.2233853340148926e-05, -4.26173210144043e-06, 3.7103891372680664e-06, 1.1682510375976562e-05, 1.965463161468506e-05, 2.7626752853393555e-05, 3.559887409210205e-05, 4.357099533081055e-05, 5.154311656951904e-05, 5.951523780822754e-05, 6.748735904693604e-05, 7.545948028564453e-05, 8.343160152435303e-05, 9.140372276306152e-05, 9.937584400177002e-05, 0.00010734796524047852, 0.00011532008647918701, 0.0001232922077178955, 0.000131264328956604, 0.0001392364501953125, 0.000147208571434021, 0.0001551806926727295, 0.000163152813911438, 0.00017112493515014648, 0.00017909705638885498, 0.00018706917762756348, 0.00019504129886627197, 0.00020301342010498047, 0.00021098554134368896, 0.00021895766258239746, 0.00022692978382110596, 0.00023490190505981445, 0.00024287402629852295, 0.00025084614753723145, 0.00025881826877593994, 0.00026679039001464844]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 28.0, 26.0, 45.0, 67.0, 81.0, 144.0, 195.0, 296.0, 439.0, 687.0, 1119.0, 1780.0, 2714.0, 4612.0, 7326.0, 11935.0, 19137.0, 31103.0, 50059.0, 75332.0, 107741.0, 135110.0, 146985.0, 135671.0, 107665.0, 75830.0, 49846.0, 31373.0, 19435.0, 11879.0, 7338.0, 4535.0, 2929.0, 1835.0, 1159.0, 737.0, 476.0, 287.0, 196.0, 143.0, 81.0, 60.0, 34.0, 25.0, 14.0, 10.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.912109375, -2.8251953125, -2.73828125, -2.6513671875, -2.564453125, -2.4775390625, -2.390625, -2.3037109375, -2.216796875, -2.1298828125, -2.04296875, -1.9560546875, -1.869140625, -1.7822265625, -1.6953125, -1.6083984375, -1.521484375, -1.4345703125, -1.34765625, -1.2607421875, -1.173828125, -1.0869140625, -1.0, -0.9130859375, -0.826171875, -0.7392578125, -0.65234375, -0.5654296875, -0.478515625, -0.3916015625, -0.3046875, -0.2177734375, -0.130859375, -0.0439453125, 0.04296875, 0.1298828125, 0.216796875, 0.3037109375, 0.390625, 0.4775390625, 0.564453125, 0.6513671875, 0.73828125, 0.8251953125, 0.912109375, 0.9990234375, 1.0859375, 1.1728515625, 1.259765625, 1.3466796875, 1.43359375, 1.5205078125, 1.607421875, 1.6943359375, 1.78125, 1.8681640625, 1.955078125, 2.0419921875, 2.12890625, 2.2158203125, 2.302734375, 2.3896484375, 2.4765625, 2.5634765625, 2.650390625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 7.0, 4.0, 7.0, 7.0, 7.0, 9.0, 14.0, 16.0, 16.0, 21.0, 20.0, 19.0, 41.0, 44.0, 50.0, 46.0, 49.0, 58.0, 49.0, 60.0, 64.0, 46.0, 31.0, 36.0, 46.0, 43.0, 33.0, 22.0, 28.0, 19.0, 18.0, 8.0, 12.0, 6.0, 7.0, 10.0, 10.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.99310302734375, -0.9598388671875, -0.92657470703125, -0.893310546875, -0.86004638671875, -0.8267822265625, -0.79351806640625, -0.76025390625, -0.72698974609375, -0.6937255859375, -0.66046142578125, -0.627197265625, -0.59393310546875, -0.5606689453125, -0.52740478515625, -0.494140625, -0.46087646484375, -0.4276123046875, -0.39434814453125, -0.361083984375, -0.32781982421875, -0.2945556640625, -0.26129150390625, -0.22802734375, -0.19476318359375, -0.1614990234375, -0.12823486328125, -0.094970703125, -0.06170654296875, -0.0284423828125, 0.00482177734375, 0.0380859375, 0.07135009765625, 0.1046142578125, 0.13787841796875, 0.171142578125, 0.20440673828125, 0.2376708984375, 0.27093505859375, 0.30419921875, 0.33746337890625, 0.3707275390625, 0.40399169921875, 0.437255859375, 0.47052001953125, 0.5037841796875, 0.53704833984375, 0.5703125, 0.60357666015625, 0.6368408203125, 0.67010498046875, 0.703369140625, 0.73663330078125, 0.7698974609375, 0.80316162109375, 0.83642578125, 0.86968994140625, 0.9029541015625, 0.93621826171875, 0.969482421875, 1.00274658203125, 1.0360107421875, 1.06927490234375, 1.1025390625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 6.0, 9.0, 3.0, 8.0, 17.0, 20.0, 9.0, 18.0, 26.0, 40.0, 41.0, 54.0, 41.0, 51.0, 47.0, 51.0, 51.0, 50.0, 47.0, 45.0, 54.0, 38.0, 42.0, 36.0, 21.0, 28.0, 21.0, 17.0, 19.0, 21.0, 14.0, 7.0, 6.0, 10.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.257930755615234, -8.916497230529785, -8.575063705444336, -8.23362922668457, -7.892195701599121, -7.550762176513672, -7.2093281745910645, -6.867894172668457, -6.526460647583008, -6.185027122497559, -5.843593120574951, -5.502159118652344, -5.1607255935668945, -4.819292068481445, -4.477858066558838, -4.1364240646362305, -3.7949905395507812, -3.453556776046753, -3.1121230125427246, -2.7706892490386963, -2.429255485534668, -2.0878217220306396, -1.7463879585266113, -1.404954195022583, -1.0635204315185547, -0.7220866680145264, -0.38065290451049805, -0.03921914100646973, 0.3022146224975586, 0.6436483860015869, 0.9850821495056152, 1.3265159130096436, 1.6679506301879883, 2.0093843936920166, 2.350818157196045, 2.6922519207000732, 3.0336856842041016, 3.37511944770813, 3.716553211212158, 4.057987213134766, 4.399420738220215, 4.740854263305664, 5.0822882652282715, 5.423722267150879, 5.765155792236328, 6.106589317321777, 6.448023319244385, 6.789457321166992, 7.130890846252441, 7.472324371337891, 7.813758373260498, 8.155192375183105, 8.496625900268555, 8.838059425354004, 9.179492950439453, 9.520927429199219, 9.862360954284668, 10.203794479370117, 10.545228958129883, 10.886662483215332, 11.228096008300781, 11.56952953338623, 11.91096305847168, 12.252397537231445, 12.593831062316895]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 11.0, 7.0, 13.0, 11.0, 16.0, 12.0, 19.0, 17.0, 19.0, 14.0, 18.0, 31.0, 26.0, 36.0, 38.0, 39.0, 31.0, 39.0, 30.0, 37.0, 31.0, 36.0, 44.0, 31.0, 46.0, 39.0, 32.0, 37.0, 31.0, 30.0, 23.0, 19.0, 17.0, 24.0, 16.0, 10.0, 11.0, 11.0, 7.0, 10.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.321619033813477, -9.971513748168945, -9.621408462524414, -9.271303176879883, -8.921198844909668, -8.571093559265137, -8.220988273620605, -7.870882987976074, -7.520778179168701, -7.17067289352417, -6.820568084716797, -6.470462799072266, -6.120357513427734, -5.770252704620361, -5.42014741897583, -5.070042610168457, -4.719937324523926, -4.3698320388793945, -4.0197272300720215, -3.6696219444274902, -3.319516897201538, -2.969411849975586, -2.6193065643310547, -2.2692015171051025, -1.9190964698791504, -1.5689914226531982, -1.2188862562179565, -0.8687810897827148, -0.5186760425567627, -0.16857099533081055, 0.1815342903137207, 0.5316393375396729, 0.8817434310913086, 1.2318484783172607, 1.5819536447525024, 1.9320588111877441, 2.2821638584136963, 2.6322689056396484, 2.9823741912841797, 3.332479238510132, 3.682584285736084, 4.032689571380615, 4.382794380187988, 4.7328996658325195, 5.083004951477051, 5.433109760284424, 5.783215045928955, 6.133319854736328, 6.483425140380859, 6.833530426025391, 7.183635234832764, 7.533740520477295, 7.883845329284668, 8.2339506149292, 8.58405590057373, 8.934161186218262, 9.284265518188477, 9.634370803833008, 9.984476089477539, 10.33458137512207, 10.684685707092285, 11.034790992736816, 11.384896278381348, 11.735001564025879, 12.08510684967041]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 10.0, 13.0, 10.0, 15.0, 35.0, 40.0, 70.0, 133.0, 152.0, 258.0, 402.0, 638.0, 1095.0, 1771.0, 2878.0, 4861.0, 8457.0, 14347.0, 25136.0, 43814.0, 75908.0, 129843.0, 219190.0, 349233.0, 509567.0, 642925.0, 656622.0, 541660.0, 380593.0, 242005.0, 144469.0, 84580.0, 48533.0, 27395.0, 15686.0, 8910.0, 5338.0, 3173.0, 1800.0, 1115.0, 586.0, 404.0, 224.0, 153.0, 88.0, 53.0, 36.0, 28.0, 16.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.5234375, -10.195556640625, -9.86767578125, -9.539794921875, -9.2119140625, -8.884033203125, -8.55615234375, -8.228271484375, -7.900390625, -7.572509765625, -7.24462890625, -6.916748046875, -6.5888671875, -6.260986328125, -5.93310546875, -5.605224609375, -5.27734375, -4.949462890625, -4.62158203125, -4.293701171875, -3.9658203125, -3.637939453125, -3.31005859375, -2.982177734375, -2.654296875, -2.326416015625, -1.99853515625, -1.670654296875, -1.3427734375, -1.014892578125, -0.68701171875, -0.359130859375, -0.03125, 0.296630859375, 0.62451171875, 0.952392578125, 1.2802734375, 1.608154296875, 1.93603515625, 2.263916015625, 2.591796875, 2.919677734375, 3.24755859375, 3.575439453125, 3.9033203125, 4.231201171875, 4.55908203125, 4.886962890625, 5.21484375, 5.542724609375, 5.87060546875, 6.198486328125, 6.5263671875, 6.854248046875, 7.18212890625, 7.510009765625, 7.837890625, 8.165771484375, 8.49365234375, 8.821533203125, 9.1494140625, 9.477294921875, 9.80517578125, 10.133056640625, 10.4609375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 4.0, 7.0, 7.0, 12.0, 13.0, 14.0, 20.0, 18.0, 23.0, 24.0, 23.0, 32.0, 39.0, 32.0, 44.0, 34.0, 35.0, 38.0, 47.0, 42.0, 36.0, 46.0, 42.0, 35.0, 32.0, 35.0, 41.0, 37.0, 33.0, 21.0, 18.0, 17.0, 21.0, 13.0, 9.0, 10.0, 7.0, 7.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3546142578125, -9.045166015625, -8.7357177734375, -8.42626953125, -8.1168212890625, -7.807373046875, -7.4979248046875, -7.1884765625, -6.8790283203125, -6.569580078125, -6.2601318359375, -5.95068359375, -5.6412353515625, -5.331787109375, -5.0223388671875, -4.712890625, -4.4034423828125, -4.093994140625, -3.7845458984375, -3.47509765625, -3.1656494140625, -2.856201171875, -2.5467529296875, -2.2373046875, -1.9278564453125, -1.618408203125, -1.3089599609375, -0.99951171875, -0.6900634765625, -0.380615234375, -0.0711669921875, 0.23828125, 0.5477294921875, 0.857177734375, 1.1666259765625, 1.47607421875, 1.7855224609375, 2.094970703125, 2.4044189453125, 2.7138671875, 3.0233154296875, 3.332763671875, 3.6422119140625, 3.95166015625, 4.2611083984375, 4.570556640625, 4.8800048828125, 5.189453125, 5.4989013671875, 5.808349609375, 6.1177978515625, 6.42724609375, 6.7366943359375, 7.046142578125, 7.3555908203125, 7.6650390625, 7.9744873046875, 8.283935546875, 8.5933837890625, 8.90283203125, 9.2122802734375, 9.521728515625, 9.8311767578125, 10.140625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 6.0, 6.0, 16.0, 16.0, 24.0, 56.0, 82.0, 188.0, 282.0, 475.0, 877.0, 1814.0, 3329.0, 6693.0, 12945.0, 25386.0, 49473.0, 93950.0, 171525.0, 297375.0, 462686.0, 622612.0, 694038.0, 623245.0, 462366.0, 296538.0, 172118.0, 94115.0, 49560.0, 25481.0, 13035.0, 6655.0, 3393.0, 1808.0, 948.0, 501.0, 246.0, 183.0, 96.0, 53.0, 34.0, 15.0, 11.0, 11.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0396728515625, -11.657470703125, -11.2752685546875, -10.89306640625, -10.5108642578125, -10.128662109375, -9.7464599609375, -9.3642578125, -8.9820556640625, -8.599853515625, -8.2176513671875, -7.83544921875, -7.4532470703125, -7.071044921875, -6.6888427734375, -6.306640625, -5.9244384765625, -5.542236328125, -5.1600341796875, -4.77783203125, -4.3956298828125, -4.013427734375, -3.6312255859375, -3.2490234375, -2.8668212890625, -2.484619140625, -2.1024169921875, -1.72021484375, -1.3380126953125, -0.955810546875, -0.5736083984375, -0.19140625, 0.1907958984375, 0.572998046875, 0.9552001953125, 1.33740234375, 1.7196044921875, 2.101806640625, 2.4840087890625, 2.8662109375, 3.2484130859375, 3.630615234375, 4.0128173828125, 4.39501953125, 4.7772216796875, 5.159423828125, 5.5416259765625, 5.923828125, 6.3060302734375, 6.688232421875, 7.0704345703125, 7.45263671875, 7.8348388671875, 8.217041015625, 8.5992431640625, 8.9814453125, 9.3636474609375, 9.745849609375, 10.1280517578125, 10.51025390625, 10.8924560546875, 11.274658203125, 11.6568603515625, 12.0390625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 20.0, 24.0, 35.0, 54.0, 64.0, 84.0, 112.0, 131.0, 167.0, 181.0, 209.0, 239.0, 244.0, 267.0, 267.0, 266.0, 268.0, 218.0, 233.0, 174.0, 158.0, 136.0, 108.0, 88.0, 73.0, 61.0, 49.0, 30.0, 21.0, 19.0, 15.0, 13.0, 3.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.9188232421875, -4.728271484375, -4.5377197265625, -4.34716796875, -4.1566162109375, -3.966064453125, -3.7755126953125, -3.5849609375, -3.3944091796875, -3.203857421875, -3.0133056640625, -2.82275390625, -2.6322021484375, -2.441650390625, -2.2510986328125, -2.060546875, -1.8699951171875, -1.679443359375, -1.4888916015625, -1.29833984375, -1.1077880859375, -0.917236328125, -0.7266845703125, -0.5361328125, -0.3455810546875, -0.155029296875, 0.0355224609375, 0.22607421875, 0.4166259765625, 0.607177734375, 0.7977294921875, 0.98828125, 1.1788330078125, 1.369384765625, 1.5599365234375, 1.75048828125, 1.9410400390625, 2.131591796875, 2.3221435546875, 2.5126953125, 2.7032470703125, 2.893798828125, 3.0843505859375, 3.27490234375, 3.4654541015625, 3.656005859375, 3.8465576171875, 4.037109375, 4.2276611328125, 4.418212890625, 4.6087646484375, 4.79931640625, 4.9898681640625, 5.180419921875, 5.3709716796875, 5.5615234375, 5.7520751953125, 5.942626953125, 6.1331787109375, 6.32373046875, 6.5142822265625, 6.704833984375, 6.8953857421875, 7.0859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 5.0, 3.0, 14.0, 11.0, 14.0, 13.0, 22.0, 18.0, 26.0, 27.0, 35.0, 46.0, 58.0, 58.0, 47.0, 60.0, 62.0, 60.0, 52.0, 59.0, 37.0, 41.0, 38.0, 31.0, 22.0, 29.0, 18.0, 16.0, 11.0, 9.0, 14.0, 7.0, 8.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.418883323669434, -10.989507675170898, -10.560132026672363, -10.130756378173828, -9.70138168334961, -9.272006034851074, -8.842630386352539, -8.413254737854004, -7.983879566192627, -7.554503917694092, -7.125128746032715, -6.69575309753418, -6.2663774490356445, -5.837002277374268, -5.407626628875732, -4.9782514572143555, -4.54887580871582, -4.119500160217285, -3.690124988555908, -3.260749340057373, -2.831373929977417, -2.401998519897461, -1.9726228713989258, -1.5432474613189697, -1.1138720512390137, -0.6844965815544128, -0.255121111869812, 0.1742544174194336, 0.6036298274993896, 1.0330052375793457, 1.4623808860778809, 1.891756296157837, 2.3211326599121094, 2.7505080699920654, 3.1798834800720215, 3.6092591285705566, 4.038634300231934, 4.468009948730469, 4.897385597229004, 5.326761245727539, 5.756136417388916, 6.185512065887451, 6.614887237548828, 7.044262886047363, 7.473638534545898, 7.903013706207275, 8.332389831542969, 8.761764526367188, 9.191140174865723, 9.620515823364258, 10.049891471862793, 10.479267120361328, 10.908641815185547, 11.338017463684082, 11.767393112182617, 12.196768760681152, 12.626144409179688, 13.055520057678223, 13.484895706176758, 13.914270401000977, 14.343646049499512, 14.773021697998047, 15.202397346496582, 15.631772994995117, 16.061147689819336]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 3.0, 4.0, 3.0, 9.0, 6.0, 14.0, 15.0, 15.0, 19.0, 22.0, 26.0, 28.0, 19.0, 19.0, 43.0, 30.0, 35.0, 52.0, 43.0, 48.0, 53.0, 49.0, 41.0, 32.0, 38.0, 43.0, 29.0, 32.0, 32.0, 38.0, 20.0, 29.0, 22.0, 19.0, 16.0, 9.0, 9.0, 7.0, 7.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.117353439331055, -12.66727352142334, -12.217193603515625, -11.76711368560791, -11.317033767700195, -10.86695384979248, -10.416873931884766, -9.966794967651367, -9.516714096069336, -9.066634178161621, -8.616554260253906, -8.166474342346191, -7.716394424438477, -7.266314506530762, -6.816235065460205, -6.36615514755249, -5.916075706481934, -5.465995788574219, -5.015915870666504, -4.565835952758789, -4.115756034851074, -3.6656763553619385, -3.2155966758728027, -2.765516757965088, -2.315436840057373, -1.8653569221496582, -1.415277123451233, -0.9651973247528076, -0.5151174068450928, -0.06503748893737793, 0.3850421905517578, 0.8351221084594727, 1.285201072692871, 1.735280990600586, 2.185360908508301, 2.6354405879974365, 3.0855205059051514, 3.535600423812866, 3.985680103302002, 4.435760021209717, 4.885839939117432, 5.3359198570251465, 5.785999774932861, 6.236079216003418, 6.686159133911133, 7.136239051818848, 7.5863189697265625, 8.036398887634277, 8.486478805541992, 8.936558723449707, 9.386638641357422, 9.836718559265137, 10.286798477172852, 10.736878395080566, 11.186958312988281, 11.63703727722168, 12.087118148803711, 12.537198066711426, 12.98727798461914, 13.437357902526855, 13.88743782043457, 14.337517738342285, 14.78759765625, 15.237676620483398, 15.687756538391113]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 9.0, 9.0, 20.0, 20.0, 46.0, 56.0, 79.0, 151.0, 195.0, 279.0, 421.0, 626.0, 846.0, 1345.0, 1980.0, 2747.0, 4177.0, 6395.0, 9714.0, 14791.0, 22943.0, 37449.0, 60720.0, 98337.0, 155480.0, 201441.0, 158144.0, 100877.0, 61992.0, 38435.0, 24052.0, 15228.0, 9752.0, 6616.0, 4284.0, 2919.0, 1885.0, 1343.0, 910.0, 595.0, 384.0, 284.0, 185.0, 129.0, 83.0, 64.0, 38.0, 24.0, 17.0, 19.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.533203125, -1.4874725341796875, -1.441741943359375, -1.3960113525390625, -1.35028076171875, -1.3045501708984375, -1.258819580078125, -1.2130889892578125, -1.1673583984375, -1.1216278076171875, -1.075897216796875, -1.0301666259765625, -0.98443603515625, -0.9387054443359375, -0.892974853515625, -0.8472442626953125, -0.801513671875, -0.7557830810546875, -0.710052490234375, -0.6643218994140625, -0.61859130859375, -0.5728607177734375, -0.527130126953125, -0.4813995361328125, -0.4356689453125, -0.3899383544921875, -0.344207763671875, -0.2984771728515625, -0.25274658203125, -0.2070159912109375, -0.161285400390625, -0.1155548095703125, -0.06982421875, -0.0240936279296875, 0.021636962890625, 0.0673675537109375, 0.11309814453125, 0.1588287353515625, 0.204559326171875, 0.2502899169921875, 0.2960205078125, 0.3417510986328125, 0.387481689453125, 0.4332122802734375, 0.47894287109375, 0.5246734619140625, 0.570404052734375, 0.6161346435546875, 0.661865234375, 0.7075958251953125, 0.753326416015625, 0.7990570068359375, 0.84478759765625, 0.8905181884765625, 0.936248779296875, 0.9819793701171875, 1.0277099609375, 1.0734405517578125, 1.119171142578125, 1.1649017333984375, 1.21063232421875, 1.2563629150390625, 1.302093505859375, 1.3478240966796875, 1.3935546875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 5.0, 6.0, 8.0, 9.0, 11.0, 17.0, 14.0, 18.0, 22.0, 24.0, 25.0, 23.0, 30.0, 28.0, 45.0, 33.0, 50.0, 54.0, 49.0, 37.0, 49.0, 41.0, 40.0, 39.0, 32.0, 37.0, 33.0, 36.0, 21.0, 28.0, 29.0, 19.0, 13.0, 20.0, 8.0, 7.0, 7.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.515625, -13.0576171875, -12.599609375, -12.1416015625, -11.68359375, -11.2255859375, -10.767578125, -10.3095703125, -9.8515625, -9.3935546875, -8.935546875, -8.4775390625, -8.01953125, -7.5615234375, -7.103515625, -6.6455078125, -6.1875, -5.7294921875, -5.271484375, -4.8134765625, -4.35546875, -3.8974609375, -3.439453125, -2.9814453125, -2.5234375, -2.0654296875, -1.607421875, -1.1494140625, -0.69140625, -0.2333984375, 0.224609375, 0.6826171875, 1.140625, 1.5986328125, 2.056640625, 2.5146484375, 2.97265625, 3.4306640625, 3.888671875, 4.3466796875, 4.8046875, 5.2626953125, 5.720703125, 6.1787109375, 6.63671875, 7.0947265625, 7.552734375, 8.0107421875, 8.46875, 8.9267578125, 9.384765625, 9.8427734375, 10.30078125, 10.7587890625, 11.216796875, 11.6748046875, 12.1328125, 12.5908203125, 13.048828125, 13.5068359375, 13.96484375, 14.4228515625, 14.880859375, 15.3388671875, 15.796875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 11.0, 19.0, 30.0, 50.0, 70.0, 117.0, 155.0, 279.0, 519.0, 785.0, 1330.0, 2417.0, 4124.0, 7227.0, 12469.0, 22017.0, 38721.0, 67150.0, 114220.0, 187661.0, 226902.0, 150211.0, 90355.0, 52004.0, 29814.0, 16865.0, 9728.0, 5509.0, 3147.0, 1903.0, 1060.0, 603.0, 391.0, 245.0, 151.0, 100.0, 68.0, 50.0, 24.0, 14.0, 6.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.763671875, -1.705413818359375, -1.64715576171875, -1.588897705078125, -1.5306396484375, -1.472381591796875, -1.41412353515625, -1.355865478515625, -1.297607421875, -1.239349365234375, -1.18109130859375, -1.122833251953125, -1.0645751953125, -1.006317138671875, -0.94805908203125, -0.889801025390625, -0.83154296875, -0.773284912109375, -0.71502685546875, -0.656768798828125, -0.5985107421875, -0.540252685546875, -0.48199462890625, -0.423736572265625, -0.365478515625, -0.307220458984375, -0.24896240234375, -0.190704345703125, -0.1324462890625, -0.074188232421875, -0.01593017578125, 0.042327880859375, 0.1005859375, 0.158843994140625, 0.21710205078125, 0.275360107421875, 0.3336181640625, 0.391876220703125, 0.45013427734375, 0.508392333984375, 0.566650390625, 0.624908447265625, 0.68316650390625, 0.741424560546875, 0.7996826171875, 0.857940673828125, 0.91619873046875, 0.974456787109375, 1.03271484375, 1.090972900390625, 1.14923095703125, 1.207489013671875, 1.2657470703125, 1.324005126953125, 1.38226318359375, 1.440521240234375, 1.498779296875, 1.557037353515625, 1.61529541015625, 1.673553466796875, 1.7318115234375, 1.790069580078125, 1.84832763671875, 1.906585693359375, 1.96484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 15.0, 11.0, 11.0, 20.0, 16.0, 20.0, 29.0, 18.0, 25.0, 23.0, 32.0, 35.0, 39.0, 41.0, 48.0, 36.0, 42.0, 57.0, 38.0, 37.0, 32.0, 47.0, 42.0, 38.0, 32.0, 30.0, 26.0, 25.0, 15.0, 30.0, 17.0, 15.0, 11.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.9139404296875, -7.632568359375, -7.3511962890625, -7.06982421875, -6.7884521484375, -6.507080078125, -6.2257080078125, -5.9443359375, -5.6629638671875, -5.381591796875, -5.1002197265625, -4.81884765625, -4.5374755859375, -4.256103515625, -3.9747314453125, -3.693359375, -3.4119873046875, -3.130615234375, -2.8492431640625, -2.56787109375, -2.2864990234375, -2.005126953125, -1.7237548828125, -1.4423828125, -1.1610107421875, -0.879638671875, -0.5982666015625, -0.31689453125, -0.0355224609375, 0.245849609375, 0.5272216796875, 0.80859375, 1.0899658203125, 1.371337890625, 1.6527099609375, 1.93408203125, 2.2154541015625, 2.496826171875, 2.7781982421875, 3.0595703125, 3.3409423828125, 3.622314453125, 3.9036865234375, 4.18505859375, 4.4664306640625, 4.747802734375, 5.0291748046875, 5.310546875, 5.5919189453125, 5.873291015625, 6.1546630859375, 6.43603515625, 6.7174072265625, 6.998779296875, 7.2801513671875, 7.5615234375, 7.8428955078125, 8.124267578125, 8.4056396484375, 8.68701171875, 8.9683837890625, 9.249755859375, 9.5311279296875, 9.8125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 15.0, 11.0, 20.0, 26.0, 38.0, 50.0, 78.0, 100.0, 145.0, 219.0, 268.0, 439.0, 639.0, 1003.0, 1463.0, 2349.0, 3772.0, 6407.0, 10990.0, 21270.0, 47469.0, 120776.0, 333907.0, 301394.0, 106813.0, 42611.0, 19928.0, 10491.0, 5749.0, 3579.0, 2124.0, 1419.0, 953.0, 642.0, 397.0, 305.0, 209.0, 150.0, 89.0, 57.0, 63.0, 33.0, 30.0, 15.0, 10.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.250213623046875, -0.24212646484375, -0.234039306640625, -0.2259521484375, -0.217864990234375, -0.20977783203125, -0.201690673828125, -0.193603515625, -0.185516357421875, -0.17742919921875, -0.169342041015625, -0.1612548828125, -0.153167724609375, -0.14508056640625, -0.136993408203125, -0.12890625, -0.120819091796875, -0.11273193359375, -0.104644775390625, -0.0965576171875, -0.088470458984375, -0.08038330078125, -0.072296142578125, -0.064208984375, -0.056121826171875, -0.04803466796875, -0.039947509765625, -0.0318603515625, -0.023773193359375, -0.01568603515625, -0.007598876953125, 0.00048828125, 0.008575439453125, 0.01666259765625, 0.024749755859375, 0.0328369140625, 0.040924072265625, 0.04901123046875, 0.057098388671875, 0.065185546875, 0.073272705078125, 0.08135986328125, 0.089447021484375, 0.0975341796875, 0.105621337890625, 0.11370849609375, 0.121795654296875, 0.1298828125, 0.137969970703125, 0.14605712890625, 0.154144287109375, 0.1622314453125, 0.170318603515625, 0.17840576171875, 0.186492919921875, 0.194580078125, 0.202667236328125, 0.21075439453125, 0.218841552734375, 0.2269287109375, 0.235015869140625, 0.24310302734375, 0.251190185546875, 0.25927734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 12.0, 14.0, 13.0, 16.0, 30.0, 25.0, 30.0, 32.0, 36.0, 54.0, 36.0, 45.0, 60.0, 55.0, 52.0, 64.0, 62.0, 51.0, 45.0, 44.0, 36.0, 37.0, 26.0, 23.0, 22.0, 15.0, 12.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7940998077392578e-05, -1.7272308468818665e-05, -1.660361886024475e-05, -1.5934929251670837e-05, -1.5266239643096924e-05, -1.459755003452301e-05, -1.3928860425949097e-05, -1.3260170817375183e-05, -1.259148120880127e-05, -1.1922791600227356e-05, -1.1254101991653442e-05, -1.0585412383079529e-05, -9.916722774505615e-06, -9.248033165931702e-06, -8.579343557357788e-06, -7.910653948783875e-06, -7.241964340209961e-06, -6.573274731636047e-06, -5.904585123062134e-06, -5.23589551448822e-06, -4.567205905914307e-06, -3.898516297340393e-06, -3.2298266887664795e-06, -2.561137080192566e-06, -1.8924474716186523e-06, -1.2237578630447388e-06, -5.550682544708252e-07, 1.1362135410308838e-07, 7.82310962677002e-07, 1.4510005712509155e-06, 2.119690179824829e-06, 2.7883797883987427e-06, 3.4570693969726562e-06, 4.12575900554657e-06, 4.794448614120483e-06, 5.463138222694397e-06, 6.1318278312683105e-06, 6.800517439842224e-06, 7.469207048416138e-06, 8.137896656990051e-06, 8.806586265563965e-06, 9.475275874137878e-06, 1.0143965482711792e-05, 1.0812655091285706e-05, 1.1481344699859619e-05, 1.2150034308433533e-05, 1.2818723917007446e-05, 1.348741352558136e-05, 1.4156103134155273e-05, 1.4824792742729187e-05, 1.54934823513031e-05, 1.6162171959877014e-05, 1.6830861568450928e-05, 1.749955117702484e-05, 1.8168240785598755e-05, 1.883693039417267e-05, 1.9505620002746582e-05, 2.0174309611320496e-05, 2.084299921989441e-05, 2.1511688828468323e-05, 2.2180378437042236e-05, 2.284906804561615e-05, 2.3517757654190063e-05, 2.4186447262763977e-05, 2.485513687133789e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 12.0, 27.0, 37.0, 44.0, 70.0, 102.0, 151.0, 206.0, 289.0, 444.0, 685.0, 1044.0, 1440.0, 2216.0, 3309.0, 5278.0, 8486.0, 13801.0, 23863.0, 42924.0, 83269.0, 174666.0, 293346.0, 191169.0, 89939.0, 45947.0, 25935.0, 14839.0, 8855.0, 5576.0, 3499.0, 2392.0, 1551.0, 952.0, 678.0, 470.0, 311.0, 238.0, 143.0, 112.0, 73.0, 54.0, 30.0, 20.0, 18.0, 9.0, 7.0, 3.0, 9.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271728515625, -0.2628364562988281, -0.25394439697265625, -0.24505233764648438, -0.2361602783203125, -0.22726821899414062, -0.21837615966796875, -0.20948410034179688, -0.200592041015625, -0.19169998168945312, -0.18280792236328125, -0.17391586303710938, -0.1650238037109375, -0.15613174438476562, -0.14723968505859375, -0.13834762573242188, -0.12945556640625, -0.12056350708007812, -0.11167144775390625, -0.10277938842773438, -0.0938873291015625, -0.08499526977539062, -0.07610321044921875, -0.06721115112304688, -0.058319091796875, -0.049427032470703125, -0.04053497314453125, -0.031642913818359375, -0.0227508544921875, -0.013858795166015625, -0.00496673583984375, 0.003925323486328125, 0.0128173828125, 0.021709442138671875, 0.03060150146484375, 0.039493560791015625, 0.0483856201171875, 0.057277679443359375, 0.06616973876953125, 0.07506179809570312, 0.083953857421875, 0.09284591674804688, 0.10173797607421875, 0.11063003540039062, 0.1195220947265625, 0.12841415405273438, 0.13730621337890625, 0.14619827270507812, 0.15509033203125, 0.16398239135742188, 0.17287445068359375, 0.18176651000976562, 0.1906585693359375, 0.19955062866210938, 0.20844268798828125, 0.21733474731445312, 0.226226806640625, 0.23511886596679688, 0.24401092529296875, 0.2529029846191406, 0.2617950439453125, 0.2706871032714844, 0.27957916259765625, 0.2884712219238281, 0.29736328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 18.0, 8.0, 16.0, 21.0, 28.0, 29.0, 46.0, 60.0, 57.0, 69.0, 68.0, 96.0, 76.0, 70.0, 62.0, 57.0, 48.0, 30.0, 28.0, 25.0, 13.0, 13.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.118896484375, -0.1151437759399414, -0.11139106750488281, -0.10763835906982422, -0.10388565063476562, -0.10013294219970703, -0.09638023376464844, -0.09262752532958984, -0.08887481689453125, -0.08512210845947266, -0.08136940002441406, -0.07761669158935547, -0.07386398315429688, -0.07011127471923828, -0.06635856628417969, -0.0626058578491211, -0.0588531494140625, -0.055100440979003906, -0.05134773254394531, -0.04759502410888672, -0.043842315673828125, -0.04008960723876953, -0.03633689880371094, -0.032584190368652344, -0.02883148193359375, -0.025078773498535156, -0.021326065063476562, -0.01757335662841797, -0.013820648193359375, -0.010067939758300781, -0.0063152313232421875, -0.0025625228881835938, 0.001190185546875, 0.004942893981933594, 0.008695602416992188, 0.012448310852050781, 0.016201019287109375, 0.01995372772216797, 0.023706436157226562, 0.027459144592285156, 0.03121185302734375, 0.034964561462402344, 0.03871726989746094, 0.04246997833251953, 0.046222686767578125, 0.04997539520263672, 0.05372810363769531, 0.057480812072753906, 0.0612335205078125, 0.0649862289428711, 0.06873893737792969, 0.07249164581298828, 0.07624435424804688, 0.07999706268310547, 0.08374977111816406, 0.08750247955322266, 0.09125518798828125, 0.09500789642333984, 0.09876060485839844, 0.10251331329345703, 0.10626602172851562, 0.11001873016357422, 0.11377143859863281, 0.1175241470336914, 0.12127685546875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 3.0, 13.0, 10.0, 15.0, 13.0, 20.0, 16.0, 27.0, 29.0, 34.0, 37.0, 60.0, 58.0, 49.0, 67.0, 52.0, 62.0, 55.0, 56.0, 45.0, 41.0, 34.0, 35.0, 22.0, 30.0, 16.0, 15.0, 13.0, 10.0, 14.0, 7.0, 6.0, 9.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.500151634216309, -11.069215774536133, -10.63827896118164, -10.207343101501465, -9.776407241821289, -9.345471382141113, -8.914535522460938, -8.483598709106445, -8.05266284942627, -7.621726989746094, -7.19079065322876, -6.759854316711426, -6.32891845703125, -5.897982597351074, -5.46704626083374, -5.036109924316406, -4.6051740646362305, -4.174238204956055, -3.7433018684387207, -3.312365770339966, -2.881429672241211, -2.450493574142456, -2.019557476043701, -1.5886213779449463, -1.1576852798461914, -0.7267491817474365, -0.29581308364868164, 0.13512301445007324, 0.5660591125488281, 0.996995210647583, 1.427931308746338, 1.8588674068450928, 2.2898025512695312, 2.720738649368286, 3.151674747467041, 3.582610845565796, 4.013546943664551, 4.444482803344727, 4.8754191398620605, 5.3063554763793945, 5.73729133605957, 6.168227195739746, 6.59916353225708, 7.030099868774414, 7.46103572845459, 7.891971588134766, 8.322908401489258, 8.753844261169434, 9.18478012084961, 9.615715980529785, 10.046651840209961, 10.477588653564453, 10.908524513244629, 11.339460372924805, 11.770397186279297, 12.201333045959473, 12.632268905639648, 13.063204765319824, 13.494140625, 13.925077438354492, 14.356013298034668, 14.786949157714844, 15.217885971069336, 15.648821830749512, 16.079757690429688]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 9.0, 3.0, 5.0, 3.0, 8.0, 6.0, 14.0, 15.0, 15.0, 20.0, 22.0, 27.0, 27.0, 19.0, 25.0, 37.0, 32.0, 35.0, 50.0, 45.0, 47.0, 56.0, 47.0, 39.0, 34.0, 37.0, 41.0, 31.0, 31.0, 31.0, 37.0, 22.0, 30.0, 24.0, 17.0, 15.0, 8.0, 9.0, 8.0, 6.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.017990112304688, -12.567744255065918, -12.117498397827148, -11.667251586914062, -11.217005729675293, -10.766759872436523, -10.316514015197754, -9.866268157958984, -9.416021347045898, -8.965775489807129, -8.51552963256836, -8.065282821655273, -7.615036964416504, -7.164791107177734, -6.714545249938965, -6.264299392700195, -5.814053535461426, -5.363807678222656, -4.9135613441467285, -4.463315486907959, -4.013069152832031, -3.5628232955932617, -3.112577438354492, -2.6623313426971436, -2.212085247039795, -1.7618391513824463, -1.3115931749343872, -0.8613471984863281, -0.4111011028289795, 0.03914499282836914, 0.48939085006713867, 0.9396369457244873, 1.3898839950561523, 1.840130090713501, 2.2903761863708496, 2.740622043609619, 3.1908681392669678, 3.6411142349243164, 4.091360092163086, 4.5416059494018555, 4.991852283477783, 5.442098140716553, 5.8923444747924805, 6.34259033203125, 6.7928361892700195, 7.243082523345947, 7.693328380584717, 8.143574714660645, 8.593820571899414, 9.044066429138184, 9.494312286376953, 9.944559097290039, 10.394804954528809, 10.845050811767578, 11.295296669006348, 11.745542526245117, 12.195789337158203, 12.646035194396973, 13.096281051635742, 13.546527862548828, 13.996773719787598, 14.447019577026367, 14.897265434265137, 15.347511291503906, 15.797757148742676]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 9.0, 10.0, 14.0, 15.0, 30.0, 49.0, 79.0, 110.0, 179.0, 285.0, 457.0, 661.0, 1099.0, 1785.0, 2732.0, 4273.0, 6766.0, 10920.0, 16967.0, 26290.0, 39299.0, 56899.0, 78621.0, 101073.0, 119037.0, 124708.0, 117378.0, 99516.0, 76242.0, 55565.0, 37759.0, 24951.0, 16379.0, 10387.0, 6497.0, 4262.0, 2697.0, 1713.0, 1047.0, 669.0, 443.0, 250.0, 149.0, 103.0, 69.0, 40.0, 22.0, 18.0, 17.0, 12.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.2076416015625, -5.989501953125, -5.7713623046875, -5.55322265625, -5.3350830078125, -5.116943359375, -4.8988037109375, -4.6806640625, -4.4625244140625, -4.244384765625, -4.0262451171875, -3.80810546875, -3.5899658203125, -3.371826171875, -3.1536865234375, -2.935546875, -2.7174072265625, -2.499267578125, -2.2811279296875, -2.06298828125, -1.8448486328125, -1.626708984375, -1.4085693359375, -1.1904296875, -0.9722900390625, -0.754150390625, -0.5360107421875, -0.31787109375, -0.0997314453125, 0.118408203125, 0.3365478515625, 0.5546875, 0.7728271484375, 0.990966796875, 1.2091064453125, 1.42724609375, 1.6453857421875, 1.863525390625, 2.0816650390625, 2.2998046875, 2.5179443359375, 2.736083984375, 2.9542236328125, 3.17236328125, 3.3905029296875, 3.608642578125, 3.8267822265625, 4.044921875, 4.2630615234375, 4.481201171875, 4.6993408203125, 4.91748046875, 5.1356201171875, 5.353759765625, 5.5718994140625, 5.7900390625, 6.0081787109375, 6.226318359375, 6.4444580078125, 6.66259765625, 6.8807373046875, 7.098876953125, 7.3170166015625, 7.53515625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 4.0, 8.0, 5.0, 8.0, 8.0, 11.0, 18.0, 12.0, 24.0, 18.0, 19.0, 28.0, 27.0, 38.0, 41.0, 23.0, 31.0, 46.0, 43.0, 43.0, 42.0, 44.0, 47.0, 33.0, 37.0, 27.0, 25.0, 46.0, 34.0, 28.0, 22.0, 15.0, 21.0, 26.0, 11.0, 16.0, 14.0, 7.0, 6.0, 8.0, 5.0, 8.0, 3.0, 6.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.09375, -11.6724853515625, -11.251220703125, -10.8299560546875, -10.40869140625, -9.9874267578125, -9.566162109375, -9.1448974609375, -8.7236328125, -8.3023681640625, -7.881103515625, -7.4598388671875, -7.03857421875, -6.6173095703125, -6.196044921875, -5.7747802734375, -5.353515625, -4.9322509765625, -4.510986328125, -4.0897216796875, -3.66845703125, -3.2471923828125, -2.825927734375, -2.4046630859375, -1.9833984375, -1.5621337890625, -1.140869140625, -0.7196044921875, -0.29833984375, 0.1229248046875, 0.544189453125, 0.9654541015625, 1.38671875, 1.8079833984375, 2.229248046875, 2.6505126953125, 3.07177734375, 3.4930419921875, 3.914306640625, 4.3355712890625, 4.7568359375, 5.1781005859375, 5.599365234375, 6.0206298828125, 6.44189453125, 6.8631591796875, 7.284423828125, 7.7056884765625, 8.126953125, 8.5482177734375, 8.969482421875, 9.3907470703125, 9.81201171875, 10.2332763671875, 10.654541015625, 11.0758056640625, 11.4970703125, 11.9183349609375, 12.339599609375, 12.7608642578125, 13.18212890625, 13.6033935546875, 14.024658203125, 14.4459228515625, 14.8671875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 11.0, 14.0, 12.0, 26.0, 37.0, 60.0, 93.0, 154.0, 237.0, 356.0, 549.0, 870.0, 1453.0, 2298.0, 3717.0, 5846.0, 9445.0, 14923.0, 22873.0, 34343.0, 50239.0, 69351.0, 90200.0, 108597.0, 119422.0, 117964.0, 105944.0, 86737.0, 65373.0, 47266.0, 31918.0, 21273.0, 13854.0, 8586.0, 5418.0, 3434.0, 2146.0, 1287.0, 806.0, 485.0, 341.0, 219.0, 144.0, 96.0, 60.0, 25.0, 15.0, 14.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.9453125, -6.7276611328125, -6.510009765625, -6.2923583984375, -6.07470703125, -5.8570556640625, -5.639404296875, -5.4217529296875, -5.2041015625, -4.9864501953125, -4.768798828125, -4.5511474609375, -4.33349609375, -4.1158447265625, -3.898193359375, -3.6805419921875, -3.462890625, -3.2452392578125, -3.027587890625, -2.8099365234375, -2.59228515625, -2.3746337890625, -2.156982421875, -1.9393310546875, -1.7216796875, -1.5040283203125, -1.286376953125, -1.0687255859375, -0.85107421875, -0.6334228515625, -0.415771484375, -0.1981201171875, 0.01953125, 0.2371826171875, 0.454833984375, 0.6724853515625, 0.89013671875, 1.1077880859375, 1.325439453125, 1.5430908203125, 1.7607421875, 1.9783935546875, 2.196044921875, 2.4136962890625, 2.63134765625, 2.8489990234375, 3.066650390625, 3.2843017578125, 3.501953125, 3.7196044921875, 3.937255859375, 4.1549072265625, 4.37255859375, 4.5902099609375, 4.807861328125, 5.0255126953125, 5.2431640625, 5.4608154296875, 5.678466796875, 5.8961181640625, 6.11376953125, 6.3314208984375, 6.549072265625, 6.7667236328125, 6.984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 8.0, 10.0, 16.0, 4.0, 18.0, 14.0, 10.0, 20.0, 19.0, 24.0, 19.0, 27.0, 35.0, 32.0, 41.0, 30.0, 53.0, 49.0, 41.0, 38.0, 38.0, 29.0, 41.0, 42.0, 39.0, 38.0, 43.0, 31.0, 23.0, 21.0, 23.0, 22.0, 18.0, 18.0, 15.0, 12.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.83203125, -7.55206298828125, -7.2720947265625, -6.99212646484375, -6.712158203125, -6.43218994140625, -6.1522216796875, -5.87225341796875, -5.59228515625, -5.31231689453125, -5.0323486328125, -4.75238037109375, -4.472412109375, -4.19244384765625, -3.9124755859375, -3.63250732421875, -3.3525390625, -3.07257080078125, -2.7926025390625, -2.51263427734375, -2.232666015625, -1.95269775390625, -1.6727294921875, -1.39276123046875, -1.11279296875, -0.83282470703125, -0.5528564453125, -0.27288818359375, 0.007080078125, 0.28704833984375, 0.5670166015625, 0.84698486328125, 1.126953125, 1.40692138671875, 1.6868896484375, 1.96685791015625, 2.246826171875, 2.52679443359375, 2.8067626953125, 3.08673095703125, 3.36669921875, 3.64666748046875, 3.9266357421875, 4.20660400390625, 4.486572265625, 4.76654052734375, 5.0465087890625, 5.32647705078125, 5.6064453125, 5.88641357421875, 6.1663818359375, 6.44635009765625, 6.726318359375, 7.00628662109375, 7.2862548828125, 7.56622314453125, 7.84619140625, 8.12615966796875, 8.4061279296875, 8.68609619140625, 8.966064453125, 9.24603271484375, 9.5260009765625, 9.80596923828125, 10.0859375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 8.0, 15.0, 29.0, 50.0, 55.0, 99.0, 161.0, 213.0, 359.0, 530.0, 871.0, 1462.0, 2412.0, 3647.0, 5878.0, 9490.0, 14824.0, 23260.0, 34833.0, 50770.0, 70017.0, 90680.0, 108339.0, 119156.0, 117560.0, 105415.0, 86617.0, 65800.0, 47074.0, 31844.0, 20766.0, 13587.0, 8434.0, 5420.0, 3255.0, 2059.0, 1329.0, 768.0, 491.0, 347.0, 204.0, 141.0, 102.0, 52.0, 47.0, 29.0, 12.0, 13.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.52734375, -2.45050048828125, -2.3736572265625, -2.29681396484375, -2.219970703125, -2.14312744140625, -2.0662841796875, -1.98944091796875, -1.91259765625, -1.83575439453125, -1.7589111328125, -1.68206787109375, -1.605224609375, -1.52838134765625, -1.4515380859375, -1.37469482421875, -1.2978515625, -1.22100830078125, -1.1441650390625, -1.06732177734375, -0.990478515625, -0.91363525390625, -0.8367919921875, -0.75994873046875, -0.68310546875, -0.60626220703125, -0.5294189453125, -0.45257568359375, -0.375732421875, -0.29888916015625, -0.2220458984375, -0.14520263671875, -0.068359375, 0.00848388671875, 0.0853271484375, 0.16217041015625, 0.239013671875, 0.31585693359375, 0.3927001953125, 0.46954345703125, 0.54638671875, 0.62322998046875, 0.7000732421875, 0.77691650390625, 0.853759765625, 0.93060302734375, 1.0074462890625, 1.08428955078125, 1.1611328125, 1.23797607421875, 1.3148193359375, 1.39166259765625, 1.468505859375, 1.54534912109375, 1.6221923828125, 1.69903564453125, 1.77587890625, 1.85272216796875, 1.9295654296875, 2.00640869140625, 2.083251953125, 2.16009521484375, 2.2369384765625, 2.31378173828125, 2.390625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 3.0, 3.0, 4.0, 10.0, 9.0, 10.0, 16.0, 23.0, 23.0, 31.0, 23.0, 37.0, 37.0, 48.0, 40.0, 59.0, 53.0, 40.0, 57.0, 55.0, 53.0, 44.0, 37.0, 47.0, 36.0, 30.0, 33.0, 28.0, 27.0, 16.0, 18.0, 10.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00028204917907714844, -0.00027300044894218445, -0.00026395171880722046, -0.00025490298867225647, -0.0002458542585372925, -0.0002368055284023285, -0.0002277567982673645, -0.0002187080681324005, -0.00020965933799743652, -0.00020061060786247253, -0.00019156187772750854, -0.00018251314759254456, -0.00017346441745758057, -0.00016441568732261658, -0.0001553669571876526, -0.0001463182270526886, -0.0001372694969177246, -0.00012822076678276062, -0.00011917203664779663, -0.00011012330651283264, -0.00010107457637786865, -9.202584624290466e-05, -8.297711610794067e-05, -7.392838597297668e-05, -6.48796558380127e-05, -5.5830925703048706e-05, -4.678219556808472e-05, -3.773346543312073e-05, -2.8684735298156738e-05, -1.963600516319275e-05, -1.058727502822876e-05, -1.5385448932647705e-06, 7.510185241699219e-06, 1.6558915376663208e-05, 2.5607645511627197e-05, 3.4656375646591187e-05, 4.3705105781555176e-05, 5.2753835916519165e-05, 6.180256605148315e-05, 7.085129618644714e-05, 7.990002632141113e-05, 8.894875645637512e-05, 9.799748659133911e-05, 0.0001070462167263031, 0.00011609494686126709, 0.00012514367699623108, 0.00013419240713119507, 0.00014324113726615906, 0.00015228986740112305, 0.00016133859753608704, 0.00017038732767105103, 0.00017943605780601501, 0.000188484787940979, 0.000197533518075943, 0.00020658224821090698, 0.00021563097834587097, 0.00022467970848083496, 0.00023372843861579895, 0.00024277716875076294, 0.00025182589888572693, 0.0002608746290206909, 0.0002699233591556549, 0.0002789720892906189, 0.0002880208194255829, 0.0002970695495605469]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 5.0, 11.0, 17.0, 25.0, 56.0, 85.0, 133.0, 242.0, 377.0, 594.0, 1024.0, 1587.0, 2681.0, 4369.0, 7396.0, 12473.0, 20377.0, 32713.0, 51315.0, 76146.0, 103983.0, 128844.0, 139798.0, 131941.0, 108758.0, 79507.0, 54592.0, 34747.0, 21546.0, 13166.0, 8009.0, 4694.0, 2884.0, 1717.0, 1071.0, 623.0, 398.0, 249.0, 140.0, 82.0, 68.0, 40.0, 21.0, 13.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.92578125, -2.833099365234375, -2.74041748046875, -2.647735595703125, -2.5550537109375, -2.462371826171875, -2.36968994140625, -2.277008056640625, -2.184326171875, -2.091644287109375, -1.99896240234375, -1.906280517578125, -1.8135986328125, -1.720916748046875, -1.62823486328125, -1.535552978515625, -1.44287109375, -1.350189208984375, -1.25750732421875, -1.164825439453125, -1.0721435546875, -0.979461669921875, -0.88677978515625, -0.794097900390625, -0.701416015625, -0.608734130859375, -0.51605224609375, -0.423370361328125, -0.3306884765625, -0.238006591796875, -0.14532470703125, -0.052642822265625, 0.0400390625, 0.132720947265625, 0.22540283203125, 0.318084716796875, 0.4107666015625, 0.503448486328125, 0.59613037109375, 0.688812255859375, 0.781494140625, 0.874176025390625, 0.96685791015625, 1.059539794921875, 1.1522216796875, 1.244903564453125, 1.33758544921875, 1.430267333984375, 1.52294921875, 1.615631103515625, 1.70831298828125, 1.800994873046875, 1.8936767578125, 1.986358642578125, 2.07904052734375, 2.171722412109375, 2.264404296875, 2.357086181640625, 2.44976806640625, 2.542449951171875, 2.6351318359375, 2.727813720703125, 2.82049560546875, 2.913177490234375, 3.005859375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 2.0, 8.0, 12.0, 9.0, 10.0, 18.0, 24.0, 36.0, 34.0, 39.0, 33.0, 61.0, 46.0, 48.0, 62.0, 51.0, 79.0, 56.0, 52.0, 49.0, 48.0, 41.0, 28.0, 26.0, 31.0, 23.0, 20.0, 15.0, 7.0, 9.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.400482177734375, -1.35662841796875, -1.312774658203125, -1.2689208984375, -1.225067138671875, -1.18121337890625, -1.137359619140625, -1.093505859375, -1.049652099609375, -1.00579833984375, -0.961944580078125, -0.9180908203125, -0.874237060546875, -0.83038330078125, -0.786529541015625, -0.74267578125, -0.698822021484375, -0.65496826171875, -0.611114501953125, -0.5672607421875, -0.523406982421875, -0.47955322265625, -0.435699462890625, -0.391845703125, -0.347991943359375, -0.30413818359375, -0.260284423828125, -0.2164306640625, -0.172576904296875, -0.12872314453125, -0.084869384765625, -0.041015625, 0.002838134765625, 0.04669189453125, 0.090545654296875, 0.1343994140625, 0.178253173828125, 0.22210693359375, 0.265960693359375, 0.309814453125, 0.353668212890625, 0.39752197265625, 0.441375732421875, 0.4852294921875, 0.529083251953125, 0.57293701171875, 0.616790771484375, 0.66064453125, 0.704498291015625, 0.74835205078125, 0.792205810546875, 0.8360595703125, 0.879913330078125, 0.92376708984375, 0.967620849609375, 1.011474609375, 1.055328369140625, 1.09918212890625, 1.143035888671875, 1.1868896484375, 1.230743408203125, 1.27459716796875, 1.318450927734375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 5.0, 8.0, 16.0, 20.0, 20.0, 20.0, 27.0, 28.0, 37.0, 40.0, 59.0, 65.0, 60.0, 57.0, 60.0, 52.0, 61.0, 52.0, 42.0, 37.0, 32.0, 31.0, 24.0, 31.0, 12.0, 15.0, 13.0, 15.0, 10.0, 3.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8134126663208, -10.368483543395996, -9.923553466796875, -9.47862434387207, -9.03369426727295, -8.588765144348145, -8.143835067749023, -7.698905944824219, -7.253976345062256, -6.809046745300293, -6.36411714553833, -5.919187545776367, -5.4742584228515625, -5.029328346252441, -4.584399223327637, -4.139469623565674, -3.694540023803711, -3.249610424041748, -2.804680824279785, -2.3597514629364014, -1.9148218631744385, -1.4698922634124756, -1.0249629020690918, -0.5800333023071289, -0.13510370254516602, 0.3098258376121521, 0.7547553777694702, 1.1996848583221436, 1.6446144580841064, 2.0895440578460693, 2.534473419189453, 2.979403018951416, 3.4243335723876953, 3.869263172149658, 4.314192771911621, 4.759121894836426, 5.204051971435547, 5.648981094360352, 6.0939106941223145, 6.538840293884277, 6.98376989364624, 7.428699493408203, 7.873629093170166, 8.318558692932129, 8.763487815856934, 9.208417892456055, 9.65334701538086, 10.098276138305664, 10.543206214904785, 10.98813533782959, 11.433065414428711, 11.877994537353516, 12.322924613952637, 12.767853736877441, 13.212783813476562, 13.657712936401367, 14.102642059326172, 14.547571182250977, 14.992501258850098, 15.437430381774902, 15.882360458374023, 16.327289581298828, 16.772218704223633, 17.217147827148438, 17.662078857421875]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 6.0, 5.0, 7.0, 9.0, 9.0, 8.0, 13.0, 23.0, 26.0, 29.0, 21.0, 27.0, 30.0, 32.0, 37.0, 43.0, 42.0, 28.0, 40.0, 54.0, 32.0, 59.0, 42.0, 40.0, 26.0, 38.0, 30.0, 24.0, 35.0, 25.0, 21.0, 35.0, 17.0, 21.0, 12.0, 10.0, 9.0, 4.0, 4.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.13102912902832, -12.675093650817871, -12.219158172607422, -11.763222694396973, -11.307287216186523, -10.85135269165039, -10.395417213439941, -9.939481735229492, -9.483546257019043, -9.027610778808594, -8.571675300598145, -8.115739822387695, -7.659804821014404, -7.203869342803955, -6.747934341430664, -6.291998863220215, -5.836063385009766, -5.380127906799316, -4.924192428588867, -4.468257427215576, -4.012321949005127, -3.5563864707946777, -3.1004512310028076, -2.6445159912109375, -2.1885805130004883, -1.7326451539993286, -1.276709794998169, -0.8207744359970093, -0.3648390769958496, 0.09109640121459961, 0.5470316410064697, 1.0029668807983398, 1.458902359008789, 1.9148377180099487, 2.3707730770111084, 2.8267083168029785, 3.2826437950134277, 3.738579273223877, 4.194514274597168, 4.650449752807617, 5.106385231018066, 5.562320709228516, 6.018256187438965, 6.474191188812256, 6.930126667022705, 7.386062145233154, 7.841997146606445, 8.297932624816895, 8.753868103027344, 9.209803581237793, 9.665739059448242, 10.121674537658691, 10.57761001586914, 11.033544540405273, 11.489480018615723, 11.945415496826172, 12.401350975036621, 12.85728645324707, 13.31322193145752, 13.769157409667969, 14.225091934204102, 14.681028366088867, 15.136962890625, 15.59289836883545, 16.0488338470459]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 21.0, 19.0, 61.0, 91.0, 131.0, 226.0, 379.0, 572.0, 996.0, 1598.0, 2646.0, 4341.0, 6872.0, 11124.0, 18313.0, 29430.0, 47716.0, 77063.0, 121230.0, 187040.0, 277961.0, 388645.0, 495808.0, 554337.0, 535997.0, 449831.0, 338314.0, 235568.0, 155211.0, 97393.0, 60838.0, 37134.0, 22364.0, 13674.0, 8225.0, 4864.0, 3159.0, 1864.0, 1211.0, 716.0, 449.0, 296.0, 202.0, 117.0, 73.0, 46.0, 35.0, 28.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 2.0, 4.0], "bins": [-10.6875, -10.3509521484375, -10.014404296875, -9.6778564453125, -9.34130859375, -9.0047607421875, -8.668212890625, -8.3316650390625, -7.9951171875, -7.6585693359375, -7.322021484375, -6.9854736328125, -6.64892578125, -6.3123779296875, -5.975830078125, -5.6392822265625, -5.302734375, -4.9661865234375, -4.629638671875, -4.2930908203125, -3.95654296875, -3.6199951171875, -3.283447265625, -2.9468994140625, -2.6103515625, -2.2738037109375, -1.937255859375, -1.6007080078125, -1.26416015625, -0.9276123046875, -0.591064453125, -0.2545166015625, 0.08203125, 0.4185791015625, 0.755126953125, 1.0916748046875, 1.42822265625, 1.7647705078125, 2.101318359375, 2.4378662109375, 2.7744140625, 3.1109619140625, 3.447509765625, 3.7840576171875, 4.12060546875, 4.4571533203125, 4.793701171875, 5.1302490234375, 5.466796875, 5.8033447265625, 6.139892578125, 6.4764404296875, 6.81298828125, 7.1495361328125, 7.486083984375, 7.8226318359375, 8.1591796875, 8.4957275390625, 8.832275390625, 9.1688232421875, 9.50537109375, 9.8419189453125, 10.178466796875, 10.5150146484375, 10.8515625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 11.0, 12.0, 12.0, 11.0, 15.0, 21.0, 20.0, 16.0, 26.0, 31.0, 29.0, 37.0, 25.0, 39.0, 39.0, 27.0, 58.0, 30.0, 40.0, 42.0, 36.0, 47.0, 41.0, 42.0, 37.0, 26.0, 23.0, 27.0, 24.0, 27.0, 25.0, 16.0, 16.0, 13.0, 7.0, 8.0, 6.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-10.859375, -10.4898681640625, -10.120361328125, -9.7508544921875, -9.38134765625, -9.0118408203125, -8.642333984375, -8.2728271484375, -7.9033203125, -7.5338134765625, -7.164306640625, -6.7947998046875, -6.42529296875, -6.0557861328125, -5.686279296875, -5.3167724609375, -4.947265625, -4.5777587890625, -4.208251953125, -3.8387451171875, -3.46923828125, -3.0997314453125, -2.730224609375, -2.3607177734375, -1.9912109375, -1.6217041015625, -1.252197265625, -0.8826904296875, -0.51318359375, -0.1436767578125, 0.225830078125, 0.5953369140625, 0.96484375, 1.3343505859375, 1.703857421875, 2.0733642578125, 2.44287109375, 2.8123779296875, 3.181884765625, 3.5513916015625, 3.9208984375, 4.2904052734375, 4.659912109375, 5.0294189453125, 5.39892578125, 5.7684326171875, 6.137939453125, 6.5074462890625, 6.876953125, 7.2464599609375, 7.615966796875, 7.9854736328125, 8.35498046875, 8.7244873046875, 9.093994140625, 9.4635009765625, 9.8330078125, 10.2025146484375, 10.572021484375, 10.9415283203125, 11.31103515625, 11.6805419921875, 12.050048828125, 12.4195556640625, 12.7890625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 8.0, 4.0, 5.0, 9.0, 17.0, 28.0, 44.0, 82.0, 115.0, 149.0, 294.0, 452.0, 773.0, 1221.0, 2158.0, 3795.0, 6554.0, 11010.0, 18894.0, 32321.0, 54598.0, 91574.0, 148890.0, 232315.0, 339180.0, 452660.0, 540943.0, 563354.0, 507874.0, 403802.0, 289146.0, 192011.0, 121421.0, 73664.0, 43625.0, 25164.0, 14978.0, 8773.0, 5079.0, 2892.0, 1788.0, 1009.0, 619.0, 384.0, 245.0, 154.0, 80.0, 57.0, 36.0, 19.0, 13.0, 1.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.828125, -11.4375, -11.046875, -10.65625, -10.265625, -9.875, -9.484375, -9.09375, -8.703125, -8.3125, -7.921875, -7.53125, -7.140625, -6.75, -6.359375, -5.96875, -5.578125, -5.1875, -4.796875, -4.40625, -4.015625, -3.625, -3.234375, -2.84375, -2.453125, -2.0625, -1.671875, -1.28125, -0.890625, -0.5, -0.109375, 0.28125, 0.671875, 1.0625, 1.453125, 1.84375, 2.234375, 2.625, 3.015625, 3.40625, 3.796875, 4.1875, 4.578125, 4.96875, 5.359375, 5.75, 6.140625, 6.53125, 6.921875, 7.3125, 7.703125, 8.09375, 8.484375, 8.875, 9.265625, 9.65625, 10.046875, 10.4375, 10.828125, 11.21875, 11.609375, 12.0, 12.390625, 12.78125, 13.171875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 9.0, 6.0, 10.0, 23.0, 27.0, 27.0, 37.0, 48.0, 64.0, 67.0, 103.0, 102.0, 139.0, 161.0, 170.0, 194.0, 262.0, 230.0, 232.0, 271.0, 226.0, 228.0, 206.0, 179.0, 175.0, 150.0, 123.0, 124.0, 104.0, 89.0, 62.0, 45.0, 36.0, 31.0, 25.0, 19.0, 20.0, 14.0, 12.0, 6.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.22174072265625, -6.0098876953125, -5.79803466796875, -5.586181640625, -5.37432861328125, -5.1624755859375, -4.95062255859375, -4.73876953125, -4.52691650390625, -4.3150634765625, -4.10321044921875, -3.891357421875, -3.67950439453125, -3.4676513671875, -3.25579833984375, -3.0439453125, -2.83209228515625, -2.6202392578125, -2.40838623046875, -2.196533203125, -1.98468017578125, -1.7728271484375, -1.56097412109375, -1.34912109375, -1.13726806640625, -0.9254150390625, -0.71356201171875, -0.501708984375, -0.28985595703125, -0.0780029296875, 0.13385009765625, 0.345703125, 0.55755615234375, 0.7694091796875, 0.98126220703125, 1.193115234375, 1.40496826171875, 1.6168212890625, 1.82867431640625, 2.04052734375, 2.25238037109375, 2.4642333984375, 2.67608642578125, 2.887939453125, 3.09979248046875, 3.3116455078125, 3.52349853515625, 3.7353515625, 3.94720458984375, 4.1590576171875, 4.37091064453125, 4.582763671875, 4.79461669921875, 5.0064697265625, 5.21832275390625, 5.43017578125, 5.64202880859375, 5.8538818359375, 6.06573486328125, 6.277587890625, 6.48944091796875, 6.7012939453125, 6.91314697265625, 7.125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 6.0, 7.0, 3.0, 4.0, 10.0, 7.0, 12.0, 14.0, 19.0, 22.0, 30.0, 22.0, 40.0, 49.0, 50.0, 63.0, 72.0, 70.0, 52.0, 73.0, 55.0, 47.0, 49.0, 39.0, 28.0, 26.0, 26.0, 17.0, 18.0, 18.0, 13.0, 11.0, 6.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.496004104614258, -17.885887145996094, -17.275768280029297, -16.665651321411133, -16.05553436279297, -15.445415496826172, -14.835298538208008, -14.225180625915527, -13.615062713623047, -13.004944801330566, -12.394826889038086, -11.784709930419922, -11.174592018127441, -10.564474105834961, -9.954357147216797, -9.344239234924316, -8.734121322631836, -8.124003410339355, -7.513885974884033, -6.903768539428711, -6.2936506271362305, -5.68353271484375, -5.073415279388428, -4.4632978439331055, -3.853179931640625, -3.2430622577667236, -2.6329445838928223, -2.022826910018921, -1.4127092361450195, -0.8025915622711182, -0.1924738883972168, 0.41764354705810547, 1.0277595520019531, 1.6378772258758545, 2.247994899749756, 2.8581125736236572, 3.4682302474975586, 4.078348159790039, 4.688465595245361, 5.298583030700684, 5.908700942993164, 6.5188188552856445, 7.128936290740967, 7.739053726196289, 8.34917163848877, 8.95928955078125, 9.569406509399414, 10.179524421691895, 10.789642333984375, 11.399760246276855, 12.009878158569336, 12.6199951171875, 13.23011302947998, 13.840230941772461, 14.450347900390625, 15.060465812683105, 15.670583724975586, 16.28070068359375, 16.890819549560547, 17.50093650817871, 18.111053466796875, 18.721172332763672, 19.331289291381836, 19.94140625, 20.551525115966797]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 22.0, 10.0, 17.0, 15.0, 22.0, 26.0, 25.0, 35.0, 34.0, 45.0, 45.0, 46.0, 36.0, 46.0, 38.0, 53.0, 48.0, 43.0, 37.0, 43.0, 52.0, 35.0, 27.0, 24.0, 14.0, 27.0, 24.0, 21.0, 14.0, 14.0, 12.0, 9.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.245445251464844, -16.63654136657715, -16.027637481689453, -15.418733596801758, -14.809828758239746, -14.20092487335205, -13.592020988464355, -12.983116149902344, -12.374212265014648, -11.765308380126953, -11.156404495239258, -10.547500610351562, -9.93859577178955, -9.329691886901855, -8.72078800201416, -8.111883163452148, -7.5029802322387695, -6.894076347351074, -6.285171985626221, -5.676268100738525, -5.067363739013672, -4.458459854125977, -3.8495559692382812, -3.2406516075134277, -2.6317477226257324, -2.022843599319458, -1.4139395952224731, -0.8050355911254883, -0.19613146781921387, 0.41277265548706055, 1.0216765403747559, 1.6305809020996094, 2.2394847869873047, 2.848388910293579, 3.4572930335998535, 4.066196918487549, 4.675101280212402, 5.284005165100098, 5.892909049987793, 6.5018134117126465, 7.110717296600342, 7.719621181488037, 8.32852554321289, 8.937429428100586, 9.546333312988281, 10.155237197875977, 10.764141082763672, 11.373045921325684, 11.981949806213379, 12.590853691101074, 13.19975757598877, 13.808662414550781, 14.417566299438477, 15.026470184326172, 15.635374069213867, 16.244277954101562, 16.853181838989258, 17.462085723876953, 18.07098960876465, 18.679893493652344, 19.28879737854004, 19.897701263427734, 20.506607055664062, 21.115510940551758, 21.724414825439453]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 18.0, 19.0, 24.0, 32.0, 62.0, 95.0, 145.0, 183.0, 295.0, 452.0, 683.0, 1019.0, 1614.0, 2470.0, 3719.0, 5765.0, 9052.0, 14107.0, 22575.0, 36192.0, 58744.0, 97054.0, 154841.0, 206768.0, 162776.0, 102475.0, 62969.0, 38601.0, 23955.0, 14971.0, 9505.0, 6027.0, 3973.0, 2499.0, 1658.0, 1093.0, 698.0, 455.0, 333.0, 209.0, 135.0, 108.0, 83.0, 38.0, 17.0, 20.0, 9.0, 10.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.931640625, -1.8704376220703125, -1.809234619140625, -1.7480316162109375, -1.68682861328125, -1.6256256103515625, -1.564422607421875, -1.5032196044921875, -1.4420166015625, -1.3808135986328125, -1.319610595703125, -1.2584075927734375, -1.19720458984375, -1.1360015869140625, -1.074798583984375, -1.0135955810546875, -0.952392578125, -0.8911895751953125, -0.829986572265625, -0.7687835693359375, -0.70758056640625, -0.6463775634765625, -0.585174560546875, -0.5239715576171875, -0.4627685546875, -0.4015655517578125, -0.340362548828125, -0.2791595458984375, -0.21795654296875, -0.1567535400390625, -0.095550537109375, -0.0343475341796875, 0.02685546875, 0.0880584716796875, 0.149261474609375, 0.2104644775390625, 0.27166748046875, 0.3328704833984375, 0.394073486328125, 0.4552764892578125, 0.5164794921875, 0.5776824951171875, 0.638885498046875, 0.7000885009765625, 0.76129150390625, 0.8224945068359375, 0.883697509765625, 0.9449005126953125, 1.006103515625, 1.0673065185546875, 1.128509521484375, 1.1897125244140625, 1.25091552734375, 1.3121185302734375, 1.373321533203125, 1.4345245361328125, 1.4957275390625, 1.5569305419921875, 1.618133544921875, 1.6793365478515625, 1.74053955078125, 1.8017425537109375, 1.862945556640625, 1.9241485595703125, 1.9853515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 4.0, 3.0, 9.0, 13.0, 13.0, 18.0, 16.0, 19.0, 21.0, 30.0, 27.0, 35.0, 37.0, 44.0, 39.0, 52.0, 67.0, 42.0, 47.0, 38.0, 44.0, 31.0, 61.0, 41.0, 39.0, 30.0, 25.0, 32.0, 15.0, 30.0, 14.0, 15.0, 6.0, 16.0, 12.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.519287109375, -17.86669921875, -17.214111328125, -16.5615234375, -15.908935546875, -15.25634765625, -14.603759765625, -13.951171875, -13.298583984375, -12.64599609375, -11.993408203125, -11.3408203125, -10.688232421875, -10.03564453125, -9.383056640625, -8.73046875, -8.077880859375, -7.42529296875, -6.772705078125, -6.1201171875, -5.467529296875, -4.81494140625, -4.162353515625, -3.509765625, -2.857177734375, -2.20458984375, -1.552001953125, -0.8994140625, -0.246826171875, 0.40576171875, 1.058349609375, 1.7109375, 2.363525390625, 3.01611328125, 3.668701171875, 4.3212890625, 4.973876953125, 5.62646484375, 6.279052734375, 6.931640625, 7.584228515625, 8.23681640625, 8.889404296875, 9.5419921875, 10.194580078125, 10.84716796875, 11.499755859375, 12.15234375, 12.804931640625, 13.45751953125, 14.110107421875, 14.7626953125, 15.415283203125, 16.06787109375, 16.720458984375, 17.373046875, 18.025634765625, 18.67822265625, 19.330810546875, 19.9833984375, 20.635986328125, 21.28857421875, 21.941162109375, 22.59375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 7.0, 15.0, 15.0, 30.0, 22.0, 50.0, 104.0, 156.0, 269.0, 486.0, 814.0, 1479.0, 2645.0, 4774.0, 8582.0, 15415.0, 28181.0, 51796.0, 95028.0, 169279.0, 252426.0, 185130.0, 104391.0, 57845.0, 31120.0, 17170.0, 9513.0, 5155.0, 2912.0, 1584.0, 889.0, 521.0, 281.0, 179.0, 103.0, 74.0, 37.0, 23.0, 16.0, 9.0, 11.0, 6.0, 0.0, 7.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.978515625, -2.8970947265625, -2.815673828125, -2.7342529296875, -2.65283203125, -2.5714111328125, -2.489990234375, -2.4085693359375, -2.3271484375, -2.2457275390625, -2.164306640625, -2.0828857421875, -2.00146484375, -1.9200439453125, -1.838623046875, -1.7572021484375, -1.67578125, -1.5943603515625, -1.512939453125, -1.4315185546875, -1.35009765625, -1.2686767578125, -1.187255859375, -1.1058349609375, -1.0244140625, -0.9429931640625, -0.861572265625, -0.7801513671875, -0.69873046875, -0.6173095703125, -0.535888671875, -0.4544677734375, -0.373046875, -0.2916259765625, -0.210205078125, -0.1287841796875, -0.04736328125, 0.0340576171875, 0.115478515625, 0.1968994140625, 0.2783203125, 0.3597412109375, 0.441162109375, 0.5225830078125, 0.60400390625, 0.6854248046875, 0.766845703125, 0.8482666015625, 0.9296875, 1.0111083984375, 1.092529296875, 1.1739501953125, 1.25537109375, 1.3367919921875, 1.418212890625, 1.4996337890625, 1.5810546875, 1.6624755859375, 1.743896484375, 1.8253173828125, 1.90673828125, 1.9881591796875, 2.069580078125, 2.1510009765625, 2.232421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 0.0, 6.0, 3.0, 9.0, 7.0, 6.0, 9.0, 5.0, 9.0, 16.0, 12.0, 17.0, 19.0, 13.0, 21.0, 21.0, 30.0, 37.0, 29.0, 38.0, 34.0, 38.0, 28.0, 48.0, 45.0, 39.0, 40.0, 45.0, 25.0, 35.0, 31.0, 29.0, 27.0, 32.0, 32.0, 19.0, 23.0, 22.0, 17.0, 16.0, 13.0, 10.0, 18.0, 7.0, 9.0, 2.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.078125, -10.7508544921875, -10.423583984375, -10.0963134765625, -9.76904296875, -9.4417724609375, -9.114501953125, -8.7872314453125, -8.4599609375, -8.1326904296875, -7.805419921875, -7.4781494140625, -7.15087890625, -6.8236083984375, -6.496337890625, -6.1690673828125, -5.841796875, -5.5145263671875, -5.187255859375, -4.8599853515625, -4.53271484375, -4.2054443359375, -3.878173828125, -3.5509033203125, -3.2236328125, -2.8963623046875, -2.569091796875, -2.2418212890625, -1.91455078125, -1.5872802734375, -1.260009765625, -0.9327392578125, -0.60546875, -0.2781982421875, 0.049072265625, 0.3763427734375, 0.70361328125, 1.0308837890625, 1.358154296875, 1.6854248046875, 2.0126953125, 2.3399658203125, 2.667236328125, 2.9945068359375, 3.32177734375, 3.6490478515625, 3.976318359375, 4.3035888671875, 4.630859375, 4.9581298828125, 5.285400390625, 5.6126708984375, 5.93994140625, 6.2672119140625, 6.594482421875, 6.9217529296875, 7.2490234375, 7.5762939453125, 7.903564453125, 8.2308349609375, 8.55810546875, 8.8853759765625, 9.212646484375, 9.5399169921875, 9.8671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 6.0, 8.0, 9.0, 19.0, 23.0, 31.0, 51.0, 72.0, 89.0, 133.0, 149.0, 296.0, 380.0, 535.0, 782.0, 1238.0, 1866.0, 3086.0, 5078.0, 9040.0, 17060.0, 36085.0, 90290.0, 260037.0, 374718.0, 141992.0, 53289.0, 23248.0, 11792.0, 6479.0, 3675.0, 2363.0, 1526.0, 945.0, 696.0, 475.0, 304.0, 185.0, 153.0, 109.0, 76.0, 53.0, 39.0, 26.0, 13.0, 16.0, 12.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.31170654296875, -0.3013916015625, -0.29107666015625, -0.28076171875, -0.27044677734375, -0.2601318359375, -0.24981689453125, -0.239501953125, -0.22918701171875, -0.2188720703125, -0.20855712890625, -0.1982421875, -0.18792724609375, -0.1776123046875, -0.16729736328125, -0.156982421875, -0.14666748046875, -0.1363525390625, -0.12603759765625, -0.11572265625, -0.10540771484375, -0.0950927734375, -0.08477783203125, -0.074462890625, -0.06414794921875, -0.0538330078125, -0.04351806640625, -0.033203125, -0.02288818359375, -0.0125732421875, -0.00225830078125, 0.008056640625, 0.01837158203125, 0.0286865234375, 0.03900146484375, 0.04931640625, 0.05963134765625, 0.0699462890625, 0.08026123046875, 0.090576171875, 0.10089111328125, 0.1112060546875, 0.12152099609375, 0.1318359375, 0.14215087890625, 0.1524658203125, 0.16278076171875, 0.173095703125, 0.18341064453125, 0.1937255859375, 0.20404052734375, 0.21435546875, 0.22467041015625, 0.2349853515625, 0.24530029296875, 0.255615234375, 0.26593017578125, 0.2762451171875, 0.28656005859375, 0.296875, 0.30718994140625, 0.3175048828125, 0.32781982421875, 0.338134765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 11.0, 6.0, 7.0, 13.0, 9.0, 10.0, 15.0, 15.0, 24.0, 31.0, 33.0, 32.0, 44.0, 37.0, 50.0, 43.0, 47.0, 45.0, 51.0, 51.0, 57.0, 51.0, 44.0, 47.0, 40.0, 41.0, 27.0, 25.0, 20.0, 17.0, 13.0, 4.0, 10.0, 8.0, 6.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.09808349609375e-05, -2.0269304513931274e-05, -1.955777406692505e-05, -1.8846243619918823e-05, -1.8134713172912598e-05, -1.7423182725906372e-05, -1.6711652278900146e-05, -1.600012183189392e-05, -1.5288591384887695e-05, -1.457706093788147e-05, -1.3865530490875244e-05, -1.3154000043869019e-05, -1.2442469596862793e-05, -1.1730939149856567e-05, -1.1019408702850342e-05, -1.0307878255844116e-05, -9.59634780883789e-06, -8.884817361831665e-06, -8.17328691482544e-06, -7.461756467819214e-06, -6.750226020812988e-06, -6.038695573806763e-06, -5.327165126800537e-06, -4.6156346797943115e-06, -3.904104232788086e-06, -3.1925737857818604e-06, -2.4810433387756348e-06, -1.7695128917694092e-06, -1.0579824447631836e-06, -3.46451997756958e-07, 3.650784492492676e-07, 1.0766088962554932e-06, 1.7881393432617188e-06, 2.4996697902679443e-06, 3.21120023727417e-06, 3.9227306842803955e-06, 4.634261131286621e-06, 5.345791578292847e-06, 6.057322025299072e-06, 6.768852472305298e-06, 7.4803829193115234e-06, 8.191913366317749e-06, 8.903443813323975e-06, 9.6149742603302e-06, 1.0326504707336426e-05, 1.1038035154342651e-05, 1.1749565601348877e-05, 1.2461096048355103e-05, 1.3172626495361328e-05, 1.3884156942367554e-05, 1.459568738937378e-05, 1.5307217836380005e-05, 1.601874828338623e-05, 1.6730278730392456e-05, 1.744180917739868e-05, 1.8153339624404907e-05, 1.8864870071411133e-05, 1.957640051841736e-05, 2.0287930965423584e-05, 2.099946141242981e-05, 2.1710991859436035e-05, 2.242252230644226e-05, 2.3134052753448486e-05, 2.3845583200454712e-05, 2.4557113647460938e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 8.0, 5.0, 15.0, 13.0, 20.0, 37.0, 41.0, 71.0, 100.0, 163.0, 227.0, 318.0, 523.0, 751.0, 1027.0, 1603.0, 2462.0, 3749.0, 5888.0, 9413.0, 15911.0, 26791.0, 47891.0, 90139.0, 179867.0, 283003.0, 175665.0, 87436.0, 47291.0, 26612.0, 15555.0, 9109.0, 5739.0, 3706.0, 2463.0, 1583.0, 1057.0, 785.0, 470.0, 316.0, 226.0, 169.0, 101.0, 72.0, 62.0, 38.0, 18.0, 15.0, 14.0, 7.0, 6.0, 5.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2846832275390625, -0.274688720703125, -0.2646942138671875, -0.25469970703125, -0.2447052001953125, -0.234710693359375, -0.2247161865234375, -0.2147216796875, -0.2047271728515625, -0.194732666015625, -0.1847381591796875, -0.17474365234375, -0.1647491455078125, -0.154754638671875, -0.1447601318359375, -0.134765625, -0.1247711181640625, -0.114776611328125, -0.1047821044921875, -0.09478759765625, -0.0847930908203125, -0.074798583984375, -0.0648040771484375, -0.0548095703125, -0.0448150634765625, -0.034820556640625, -0.0248260498046875, -0.01483154296875, -0.0048370361328125, 0.005157470703125, 0.0151519775390625, 0.025146484375, 0.0351409912109375, 0.045135498046875, 0.0551300048828125, 0.06512451171875, 0.0751190185546875, 0.085113525390625, 0.0951080322265625, 0.1051025390625, 0.1150970458984375, 0.125091552734375, 0.1350860595703125, 0.14508056640625, 0.1550750732421875, 0.165069580078125, 0.1750640869140625, 0.18505859375, 0.1950531005859375, 0.205047607421875, 0.2150421142578125, 0.22503662109375, 0.2350311279296875, 0.245025634765625, 0.2550201416015625, 0.2650146484375, 0.2750091552734375, 0.285003662109375, 0.2949981689453125, 0.30499267578125, 0.3149871826171875, 0.324981689453125, 0.3349761962890625, 0.344970703125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 2.0, 7.0, 13.0, 6.0, 11.0, 15.0, 14.0, 15.0, 34.0, 37.0, 26.0, 45.0, 50.0, 58.0, 60.0, 66.0, 78.0, 80.0, 70.0, 46.0, 44.0, 37.0, 32.0, 16.0, 20.0, 24.0, 13.0, 8.0, 13.0, 6.0, 7.0, 7.0, 4.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12091064453125, -0.1173715591430664, -0.11383247375488281, -0.11029338836669922, -0.10675430297851562, -0.10321521759033203, -0.09967613220214844, -0.09613704681396484, -0.09259796142578125, -0.08905887603759766, -0.08551979064941406, -0.08198070526123047, -0.07844161987304688, -0.07490253448486328, -0.07136344909667969, -0.0678243637084961, -0.0642852783203125, -0.060746192932128906, -0.05720710754394531, -0.05366802215576172, -0.050128936767578125, -0.04658985137939453, -0.04305076599121094, -0.039511680603027344, -0.03597259521484375, -0.032433509826660156, -0.028894424438476562, -0.02535533905029297, -0.021816253662109375, -0.01827716827392578, -0.014738082885742188, -0.011198997497558594, -0.007659912109375, -0.004120826721191406, -0.0005817413330078125, 0.0029573440551757812, 0.006496429443359375, 0.010035514831542969, 0.013574600219726562, 0.017113685607910156, 0.02065277099609375, 0.024191856384277344, 0.027730941772460938, 0.03127002716064453, 0.034809112548828125, 0.03834819793701172, 0.04188728332519531, 0.045426368713378906, 0.0489654541015625, 0.052504539489746094, 0.05604362487792969, 0.05958271026611328, 0.06312179565429688, 0.06666088104248047, 0.07019996643066406, 0.07373905181884766, 0.07727813720703125, 0.08081722259521484, 0.08435630798339844, 0.08789539337158203, 0.09143447875976562, 0.09497356414794922, 0.09851264953613281, 0.1020517349243164, 0.1055908203125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 4.0, 9.0, 7.0, 12.0, 9.0, 16.0, 24.0, 24.0, 30.0, 30.0, 44.0, 48.0, 58.0, 73.0, 62.0, 62.0, 67.0, 55.0, 56.0, 45.0, 47.0, 31.0, 28.0, 25.0, 24.0, 20.0, 13.0, 14.0, 15.0, 8.0, 6.0, 7.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.65519142150879, -18.04994010925293, -17.444686889648438, -16.839435577392578, -16.23418426513672, -15.628931045532227, -15.023679733276367, -14.418427467346191, -13.813175201416016, -13.20792293548584, -12.60267162322998, -11.997419357299805, -11.392167091369629, -10.786914825439453, -10.181663513183594, -9.576411247253418, -8.971159934997559, -8.365907669067383, -7.760655879974365, -7.155404090881348, -6.550151824951172, -5.944900035858154, -5.339648246765137, -4.734395980834961, -4.129144191741943, -3.5238921642303467, -2.91864013671875, -2.3133883476257324, -1.7081363201141357, -1.102884292602539, -0.4976325035095215, 0.1076197624206543, 0.7128715515136719, 1.3181235790252686, 1.9233754873275757, 2.528627395629883, 3.1338794231414795, 3.739131450653076, 4.344383239746094, 4.9496355056762695, 5.554887294769287, 6.160139083862305, 6.7653913497924805, 7.370643138885498, 7.975894927978516, 8.581147193908691, 9.186399459838867, 9.791650772094727, 10.396903038024902, 11.002155303955078, 11.607406616210938, 12.212658882141113, 12.817911148071289, 13.423162460327148, 14.028414726257324, 14.6336669921875, 15.23891830444336, 15.844170570373535, 16.44942283630371, 17.05467414855957, 17.65992546081543, 18.265178680419922, 18.87042999267578, 19.47568130493164, 20.080934524536133]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 7.0, 21.0, 10.0, 15.0, 17.0, 22.0, 28.0, 23.0, 38.0, 34.0, 42.0, 45.0, 48.0, 36.0, 44.0, 41.0, 52.0, 48.0, 43.0, 37.0, 43.0, 51.0, 35.0, 27.0, 23.0, 15.0, 27.0, 25.0, 20.0, 15.0, 12.0, 13.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.161298751831055, -16.551006317138672, -15.940714836120605, -15.330422401428223, -14.720130920410156, -14.109838485717773, -13.49954605102539, -12.889253616333008, -12.278962135314941, -11.668669700622559, -11.058378219604492, -10.44808578491211, -9.837793350219727, -9.22750186920166, -8.617209434509277, -8.006917953491211, -7.396625518798828, -6.7863335609436035, -6.176041603088379, -5.565749168395996, -4.9554572105407715, -4.345165252685547, -3.734873056411743, -3.1245808601379395, -2.514288902282715, -1.9039968252182007, -1.2937047481536865, -0.6834126710891724, -0.0731205940246582, 0.5371713638305664, 1.1474635601043701, 1.7577557563781738, 2.3680496215820312, 2.978341579437256, 3.5886337757110596, 4.198925971984863, 4.809217929840088, 5.4195098876953125, 6.029802322387695, 6.64009428024292, 7.2503862380981445, 7.860678195953369, 8.470970153808594, 9.081262588500977, 9.69155502319336, 10.301846504211426, 10.912138938903809, 11.522430419921875, 12.132722854614258, 12.74301528930664, 13.353306770324707, 13.96359920501709, 14.573890686035156, 15.184183120727539, 15.794475555419922, 16.404767990112305, 17.015060424804688, 17.62535285949707, 18.235645294189453, 18.845935821533203, 19.456228256225586, 20.06652069091797, 20.67681312561035, 21.287105560302734, 21.897396087646484]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 13.0, 17.0, 14.0, 30.0, 37.0, 65.0, 105.0, 148.0, 200.0, 318.0, 524.0, 771.0, 1223.0, 1941.0, 3247.0, 5116.0, 8377.0, 13352.0, 21318.0, 33803.0, 51213.0, 74906.0, 101973.0, 124497.0, 135718.0, 127561.0, 107652.0, 80152.0, 55604.0, 36548.0, 23241.0, 14640.0, 9128.0, 5512.0, 3552.0, 2096.0, 1401.0, 876.0, 567.0, 377.0, 256.0, 168.0, 106.0, 74.0, 41.0, 22.0, 22.0, 17.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7890625, -8.5018310546875, -8.214599609375, -7.9273681640625, -7.64013671875, -7.3529052734375, -7.065673828125, -6.7784423828125, -6.4912109375, -6.2039794921875, -5.916748046875, -5.6295166015625, -5.34228515625, -5.0550537109375, -4.767822265625, -4.4805908203125, -4.193359375, -3.9061279296875, -3.618896484375, -3.3316650390625, -3.04443359375, -2.7572021484375, -2.469970703125, -2.1827392578125, -1.8955078125, -1.6082763671875, -1.321044921875, -1.0338134765625, -0.74658203125, -0.4593505859375, -0.172119140625, 0.1151123046875, 0.40234375, 0.6895751953125, 0.976806640625, 1.2640380859375, 1.55126953125, 1.8385009765625, 2.125732421875, 2.4129638671875, 2.7001953125, 2.9874267578125, 3.274658203125, 3.5618896484375, 3.84912109375, 4.1363525390625, 4.423583984375, 4.7108154296875, 4.998046875, 5.2852783203125, 5.572509765625, 5.8597412109375, 6.14697265625, 6.4342041015625, 6.721435546875, 7.0086669921875, 7.2958984375, 7.5831298828125, 7.870361328125, 8.1575927734375, 8.44482421875, 8.7320556640625, 9.019287109375, 9.3065185546875, 9.59375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 13.0, 13.0, 14.0, 10.0, 21.0, 14.0, 31.0, 25.0, 39.0, 32.0, 36.0, 42.0, 55.0, 44.0, 50.0, 39.0, 56.0, 37.0, 34.0, 46.0, 47.0, 37.0, 37.0, 40.0, 28.0, 27.0, 23.0, 20.0, 19.0, 9.0, 22.0, 12.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.521728515625, -17.88720703125, -17.252685546875, -16.6181640625, -15.983642578125, -15.34912109375, -14.714599609375, -14.080078125, -13.445556640625, -12.81103515625, -12.176513671875, -11.5419921875, -10.907470703125, -10.27294921875, -9.638427734375, -9.00390625, -8.369384765625, -7.73486328125, -7.100341796875, -6.4658203125, -5.831298828125, -5.19677734375, -4.562255859375, -3.927734375, -3.293212890625, -2.65869140625, -2.024169921875, -1.3896484375, -0.755126953125, -0.12060546875, 0.513916015625, 1.1484375, 1.782958984375, 2.41748046875, 3.052001953125, 3.6865234375, 4.321044921875, 4.95556640625, 5.590087890625, 6.224609375, 6.859130859375, 7.49365234375, 8.128173828125, 8.7626953125, 9.397216796875, 10.03173828125, 10.666259765625, 11.30078125, 11.935302734375, 12.56982421875, 13.204345703125, 13.8388671875, 14.473388671875, 15.10791015625, 15.742431640625, 16.376953125, 17.011474609375, 17.64599609375, 18.280517578125, 18.9150390625, 19.549560546875, 20.18408203125, 20.818603515625, 21.453125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 27.0, 26.0, 56.0, 70.0, 116.0, 168.0, 296.0, 497.0, 786.0, 1265.0, 2140.0, 3530.0, 5891.0, 10098.0, 16995.0, 27831.0, 44880.0, 68210.0, 97683.0, 124628.0, 140222.0, 137998.0, 117521.0, 88621.0, 60776.0, 38949.0, 23634.0, 14197.0, 8536.0, 5099.0, 3090.0, 1822.0, 1123.0, 657.0, 404.0, 280.0, 158.0, 84.0, 53.0, 44.0, 27.0, 18.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.0, -9.695556640625, -9.39111328125, -9.086669921875, -8.7822265625, -8.477783203125, -8.17333984375, -7.868896484375, -7.564453125, -7.260009765625, -6.95556640625, -6.651123046875, -6.3466796875, -6.042236328125, -5.73779296875, -5.433349609375, -5.12890625, -4.824462890625, -4.52001953125, -4.215576171875, -3.9111328125, -3.606689453125, -3.30224609375, -2.997802734375, -2.693359375, -2.388916015625, -2.08447265625, -1.780029296875, -1.4755859375, -1.171142578125, -0.86669921875, -0.562255859375, -0.2578125, 0.046630859375, 0.35107421875, 0.655517578125, 0.9599609375, 1.264404296875, 1.56884765625, 1.873291015625, 2.177734375, 2.482177734375, 2.78662109375, 3.091064453125, 3.3955078125, 3.699951171875, 4.00439453125, 4.308837890625, 4.61328125, 4.917724609375, 5.22216796875, 5.526611328125, 5.8310546875, 6.135498046875, 6.43994140625, 6.744384765625, 7.048828125, 7.353271484375, 7.65771484375, 7.962158203125, 8.2666015625, 8.571044921875, 8.87548828125, 9.179931640625, 9.484375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 5.0, 10.0, 12.0, 8.0, 8.0, 12.0, 19.0, 16.0, 15.0, 18.0, 25.0, 26.0, 24.0, 23.0, 36.0, 35.0, 33.0, 42.0, 41.0, 47.0, 28.0, 43.0, 28.0, 45.0, 45.0, 38.0, 44.0, 39.0, 37.0, 22.0, 25.0, 21.0, 22.0, 18.0, 13.0, 17.0, 13.0, 5.0, 11.0, 1.0, 6.0, 4.0, 4.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.14306640625, -9.8173828125, -9.49169921875, -9.166015625, -8.84033203125, -8.5146484375, -8.18896484375, -7.86328125, -7.53759765625, -7.2119140625, -6.88623046875, -6.560546875, -6.23486328125, -5.9091796875, -5.58349609375, -5.2578125, -4.93212890625, -4.6064453125, -4.28076171875, -3.955078125, -3.62939453125, -3.3037109375, -2.97802734375, -2.65234375, -2.32666015625, -2.0009765625, -1.67529296875, -1.349609375, -1.02392578125, -0.6982421875, -0.37255859375, -0.046875, 0.27880859375, 0.6044921875, 0.93017578125, 1.255859375, 1.58154296875, 1.9072265625, 2.23291015625, 2.55859375, 2.88427734375, 3.2099609375, 3.53564453125, 3.861328125, 4.18701171875, 4.5126953125, 4.83837890625, 5.1640625, 5.48974609375, 5.8154296875, 6.14111328125, 6.466796875, 6.79248046875, 7.1181640625, 7.44384765625, 7.76953125, 8.09521484375, 8.4208984375, 8.74658203125, 9.072265625, 9.39794921875, 9.7236328125, 10.04931640625, 10.375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 14.0, 24.0, 48.0, 56.0, 117.0, 179.0, 307.0, 410.0, 699.0, 1152.0, 1873.0, 3007.0, 4813.0, 7735.0, 11849.0, 18287.0, 26810.0, 38424.0, 53187.0, 68033.0, 83951.0, 97116.0, 103589.0, 103924.0, 96870.0, 84445.0, 69831.0, 53524.0, 38991.0, 27664.0, 18439.0, 12219.0, 7869.0, 4912.0, 3071.0, 1954.0, 1178.0, 783.0, 447.0, 279.0, 177.0, 108.0, 67.0, 45.0, 29.0, 21.0, 10.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.319244384765625, -2.24200439453125, -2.164764404296875, -2.0875244140625, -2.010284423828125, -1.93304443359375, -1.855804443359375, -1.778564453125, -1.701324462890625, -1.62408447265625, -1.546844482421875, -1.4696044921875, -1.392364501953125, -1.31512451171875, -1.237884521484375, -1.16064453125, -1.083404541015625, -1.00616455078125, -0.928924560546875, -0.8516845703125, -0.774444580078125, -0.69720458984375, -0.619964599609375, -0.542724609375, -0.465484619140625, -0.38824462890625, -0.311004638671875, -0.2337646484375, -0.156524658203125, -0.07928466796875, -0.002044677734375, 0.0751953125, 0.152435302734375, 0.22967529296875, 0.306915283203125, 0.3841552734375, 0.461395263671875, 0.53863525390625, 0.615875244140625, 0.693115234375, 0.770355224609375, 0.84759521484375, 0.924835205078125, 1.0020751953125, 1.079315185546875, 1.15655517578125, 1.233795166015625, 1.31103515625, 1.388275146484375, 1.46551513671875, 1.542755126953125, 1.6199951171875, 1.697235107421875, 1.77447509765625, 1.851715087890625, 1.928955078125, 2.006195068359375, 2.08343505859375, 2.160675048828125, 2.2379150390625, 2.315155029296875, 2.39239501953125, 2.469635009765625, 2.546875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 7.0, 11.0, 12.0, 7.0, 20.0, 22.0, 19.0, 35.0, 46.0, 34.0, 26.0, 38.0, 32.0, 47.0, 48.0, 57.0, 58.0, 44.0, 50.0, 39.0, 43.0, 44.0, 38.0, 40.0, 34.0, 30.0, 18.0, 12.0, 17.0, 9.0, 14.0, 7.0, 8.0, 7.0, 6.0, 9.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003161430358886719, -0.0003054179251194, -0.0002946928143501282, -0.0002839677035808563, -0.00027324259281158447, -0.0002625174820423126, -0.00025179237127304077, -0.00024106726050376892, -0.00023034214973449707, -0.00021961703896522522, -0.00020889192819595337, -0.00019816681742668152, -0.00018744170665740967, -0.00017671659588813782, -0.00016599148511886597, -0.00015526637434959412, -0.00014454126358032227, -0.00013381615281105042, -0.00012309104204177856, -0.00011236593127250671, -0.00010164082050323486, -9.091570973396301e-05, -8.019059896469116e-05, -6.946548819541931e-05, -5.874037742614746e-05, -4.801526665687561e-05, -3.729015588760376e-05, -2.656504511833191e-05, -1.583993434906006e-05, -5.114823579788208e-06, 5.610287189483643e-06, 1.6335397958755493e-05, 2.7060508728027344e-05, 3.7785619497299194e-05, 4.8510730266571045e-05, 5.9235841035842896e-05, 6.996095180511475e-05, 8.06860625743866e-05, 9.141117334365845e-05, 0.0001021362841129303, 0.00011286139488220215, 0.000123586505651474, 0.00013431161642074585, 0.0001450367271900177, 0.00015576183795928955, 0.0001664869487285614, 0.00017721205949783325, 0.0001879371702671051, 0.00019866228103637695, 0.0002093873918056488, 0.00022011250257492065, 0.0002308376133441925, 0.00024156272411346436, 0.0002522878348827362, 0.00026301294565200806, 0.0002737380564212799, 0.00028446316719055176, 0.0002951882779598236, 0.00030591338872909546, 0.0003166384994983673, 0.00032736361026763916, 0.000338088721036911, 0.00034881383180618286, 0.0003595389425754547, 0.00037026405334472656]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 4.0, 10.0, 15.0, 18.0, 29.0, 45.0, 71.0, 118.0, 188.0, 307.0, 498.0, 823.0, 1384.0, 2421.0, 4410.0, 7500.0, 13168.0, 22268.0, 36095.0, 55508.0, 79651.0, 104507.0, 124748.0, 132743.0, 125600.0, 105920.0, 81693.0, 56539.0, 37218.0, 23007.0, 13451.0, 7829.0, 4557.0, 2568.0, 1430.0, 863.0, 555.0, 287.0, 167.0, 108.0, 71.0, 51.0, 28.0, 27.0, 18.0, 11.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-3.46484375, -3.36151123046875, -3.2581787109375, -3.15484619140625, -3.051513671875, -2.94818115234375, -2.8448486328125, -2.74151611328125, -2.63818359375, -2.53485107421875, -2.4315185546875, -2.32818603515625, -2.224853515625, -2.12152099609375, -2.0181884765625, -1.91485595703125, -1.8115234375, -1.70819091796875, -1.6048583984375, -1.50152587890625, -1.398193359375, -1.29486083984375, -1.1915283203125, -1.08819580078125, -0.98486328125, -0.88153076171875, -0.7781982421875, -0.67486572265625, -0.571533203125, -0.46820068359375, -0.3648681640625, -0.26153564453125, -0.158203125, -0.05487060546875, 0.0484619140625, 0.15179443359375, 0.255126953125, 0.35845947265625, 0.4617919921875, 0.56512451171875, 0.66845703125, 0.77178955078125, 0.8751220703125, 0.97845458984375, 1.081787109375, 1.18511962890625, 1.2884521484375, 1.39178466796875, 1.4951171875, 1.59844970703125, 1.7017822265625, 1.80511474609375, 1.908447265625, 2.01177978515625, 2.1151123046875, 2.21844482421875, 2.32177734375, 2.42510986328125, 2.5284423828125, 2.63177490234375, 2.735107421875, 2.83843994140625, 2.9417724609375, 3.04510498046875, 3.1484375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 6.0, 16.0, 14.0, 24.0, 20.0, 18.0, 29.0, 40.0, 32.0, 41.0, 66.0, 68.0, 58.0, 66.0, 62.0, 54.0, 54.0, 52.0, 52.0, 42.0, 27.0, 30.0, 23.0, 13.0, 21.0, 16.0, 13.0, 7.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5771484375, -1.5321197509765625, -1.487091064453125, -1.4420623779296875, -1.39703369140625, -1.3520050048828125, -1.306976318359375, -1.2619476318359375, -1.2169189453125, -1.1718902587890625, -1.126861572265625, -1.0818328857421875, -1.03680419921875, -0.9917755126953125, -0.946746826171875, -0.9017181396484375, -0.856689453125, -0.8116607666015625, -0.766632080078125, -0.7216033935546875, -0.67657470703125, -0.6315460205078125, -0.586517333984375, -0.5414886474609375, -0.4964599609375, -0.4514312744140625, -0.406402587890625, -0.3613739013671875, -0.31634521484375, -0.2713165283203125, -0.226287841796875, -0.1812591552734375, -0.13623046875, -0.0912017822265625, -0.046173095703125, -0.0011444091796875, 0.04388427734375, 0.0889129638671875, 0.133941650390625, 0.1789703369140625, 0.2239990234375, 0.2690277099609375, 0.314056396484375, 0.3590850830078125, 0.40411376953125, 0.4491424560546875, 0.494171142578125, 0.5391998291015625, 0.584228515625, 0.6292572021484375, 0.674285888671875, 0.7193145751953125, 0.76434326171875, 0.8093719482421875, 0.854400634765625, 0.8994293212890625, 0.9444580078125, 0.9894866943359375, 1.034515380859375, 1.0795440673828125, 1.12457275390625, 1.1696014404296875, 1.214630126953125, 1.2596588134765625, 1.3046875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 8.0, 9.0, 13.0, 8.0, 22.0, 21.0, 33.0, 32.0, 27.0, 41.0, 55.0, 61.0, 60.0, 72.0, 64.0, 63.0, 55.0, 51.0, 47.0, 47.0, 37.0, 26.0, 19.0, 22.0, 19.0, 17.0, 11.0, 11.0, 7.0, 9.0, 6.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.398935317993164, -17.77839469909668, -17.157854080200195, -16.53731346130371, -15.916772842407227, -15.296232223510742, -14.675692558288574, -14.05515193939209, -13.434611320495605, -12.814070701599121, -12.193530082702637, -11.572989463806152, -10.952449798583984, -10.3319091796875, -9.711368560791016, -9.090827941894531, -8.470287322998047, -7.8497467041015625, -7.229206085205078, -6.608665943145752, -5.988125324249268, -5.367584705352783, -4.747044563293457, -4.126503944396973, -3.5059633255004883, -2.885422706604004, -2.2648823261260986, -1.6443418264389038, -1.023801326751709, -0.4032607078552246, 0.21727967262268066, 0.8378200531005859, 1.4583625793457031, 2.0789031982421875, 2.6994435787200928, 3.319983959197998, 3.9405245780944824, 4.561065196990967, 5.181605339050293, 5.802145957946777, 6.422686576843262, 7.043227195739746, 7.6637678146362305, 8.284308433532715, 8.904848098754883, 9.525388717651367, 10.145929336547852, 10.766469955444336, 11.38701057434082, 12.007551193237305, 12.628091812133789, 13.248632431030273, 13.869173049926758, 14.489713668823242, 15.11025333404541, 15.730793952941895, 16.351333618164062, 16.971874237060547, 17.59241485595703, 18.212955474853516, 18.83349609375, 19.454036712646484, 20.07457733154297, 20.695117950439453, 21.315658569335938]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 10.0, 12.0, 17.0, 15.0, 22.0, 21.0, 31.0, 29.0, 34.0, 40.0, 36.0, 35.0, 42.0, 47.0, 45.0, 40.0, 43.0, 55.0, 43.0, 44.0, 38.0, 31.0, 42.0, 28.0, 34.0, 17.0, 23.0, 19.0, 15.0, 15.0, 16.0, 16.0, 8.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.88784408569336, -17.223962783813477, -16.560081481933594, -15.896201133728027, -15.232319831848145, -14.568438529968262, -13.904558181762695, -13.240676879882812, -12.57679557800293, -11.912914276123047, -11.249032974243164, -10.585152626037598, -9.921271324157715, -9.257390022277832, -8.593509674072266, -7.929628372192383, -7.2657470703125, -6.601865768432617, -5.937984943389893, -5.274104118347168, -4.610222816467285, -3.9463417530059814, -3.2824606895446777, -2.618579864501953, -1.9546985626220703, -1.2908174991607666, -0.6269364356994629, 0.03694462776184082, 0.7008256912231445, 1.3647067546844482, 2.028587818145752, 2.6924686431884766, 3.3563499450683594, 4.020231246948242, 4.684112071990967, 5.347992897033691, 6.011874198913574, 6.675755500793457, 7.339636325836182, 8.003517150878906, 8.667398452758789, 9.331279754638672, 9.995161056518555, 10.659041404724121, 11.322922706604004, 11.986804008483887, 12.650684356689453, 13.314565658569336, 13.978446960449219, 14.642328262329102, 15.306209564208984, 15.97008991241455, 16.63397216796875, 17.2978515625, 17.961732864379883, 18.625614166259766, 19.28949546813965, 19.95337677001953, 20.617258071899414, 21.281139373779297, 21.945018768310547, 22.60890007019043, 23.272781372070312, 23.936662673950195, 24.600543975830078]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 15.0, 16.0, 28.0, 34.0, 67.0, 84.0, 136.0, 213.0, 335.0, 616.0, 938.0, 1565.0, 2443.0, 3979.0, 6596.0, 10965.0, 18116.0, 30242.0, 50440.0, 83858.0, 139100.0, 226594.0, 353274.0, 506121.0, 627324.0, 632072.0, 519847.0, 365974.0, 238908.0, 148920.0, 90480.0, 54308.0, 32269.0, 19309.0, 11583.0, 7024.0, 4089.0, 2532.0, 1462.0, 931.0, 546.0, 368.0, 225.0, 128.0, 70.0, 56.0, 25.0, 27.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0], "bins": [-17.0625, -16.546142578125, -16.02978515625, -15.513427734375, -14.9970703125, -14.480712890625, -13.96435546875, -13.447998046875, -12.931640625, -12.415283203125, -11.89892578125, -11.382568359375, -10.8662109375, -10.349853515625, -9.83349609375, -9.317138671875, -8.80078125, -8.284423828125, -7.76806640625, -7.251708984375, -6.7353515625, -6.218994140625, -5.70263671875, -5.186279296875, -4.669921875, -4.153564453125, -3.63720703125, -3.120849609375, -2.6044921875, -2.088134765625, -1.57177734375, -1.055419921875, -0.5390625, -0.022705078125, 0.49365234375, 1.010009765625, 1.5263671875, 2.042724609375, 2.55908203125, 3.075439453125, 3.591796875, 4.108154296875, 4.62451171875, 5.140869140625, 5.6572265625, 6.173583984375, 6.68994140625, 7.206298828125, 7.72265625, 8.239013671875, 8.75537109375, 9.271728515625, 9.7880859375, 10.304443359375, 10.82080078125, 11.337158203125, 11.853515625, 12.369873046875, 12.88623046875, 13.402587890625, 13.9189453125, 14.435302734375, 14.95166015625, 15.468017578125, 15.984375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 10.0, 14.0, 12.0, 14.0, 21.0, 23.0, 22.0, 19.0, 33.0, 35.0, 35.0, 37.0, 43.0, 41.0, 48.0, 49.0, 45.0, 48.0, 31.0, 32.0, 43.0, 32.0, 48.0, 38.0, 27.0, 28.0, 23.0, 18.0, 18.0, 16.0, 19.0, 16.0, 14.0, 9.0, 4.0, 6.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.25, -16.670654296875, -16.09130859375, -15.511962890625, -14.9326171875, -14.353271484375, -13.77392578125, -13.194580078125, -12.615234375, -12.035888671875, -11.45654296875, -10.877197265625, -10.2978515625, -9.718505859375, -9.13916015625, -8.559814453125, -7.98046875, -7.401123046875, -6.82177734375, -6.242431640625, -5.6630859375, -5.083740234375, -4.50439453125, -3.925048828125, -3.345703125, -2.766357421875, -2.18701171875, -1.607666015625, -1.0283203125, -0.448974609375, 0.13037109375, 0.709716796875, 1.2890625, 1.868408203125, 2.44775390625, 3.027099609375, 3.6064453125, 4.185791015625, 4.76513671875, 5.344482421875, 5.923828125, 6.503173828125, 7.08251953125, 7.661865234375, 8.2412109375, 8.820556640625, 9.39990234375, 9.979248046875, 10.55859375, 11.137939453125, 11.71728515625, 12.296630859375, 12.8759765625, 13.455322265625, 14.03466796875, 14.614013671875, 15.193359375, 15.772705078125, 16.35205078125, 16.931396484375, 17.5107421875, 18.090087890625, 18.66943359375, 19.248779296875, 19.828125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 11.0, 12.0, 20.0, 28.0, 38.0, 83.0, 123.0, 200.0, 330.0, 536.0, 932.0, 1524.0, 2557.0, 4407.0, 7373.0, 12945.0, 22024.0, 36930.0, 62167.0, 103033.0, 166602.0, 258934.0, 377761.0, 498406.0, 577577.0, 571242.0, 483356.0, 362155.0, 246098.0, 157352.0, 97085.0, 58142.0, 34645.0, 20621.0, 11932.0, 6948.0, 4079.0, 2489.0, 1397.0, 830.0, 517.0, 326.0, 193.0, 118.0, 73.0, 55.0, 34.0, 16.0, 13.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.949462890625, -16.38330078125, -15.817138671875, -15.2509765625, -14.684814453125, -14.11865234375, -13.552490234375, -12.986328125, -12.420166015625, -11.85400390625, -11.287841796875, -10.7216796875, -10.155517578125, -9.58935546875, -9.023193359375, -8.45703125, -7.890869140625, -7.32470703125, -6.758544921875, -6.1923828125, -5.626220703125, -5.06005859375, -4.493896484375, -3.927734375, -3.361572265625, -2.79541015625, -2.229248046875, -1.6630859375, -1.096923828125, -0.53076171875, 0.035400390625, 0.6015625, 1.167724609375, 1.73388671875, 2.300048828125, 2.8662109375, 3.432373046875, 3.99853515625, 4.564697265625, 5.130859375, 5.697021484375, 6.26318359375, 6.829345703125, 7.3955078125, 7.961669921875, 8.52783203125, 9.093994140625, 9.66015625, 10.226318359375, 10.79248046875, 11.358642578125, 11.9248046875, 12.490966796875, 13.05712890625, 13.623291015625, 14.189453125, 14.755615234375, 15.32177734375, 15.887939453125, 16.4541015625, 17.020263671875, 17.58642578125, 18.152587890625, 18.71875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 7.0, 2.0, 7.0, 13.0, 21.0, 20.0, 29.0, 33.0, 43.0, 50.0, 66.0, 80.0, 91.0, 106.0, 117.0, 172.0, 169.0, 190.0, 217.0, 265.0, 217.0, 221.0, 221.0, 207.0, 211.0, 189.0, 191.0, 150.0, 132.0, 109.0, 95.0, 91.0, 62.0, 59.0, 42.0, 44.0, 35.0, 29.0, 14.0, 21.0, 5.0, 10.0, 4.0, 5.0, 10.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.8741455078125, -7.576416015625, -7.2786865234375, -6.98095703125, -6.6832275390625, -6.385498046875, -6.0877685546875, -5.7900390625, -5.4923095703125, -5.194580078125, -4.8968505859375, -4.59912109375, -4.3013916015625, -4.003662109375, -3.7059326171875, -3.408203125, -3.1104736328125, -2.812744140625, -2.5150146484375, -2.21728515625, -1.9195556640625, -1.621826171875, -1.3240966796875, -1.0263671875, -0.7286376953125, -0.430908203125, -0.1331787109375, 0.16455078125, 0.4622802734375, 0.760009765625, 1.0577392578125, 1.35546875, 1.6531982421875, 1.950927734375, 2.2486572265625, 2.54638671875, 2.8441162109375, 3.141845703125, 3.4395751953125, 3.7373046875, 4.0350341796875, 4.332763671875, 4.6304931640625, 4.92822265625, 5.2259521484375, 5.523681640625, 5.8214111328125, 6.119140625, 6.4168701171875, 6.714599609375, 7.0123291015625, 7.31005859375, 7.6077880859375, 7.905517578125, 8.2032470703125, 8.5009765625, 8.7987060546875, 9.096435546875, 9.3941650390625, 9.69189453125, 9.9896240234375, 10.287353515625, 10.5850830078125, 10.8828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 11.0, 11.0, 15.0, 17.0, 26.0, 39.0, 36.0, 35.0, 48.0, 57.0, 52.0, 60.0, 59.0, 54.0, 67.0, 67.0, 61.0, 42.0, 37.0, 32.0, 27.0, 25.0, 22.0, 13.0, 13.0, 16.0, 11.0, 8.0, 10.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.869831085205078, -28.953454971313477, -28.037078857421875, -27.120704650878906, -26.204328536987305, -25.287952423095703, -24.371578216552734, -23.455202102661133, -22.53882598876953, -21.62244987487793, -20.706073760986328, -19.78969955444336, -18.873323440551758, -17.956947326660156, -17.040573120117188, -16.124197006225586, -15.207820892333984, -14.291444778442383, -13.375069618225098, -12.458694458007812, -11.542318344116211, -10.62594223022461, -9.709567070007324, -8.793191909790039, -7.8768157958984375, -6.960440158843994, -6.044064521789551, -5.127688884735107, -4.211313247680664, -3.2949376106262207, -2.3785619735717773, -1.462186336517334, -0.5458126068115234, 0.3705630302429199, 1.2869386672973633, 2.2033143043518066, 3.11968994140625, 4.036065578460693, 4.952441215515137, 5.86881685256958, 6.785192489624023, 7.701568126678467, 8.61794376373291, 9.534318923950195, 10.450695037841797, 11.367071151733398, 12.283446311950684, 13.199821472167969, 14.11619758605957, 15.032573699951172, 15.948948860168457, 16.865324020385742, 17.781700134277344, 18.698076248168945, 19.614452362060547, 20.530826568603516, 21.447202682495117, 22.36357879638672, 23.279953002929688, 24.19632911682129, 25.11270523071289, 26.029081344604492, 26.945457458496094, 27.861831665039062, 28.778207778930664]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 8.0, 6.0, 5.0, 5.0, 8.0, 10.0, 17.0, 16.0, 14.0, 29.0, 41.0, 34.0, 34.0, 41.0, 39.0, 43.0, 54.0, 43.0, 55.0, 51.0, 55.0, 53.0, 42.0, 47.0, 33.0, 35.0, 35.0, 29.0, 16.0, 24.0, 16.0, 12.0, 11.0, 15.0, 9.0, 9.0, 6.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.736557006835938, -25.748050689697266, -24.759544372558594, -23.771038055419922, -22.782533645629883, -21.79402732849121, -20.80552101135254, -19.817014694213867, -18.828508377075195, -17.840002059936523, -16.85149574279785, -15.862990379333496, -14.874484062194824, -13.885978698730469, -12.897472381591797, -11.908966064453125, -10.92046070098877, -9.931954383850098, -8.943449020385742, -7.95494270324707, -6.966436386108398, -5.977930545806885, -4.989424705505371, -4.000918388366699, -3.0124125480651855, -2.0239064693450928, -1.0354005098342896, -0.04689455032348633, 0.9416115283966064, 1.9301176071166992, 2.918623447418213, 3.9071297645568848, 4.895635604858398, 5.884141445159912, 6.872647762298584, 7.861153602600098, 8.84965991973877, 9.838165283203125, 10.826671600341797, 11.815177917480469, 12.80368423461914, 13.792190551757812, 14.780695915222168, 15.76920223236084, 16.757707595825195, 17.746213912963867, 18.73472023010254, 19.72322654724121, 20.71173095703125, 21.700237274169922, 22.688743591308594, 23.677249908447266, 24.665754318237305, 25.654260635375977, 26.64276695251465, 27.63127326965332, 28.619779586791992, 29.608285903930664, 30.596792221069336, 31.585296630859375, 32.57380294799805, 33.56230926513672, 34.55081558227539, 35.53932189941406, 36.527828216552734]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 10.0, 12.0, 14.0, 24.0, 40.0, 41.0, 51.0, 96.0, 141.0, 190.0, 300.0, 428.0, 605.0, 967.0, 1562.0, 2291.0, 3716.0, 5721.0, 9425.0, 15496.0, 26680.0, 46011.0, 81775.0, 144231.0, 228414.0, 201643.0, 118034.0, 66039.0, 37930.0, 21785.0, 13100.0, 8066.0, 4854.0, 3055.0, 1982.0, 1265.0, 798.0, 588.0, 396.0, 249.0, 166.0, 110.0, 73.0, 53.0, 38.0, 33.0, 17.0, 17.0, 9.0, 5.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.306640625, -3.202728271484375, -3.09881591796875, -2.994903564453125, -2.8909912109375, -2.787078857421875, -2.68316650390625, -2.579254150390625, -2.475341796875, -2.371429443359375, -2.26751708984375, -2.163604736328125, -2.0596923828125, -1.955780029296875, -1.85186767578125, -1.747955322265625, -1.64404296875, -1.540130615234375, -1.43621826171875, -1.332305908203125, -1.2283935546875, -1.124481201171875, -1.02056884765625, -0.916656494140625, -0.812744140625, -0.708831787109375, -0.60491943359375, -0.501007080078125, -0.3970947265625, -0.293182373046875, -0.18927001953125, -0.085357666015625, 0.0185546875, 0.122467041015625, 0.22637939453125, 0.330291748046875, 0.4342041015625, 0.538116455078125, 0.64202880859375, 0.745941162109375, 0.849853515625, 0.953765869140625, 1.05767822265625, 1.161590576171875, 1.2655029296875, 1.369415283203125, 1.47332763671875, 1.577239990234375, 1.68115234375, 1.785064697265625, 1.88897705078125, 1.992889404296875, 2.0968017578125, 2.200714111328125, 2.30462646484375, 2.408538818359375, 2.512451171875, 2.616363525390625, 2.72027587890625, 2.824188232421875, 2.9281005859375, 3.032012939453125, 3.13592529296875, 3.239837646484375, 3.34375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 11.0, 8.0, 17.0, 27.0, 28.0, 24.0, 41.0, 32.0, 47.0, 37.0, 36.0, 49.0, 40.0, 46.0, 51.0, 47.0, 45.0, 46.0, 47.0, 51.0, 35.0, 31.0, 29.0, 28.0, 27.0, 17.0, 9.0, 11.0, 15.0, 8.0, 7.0, 14.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.185302734375, -24.19873046875, -23.212158203125, -22.2255859375, -21.239013671875, -20.25244140625, -19.265869140625, -18.279296875, -17.292724609375, -16.30615234375, -15.319580078125, -14.3330078125, -13.346435546875, -12.35986328125, -11.373291015625, -10.38671875, -9.400146484375, -8.41357421875, -7.427001953125, -6.4404296875, -5.453857421875, -4.46728515625, -3.480712890625, -2.494140625, -1.507568359375, -0.52099609375, 0.465576171875, 1.4521484375, 2.438720703125, 3.42529296875, 4.411865234375, 5.3984375, 6.385009765625, 7.37158203125, 8.358154296875, 9.3447265625, 10.331298828125, 11.31787109375, 12.304443359375, 13.291015625, 14.277587890625, 15.26416015625, 16.250732421875, 17.2373046875, 18.223876953125, 19.21044921875, 20.197021484375, 21.18359375, 22.170166015625, 23.15673828125, 24.143310546875, 25.1298828125, 26.116455078125, 27.10302734375, 28.089599609375, 29.076171875, 30.062744140625, 31.04931640625, 32.035888671875, 33.0224609375, 34.009033203125, 34.99560546875, 35.982177734375, 36.96875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 11.0, 12.0, 14.0, 24.0, 49.0, 58.0, 142.0, 213.0, 322.0, 604.0, 1046.0, 1967.0, 3581.0, 6379.0, 11815.0, 21918.0, 40511.0, 76469.0, 140496.0, 242575.0, 224902.0, 126383.0, 69048.0, 36674.0, 19579.0, 10707.0, 5727.0, 3222.0, 1783.0, 948.0, 538.0, 327.0, 195.0, 120.0, 70.0, 49.0, 23.0, 16.0, 12.0, 9.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.5390625, -4.416107177734375, -4.29315185546875, -4.170196533203125, -4.0472412109375, -3.924285888671875, -3.80133056640625, -3.678375244140625, -3.555419921875, -3.432464599609375, -3.30950927734375, -3.186553955078125, -3.0635986328125, -2.940643310546875, -2.81768798828125, -2.694732666015625, -2.57177734375, -2.448822021484375, -2.32586669921875, -2.202911376953125, -2.0799560546875, -1.957000732421875, -1.83404541015625, -1.711090087890625, -1.588134765625, -1.465179443359375, -1.34222412109375, -1.219268798828125, -1.0963134765625, -0.973358154296875, -0.85040283203125, -0.727447509765625, -0.6044921875, -0.481536865234375, -0.35858154296875, -0.235626220703125, -0.1126708984375, 0.010284423828125, 0.13323974609375, 0.256195068359375, 0.379150390625, 0.502105712890625, 0.62506103515625, 0.748016357421875, 0.8709716796875, 0.993927001953125, 1.11688232421875, 1.239837646484375, 1.36279296875, 1.485748291015625, 1.60870361328125, 1.731658935546875, 1.8546142578125, 1.977569580078125, 2.10052490234375, 2.223480224609375, 2.346435546875, 2.469390869140625, 2.59234619140625, 2.715301513671875, 2.8382568359375, 2.961212158203125, 3.08416748046875, 3.207122802734375, 3.330078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 4.0, 10.0, 10.0, 14.0, 20.0, 13.0, 21.0, 27.0, 26.0, 28.0, 35.0, 37.0, 34.0, 39.0, 35.0, 36.0, 47.0, 40.0, 32.0, 36.0, 44.0, 33.0, 39.0, 33.0, 32.0, 33.0, 33.0, 24.0, 20.0, 21.0, 16.0, 16.0, 10.0, 16.0, 10.0, 12.0, 11.0, 8.0, 5.0, 5.0, 3.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-15.9765625, -15.4669189453125, -14.957275390625, -14.4476318359375, -13.93798828125, -13.4283447265625, -12.918701171875, -12.4090576171875, -11.8994140625, -11.3897705078125, -10.880126953125, -10.3704833984375, -9.86083984375, -9.3511962890625, -8.841552734375, -8.3319091796875, -7.822265625, -7.3126220703125, -6.802978515625, -6.2933349609375, -5.78369140625, -5.2740478515625, -4.764404296875, -4.2547607421875, -3.7451171875, -3.2354736328125, -2.725830078125, -2.2161865234375, -1.70654296875, -1.1968994140625, -0.687255859375, -0.1776123046875, 0.33203125, 0.8416748046875, 1.351318359375, 1.8609619140625, 2.37060546875, 2.8802490234375, 3.389892578125, 3.8995361328125, 4.4091796875, 4.9188232421875, 5.428466796875, 5.9381103515625, 6.44775390625, 6.9573974609375, 7.467041015625, 7.9766845703125, 8.486328125, 8.9959716796875, 9.505615234375, 10.0152587890625, 10.52490234375, 11.0345458984375, 11.544189453125, 12.0538330078125, 12.5634765625, 13.0731201171875, 13.582763671875, 14.0924072265625, 14.60205078125, 15.1116943359375, 15.621337890625, 16.1309814453125, 16.640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 12.0, 7.0, 13.0, 6.0, 15.0, 20.0, 42.0, 43.0, 65.0, 108.0, 140.0, 200.0, 256.0, 366.0, 612.0, 879.0, 1386.0, 2132.0, 3590.0, 6236.0, 11236.0, 22808.0, 53437.0, 155392.0, 420522.0, 231725.0, 74284.0, 30100.0, 14059.0, 7313.0, 4206.0, 2550.0, 1557.0, 1041.0, 669.0, 455.0, 315.0, 216.0, 154.0, 115.0, 85.0, 54.0, 41.0, 29.0, 22.0, 9.0, 14.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.55224609375, -0.5358428955078125, -0.519439697265625, -0.5030364990234375, -0.48663330078125, -0.4702301025390625, -0.453826904296875, -0.4374237060546875, -0.4210205078125, -0.4046173095703125, -0.388214111328125, -0.3718109130859375, -0.35540771484375, -0.3390045166015625, -0.322601318359375, -0.3061981201171875, -0.289794921875, -0.2733917236328125, -0.256988525390625, -0.2405853271484375, -0.22418212890625, -0.2077789306640625, -0.191375732421875, -0.1749725341796875, -0.1585693359375, -0.1421661376953125, -0.125762939453125, -0.1093597412109375, -0.09295654296875, -0.0765533447265625, -0.060150146484375, -0.0437469482421875, -0.02734375, -0.0109405517578125, 0.005462646484375, 0.0218658447265625, 0.03826904296875, 0.0546722412109375, 0.071075439453125, 0.0874786376953125, 0.1038818359375, 0.1202850341796875, 0.136688232421875, 0.1530914306640625, 0.16949462890625, 0.1858978271484375, 0.202301025390625, 0.2187042236328125, 0.235107421875, 0.2515106201171875, 0.267913818359375, 0.2843170166015625, 0.30072021484375, 0.3171234130859375, 0.333526611328125, 0.3499298095703125, 0.3663330078125, 0.3827362060546875, 0.399139404296875, 0.4155426025390625, 0.43194580078125, 0.4483489990234375, 0.464752197265625, 0.4811553955078125, 0.49755859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 14.0, 15.0, 13.0, 25.0, 23.0, 39.0, 33.0, 44.0, 52.0, 53.0, 64.0, 73.0, 64.0, 64.0, 60.0, 62.0, 54.0, 62.0, 41.0, 31.0, 21.0, 22.0, 20.0, 6.0, 14.0, 5.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.612041473388672e-05, -3.486312925815582e-05, -3.360584378242493e-05, -3.234855830669403e-05, -3.1091272830963135e-05, -2.983398735523224e-05, -2.8576701879501343e-05, -2.7319416403770447e-05, -2.606213092803955e-05, -2.4804845452308655e-05, -2.354755997657776e-05, -2.2290274500846863e-05, -2.1032989025115967e-05, -1.977570354938507e-05, -1.8518418073654175e-05, -1.726113259792328e-05, -1.6003847122192383e-05, -1.4746561646461487e-05, -1.348927617073059e-05, -1.2231990694999695e-05, -1.0974705219268799e-05, -9.717419743537903e-06, -8.460134267807007e-06, -7.202848792076111e-06, -5.945563316345215e-06, -4.688277840614319e-06, -3.430992364883423e-06, -2.173706889152527e-06, -9.164214134216309e-07, 3.4086406230926514e-07, 1.5981495380401611e-06, 2.855435013771057e-06, 4.112720489501953e-06, 5.370005965232849e-06, 6.627291440963745e-06, 7.884576916694641e-06, 9.141862392425537e-06, 1.0399147868156433e-05, 1.1656433343887329e-05, 1.2913718819618225e-05, 1.4171004295349121e-05, 1.5428289771080017e-05, 1.6685575246810913e-05, 1.794286072254181e-05, 1.9200146198272705e-05, 2.04574316740036e-05, 2.1714717149734497e-05, 2.2972002625465393e-05, 2.422928810119629e-05, 2.5486573576927185e-05, 2.674385905265808e-05, 2.8001144528388977e-05, 2.9258430004119873e-05, 3.051571547985077e-05, 3.1773000955581665e-05, 3.303028643131256e-05, 3.428757190704346e-05, 3.554485738277435e-05, 3.680214285850525e-05, 3.8059428334236145e-05, 3.931671380996704e-05, 4.057399928569794e-05, 4.183128476142883e-05, 4.308857023715973e-05, 4.4345855712890625e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 15.0, 16.0, 25.0, 29.0, 47.0, 59.0, 102.0, 128.0, 255.0, 363.0, 519.0, 807.0, 1184.0, 1799.0, 2758.0, 4454.0, 7079.0, 11426.0, 19347.0, 33694.0, 62607.0, 125795.0, 263163.0, 252634.0, 118944.0, 60005.0, 32290.0, 18704.0, 11222.0, 6775.0, 4400.0, 2730.0, 1814.0, 1164.0, 742.0, 443.0, 339.0, 209.0, 148.0, 110.0, 64.0, 51.0, 38.0, 12.0, 16.0, 9.0, 10.0, 7.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.63330078125, -0.6151885986328125, -0.597076416015625, -0.5789642333984375, -0.56085205078125, -0.5427398681640625, -0.524627685546875, -0.5065155029296875, -0.4884033203125, -0.4702911376953125, -0.452178955078125, -0.4340667724609375, -0.41595458984375, -0.3978424072265625, -0.379730224609375, -0.3616180419921875, -0.343505859375, -0.3253936767578125, -0.307281494140625, -0.2891693115234375, -0.27105712890625, -0.2529449462890625, -0.234832763671875, -0.2167205810546875, -0.1986083984375, -0.1804962158203125, -0.162384033203125, -0.1442718505859375, -0.12615966796875, -0.1080474853515625, -0.089935302734375, -0.0718231201171875, -0.0537109375, -0.0355987548828125, -0.017486572265625, 0.0006256103515625, 0.01873779296875, 0.0368499755859375, 0.054962158203125, 0.0730743408203125, 0.0911865234375, 0.1092987060546875, 0.127410888671875, 0.1455230712890625, 0.16363525390625, 0.1817474365234375, 0.199859619140625, 0.2179718017578125, 0.236083984375, 0.2541961669921875, 0.272308349609375, 0.2904205322265625, 0.30853271484375, 0.3266448974609375, 0.344757080078125, 0.3628692626953125, 0.3809814453125, 0.3990936279296875, 0.417205810546875, 0.4353179931640625, 0.45343017578125, 0.4715423583984375, 0.489654541015625, 0.5077667236328125, 0.52587890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 16.0, 16.0, 17.0, 22.0, 22.0, 40.0, 47.0, 58.0, 107.0, 98.0, 113.0, 93.0, 85.0, 56.0, 43.0, 43.0, 24.0, 23.0, 13.0, 13.0, 9.0, 10.0, 13.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.288330078125, -0.27851104736328125, -0.2686920166015625, -0.25887298583984375, -0.249053955078125, -0.23923492431640625, -0.2294158935546875, -0.21959686279296875, -0.20977783203125, -0.19995880126953125, -0.1901397705078125, -0.18032073974609375, -0.170501708984375, -0.16068267822265625, -0.1508636474609375, -0.14104461669921875, -0.1312255859375, -0.12140655517578125, -0.1115875244140625, -0.10176849365234375, -0.091949462890625, -0.08213043212890625, -0.0723114013671875, -0.06249237060546875, -0.05267333984375, -0.04285430908203125, -0.0330352783203125, -0.02321624755859375, -0.013397216796875, -0.00357818603515625, 0.0062408447265625, 0.01605987548828125, 0.02587890625, 0.03569793701171875, 0.0455169677734375, 0.05533599853515625, 0.065155029296875, 0.07497406005859375, 0.0847930908203125, 0.09461212158203125, 0.10443115234375, 0.11425018310546875, 0.1240692138671875, 0.13388824462890625, 0.143707275390625, 0.15352630615234375, 0.1633453369140625, 0.17316436767578125, 0.1829833984375, 0.19280242919921875, 0.2026214599609375, 0.21244049072265625, 0.222259521484375, 0.23207855224609375, 0.2418975830078125, 0.25171661376953125, 0.26153564453125, 0.27135467529296875, 0.2811737060546875, 0.29099273681640625, 0.300811767578125, 0.31063079833984375, 0.3204498291015625, 0.33026885986328125, 0.340087890625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 11.0, 8.0, 14.0, 16.0, 16.0, 34.0, 37.0, 34.0, 36.0, 50.0, 57.0, 53.0, 60.0, 56.0, 58.0, 60.0, 77.0, 51.0, 45.0, 33.0, 29.0, 28.0, 27.0, 20.0, 15.0, 12.0, 14.0, 9.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.633197784423828, -28.719789505004883, -27.806379318237305, -26.89297103881836, -25.979562759399414, -25.06615447998047, -24.15274429321289, -23.239336013793945, -22.325927734375, -21.412519454956055, -20.499109268188477, -19.58570098876953, -18.672292709350586, -17.75888442993164, -16.845474243164062, -15.932065963745117, -15.018656730651855, -14.105247497558594, -13.191839218139648, -12.278429985046387, -11.365021705627441, -10.45161247253418, -9.538204193115234, -8.624794960021973, -7.711386203765869, -6.797977447509766, -5.884568691253662, -4.971159934997559, -4.057750701904297, -3.1443419456481934, -2.23093318939209, -1.3175244331359863, -0.4041156768798828, 0.5092931389808655, 1.4227019548416138, 2.336110830307007, 3.2495195865631104, 4.162928581237793, 5.0763373374938965, 5.98974609375, 6.9031548500061035, 7.816563606262207, 8.729972839355469, 9.643381118774414, 10.556790351867676, 11.470199584960938, 12.383607864379883, 13.297016143798828, 14.21042537689209, 15.123834609985352, 16.037242889404297, 16.950651168823242, 17.86406135559082, 18.777469635009766, 19.69087791442871, 20.604286193847656, 21.517696380615234, 22.43110466003418, 23.344514846801758, 24.257923126220703, 25.17133140563965, 26.084739685058594, 26.998149871826172, 27.911558151245117, 28.824966430664062]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 8.0, 6.0, 5.0, 5.0, 8.0, 8.0, 20.0, 15.0, 14.0, 30.0, 39.0, 34.0, 36.0, 40.0, 39.0, 45.0, 53.0, 43.0, 58.0, 50.0, 54.0, 53.0, 42.0, 47.0, 33.0, 34.0, 34.0, 32.0, 15.0, 23.0, 14.0, 14.0, 11.0, 16.0, 7.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.855358123779297, -25.862546920776367, -24.869735717773438, -23.876924514770508, -22.884113311767578, -21.89130210876465, -20.89849090576172, -19.90567970275879, -18.91286849975586, -17.92005729675293, -16.92724609375, -15.93443489074707, -14.94162368774414, -13.948812484741211, -12.956001281738281, -11.963190078735352, -10.970379829406738, -9.977568626403809, -8.984757423400879, -7.991946220397949, -6.9991350173950195, -6.006324291229248, -5.013513088226318, -4.020701885223389, -3.027890682220459, -2.0350794792175293, -1.0422683954238892, -0.04945731163024902, 0.9433538913726807, 1.9361648559570312, 2.928976058959961, 3.9217872619628906, 4.91459846496582, 5.90740966796875, 6.90022087097168, 7.893032073974609, 8.885843276977539, 9.878654479980469, 10.871465682983398, 11.864276885986328, 12.857088088989258, 13.849899291992188, 14.842710494995117, 15.835521697998047, 16.828332901000977, 17.821144104003906, 18.813955307006836, 19.806766510009766, 20.799575805664062, 21.792387008666992, 22.785198211669922, 23.77800941467285, 24.77082061767578, 25.76363182067871, 26.75644302368164, 27.74925422668457, 28.7420654296875, 29.73487663269043, 30.72768783569336, 31.72049903869629, 32.71331024169922, 33.706119537353516, 34.69893264770508, 35.691741943359375, 36.68455505371094]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 8.0, 8.0, 11.0, 14.0, 26.0, 39.0, 47.0, 71.0, 120.0, 201.0, 267.0, 485.0, 740.0, 1268.0, 2001.0, 3384.0, 5832.0, 10312.0, 18664.0, 35129.0, 65849.0, 115989.0, 173223.0, 199124.0, 168414.0, 110472.0, 62198.0, 33263.0, 17827.0, 9833.0, 5416.0, 3264.0, 1899.0, 1175.0, 697.0, 472.0, 292.0, 170.0, 123.0, 83.0, 52.0, 37.0, 23.0, 11.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.46875, -17.8623046875, -17.255859375, -16.6494140625, -16.04296875, -15.4365234375, -14.830078125, -14.2236328125, -13.6171875, -13.0107421875, -12.404296875, -11.7978515625, -11.19140625, -10.5849609375, -9.978515625, -9.3720703125, -8.765625, -8.1591796875, -7.552734375, -6.9462890625, -6.33984375, -5.7333984375, -5.126953125, -4.5205078125, -3.9140625, -3.3076171875, -2.701171875, -2.0947265625, -1.48828125, -0.8818359375, -0.275390625, 0.3310546875, 0.9375, 1.5439453125, 2.150390625, 2.7568359375, 3.36328125, 3.9697265625, 4.576171875, 5.1826171875, 5.7890625, 6.3955078125, 7.001953125, 7.6083984375, 8.21484375, 8.8212890625, 9.427734375, 10.0341796875, 10.640625, 11.2470703125, 11.853515625, 12.4599609375, 13.06640625, 13.6728515625, 14.279296875, 14.8857421875, 15.4921875, 16.0986328125, 16.705078125, 17.3115234375, 17.91796875, 18.5244140625, 19.130859375, 19.7373046875, 20.34375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 9.0, 9.0, 14.0, 17.0, 27.0, 23.0, 24.0, 29.0, 42.0, 37.0, 41.0, 51.0, 40.0, 57.0, 53.0, 48.0, 53.0, 39.0, 50.0, 54.0, 42.0, 29.0, 35.0, 20.0, 24.0, 19.0, 17.0, 12.0, 10.0, 17.0, 9.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.64208984375, -24.6591796875, -23.67626953125, -22.693359375, -21.71044921875, -20.7275390625, -19.74462890625, -18.76171875, -17.77880859375, -16.7958984375, -15.81298828125, -14.830078125, -13.84716796875, -12.8642578125, -11.88134765625, -10.8984375, -9.91552734375, -8.9326171875, -7.94970703125, -6.966796875, -5.98388671875, -5.0009765625, -4.01806640625, -3.03515625, -2.05224609375, -1.0693359375, -0.08642578125, 0.896484375, 1.87939453125, 2.8623046875, 3.84521484375, 4.828125, 5.81103515625, 6.7939453125, 7.77685546875, 8.759765625, 9.74267578125, 10.7255859375, 11.70849609375, 12.69140625, 13.67431640625, 14.6572265625, 15.64013671875, 16.623046875, 17.60595703125, 18.5888671875, 19.57177734375, 20.5546875, 21.53759765625, 22.5205078125, 23.50341796875, 24.486328125, 25.46923828125, 26.4521484375, 27.43505859375, 28.41796875, 29.40087890625, 30.3837890625, 31.36669921875, 32.349609375, 33.33251953125, 34.3154296875, 35.29833984375, 36.28125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 14.0, 17.0, 27.0, 31.0, 67.0, 89.0, 111.0, 188.0, 277.0, 397.0, 594.0, 855.0, 1265.0, 1995.0, 3147.0, 5111.0, 8373.0, 14460.0, 24847.0, 44497.0, 78381.0, 129244.0, 178568.0, 186664.0, 147653.0, 93848.0, 53883.0, 30054.0, 17265.0, 9896.0, 6006.0, 3790.0, 2371.0, 1487.0, 1074.0, 665.0, 448.0, 279.0, 202.0, 138.0, 83.0, 51.0, 48.0, 33.0, 22.0, 16.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.688720703125, -20.06494140625, -19.441162109375, -18.8173828125, -18.193603515625, -17.56982421875, -16.946044921875, -16.322265625, -15.698486328125, -15.07470703125, -14.450927734375, -13.8271484375, -13.203369140625, -12.57958984375, -11.955810546875, -11.33203125, -10.708251953125, -10.08447265625, -9.460693359375, -8.8369140625, -8.213134765625, -7.58935546875, -6.965576171875, -6.341796875, -5.718017578125, -5.09423828125, -4.470458984375, -3.8466796875, -3.222900390625, -2.59912109375, -1.975341796875, -1.3515625, -0.727783203125, -0.10400390625, 0.519775390625, 1.1435546875, 1.767333984375, 2.39111328125, 3.014892578125, 3.638671875, 4.262451171875, 4.88623046875, 5.510009765625, 6.1337890625, 6.757568359375, 7.38134765625, 8.005126953125, 8.62890625, 9.252685546875, 9.87646484375, 10.500244140625, 11.1240234375, 11.747802734375, 12.37158203125, 12.995361328125, 13.619140625, 14.242919921875, 14.86669921875, 15.490478515625, 16.1142578125, 16.738037109375, 17.36181640625, 17.985595703125, 18.609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 15.0, 12.0, 11.0, 15.0, 25.0, 26.0, 27.0, 30.0, 27.0, 36.0, 32.0, 35.0, 43.0, 41.0, 45.0, 55.0, 37.0, 49.0, 43.0, 34.0, 30.0, 40.0, 39.0, 29.0, 28.0, 18.0, 25.0, 25.0, 11.0, 12.0, 18.0, 11.0, 10.0, 9.0, 6.0, 8.0, 11.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7265625, -15.1771240234375, -14.627685546875, -14.0782470703125, -13.52880859375, -12.9793701171875, -12.429931640625, -11.8804931640625, -11.3310546875, -10.7816162109375, -10.232177734375, -9.6827392578125, -9.13330078125, -8.5838623046875, -8.034423828125, -7.4849853515625, -6.935546875, -6.3861083984375, -5.836669921875, -5.2872314453125, -4.73779296875, -4.1883544921875, -3.638916015625, -3.0894775390625, -2.5400390625, -1.9906005859375, -1.441162109375, -0.8917236328125, -0.34228515625, 0.2071533203125, 0.756591796875, 1.3060302734375, 1.85546875, 2.4049072265625, 2.954345703125, 3.5037841796875, 4.05322265625, 4.6026611328125, 5.152099609375, 5.7015380859375, 6.2509765625, 6.8004150390625, 7.349853515625, 7.8992919921875, 8.44873046875, 8.9981689453125, 9.547607421875, 10.0970458984375, 10.646484375, 11.1959228515625, 11.745361328125, 12.2947998046875, 12.84423828125, 13.3936767578125, 13.943115234375, 14.4925537109375, 15.0419921875, 15.5914306640625, 16.140869140625, 16.6903076171875, 17.23974609375, 17.7891845703125, 18.338623046875, 18.8880615234375, 19.4375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 16.0, 14.0, 19.0, 33.0, 46.0, 81.0, 130.0, 238.0, 367.0, 714.0, 1187.0, 2188.0, 3924.0, 7657.0, 14417.0, 27104.0, 49907.0, 85020.0, 128563.0, 163866.0, 170992.0, 146700.0, 103915.0, 64733.0, 35665.0, 19130.0, 9900.0, 5393.0, 2962.0, 1580.0, 893.0, 501.0, 303.0, 158.0, 99.0, 65.0, 36.0, 18.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.57421875, -6.3763427734375, -6.178466796875, -5.9805908203125, -5.78271484375, -5.5848388671875, -5.386962890625, -5.1890869140625, -4.9912109375, -4.7933349609375, -4.595458984375, -4.3975830078125, -4.19970703125, -4.0018310546875, -3.803955078125, -3.6060791015625, -3.408203125, -3.2103271484375, -3.012451171875, -2.8145751953125, -2.61669921875, -2.4188232421875, -2.220947265625, -2.0230712890625, -1.8251953125, -1.6273193359375, -1.429443359375, -1.2315673828125, -1.03369140625, -0.8358154296875, -0.637939453125, -0.4400634765625, -0.2421875, -0.0443115234375, 0.153564453125, 0.3514404296875, 0.54931640625, 0.7471923828125, 0.945068359375, 1.1429443359375, 1.3408203125, 1.5386962890625, 1.736572265625, 1.9344482421875, 2.13232421875, 2.3302001953125, 2.528076171875, 2.7259521484375, 2.923828125, 3.1217041015625, 3.319580078125, 3.5174560546875, 3.71533203125, 3.9132080078125, 4.111083984375, 4.3089599609375, 4.5068359375, 4.7047119140625, 4.902587890625, 5.1004638671875, 5.29833984375, 5.4962158203125, 5.694091796875, 5.8919677734375, 6.08984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 7.0, 10.0, 13.0, 24.0, 27.0, 29.0, 32.0, 48.0, 33.0, 68.0, 65.0, 78.0, 53.0, 59.0, 71.0, 56.0, 57.0, 58.0, 36.0, 36.0, 40.0, 20.0, 21.0, 13.0, 8.0, 7.0, 11.0, 5.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00054168701171875, -0.0005190297961235046, -0.0004963725805282593, -0.0004737153649330139, -0.00045105814933776855, -0.0004284009337425232, -0.00040574371814727783, -0.00038308650255203247, -0.0003604292869567871, -0.00033777207136154175, -0.0003151148557662964, -0.000292457640171051, -0.00026980042457580566, -0.0002471432089805603, -0.00022448599338531494, -0.00020182877779006958, -0.00017917156219482422, -0.00015651434659957886, -0.0001338571310043335, -0.00011119991540908813, -8.854269981384277e-05, -6.588548421859741e-05, -4.322826862335205e-05, -2.057105302810669e-05, 2.086162567138672e-06, 2.4743378162384033e-05, 4.7400593757629395e-05, 7.005780935287476e-05, 9.271502494812012e-05, 0.00011537224054336548, 0.00013802945613861084, 0.0001606866717338562, 0.00018334388732910156, 0.00020600110292434692, 0.00022865831851959229, 0.00025131553411483765, 0.000273972749710083, 0.00029662996530532837, 0.00031928718090057373, 0.0003419443964958191, 0.00036460161209106445, 0.0003872588276863098, 0.0004099160432815552, 0.00043257325887680054, 0.0004552304744720459, 0.00047788769006729126, 0.0005005449056625366, 0.000523202121257782, 0.0005458593368530273, 0.0005685165524482727, 0.0005911737680435181, 0.0006138309836387634, 0.0006364881992340088, 0.0006591454148292542, 0.0006818026304244995, 0.0007044598460197449, 0.0007271170616149902, 0.0007497742772102356, 0.000772431492805481, 0.0007950887084007263, 0.0008177459239959717, 0.000840403139591217, 0.0008630603551864624, 0.0008857175707817078, 0.0009083747863769531]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 15.0, 20.0, 19.0, 39.0, 53.0, 70.0, 108.0, 149.0, 193.0, 271.0, 419.0, 598.0, 974.0, 1454.0, 2410.0, 3990.0, 7022.0, 12184.0, 21379.0, 37494.0, 62017.0, 95253.0, 130796.0, 154475.0, 152414.0, 128202.0, 92226.0, 59726.0, 35567.0, 20427.0, 11424.0, 6624.0, 3808.0, 2359.0, 1423.0, 977.0, 626.0, 418.0, 257.0, 201.0, 147.0, 97.0, 73.0, 62.0, 30.0, 25.0, 15.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.984375, -5.80279541015625, -5.6212158203125, -5.43963623046875, -5.258056640625, -5.07647705078125, -4.8948974609375, -4.71331787109375, -4.53173828125, -4.35015869140625, -4.1685791015625, -3.98699951171875, -3.805419921875, -3.62384033203125, -3.4422607421875, -3.26068115234375, -3.0791015625, -2.89752197265625, -2.7159423828125, -2.53436279296875, -2.352783203125, -2.17120361328125, -1.9896240234375, -1.80804443359375, -1.62646484375, -1.44488525390625, -1.2633056640625, -1.08172607421875, -0.900146484375, -0.71856689453125, -0.5369873046875, -0.35540771484375, -0.173828125, 0.00775146484375, 0.1893310546875, 0.37091064453125, 0.552490234375, 0.73406982421875, 0.9156494140625, 1.09722900390625, 1.27880859375, 1.46038818359375, 1.6419677734375, 1.82354736328125, 2.005126953125, 2.18670654296875, 2.3682861328125, 2.54986572265625, 2.7314453125, 2.91302490234375, 3.0946044921875, 3.27618408203125, 3.457763671875, 3.63934326171875, 3.8209228515625, 4.00250244140625, 4.18408203125, 4.36566162109375, 4.5472412109375, 4.72882080078125, 4.910400390625, 5.09197998046875, 5.2735595703125, 5.45513916015625, 5.63671875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 7.0, 7.0, 9.0, 9.0, 15.0, 18.0, 18.0, 22.0, 22.0, 14.0, 31.0, 36.0, 32.0, 33.0, 35.0, 41.0, 42.0, 31.0, 47.0, 43.0, 46.0, 33.0, 42.0, 29.0, 40.0, 31.0, 30.0, 45.0, 33.0, 17.0, 25.0, 19.0, 20.0, 8.0, 14.0, 12.0, 5.0, 7.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2921600341796875, -1.248382568359375, -1.2046051025390625, -1.16082763671875, -1.1170501708984375, -1.073272705078125, -1.0294952392578125, -0.9857177734375, -0.9419403076171875, -0.898162841796875, -0.8543853759765625, -0.81060791015625, -0.7668304443359375, -0.723052978515625, -0.6792755126953125, -0.635498046875, -0.5917205810546875, -0.547943115234375, -0.5041656494140625, -0.46038818359375, -0.4166107177734375, -0.372833251953125, -0.3290557861328125, -0.2852783203125, -0.2415008544921875, -0.197723388671875, -0.1539459228515625, -0.11016845703125, -0.0663909912109375, -0.022613525390625, 0.0211639404296875, 0.06494140625, 0.1087188720703125, 0.152496337890625, 0.1962738037109375, 0.24005126953125, 0.2838287353515625, 0.327606201171875, 0.3713836669921875, 0.4151611328125, 0.4589385986328125, 0.502716064453125, 0.5464935302734375, 0.59027099609375, 0.6340484619140625, 0.677825927734375, 0.7216033935546875, 0.765380859375, 0.8091583251953125, 0.852935791015625, 0.8967132568359375, 0.94049072265625, 0.9842681884765625, 1.028045654296875, 1.0718231201171875, 1.1156005859375, 1.1593780517578125, 1.203155517578125, 1.2469329833984375, 1.29071044921875, 1.3344879150390625, 1.378265380859375, 1.4220428466796875, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 11.0, 13.0, 17.0, 31.0, 34.0, 35.0, 32.0, 40.0, 42.0, 57.0, 57.0, 53.0, 61.0, 54.0, 50.0, 53.0, 53.0, 44.0, 34.0, 34.0, 33.0, 25.0, 15.0, 15.0, 12.0, 17.0, 8.0, 11.0, 10.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-27.81768798828125, -26.92951774597168, -26.04134750366211, -25.15317726135254, -24.26500701904297, -23.3768367767334, -22.488666534423828, -21.60049819946289, -20.712326049804688, -19.824155807495117, -18.935985565185547, -18.047815322875977, -17.159645080566406, -16.271474838256836, -15.383305549621582, -14.495135307312012, -13.606966018676758, -12.718795776367188, -11.830625534057617, -10.942455291748047, -10.054285049438477, -9.166114807128906, -8.277945518493652, -7.389775276184082, -6.501605033874512, -5.613434791564941, -4.725264549255371, -3.837094783782959, -2.9489245414733887, -2.0607542991638184, -1.1725845336914062, -0.28441429138183594, 0.6037578582763672, 1.491927981376648, 2.3800981044769287, 3.26826810836792, 4.15643835067749, 5.0446085929870605, 5.932778358459473, 6.820948600769043, 7.709118843078613, 8.597289085388184, 9.485459327697754, 10.373628616333008, 11.261798858642578, 12.149969100952148, 13.038139343261719, 13.926309585571289, 14.81447982788086, 15.70265007019043, 16.5908203125, 17.47899055480957, 18.36716079711914, 19.25533103942871, 20.14350128173828, 21.03166961669922, 21.919841766357422, 22.808012008666992, 23.696182250976562, 24.584352493286133, 25.472522735595703, 26.360692977905273, 27.248863220214844, 28.13703155517578, 29.02520179748535]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 6.0, 8.0, 10.0, 14.0, 15.0, 19.0, 18.0, 35.0, 33.0, 41.0, 26.0, 50.0, 44.0, 44.0, 42.0, 41.0, 47.0, 50.0, 39.0, 48.0, 29.0, 46.0, 35.0, 32.0, 30.0, 23.0, 26.0, 27.0, 13.0, 22.0, 12.0, 10.0, 10.0, 12.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.49903106689453, -28.445465087890625, -27.39189910888672, -26.338333129882812, -25.284767150878906, -24.231201171875, -23.177635192871094, -22.124069213867188, -21.07050323486328, -20.016937255859375, -18.96337127685547, -17.909805297851562, -16.856239318847656, -15.80267333984375, -14.74910831451416, -13.695542335510254, -12.641977310180664, -11.588411331176758, -10.534845352172852, -9.481279373168945, -8.427713394165039, -7.374147891998291, -6.320582389831543, -5.267016410827637, -4.2134504318237305, -3.159884452819824, -2.106318712234497, -1.05275297164917, 0.0008130073547363281, 1.0543789863586426, 2.1079444885253906, 3.161510467529297, 4.215076446533203, 5.268642425537109, 6.322208404541016, 7.375773906707764, 8.429340362548828, 9.482906341552734, 10.536471366882324, 11.59003734588623, 12.643603324890137, 13.697169303894043, 14.75073528289795, 15.804300308227539, 16.857866287231445, 17.91143226623535, 18.964998245239258, 20.018564224243164, 21.07213020324707, 22.125696182250977, 23.179262161254883, 24.23282814025879, 25.286394119262695, 26.3399600982666, 27.393524169921875, 28.44709014892578, 29.500656127929688, 30.554222106933594, 31.6077880859375, 32.661354064941406, 33.71492004394531, 34.76848602294922, 35.822052001953125, 36.87561798095703, 37.92918395996094]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 8.0, 19.0, 33.0, 42.0, 60.0, 109.0, 129.0, 240.0, 344.0, 443.0, 745.0, 1160.0, 1784.0, 2647.0, 4146.0, 5921.0, 9197.0, 14011.0, 21529.0, 33713.0, 53025.0, 85966.0, 140043.0, 231499.0, 387524.0, 602939.0, 751853.0, 674090.0, 457785.0, 276790.0, 164138.0, 99269.0, 61242.0, 38505.0, 24784.0, 16079.0, 10701.0, 6987.0, 4654.0, 3165.0, 2173.0, 1447.0, 1049.0, 714.0, 494.0, 341.0, 230.0, 155.0, 97.0, 80.0, 55.0, 43.0, 36.0, 17.0, 16.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0], "bins": [-25.453125, -24.595458984375, -23.73779296875, -22.880126953125, -22.0224609375, -21.164794921875, -20.30712890625, -19.449462890625, -18.591796875, -17.734130859375, -16.87646484375, -16.018798828125, -15.1611328125, -14.303466796875, -13.44580078125, -12.588134765625, -11.73046875, -10.872802734375, -10.01513671875, -9.157470703125, -8.2998046875, -7.442138671875, -6.58447265625, -5.726806640625, -4.869140625, -4.011474609375, -3.15380859375, -2.296142578125, -1.4384765625, -0.580810546875, 0.27685546875, 1.134521484375, 1.9921875, 2.849853515625, 3.70751953125, 4.565185546875, 5.4228515625, 6.280517578125, 7.13818359375, 7.995849609375, 8.853515625, 9.711181640625, 10.56884765625, 11.426513671875, 12.2841796875, 13.141845703125, 13.99951171875, 14.857177734375, 15.71484375, 16.572509765625, 17.43017578125, 18.287841796875, 19.1455078125, 20.003173828125, 20.86083984375, 21.718505859375, 22.576171875, 23.433837890625, 24.29150390625, 25.149169921875, 26.0068359375, 26.864501953125, 27.72216796875, 28.579833984375, 29.4375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 11.0, 7.0, 5.0, 16.0, 17.0, 25.0, 25.0, 20.0, 32.0, 33.0, 29.0, 43.0, 45.0, 36.0, 39.0, 42.0, 45.0, 51.0, 50.0, 45.0, 38.0, 30.0, 33.0, 37.0, 36.0, 23.0, 35.0, 10.0, 23.0, 20.0, 14.0, 13.0, 9.0, 12.0, 11.0, 3.0, 6.0, 1.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-29.421875, -28.424072265625, -27.42626953125, -26.428466796875, -25.4306640625, -24.432861328125, -23.43505859375, -22.437255859375, -21.439453125, -20.441650390625, -19.44384765625, -18.446044921875, -17.4482421875, -16.450439453125, -15.45263671875, -14.454833984375, -13.45703125, -12.459228515625, -11.46142578125, -10.463623046875, -9.4658203125, -8.468017578125, -7.47021484375, -6.472412109375, -5.474609375, -4.476806640625, -3.47900390625, -2.481201171875, -1.4833984375, -0.485595703125, 0.51220703125, 1.510009765625, 2.5078125, 3.505615234375, 4.50341796875, 5.501220703125, 6.4990234375, 7.496826171875, 8.49462890625, 9.492431640625, 10.490234375, 11.488037109375, 12.48583984375, 13.483642578125, 14.4814453125, 15.479248046875, 16.47705078125, 17.474853515625, 18.47265625, 19.470458984375, 20.46826171875, 21.466064453125, 22.4638671875, 23.461669921875, 24.45947265625, 25.457275390625, 26.455078125, 27.452880859375, 28.45068359375, 29.448486328125, 30.4462890625, 31.444091796875, 32.44189453125, 33.439697265625, 34.4375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 5.0, 11.0, 16.0, 25.0, 38.0, 69.0, 85.0, 142.0, 203.0, 352.0, 552.0, 797.0, 1379.0, 2267.0, 3768.0, 6469.0, 11216.0, 19880.0, 34230.0, 60751.0, 107077.0, 187620.0, 325644.0, 530464.0, 750123.0, 769835.0, 562413.0, 347648.0, 203121.0, 115091.0, 65133.0, 36953.0, 21069.0, 12217.0, 7046.0, 4171.0, 2419.0, 1541.0, 912.0, 563.0, 378.0, 209.0, 136.0, 94.0, 62.0, 33.0, 22.0, 15.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-37.96875, -36.78466796875, -35.6005859375, -34.41650390625, -33.232421875, -32.04833984375, -30.8642578125, -29.68017578125, -28.49609375, -27.31201171875, -26.1279296875, -24.94384765625, -23.759765625, -22.57568359375, -21.3916015625, -20.20751953125, -19.0234375, -17.83935546875, -16.6552734375, -15.47119140625, -14.287109375, -13.10302734375, -11.9189453125, -10.73486328125, -9.55078125, -8.36669921875, -7.1826171875, -5.99853515625, -4.814453125, -3.63037109375, -2.4462890625, -1.26220703125, -0.078125, 1.10595703125, 2.2900390625, 3.47412109375, 4.658203125, 5.84228515625, 7.0263671875, 8.21044921875, 9.39453125, 10.57861328125, 11.7626953125, 12.94677734375, 14.130859375, 15.31494140625, 16.4990234375, 17.68310546875, 18.8671875, 20.05126953125, 21.2353515625, 22.41943359375, 23.603515625, 24.78759765625, 25.9716796875, 27.15576171875, 28.33984375, 29.52392578125, 30.7080078125, 31.89208984375, 33.076171875, 34.26025390625, 35.4443359375, 36.62841796875, 37.8125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 12.0, 12.0, 20.0, 24.0, 31.0, 43.0, 42.0, 58.0, 79.0, 105.0, 88.0, 126.0, 139.0, 193.0, 220.0, 198.0, 256.0, 241.0, 275.0, 226.0, 260.0, 228.0, 168.0, 152.0, 157.0, 122.0, 121.0, 90.0, 66.0, 52.0, 59.0, 34.0, 33.0, 29.0, 19.0, 16.0, 14.0, 16.0, 6.0, 6.0, 6.0, 9.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-17.265625, -16.7314453125, -16.197265625, -15.6630859375, -15.12890625, -14.5947265625, -14.060546875, -13.5263671875, -12.9921875, -12.4580078125, -11.923828125, -11.3896484375, -10.85546875, -10.3212890625, -9.787109375, -9.2529296875, -8.71875, -8.1845703125, -7.650390625, -7.1162109375, -6.58203125, -6.0478515625, -5.513671875, -4.9794921875, -4.4453125, -3.9111328125, -3.376953125, -2.8427734375, -2.30859375, -1.7744140625, -1.240234375, -0.7060546875, -0.171875, 0.3623046875, 0.896484375, 1.4306640625, 1.96484375, 2.4990234375, 3.033203125, 3.5673828125, 4.1015625, 4.6357421875, 5.169921875, 5.7041015625, 6.23828125, 6.7724609375, 7.306640625, 7.8408203125, 8.375, 8.9091796875, 9.443359375, 9.9775390625, 10.51171875, 11.0458984375, 11.580078125, 12.1142578125, 12.6484375, 13.1826171875, 13.716796875, 14.2509765625, 14.78515625, 15.3193359375, 15.853515625, 16.3876953125, 16.921875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 11.0, 7.0, 12.0, 12.0, 18.0, 17.0, 23.0, 28.0, 30.0, 35.0, 45.0, 43.0, 53.0, 62.0, 56.0, 69.0, 65.0, 64.0, 44.0, 59.0, 38.0, 43.0, 26.0, 25.0, 17.0, 18.0, 14.0, 12.0, 11.0, 13.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.579036712646484, -32.98521041870117, -31.391386032104492, -29.79755973815918, -28.2037353515625, -26.609909057617188, -25.016082763671875, -23.422256469726562, -21.828432083129883, -20.23460578918457, -18.64078140258789, -17.046955108642578, -15.453129768371582, -13.859304428100586, -12.265478134155273, -10.671652793884277, -9.077827453613281, -7.484002113342285, -5.890176296234131, -4.296350479125977, -2.7025251388549805, -1.1086997985839844, 0.4851264953613281, 2.078951835632324, 3.6727771759033203, 5.266602516174316, 6.860428333282471, 8.454254150390625, 10.048079490661621, 11.641904830932617, 13.23573112487793, 14.829556465148926, 16.423377990722656, 18.01720428466797, 19.61102867126465, 21.20485496520996, 22.79867935180664, 24.392505645751953, 25.986331939697266, 27.580158233642578, 29.173982620239258, 30.76780891418457, 32.36163330078125, 33.95545959472656, 35.549285888671875, 37.14311218261719, 38.7369384765625, 40.33076095581055, 41.92458724975586, 43.51841354370117, 45.112239837646484, 46.70606231689453, 48.299888610839844, 49.893714904785156, 51.48754119873047, 53.08136749267578, 54.675193786621094, 56.269020080566406, 57.86284637451172, 59.45667266845703, 61.05049514770508, 62.64432144165039, 64.23814392089844, 65.83197021484375, 67.42579650878906]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 9.0, 5.0, 9.0, 16.0, 10.0, 26.0, 16.0, 26.0, 22.0, 34.0, 35.0, 43.0, 28.0, 34.0, 41.0, 38.0, 37.0, 42.0, 35.0, 48.0, 44.0, 38.0, 31.0, 27.0, 37.0, 33.0, 29.0, 27.0, 26.0, 13.0, 25.0, 10.0, 15.0, 13.0, 19.0, 7.0, 7.0, 3.0, 4.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.175655364990234, -46.591129302978516, -45.00659942626953, -43.42207336425781, -41.837547302246094, -40.253021240234375, -38.66849136352539, -37.08396530151367, -35.49943542480469, -33.91490936279297, -32.330379486083984, -30.745853424072266, -29.161327362060547, -27.576799392700195, -25.992271423339844, -24.407745361328125, -22.823219299316406, -21.238691329956055, -19.654165267944336, -18.069637298583984, -16.485111236572266, -14.900583267211914, -13.316055297851562, -11.731528282165527, -10.147001266479492, -8.562474250793457, -6.977946758270264, -5.39341926574707, -3.808892250061035, -2.224365234375, -0.6398372650146484, 0.9446897506713867, 2.5292205810546875, 4.113747596740723, 5.698275089263916, 7.282802581787109, 8.867329597473145, 10.45185661315918, 12.036384582519531, 13.620911598205566, 15.205438613891602, 16.789966583251953, 18.374492645263672, 19.959020614624023, 21.543548583984375, 23.128074645996094, 24.712602615356445, 26.297130584716797, 27.881656646728516, 29.466184616088867, 31.050710678100586, 32.63523864746094, 34.219764709472656, 35.804290771484375, 37.38882064819336, 38.97334671020508, 40.55787658691406, 42.14240264892578, 43.726932525634766, 45.311458587646484, 46.8959846496582, 48.48051452636719, 50.065040588378906, 51.649566650390625, 53.234092712402344]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 8.0, 12.0, 18.0, 31.0, 42.0, 58.0, 92.0, 131.0, 220.0, 323.0, 509.0, 774.0, 1200.0, 1945.0, 3119.0, 5195.0, 8971.0, 15677.0, 28763.0, 55496.0, 113707.0, 239219.0, 282546.0, 142091.0, 68484.0, 35064.0, 18673.0, 10369.0, 6057.0, 3671.0, 2157.0, 1406.0, 871.0, 573.0, 343.0, 255.0, 162.0, 101.0, 64.0, 52.0, 38.0, 20.0, 12.0, 11.0, 9.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.5625, -9.282470703125, -9.00244140625, -8.722412109375, -8.4423828125, -8.162353515625, -7.88232421875, -7.602294921875, -7.322265625, -7.042236328125, -6.76220703125, -6.482177734375, -6.2021484375, -5.922119140625, -5.64208984375, -5.362060546875, -5.08203125, -4.802001953125, -4.52197265625, -4.241943359375, -3.9619140625, -3.681884765625, -3.40185546875, -3.121826171875, -2.841796875, -2.561767578125, -2.28173828125, -2.001708984375, -1.7216796875, -1.441650390625, -1.16162109375, -0.881591796875, -0.6015625, -0.321533203125, -0.04150390625, 0.238525390625, 0.5185546875, 0.798583984375, 1.07861328125, 1.358642578125, 1.638671875, 1.918701171875, 2.19873046875, 2.478759765625, 2.7587890625, 3.038818359375, 3.31884765625, 3.598876953125, 3.87890625, 4.158935546875, 4.43896484375, 4.718994140625, 4.9990234375, 5.279052734375, 5.55908203125, 5.839111328125, 6.119140625, 6.399169921875, 6.67919921875, 6.959228515625, 7.2392578125, 7.519287109375, 7.79931640625, 8.079345703125, 8.359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 6.0, 5.0, 12.0, 8.0, 9.0, 14.0, 13.0, 18.0, 27.0, 24.0, 28.0, 36.0, 41.0, 40.0, 35.0, 40.0, 38.0, 47.0, 34.0, 47.0, 46.0, 48.0, 30.0, 39.0, 35.0, 31.0, 36.0, 17.0, 32.0, 30.0, 24.0, 12.0, 12.0, 14.0, 9.0, 9.0, 10.0, 10.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.7666015625, -48.064453125, -46.3623046875, -44.66015625, -42.9580078125, -41.255859375, -39.5537109375, -37.8515625, -36.1494140625, -34.447265625, -32.7451171875, -31.04296875, -29.3408203125, -27.638671875, -25.9365234375, -24.234375, -22.5322265625, -20.830078125, -19.1279296875, -17.42578125, -15.7236328125, -14.021484375, -12.3193359375, -10.6171875, -8.9150390625, -7.212890625, -5.5107421875, -3.80859375, -2.1064453125, -0.404296875, 1.2978515625, 3.0, 4.7021484375, 6.404296875, 8.1064453125, 9.80859375, 11.5107421875, 13.212890625, 14.9150390625, 16.6171875, 18.3193359375, 20.021484375, 21.7236328125, 23.42578125, 25.1279296875, 26.830078125, 28.5322265625, 30.234375, 31.9365234375, 33.638671875, 35.3408203125, 37.04296875, 38.7451171875, 40.447265625, 42.1494140625, 43.8515625, 45.5537109375, 47.255859375, 48.9580078125, 50.66015625, 52.3623046875, 54.064453125, 55.7666015625, 57.46875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 10.0, 13.0, 27.0, 33.0, 40.0, 74.0, 120.0, 204.0, 309.0, 559.0, 1003.0, 1686.0, 2944.0, 5320.0, 9568.0, 17802.0, 33399.0, 65146.0, 128403.0, 259244.0, 258323.0, 127219.0, 64251.0, 33471.0, 17614.0, 9506.0, 5298.0, 2874.0, 1706.0, 943.0, 564.0, 335.0, 184.0, 134.0, 82.0, 52.0, 32.0, 14.0, 9.0, 11.0, 8.0, 5.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.6171875, -8.36370849609375, -8.1102294921875, -7.85675048828125, -7.603271484375, -7.34979248046875, -7.0963134765625, -6.84283447265625, -6.58935546875, -6.33587646484375, -6.0823974609375, -5.82891845703125, -5.575439453125, -5.32196044921875, -5.0684814453125, -4.81500244140625, -4.5615234375, -4.30804443359375, -4.0545654296875, -3.80108642578125, -3.547607421875, -3.29412841796875, -3.0406494140625, -2.78717041015625, -2.53369140625, -2.28021240234375, -2.0267333984375, -1.77325439453125, -1.519775390625, -1.26629638671875, -1.0128173828125, -0.75933837890625, -0.505859375, -0.25238037109375, 0.0010986328125, 0.25457763671875, 0.508056640625, 0.76153564453125, 1.0150146484375, 1.26849365234375, 1.52197265625, 1.77545166015625, 2.0289306640625, 2.28240966796875, 2.535888671875, 2.78936767578125, 3.0428466796875, 3.29632568359375, 3.5498046875, 3.80328369140625, 4.0567626953125, 4.31024169921875, 4.563720703125, 4.81719970703125, 5.0706787109375, 5.32415771484375, 5.57763671875, 5.83111572265625, 6.0845947265625, 6.33807373046875, 6.591552734375, 6.84503173828125, 7.0985107421875, 7.35198974609375, 7.60546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 7.0, 20.0, 16.0, 15.0, 17.0, 26.0, 23.0, 29.0, 43.0, 47.0, 37.0, 35.0, 48.0, 51.0, 46.0, 43.0, 41.0, 54.0, 47.0, 36.0, 31.0, 32.0, 36.0, 34.0, 24.0, 27.0, 15.0, 13.0, 13.0, 15.0, 9.0, 11.0, 4.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.75, -27.74462890625, -26.7392578125, -25.73388671875, -24.728515625, -23.72314453125, -22.7177734375, -21.71240234375, -20.70703125, -19.70166015625, -18.6962890625, -17.69091796875, -16.685546875, -15.68017578125, -14.6748046875, -13.66943359375, -12.6640625, -11.65869140625, -10.6533203125, -9.64794921875, -8.642578125, -7.63720703125, -6.6318359375, -5.62646484375, -4.62109375, -3.61572265625, -2.6103515625, -1.60498046875, -0.599609375, 0.40576171875, 1.4111328125, 2.41650390625, 3.421875, 4.42724609375, 5.4326171875, 6.43798828125, 7.443359375, 8.44873046875, 9.4541015625, 10.45947265625, 11.46484375, 12.47021484375, 13.4755859375, 14.48095703125, 15.486328125, 16.49169921875, 17.4970703125, 18.50244140625, 19.5078125, 20.51318359375, 21.5185546875, 22.52392578125, 23.529296875, 24.53466796875, 25.5400390625, 26.54541015625, 27.55078125, 28.55615234375, 29.5615234375, 30.56689453125, 31.572265625, 32.57763671875, 33.5830078125, 34.58837890625, 35.59375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 8.0, 19.0, 15.0, 17.0, 41.0, 36.0, 78.0, 82.0, 130.0, 185.0, 312.0, 439.0, 687.0, 1055.0, 1750.0, 3015.0, 5976.0, 13951.0, 49767.0, 471314.0, 426221.0, 46326.0, 13598.0, 5647.0, 3067.0, 1723.0, 1088.0, 669.0, 445.0, 251.0, 202.0, 119.0, 104.0, 46.0, 47.0, 38.0, 23.0, 20.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.5166015625, -1.4719696044921875, -1.427337646484375, -1.3827056884765625, -1.33807373046875, -1.2934417724609375, -1.248809814453125, -1.2041778564453125, -1.1595458984375, -1.1149139404296875, -1.070281982421875, -1.0256500244140625, -0.98101806640625, -0.9363861083984375, -0.891754150390625, -0.8471221923828125, -0.802490234375, -0.7578582763671875, -0.713226318359375, -0.6685943603515625, -0.62396240234375, -0.5793304443359375, -0.534698486328125, -0.4900665283203125, -0.4454345703125, -0.4008026123046875, -0.356170654296875, -0.3115386962890625, -0.26690673828125, -0.2222747802734375, -0.177642822265625, -0.1330108642578125, -0.08837890625, -0.0437469482421875, 0.000885009765625, 0.0455169677734375, 0.09014892578125, 0.1347808837890625, 0.179412841796875, 0.2240447998046875, 0.2686767578125, 0.3133087158203125, 0.357940673828125, 0.4025726318359375, 0.44720458984375, 0.4918365478515625, 0.536468505859375, 0.5811004638671875, 0.625732421875, 0.6703643798828125, 0.714996337890625, 0.7596282958984375, 0.80426025390625, 0.8488922119140625, 0.893524169921875, 0.9381561279296875, 0.9827880859375, 1.0274200439453125, 1.072052001953125, 1.1166839599609375, 1.16131591796875, 1.2059478759765625, 1.250579833984375, 1.2952117919921875, 1.33984375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 12.0, 15.0, 35.0, 53.0, 93.0, 146.0, 170.0, 173.0, 103.0, 75.0, 36.0, 20.0, 14.0, 7.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013446807861328125, -0.00013023801147937775, -0.00012600794434547424, -0.00012177787721157074, -0.00011754781007766724, -0.00011331774294376373, -0.00010908767580986023, -0.00010485760867595673, -0.00010062754154205322, -9.639747440814972e-05, -9.216740727424622e-05, -8.793734014034271e-05, -8.370727300643921e-05, -7.94772058725357e-05, -7.52471387386322e-05, -7.10170716047287e-05, -6.67870044708252e-05, -6.255693733692169e-05, -5.832687020301819e-05, -5.4096803069114685e-05, -4.986673593521118e-05, -4.563666880130768e-05, -4.1406601667404175e-05, -3.717653453350067e-05, -3.294646739959717e-05, -2.8716400265693665e-05, -2.448633313179016e-05, -2.0256265997886658e-05, -1.6026198863983154e-05, -1.1796131730079651e-05, -7.5660645961761475e-06, -3.335997462272644e-06, 8.940696716308594e-07, 5.124136805534363e-06, 9.354203939437866e-06, 1.358427107334137e-05, 1.7814338207244873e-05, 2.2044405341148376e-05, 2.627447247505188e-05, 3.0504539608955383e-05, 3.473460674285889e-05, 3.896467387676239e-05, 4.3194741010665894e-05, 4.74248081445694e-05, 5.16548752784729e-05, 5.5884942412376404e-05, 6.011500954627991e-05, 6.434507668018341e-05, 6.857514381408691e-05, 7.280521094799042e-05, 7.703527808189392e-05, 8.126534521579742e-05, 8.549541234970093e-05, 8.972547948360443e-05, 9.395554661750793e-05, 9.818561375141144e-05, 0.00010241568088531494, 0.00010664574801921844, 0.00011087581515312195, 0.00011510588228702545, 0.00011933594942092896, 0.00012356601655483246, 0.00012779608368873596, 0.00013202615082263947, 0.00013625621795654297]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 4.0, 15.0, 24.0, 42.0, 60.0, 87.0, 111.0, 205.0, 311.0, 452.0, 730.0, 1119.0, 1622.0, 2669.0, 4634.0, 8160.0, 16459.0, 41143.0, 183896.0, 601536.0, 120891.0, 32492.0, 13908.0, 7130.0, 4171.0, 2399.0, 1507.0, 928.0, 615.0, 421.0, 268.0, 194.0, 131.0, 72.0, 54.0, 43.0, 23.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6666259765625, -1.613525390625, -1.5604248046875, -1.50732421875, -1.4542236328125, -1.401123046875, -1.3480224609375, -1.294921875, -1.2418212890625, -1.188720703125, -1.1356201171875, -1.08251953125, -1.0294189453125, -0.976318359375, -0.9232177734375, -0.8701171875, -0.8170166015625, -0.763916015625, -0.7108154296875, -0.65771484375, -0.6046142578125, -0.551513671875, -0.4984130859375, -0.4453125, -0.3922119140625, -0.339111328125, -0.2860107421875, -0.23291015625, -0.1798095703125, -0.126708984375, -0.0736083984375, -0.0205078125, 0.0325927734375, 0.085693359375, 0.1387939453125, 0.19189453125, 0.2449951171875, 0.298095703125, 0.3511962890625, 0.404296875, 0.4573974609375, 0.510498046875, 0.5635986328125, 0.61669921875, 0.6697998046875, 0.722900390625, 0.7760009765625, 0.8291015625, 0.8822021484375, 0.935302734375, 0.9884033203125, 1.04150390625, 1.0946044921875, 1.147705078125, 1.2008056640625, 1.25390625, 1.3070068359375, 1.360107421875, 1.4132080078125, 1.46630859375, 1.5194091796875, 1.572509765625, 1.6256103515625, 1.6787109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 13.0, 10.0, 15.0, 20.0, 28.0, 31.0, 32.0, 72.0, 88.0, 148.0, 157.0, 98.0, 64.0, 37.0, 36.0, 26.0, 19.0, 11.0, 7.0, 7.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.346435546875, -0.33527374267578125, -0.3241119384765625, -0.31295013427734375, -0.301788330078125, -0.29062652587890625, -0.2794647216796875, -0.26830291748046875, -0.25714111328125, -0.24597930908203125, -0.2348175048828125, -0.22365570068359375, -0.212493896484375, -0.20133209228515625, -0.1901702880859375, -0.17900848388671875, -0.1678466796875, -0.15668487548828125, -0.1455230712890625, -0.13436126708984375, -0.123199462890625, -0.11203765869140625, -0.1008758544921875, -0.08971405029296875, -0.07855224609375, -0.06739044189453125, -0.0562286376953125, -0.04506683349609375, -0.033905029296875, -0.02274322509765625, -0.0115814208984375, -0.00041961669921875, 0.0107421875, 0.02190399169921875, 0.0330657958984375, 0.04422760009765625, 0.055389404296875, 0.06655120849609375, 0.0777130126953125, 0.08887481689453125, 0.10003662109375, 0.11119842529296875, 0.1223602294921875, 0.13352203369140625, 0.144683837890625, 0.15584564208984375, 0.1670074462890625, 0.17816925048828125, 0.1893310546875, 0.20049285888671875, 0.2116546630859375, 0.22281646728515625, 0.233978271484375, 0.24514007568359375, 0.2563018798828125, 0.26746368408203125, 0.27862548828125, 0.28978729248046875, 0.3009490966796875, 0.31211090087890625, 0.323272705078125, 0.33443450927734375, 0.3455963134765625, 0.35675811767578125, 0.367919921875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 7.0, 10.0, 10.0, 14.0, 17.0, 18.0, 23.0, 28.0, 27.0, 31.0, 46.0, 51.0, 55.0, 57.0, 54.0, 73.0, 56.0, 70.0, 49.0, 56.0, 33.0, 44.0, 29.0, 24.0, 19.0, 18.0, 12.0, 15.0, 8.0, 11.0, 13.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.03831100463867, -33.42974090576172, -31.821170806884766, -30.212602615356445, -28.604032516479492, -26.99546241760254, -25.38689422607422, -23.778324127197266, -22.169754028320312, -20.56118392944336, -18.952613830566406, -17.344045639038086, -15.735475540161133, -14.12690544128418, -12.518336296081543, -10.909767150878906, -9.301197052001953, -7.692627429962158, -6.084057807922363, -4.475488185882568, -2.8669185638427734, -1.2583484649658203, 0.3502206802368164, 1.9587898254394531, 3.5673599243164062, 5.175929546356201, 6.784499168395996, 8.393068313598633, 10.001638412475586, 11.610208511352539, 13.218777656555176, 14.827346801757812, 16.4359130859375, 18.044483184814453, 19.653053283691406, 21.261621475219727, 22.87019157409668, 24.478761672973633, 26.087329864501953, 27.695899963378906, 29.30447006225586, 30.913040161132812, 32.521610260009766, 34.13018035888672, 35.738746643066406, 37.347320556640625, 38.95588684082031, 40.564456939697266, 42.17302703857422, 43.78159713745117, 45.390167236328125, 46.99873733520508, 48.60730743408203, 50.21587371826172, 51.82444381713867, 53.433013916015625, 55.04158401489258, 56.65015411376953, 58.258724212646484, 59.86729431152344, 61.475860595703125, 63.084434509277344, 64.69300079345703, 66.30157470703125, 67.91014099121094]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 2.0, 10.0, 7.0, 8.0, 16.0, 9.0, 26.0, 17.0, 21.0, 27.0, 30.0, 39.0, 40.0, 29.0, 33.0, 41.0, 35.0, 42.0, 38.0, 38.0, 45.0, 45.0, 40.0, 33.0, 26.0, 37.0, 35.0, 27.0, 28.0, 28.0, 11.0, 26.0, 6.0, 19.0, 13.0, 19.0, 7.0, 7.0, 3.0, 3.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.702945709228516, -47.10239791870117, -45.50185012817383, -43.901302337646484, -42.30075454711914, -40.7002067565918, -39.09965515136719, -37.499107360839844, -35.8985595703125, -34.298011779785156, -32.69746398925781, -31.09691619873047, -29.496368408203125, -27.89582061767578, -26.295270919799805, -24.69472312927246, -23.09417724609375, -21.493629455566406, -19.893081665039062, -18.29253387451172, -16.691986083984375, -15.091437339782715, -13.490888595581055, -11.890340805053711, -10.289793014526367, -8.689245223999023, -7.0886969566345215, -5.4881486892700195, -3.887600898742676, -2.287053108215332, -0.6865043640136719, 0.9140434265136719, 2.51458740234375, 4.115135192871094, 5.715683460235596, 7.316231727600098, 8.916779518127441, 10.517327308654785, 12.117876052856445, 13.718423843383789, 15.318971633911133, 16.919519424438477, 18.52006721496582, 20.120616912841797, 21.72116470336914, 23.321712493896484, 24.922260284423828, 26.522808074951172, 28.123355865478516, 29.72390365600586, 31.324451446533203, 32.92499923706055, 34.52554702758789, 36.126094818115234, 37.726646423339844, 39.32719421386719, 40.92774200439453, 42.528289794921875, 44.12883758544922, 45.72938537597656, 47.329933166503906, 48.93048095703125, 50.531028747558594, 52.13157653808594, 53.73212432861328]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 5.0, 16.0, 16.0, 44.0, 49.0, 95.0, 145.0, 251.0, 352.0, 598.0, 887.0, 1605.0, 2511.0, 4035.0, 7163.0, 12396.0, 23003.0, 46001.0, 105415.0, 257186.0, 311855.0, 148046.0, 60971.0, 29161.0, 15354.0, 8556.0, 4976.0, 2968.0, 1798.0, 1144.0, 734.0, 439.0, 272.0, 179.0, 130.0, 73.0, 40.0, 24.0, 18.0, 10.0, 14.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-71.5625, -69.5283203125, -67.494140625, -65.4599609375, -63.42578125, -61.3916015625, -59.357421875, -57.3232421875, -55.2890625, -53.2548828125, -51.220703125, -49.1865234375, -47.15234375, -45.1181640625, -43.083984375, -41.0498046875, -39.015625, -36.9814453125, -34.947265625, -32.9130859375, -30.87890625, -28.8447265625, -26.810546875, -24.7763671875, -22.7421875, -20.7080078125, -18.673828125, -16.6396484375, -14.60546875, -12.5712890625, -10.537109375, -8.5029296875, -6.46875, -4.4345703125, -2.400390625, -0.3662109375, 1.66796875, 3.7021484375, 5.736328125, 7.7705078125, 9.8046875, 11.8388671875, 13.873046875, 15.9072265625, 17.94140625, 19.9755859375, 22.009765625, 24.0439453125, 26.078125, 28.1123046875, 30.146484375, 32.1806640625, 34.21484375, 36.2490234375, 38.283203125, 40.3173828125, 42.3515625, 44.3857421875, 46.419921875, 48.4541015625, 50.48828125, 52.5224609375, 54.556640625, 56.5908203125, 58.625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 4.0, 10.0, 20.0, 17.0, 27.0, 21.0, 36.0, 35.0, 44.0, 43.0, 29.0, 53.0, 52.0, 50.0, 45.0, 48.0, 48.0, 43.0, 30.0, 44.0, 45.0, 35.0, 35.0, 26.0, 25.0, 23.0, 13.0, 13.0, 13.0, 12.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-67.1875, -65.263671875, -63.33984375, -61.416015625, -59.4921875, -57.568359375, -55.64453125, -53.720703125, -51.796875, -49.873046875, -47.94921875, -46.025390625, -44.1015625, -42.177734375, -40.25390625, -38.330078125, -36.40625, -34.482421875, -32.55859375, -30.634765625, -28.7109375, -26.787109375, -24.86328125, -22.939453125, -21.015625, -19.091796875, -17.16796875, -15.244140625, -13.3203125, -11.396484375, -9.47265625, -7.548828125, -5.625, -3.701171875, -1.77734375, 0.146484375, 2.0703125, 3.994140625, 5.91796875, 7.841796875, 9.765625, 11.689453125, 13.61328125, 15.537109375, 17.4609375, 19.384765625, 21.30859375, 23.232421875, 25.15625, 27.080078125, 29.00390625, 30.927734375, 32.8515625, 34.775390625, 36.69921875, 38.623046875, 40.546875, 42.470703125, 44.39453125, 46.318359375, 48.2421875, 50.166015625, 52.08984375, 54.013671875, 55.9375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 11.0, 17.0, 10.0, 21.0, 27.0, 33.0, 65.0, 83.0, 153.0, 174.0, 313.0, 459.0, 630.0, 1033.0, 1565.0, 2449.0, 3760.0, 5861.0, 9006.0, 13662.0, 21424.0, 34564.0, 60103.0, 115351.0, 233102.0, 250352.0, 127850.0, 64963.0, 37313.0, 22796.0, 14371.0, 9246.0, 6179.0, 4037.0, 2605.0, 1700.0, 1053.0, 737.0, 481.0, 325.0, 223.0, 133.0, 92.0, 68.0, 57.0, 34.0, 32.0, 11.0, 10.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-73.25, -70.9658203125, -68.681640625, -66.3974609375, -64.11328125, -61.8291015625, -59.544921875, -57.2607421875, -54.9765625, -52.6923828125, -50.408203125, -48.1240234375, -45.83984375, -43.5556640625, -41.271484375, -38.9873046875, -36.703125, -34.4189453125, -32.134765625, -29.8505859375, -27.56640625, -25.2822265625, -22.998046875, -20.7138671875, -18.4296875, -16.1455078125, -13.861328125, -11.5771484375, -9.29296875, -7.0087890625, -4.724609375, -2.4404296875, -0.15625, 2.1279296875, 4.412109375, 6.6962890625, 8.98046875, 11.2646484375, 13.548828125, 15.8330078125, 18.1171875, 20.4013671875, 22.685546875, 24.9697265625, 27.25390625, 29.5380859375, 31.822265625, 34.1064453125, 36.390625, 38.6748046875, 40.958984375, 43.2431640625, 45.52734375, 47.8115234375, 50.095703125, 52.3798828125, 54.6640625, 56.9482421875, 59.232421875, 61.5166015625, 63.80078125, 66.0849609375, 68.369140625, 70.6533203125, 72.9375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 8.0, 11.0, 16.0, 13.0, 15.0, 20.0, 17.0, 18.0, 18.0, 21.0, 23.0, 29.0, 34.0, 29.0, 27.0, 35.0, 34.0, 44.0, 48.0, 40.0, 25.0, 40.0, 36.0, 35.0, 42.0, 34.0, 34.0, 29.0, 31.0, 21.0, 30.0, 18.0, 16.0, 10.0, 16.0, 11.0, 11.0, 9.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.4375, -31.434814453125, -30.43212890625, -29.429443359375, -28.4267578125, -27.424072265625, -26.42138671875, -25.418701171875, -24.416015625, -23.413330078125, -22.41064453125, -21.407958984375, -20.4052734375, -19.402587890625, -18.39990234375, -17.397216796875, -16.39453125, -15.391845703125, -14.38916015625, -13.386474609375, -12.3837890625, -11.381103515625, -10.37841796875, -9.375732421875, -8.373046875, -7.370361328125, -6.36767578125, -5.364990234375, -4.3623046875, -3.359619140625, -2.35693359375, -1.354248046875, -0.3515625, 0.651123046875, 1.65380859375, 2.656494140625, 3.6591796875, 4.661865234375, 5.66455078125, 6.667236328125, 7.669921875, 8.672607421875, 9.67529296875, 10.677978515625, 11.6806640625, 12.683349609375, 13.68603515625, 14.688720703125, 15.69140625, 16.694091796875, 17.69677734375, 18.699462890625, 19.7021484375, 20.704833984375, 21.70751953125, 22.710205078125, 23.712890625, 24.715576171875, 25.71826171875, 26.720947265625, 27.7236328125, 28.726318359375, 29.72900390625, 30.731689453125, 31.734375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 9.0, 28.0, 28.0, 45.0, 66.0, 116.0, 165.0, 243.0, 457.0, 718.0, 1083.0, 1757.0, 2857.0, 4704.0, 7818.0, 12775.0, 20094.0, 32222.0, 48957.0, 70768.0, 94843.0, 116598.0, 128030.0, 126179.0, 110582.0, 87198.0, 63612.0, 43112.0, 27985.0, 17569.0, 10827.0, 6664.0, 4033.0, 2452.0, 1462.0, 906.0, 568.0, 399.0, 231.0, 141.0, 82.0, 56.0, 41.0, 23.0, 11.0, 12.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.328125, -6.12939453125, -5.9306640625, -5.73193359375, -5.533203125, -5.33447265625, -5.1357421875, -4.93701171875, -4.73828125, -4.53955078125, -4.3408203125, -4.14208984375, -3.943359375, -3.74462890625, -3.5458984375, -3.34716796875, -3.1484375, -2.94970703125, -2.7509765625, -2.55224609375, -2.353515625, -2.15478515625, -1.9560546875, -1.75732421875, -1.55859375, -1.35986328125, -1.1611328125, -0.96240234375, -0.763671875, -0.56494140625, -0.3662109375, -0.16748046875, 0.03125, 0.22998046875, 0.4287109375, 0.62744140625, 0.826171875, 1.02490234375, 1.2236328125, 1.42236328125, 1.62109375, 1.81982421875, 2.0185546875, 2.21728515625, 2.416015625, 2.61474609375, 2.8134765625, 3.01220703125, 3.2109375, 3.40966796875, 3.6083984375, 3.80712890625, 4.005859375, 4.20458984375, 4.4033203125, 4.60205078125, 4.80078125, 4.99951171875, 5.1982421875, 5.39697265625, 5.595703125, 5.79443359375, 5.9931640625, 6.19189453125, 6.390625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 7.0, 10.0, 18.0, 18.0, 15.0, 28.0, 31.0, 33.0, 30.0, 45.0, 60.0, 55.0, 58.0, 56.0, 69.0, 64.0, 60.0, 41.0, 46.0, 43.0, 39.0, 31.0, 22.0, 22.0, 11.0, 22.0, 12.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011053085327148438, -0.0010730177164077759, -0.001040726900100708, -0.0010084360837936401, -0.0009761452674865723, -0.0009438544511795044, -0.0009115636348724365, -0.0008792728185653687, -0.0008469820022583008, -0.0008146911859512329, -0.000782400369644165, -0.0007501095533370972, -0.0007178187370300293, -0.0006855279207229614, -0.0006532371044158936, -0.0006209462881088257, -0.0005886554718017578, -0.0005563646554946899, -0.0005240738391876221, -0.0004917830228805542, -0.00045949220657348633, -0.00042720139026641846, -0.0003949105739593506, -0.0003626197576522827, -0.00033032894134521484, -0.00029803812503814697, -0.0002657473087310791, -0.00023345649242401123, -0.00020116567611694336, -0.0001688748598098755, -0.00013658404350280762, -0.00010429322719573975, -7.200241088867188e-05, -3.9711594581604004e-05, -7.420778274536133e-06, 2.4870038032531738e-05, 5.716085433959961e-05, 8.945167064666748e-05, 0.00012174248695373535, 0.00015403330326080322, 0.0001863241195678711, 0.00021861493587493896, 0.00025090575218200684, 0.0002831965684890747, 0.0003154873847961426, 0.00034777820110321045, 0.0003800690174102783, 0.0004123598337173462, 0.00044465065002441406, 0.00047694146633148193, 0.0005092322826385498, 0.0005415230989456177, 0.0005738139152526855, 0.0006061047315597534, 0.0006383955478668213, 0.0006706863641738892, 0.000702977180480957, 0.0007352679967880249, 0.0007675588130950928, 0.0007998496294021606, 0.0008321404457092285, 0.0008644312620162964, 0.0008967220783233643, 0.0009290128946304321, 0.0009613037109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 14.0, 20.0, 28.0, 49.0, 77.0, 159.0, 224.0, 345.0, 647.0, 970.0, 1702.0, 2769.0, 4661.0, 7734.0, 13078.0, 20955.0, 33458.0, 51111.0, 73577.0, 98134.0, 120041.0, 130109.0, 126177.0, 109181.0, 84652.0, 60859.0, 40681.0, 26124.0, 16241.0, 9917.0, 5907.0, 3595.0, 2110.0, 1287.0, 750.0, 467.0, 290.0, 160.0, 111.0, 68.0, 47.0, 24.0, 20.0, 12.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7109375, -5.51214599609375, -5.3133544921875, -5.11456298828125, -4.915771484375, -4.71697998046875, -4.5181884765625, -4.31939697265625, -4.12060546875, -3.92181396484375, -3.7230224609375, -3.52423095703125, -3.325439453125, -3.12664794921875, -2.9278564453125, -2.72906494140625, -2.5302734375, -2.33148193359375, -2.1326904296875, -1.93389892578125, -1.735107421875, -1.53631591796875, -1.3375244140625, -1.13873291015625, -0.93994140625, -0.74114990234375, -0.5423583984375, -0.34356689453125, -0.144775390625, 0.05401611328125, 0.2528076171875, 0.45159912109375, 0.650390625, 0.84918212890625, 1.0479736328125, 1.24676513671875, 1.445556640625, 1.64434814453125, 1.8431396484375, 2.04193115234375, 2.24072265625, 2.43951416015625, 2.6383056640625, 2.83709716796875, 3.035888671875, 3.23468017578125, 3.4334716796875, 3.63226318359375, 3.8310546875, 4.02984619140625, 4.2286376953125, 4.42742919921875, 4.626220703125, 4.82501220703125, 5.0238037109375, 5.22259521484375, 5.42138671875, 5.62017822265625, 5.8189697265625, 6.01776123046875, 6.216552734375, 6.41534423828125, 6.6141357421875, 6.81292724609375, 7.01171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 8.0, 5.0, 12.0, 12.0, 15.0, 20.0, 19.0, 18.0, 21.0, 26.0, 23.0, 29.0, 46.0, 45.0, 26.0, 40.0, 36.0, 37.0, 41.0, 34.0, 38.0, 30.0, 39.0, 45.0, 38.0, 27.0, 38.0, 26.0, 26.0, 20.0, 20.0, 20.0, 16.0, 19.0, 12.0, 12.0, 10.0, 10.0, 6.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8214111328125, -1.760986328125, -1.7005615234375, -1.64013671875, -1.5797119140625, -1.519287109375, -1.4588623046875, -1.3984375, -1.3380126953125, -1.277587890625, -1.2171630859375, -1.15673828125, -1.0963134765625, -1.035888671875, -0.9754638671875, -0.9150390625, -0.8546142578125, -0.794189453125, -0.7337646484375, -0.67333984375, -0.6129150390625, -0.552490234375, -0.4920654296875, -0.431640625, -0.3712158203125, -0.310791015625, -0.2503662109375, -0.18994140625, -0.1295166015625, -0.069091796875, -0.0086669921875, 0.0517578125, 0.1121826171875, 0.172607421875, 0.2330322265625, 0.29345703125, 0.3538818359375, 0.414306640625, 0.4747314453125, 0.53515625, 0.5955810546875, 0.656005859375, 0.7164306640625, 0.77685546875, 0.8372802734375, 0.897705078125, 0.9581298828125, 1.0185546875, 1.0789794921875, 1.139404296875, 1.1998291015625, 1.26025390625, 1.3206787109375, 1.381103515625, 1.4415283203125, 1.501953125, 1.5623779296875, 1.622802734375, 1.6832275390625, 1.74365234375, 1.8040771484375, 1.864501953125, 1.9249267578125, 1.9853515625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 9.0, 9.0, 11.0, 10.0, 16.0, 18.0, 30.0, 25.0, 33.0, 37.0, 51.0, 46.0, 62.0, 51.0, 52.0, 57.0, 54.0, 65.0, 47.0, 32.0, 61.0, 39.0, 29.0, 23.0, 23.0, 15.0, 10.0, 19.0, 9.0, 13.0, 8.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.50895690917969, -39.74360656738281, -37.9782600402832, -36.21290969848633, -34.44756317138672, -32.682212829589844, -30.91686248779297, -29.151514053344727, -27.386165618896484, -25.620817184448242, -23.85546875, -22.090118408203125, -20.324769973754883, -18.55942153930664, -16.794071197509766, -15.028722763061523, -13.263374328613281, -11.498025894165039, -9.73267650604248, -7.96732759475708, -6.20197868347168, -4.4366302490234375, -2.671280860900879, -0.9059314727783203, 0.8594169616699219, 2.6247658729553223, 4.390114784240723, 6.155463695526123, 7.920812606811523, 9.686161041259766, 11.451510429382324, 13.216859817504883, 14.982208251953125, 16.747556686401367, 18.51290512084961, 20.278255462646484, 22.043603897094727, 23.80895233154297, 25.574302673339844, 27.339651107788086, 29.104999542236328, 30.87034797668457, 32.63569641113281, 34.40104675292969, 36.16639709472656, 37.93174362182617, 39.69709396362305, 41.462440490722656, 43.22779083251953, 44.993141174316406, 46.758487701416016, 48.52383804321289, 50.2891845703125, 52.054534912109375, 53.81988525390625, 55.585235595703125, 57.350582122802734, 59.11593246459961, 60.88127899169922, 62.646629333496094, 64.41197967529297, 66.17732238769531, 67.94267272949219, 69.70802307128906, 71.47337341308594]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 9.0, 6.0, 14.0, 12.0, 19.0, 22.0, 22.0, 17.0, 24.0, 39.0, 37.0, 28.0, 42.0, 37.0, 38.0, 39.0, 34.0, 30.0, 35.0, 33.0, 44.0, 37.0, 47.0, 36.0, 34.0, 42.0, 22.0, 25.0, 21.0, 18.0, 21.0, 11.0, 14.0, 5.0, 10.0, 7.0, 7.0, 10.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.36350631713867, -58.35368347167969, -56.34386444091797, -54.334041595458984, -52.32421875, -50.31439971923828, -48.3045768737793, -46.29475402832031, -44.284934997558594, -42.27511215209961, -40.26529312133789, -38.255470275878906, -36.24565124511719, -34.2358283996582, -32.22600555419922, -30.216184616088867, -28.206363677978516, -26.196542739868164, -24.186721801757812, -22.176898956298828, -20.167078018188477, -18.157257080078125, -16.14743423461914, -14.137613296508789, -12.127792358398438, -10.117971420288086, -8.108149528503418, -6.098328113555908, -4.088506698608398, -2.078685760498047, -0.0688638687133789, 1.940958023071289, 3.9507827758789062, 5.960604190826416, 7.970425605773926, 9.980247497558594, 11.990068435668945, 13.999889373779297, 16.00971221923828, 18.019533157348633, 20.029354095458984, 22.039175033569336, 24.048995971679688, 26.058818817138672, 28.068639755249023, 30.078460693359375, 32.08828353881836, 34.098106384277344, 36.10792541503906, 38.11774826049805, 40.127567291259766, 42.13739013671875, 44.14720916748047, 46.15703201293945, 48.16685485839844, 50.176673889160156, 52.18649673461914, 54.196319580078125, 56.206138610839844, 58.21596145629883, 60.22578430175781, 62.23560333251953, 64.24542236328125, 66.2552490234375, 68.26506805419922]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 9.0, 5.0, 8.0, 22.0, 13.0, 26.0, 33.0, 40.0, 61.0, 82.0, 119.0, 134.0, 191.0, 294.0, 393.0, 589.0, 976.0, 1598.0, 2544.0, 4157.0, 6014.0, 481315.0, 9072.0, 5727.0, 3975.0, 2450.0, 1538.0, 954.0, 545.0, 383.0, 276.0, 206.0, 133.0, 108.0, 69.0, 56.0, 40.0, 23.0, 19.0, 15.0, 10.0, 11.0, 10.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-472.74908447265625, -457.4722900390625, -442.1955261230469, -426.9187316894531, -411.6419677734375, -396.36517333984375, -381.08837890625, -365.8116149902344, -350.5348205566406, -335.2580261230469, -319.98126220703125, -304.7044677734375, -289.4277038574219, -274.1509094238281, -258.8741455078125, -243.59735107421875, -228.32057189941406, -213.04379272460938, -197.7670135498047, -182.490234375, -167.21343994140625, -151.93666076660156, -136.65988159179688, -121.38309478759766, -106.10631561279297, -90.82953643798828, -75.55274963378906, -60.275970458984375, -44.99918746948242, -29.72240447998047, -14.445625305175781, 0.8311614990234375, 16.107940673828125, 31.384723663330078, 46.66150665283203, 61.93828582763672, 77.21507263183594, 92.49185180664062, 107.76863098144531, 123.04541778564453, 138.32220458984375, 153.59898376464844, 168.87576293945312, 184.15255737304688, 199.42933654785156, 214.70611572265625, 229.98289489746094, 245.25967407226562, 260.53643798828125, 275.813232421875, 291.0899963378906, 306.3667907714844, 321.6435546875, 336.92034912109375, 352.1971435546875, 367.4739074707031, 382.7507019042969, 398.0274963378906, 413.30426025390625, 428.5810546875, 443.8578186035156, 459.1346130371094, 474.411376953125, 489.68817138671875, 504.9649658203125]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 9.0, 5.0, 13.0, 13.0, 18.0, 23.0, 20.0, 17.0, 22.0, 35.0, 42.0, 29.0, 38.0, 41.0, 37.0, 39.0, 38.0, 30.0, 1059.0, 34.0, 43.0, 37.0, 48.0, 34.0, 33.0, 43.0, 24.0, 25.0, 19.0, 19.0, 22.0, 10.0, 13.0, 8.0, 8.0, 8.0, 6.0, 9.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1791.1861572265625, -1731.5419921875, -1671.8978271484375, -1612.253662109375, -1552.6094970703125, -1492.96533203125, -1433.3211669921875, -1373.677001953125, -1314.0328369140625, -1254.388671875, -1194.7445068359375, -1135.100341796875, -1075.4561767578125, -1015.81201171875, -956.1678466796875, -896.523681640625, -836.8794555664062, -777.2352905273438, -717.5911254882812, -657.9469604492188, -598.3027954101562, -538.6585693359375, -479.0144348144531, -419.3702697753906, -359.7261047363281, -300.0819396972656, -240.43777465820312, -180.79359436035156, -121.14942932128906, -61.5052490234375, -1.861083984375, 57.7830810546875, 117.42724609375, 177.0714111328125, 236.715576171875, 296.3597412109375, 356.00390625, 415.6481018066406, 475.2922668457031, 534.9364013671875, 594.58056640625, 654.2247314453125, 713.868896484375, 773.5130615234375, 833.1572265625, 892.8013916015625, 952.445556640625, 1012.0897216796875, 1071.73388671875, 1131.3780517578125, 1191.022216796875, 1250.6663818359375, 1310.310546875, 1369.9547119140625, 1429.598876953125, 1489.2430419921875, 1548.8873291015625, 1608.531494140625, 1668.1756591796875, 1727.81982421875, 1787.4639892578125, 1847.108154296875, 1906.7523193359375, 1966.396484375, 2026.0406494140625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 15.0, 22.0, 26.0, 28.0, 33.0, 61.0, 110.0, 314.0, 323.0, 310.0, 462.0, 688.0, 1177.0, 2230.0, 4754.0, 9678.0, 16920.0, 25266.0, 556778.0, 30550710.0, 56444.0, 15847.0, 6176.0, 2752.0, 1238.0, 826.0, 587.0, 229.0, 123.0, 77.0, 45.0, 37.0, 23.0, 30.0, 19.0, 16.0, 15.0, 13.0, 14.0, 15.0, 8.0, 10.0, 8.0, 8.0, 5.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-752.6950073242188, -723.7778930664062, -694.8607788085938, -665.9436645507812, -637.0265502929688, -608.1094360351562, -579.1923828125, -550.2752685546875, -521.358154296875, -492.4410400390625, -463.52392578125, -434.6068115234375, -405.689697265625, -376.7725830078125, -347.8554992675781, -318.9383850097656, -290.021240234375, -261.1041259765625, -232.18701171875, -203.26991271972656, -174.35279846191406, -145.43568420410156, -116.51858520507812, -87.60147094726562, -58.684356689453125, -29.76724624633789, -0.8501358032226562, 28.066970825195312, 56.98408508300781, 85.90119934082031, 114.81829833984375, 143.73541259765625, 172.6524658203125, 201.569580078125, 230.4866943359375, 259.40380859375, 288.3209228515625, 317.238037109375, 346.1551208496094, 375.0722351074219, 403.9893493652344, 432.9064636230469, 461.8235778808594, 490.74066162109375, 519.6577758789062, 548.5748901367188, 577.4920043945312, 606.4091186523438, 635.3262329101562, 664.2433471679688, 693.1604614257812, 722.0775756835938, 750.9946899414062, 779.9118041992188, 808.828857421875, 837.7459716796875, 866.6630859375, 895.5802001953125, 924.497314453125, 953.4144287109375, 982.33154296875, 1011.2486572265625, 1040.165771484375, 1069.0828857421875, 1098.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 8.0, 13.0, 17.0, 31.0, 37.0, 44.0, 70.0, 79.0, 122.0, 174.0, 247.0, 392.0, 576.0, 806.0, 1239.0, 1975.0, 3160.0, 5247.0, 9274.0, 17015.0, 36642.0, 88180.0, 262866.0, 1217379.0, 3898815.0, 496925.0, 142678.0, 53922.0, 23793.0, 12150.0, 6657.0, 3863.0, 2384.0, 1469.0, 998.0, 678.0, 450.0, 312.0, 204.0, 150.0, 113.0, 83.0, 52.0, 43.0, 36.0, 20.0, 10.0, 9.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-31.640625, -30.627685546875, -29.61474609375, -28.601806640625, -27.5888671875, -26.575927734375, -25.56298828125, -24.550048828125, -23.537109375, -22.524169921875, -21.51123046875, -20.498291015625, -19.4853515625, -18.472412109375, -17.45947265625, -16.446533203125, -15.43359375, -14.420654296875, -13.40771484375, -12.394775390625, -11.3818359375, -10.368896484375, -9.35595703125, -8.343017578125, -7.330078125, -6.317138671875, -5.30419921875, -4.291259765625, -3.2783203125, -2.265380859375, -1.25244140625, -0.239501953125, 0.7734375, 1.786376953125, 2.79931640625, 3.812255859375, 4.8251953125, 5.838134765625, 6.85107421875, 7.864013671875, 8.876953125, 9.889892578125, 10.90283203125, 11.915771484375, 12.9287109375, 13.941650390625, 14.95458984375, 15.967529296875, 16.98046875, 17.993408203125, 19.00634765625, 20.019287109375, 21.0322265625, 22.045166015625, 23.05810546875, 24.071044921875, 25.083984375, 26.096923828125, 27.10986328125, 28.122802734375, 29.1357421875, 30.148681640625, 31.16162109375, 32.174560546875, 33.1875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 6.0, 5.0, 8.0, 15.0, 16.0, 8.0, 16.0, 21.0, 24.0, 15.0, 21.0, 26.0, 26.0, 44.0, 39.0, 50.0, 64.0, 102.0, 183.0, 523.0, 299.0, 100.0, 36.0, 41.0, 47.0, 36.0, 27.0, 33.0, 29.0, 19.0, 24.0, 14.0, 17.0, 14.0, 15.0, 15.0, 8.0, 12.0, 13.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.71484375, -35.4921875, -34.26953125, -33.046875, -31.82421875, -30.6015625, -29.37890625, -28.15625, -26.93359375, -25.7109375, -24.48828125, -23.265625, -22.04296875, -20.8203125, -19.59765625, -18.375, -17.15234375, -15.9296875, -14.70703125, -13.484375, -12.26171875, -11.0390625, -9.81640625, -8.59375, -7.37109375, -6.1484375, -4.92578125, -3.703125, -2.48046875, -1.2578125, -0.03515625, 1.1875, 2.41015625, 3.6328125, 4.85546875, 6.078125, 7.30078125, 8.5234375, 9.74609375, 10.96875, 12.19140625, 13.4140625, 14.63671875, 15.859375, 17.08203125, 18.3046875, 19.52734375, 20.75, 21.97265625, 23.1953125, 24.41796875, 25.640625, 26.86328125, 28.0859375, 29.30859375, 30.53125, 31.75390625, 32.9765625, 34.19921875, 35.421875, 36.64453125, 37.8671875, 39.08984375, 40.3125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 15.0, 19.0, 33.0, 29.0, 52.0, 54.0, 85.0, 114.0, 174.0, 324.0, 565.0, 875.0, 1368.0, 2208.0, 3546.0, 6213.0, 10844.0, 19801.0, 39158.0, 85129.0, 205483.0, 616665.0, 3895552.0, 920485.0, 271624.0, 108423.0, 48110.0, 24022.0, 12659.0, 6893.0, 4126.0, 2447.0, 1512.0, 1029.0, 645.0, 439.0, 208.0, 137.0, 125.0, 64.0, 77.0, 52.0, 20.0, 18.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0], "bins": [-30.75, -29.807861328125, -28.86572265625, -27.923583984375, -26.9814453125, -26.039306640625, -25.09716796875, -24.155029296875, -23.212890625, -22.270751953125, -21.32861328125, -20.386474609375, -19.4443359375, -18.502197265625, -17.56005859375, -16.617919921875, -15.67578125, -14.733642578125, -13.79150390625, -12.849365234375, -11.9072265625, -10.965087890625, -10.02294921875, -9.080810546875, -8.138671875, -7.196533203125, -6.25439453125, -5.312255859375, -4.3701171875, -3.427978515625, -2.48583984375, -1.543701171875, -0.6015625, 0.340576171875, 1.28271484375, 2.224853515625, 3.1669921875, 4.109130859375, 5.05126953125, 5.993408203125, 6.935546875, 7.877685546875, 8.81982421875, 9.761962890625, 10.7041015625, 11.646240234375, 12.58837890625, 13.530517578125, 14.47265625, 15.414794921875, 16.35693359375, 17.299072265625, 18.2412109375, 19.183349609375, 20.12548828125, 21.067626953125, 22.009765625, 22.951904296875, 23.89404296875, 24.836181640625, 25.7783203125, 26.720458984375, 27.66259765625, 28.604736328125, 29.546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 15.0, 13.0, 12.0, 17.0, 14.0, 28.0, 33.0, 37.0, 52.0, 57.0, 50.0, 81.0, 254.0, 728.0, 173.0, 69.0, 59.0, 50.0, 41.0, 39.0, 29.0, 31.0, 29.0, 22.0, 14.0, 11.0, 14.0, 13.0, 3.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.03125, -47.26416015625, -45.4970703125, -43.72998046875, -41.962890625, -40.19580078125, -38.4287109375, -36.66162109375, -34.89453125, -33.12744140625, -31.3603515625, -29.59326171875, -27.826171875, -26.05908203125, -24.2919921875, -22.52490234375, -20.7578125, -18.99072265625, -17.2236328125, -15.45654296875, -13.689453125, -11.92236328125, -10.1552734375, -8.38818359375, -6.62109375, -4.85400390625, -3.0869140625, -1.31982421875, 0.447265625, 2.21435546875, 3.9814453125, 5.74853515625, 7.515625, 9.28271484375, 11.0498046875, 12.81689453125, 14.583984375, 16.35107421875, 18.1181640625, 19.88525390625, 21.65234375, 23.41943359375, 25.1865234375, 26.95361328125, 28.720703125, 30.48779296875, 32.2548828125, 34.02197265625, 35.7890625, 37.55615234375, 39.3232421875, 41.09033203125, 42.857421875, 44.62451171875, 46.3916015625, 48.15869140625, 49.92578125, 51.69287109375, 53.4599609375, 55.22705078125, 56.994140625, 58.76123046875, 60.5283203125, 62.29541015625, 64.0625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 4.0, 6.0, 2.0, 15.0, 14.0, 3.0, 13.0, 19.0, 31.0, 26.0, 51.0, 55.0, 77.0, 82.0, 95.0, 145.0, 197.0, 355.0, 491.0, 610.0, 1194.0, 2007.0, 3597.0, 8132.0, 21272.0, 85776.0, 5979028.0, 139854.0, 27921.0, 9748.0, 4569.0, 2216.0, 1258.0, 866.0, 505.0, 245.0, 219.0, 170.0, 142.0, 92.0, 46.0, 49.0, 46.0, 38.0, 22.0, 35.0, 23.0, 3.0, 5.0, 7.0, 21.0, 3.0, 5.0, 9.0, 6.0, 4.0, 2.0, 10.0], "bins": [-181.5, -175.935546875, -170.37109375, -164.806640625, -159.2421875, -153.677734375, -148.11328125, -142.548828125, -136.984375, -131.419921875, -125.85546875, -120.291015625, -114.7265625, -109.162109375, -103.59765625, -98.033203125, -92.46875, -86.904296875, -81.33984375, -75.775390625, -70.2109375, -64.646484375, -59.08203125, -53.517578125, -47.953125, -42.388671875, -36.82421875, -31.259765625, -25.6953125, -20.130859375, -14.56640625, -9.001953125, -3.4375, 2.126953125, 7.69140625, 13.255859375, 18.8203125, 24.384765625, 29.94921875, 35.513671875, 41.078125, 46.642578125, 52.20703125, 57.771484375, 63.3359375, 68.900390625, 74.46484375, 80.029296875, 85.59375, 91.158203125, 96.72265625, 102.287109375, 107.8515625, 113.416015625, 118.98046875, 124.544921875, 130.109375, 135.673828125, 141.23828125, 146.802734375, 152.3671875, 157.931640625, 163.49609375, 169.060546875, 174.625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 12.0, 13.0, 15.0, 18.0, 18.0, 32.0, 44.0, 39.0, 45.0, 50.0, 84.0, 167.0, 589.0, 411.0, 90.0, 56.0, 53.0, 43.0, 29.0, 39.0, 22.0, 26.0, 16.0, 14.0, 13.0, 11.0, 11.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.625, -84.0810546875, -81.537109375, -78.9931640625, -76.44921875, -73.9052734375, -71.361328125, -68.8173828125, -66.2734375, -63.7294921875, -61.185546875, -58.6416015625, -56.09765625, -53.5537109375, -51.009765625, -48.4658203125, -45.921875, -43.3779296875, -40.833984375, -38.2900390625, -35.74609375, -33.2021484375, -30.658203125, -28.1142578125, -25.5703125, -23.0263671875, -20.482421875, -17.9384765625, -15.39453125, -12.8505859375, -10.306640625, -7.7626953125, -5.21875, -2.6748046875, -0.130859375, 2.4130859375, 4.95703125, 7.5009765625, 10.044921875, 12.5888671875, 15.1328125, 17.6767578125, 20.220703125, 22.7646484375, 25.30859375, 27.8525390625, 30.396484375, 32.9404296875, 35.484375, 38.0283203125, 40.572265625, 43.1162109375, 45.66015625, 48.2041015625, 50.748046875, 53.2919921875, 55.8359375, 58.3798828125, 60.923828125, 63.4677734375, 66.01171875, 68.5556640625, 71.099609375, 73.6435546875, 76.1875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 19.0, 22.0, 46.0, 358.0, 489.0, 33.0, 16.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-527.37109375, -507.8791198730469, -488.3871765136719, -468.89520263671875, -449.40325927734375, -429.9112854003906, -410.4193115234375, -390.9273681640625, -371.4354248046875, -351.9434509277344, -332.4515075683594, -312.95953369140625, -293.46759033203125, -273.9756164550781, -254.48365783691406, -234.99169921875, -215.49972534179688, -196.0077667236328, -176.51580810546875, -157.02383422851562, -137.53189086914062, -118.03992462158203, -98.54795837402344, -79.05599975585938, -59.56404113769531, -40.07208251953125, -20.580120086669922, -1.0881576538085938, 18.40380096435547, 37.89575958251953, 57.387725830078125, 76.87968444824219, 96.37164306640625, 115.86360168457031, 135.35556030273438, 154.8475341796875, 174.3394775390625, 193.83145141601562, 213.3234100341797, 232.81536865234375, 252.3073272705078, 271.7992858886719, 291.291259765625, 310.783203125, 330.2751770019531, 349.7671203613281, 369.25909423828125, 388.75103759765625, 408.2430114746094, 427.7349853515625, 447.2269287109375, 466.7189025878906, 486.2108459472656, 505.70281982421875, 525.1947631835938, 544.686767578125, 564.1787109375, 583.670654296875, 603.1626586914062, 622.6546020507812, 642.1465454101562, 661.6384887695312, 681.1304931640625, 700.6224365234375, 720.1143798828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 20.0, 13.0, 26.0, 46.0, 93.0, 388.0, 226.0, 56.0, 29.0, 24.0, 13.0, 15.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.17327880859375, -431.1522216796875, -416.1311340332031, -401.1100769042969, -386.0890197753906, -371.06793212890625, -356.046875, -341.02581787109375, -326.0047607421875, -310.98370361328125, -295.9626159667969, -280.9415588378906, -265.9205017089844, -250.89942932128906, -235.87835693359375, -220.8572998046875, -205.83621215820312, -190.8151397705078, -175.79408264160156, -160.77301025390625, -145.751953125, -130.7308807373047, -115.70980834960938, -100.6887435913086, -85.66767883300781, -70.64661407470703, -55.625545501708984, -40.60447692871094, -25.583412170410156, -10.562347412109375, 4.4587249755859375, 19.47978973388672, 34.5008544921875, 49.52191925048828, 64.54298400878906, 79.56405639648438, 94.58512115478516, 109.60618591308594, 124.62725830078125, 139.6483154296875, 154.6693878173828, 169.69046020507812, 184.71151733398438, 199.7325897216797, 214.753662109375, 229.77471923828125, 244.79579162597656, 259.8168640136719, 274.8379211425781, 289.8589782714844, 304.88006591796875, 319.901123046875, 334.92218017578125, 349.9432373046875, 364.9643249511719, 379.9853820800781, 395.0064697265625, 410.02752685546875, 425.0486145019531, 440.0696716308594, 455.0907287597656, 470.11181640625, 485.13287353515625, 500.1539306640625, 515.1749877929688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 11.0, 32.0, 33.0, 55.0, 74.0, 119.0, 176.0, 255.0, 379.0, 626.0, 1051.0, 2041.0, 4369.0, 11571.0, 48945.0, 3713664.0, 364557.0, 27865.0, 9613.0, 4117.0, 1936.0, 959.0, 583.0, 369.0, 234.0, 160.0, 119.0, 106.0, 72.0, 61.0, 37.0, 26.0, 19.0, 15.0, 8.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.705810546875, -8.40380859375, -8.101806640625, -7.7998046875, -7.497802734375, -7.19580078125, -6.893798828125, -6.591796875, -6.289794921875, -5.98779296875, -5.685791015625, -5.3837890625, -5.081787109375, -4.77978515625, -4.477783203125, -4.17578125, -3.873779296875, -3.57177734375, -3.269775390625, -2.9677734375, -2.665771484375, -2.36376953125, -2.061767578125, -1.759765625, -1.457763671875, -1.15576171875, -0.853759765625, -0.5517578125, -0.249755859375, 0.05224609375, 0.354248046875, 0.65625, 0.958251953125, 1.26025390625, 1.562255859375, 1.8642578125, 2.166259765625, 2.46826171875, 2.770263671875, 3.072265625, 3.374267578125, 3.67626953125, 3.978271484375, 4.2802734375, 4.582275390625, 4.88427734375, 5.186279296875, 5.48828125, 5.790283203125, 6.09228515625, 6.394287109375, 6.6962890625, 6.998291015625, 7.30029296875, 7.602294921875, 7.904296875, 8.206298828125, 8.50830078125, 8.810302734375, 9.1123046875, 9.414306640625, 9.71630859375, 10.018310546875, 10.3203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 10.0, 18.0, 30.0, 131.0, 366.0, 274.0, 91.0, 20.0, 13.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6406707763671875, -0.619232177734375, -0.5977935791015625, -0.57635498046875, -0.5549163818359375, -0.533477783203125, -0.5120391845703125, -0.4906005859375, -0.4691619873046875, -0.447723388671875, -0.4262847900390625, -0.40484619140625, -0.3834075927734375, -0.361968994140625, -0.3405303955078125, -0.319091796875, -0.2976531982421875, -0.276214599609375, -0.2547760009765625, -0.23333740234375, -0.2118988037109375, -0.190460205078125, -0.1690216064453125, -0.1475830078125, -0.1261444091796875, -0.104705810546875, -0.0832672119140625, -0.06182861328125, -0.0403900146484375, -0.018951416015625, 0.0024871826171875, 0.02392578125, 0.0453643798828125, 0.066802978515625, 0.0882415771484375, 0.10968017578125, 0.1311187744140625, 0.152557373046875, 0.1739959716796875, 0.1954345703125, 0.2168731689453125, 0.238311767578125, 0.2597503662109375, 0.28118896484375, 0.3026275634765625, 0.324066162109375, 0.3455047607421875, 0.366943359375, 0.3883819580078125, 0.409820556640625, 0.4312591552734375, 0.45269775390625, 0.4741363525390625, 0.495574951171875, 0.5170135498046875, 0.5384521484375, 0.5598907470703125, 0.581329345703125, 0.6027679443359375, 0.62420654296875, 0.6456451416015625, 0.667083740234375, 0.6885223388671875, 0.7099609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 5.0, 8.0, 13.0, 13.0, 20.0, 29.0, 38.0, 55.0, 78.0, 109.0, 129.0, 215.0, 264.0, 422.0, 639.0, 947.0, 1436.0, 2402.0, 4229.0, 7843.0, 16530.0, 44698.0, 176569.0, 3334938.0, 482125.0, 73271.0, 23218.0, 10271.0, 5324.0, 2964.0, 1787.0, 1233.0, 814.0, 523.0, 330.0, 247.0, 159.0, 102.0, 85.0, 57.0, 45.0, 32.0, 24.0, 11.0, 6.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.03125, -4.8775634765625, -4.723876953125, -4.5701904296875, -4.41650390625, -4.2628173828125, -4.109130859375, -3.9554443359375, -3.8017578125, -3.6480712890625, -3.494384765625, -3.3406982421875, -3.18701171875, -3.0333251953125, -2.879638671875, -2.7259521484375, -2.572265625, -2.4185791015625, -2.264892578125, -2.1112060546875, -1.95751953125, -1.8038330078125, -1.650146484375, -1.4964599609375, -1.3427734375, -1.1890869140625, -1.035400390625, -0.8817138671875, -0.72802734375, -0.5743408203125, -0.420654296875, -0.2669677734375, -0.11328125, 0.0404052734375, 0.194091796875, 0.3477783203125, 0.50146484375, 0.6551513671875, 0.808837890625, 0.9625244140625, 1.1162109375, 1.2698974609375, 1.423583984375, 1.5772705078125, 1.73095703125, 1.8846435546875, 2.038330078125, 2.1920166015625, 2.345703125, 2.4993896484375, 2.653076171875, 2.8067626953125, 2.96044921875, 3.1141357421875, 3.267822265625, 3.4215087890625, 3.5751953125, 3.7288818359375, 3.882568359375, 4.0362548828125, 4.18994140625, 4.3436279296875, 4.497314453125, 4.6510009765625, 4.8046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 8.0, 10.0, 12.0, 22.0, 12.0, 30.0, 23.0, 34.0, 45.0, 53.0, 53.0, 56.0, 88.0, 79.0, 124.0, 158.0, 182.0, 278.0, 1141.0, 586.0, 259.0, 162.0, 142.0, 99.0, 87.0, 79.0, 64.0, 36.0, 29.0, 19.0, 28.0, 14.0, 9.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.98974609375, -0.96051025390625, -0.9312744140625, -0.90203857421875, -0.872802734375, -0.84356689453125, -0.8143310546875, -0.78509521484375, -0.755859375, -0.72662353515625, -0.6973876953125, -0.66815185546875, -0.638916015625, -0.60968017578125, -0.5804443359375, -0.55120849609375, -0.52197265625, -0.49273681640625, -0.4635009765625, -0.43426513671875, -0.405029296875, -0.37579345703125, -0.3465576171875, -0.31732177734375, -0.2880859375, -0.25885009765625, -0.2296142578125, -0.20037841796875, -0.171142578125, -0.14190673828125, -0.1126708984375, -0.08343505859375, -0.05419921875, -0.02496337890625, 0.0042724609375, 0.03350830078125, 0.062744140625, 0.09197998046875, 0.1212158203125, 0.15045166015625, 0.1796875, 0.20892333984375, 0.2381591796875, 0.26739501953125, 0.296630859375, 0.32586669921875, 0.3551025390625, 0.38433837890625, 0.41357421875, 0.44281005859375, 0.4720458984375, 0.50128173828125, 0.530517578125, 0.55975341796875, 0.5889892578125, 0.61822509765625, 0.6474609375, 0.67669677734375, 0.7059326171875, 0.73516845703125, 0.764404296875, 0.79364013671875, 0.8228759765625, 0.85211181640625, 0.88134765625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 5.0, 6.0, 13.0, 8.0, 29.0, 46.0, 96.0, 148.0, 290.0, 224.0, 78.0, 25.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.78151512145996, -20.2340030670166, -19.68648910522461, -19.13897705078125, -18.59146499633789, -18.04395294189453, -17.49643898010254, -16.94892692565918, -16.401412963867188, -15.853899955749512, -15.306387901306152, -14.758874893188477, -14.211362838745117, -13.663849830627441, -13.116336822509766, -12.568824768066406, -12.021312713623047, -11.473799705505371, -10.926287651062012, -10.378774642944336, -9.831262588500977, -9.2837495803833, -8.736236572265625, -8.188724517822266, -7.64121150970459, -7.093698978424072, -6.546186447143555, -5.998673439025879, -5.451160907745361, -4.903648376464844, -4.356135368347168, -3.8086228370666504, -3.261110305786133, -2.7135977745056152, -2.1660850048065186, -1.6185723543167114, -1.0710597038269043, -0.5235471725463867, 0.02396559715270996, 0.5714783668518066, 1.1189908981323242, 1.6665035486221313, 2.2140161991119385, 2.761528968811035, 3.3090415000915527, 3.8565540313720703, 4.404067039489746, 4.951579570770264, 5.499092102050781, 6.046604633331299, 6.594117164611816, 7.141630172729492, 7.68914270401001, 8.236655235290527, 8.784168243408203, 9.331680297851562, 9.879193305969238, 10.426706314086914, 10.974218368530273, 11.52173137664795, 12.069244384765625, 12.616756439208984, 13.16426944732666, 13.711782455444336, 14.259294509887695]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 10.0, 11.0, 13.0, 20.0, 14.0, 22.0, 31.0, 31.0, 36.0, 39.0, 68.0, 55.0, 53.0, 59.0, 57.0, 55.0, 66.0, 53.0, 60.0, 49.0, 51.0, 39.0, 30.0, 21.0, 12.0, 11.0, 10.0, 5.0, 8.0, 3.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.891026496887207, -8.604387283325195, -8.317748069763184, -8.031107902526855, -7.744468688964844, -7.457829475402832, -7.17119026184082, -6.884551048278809, -6.597911357879639, -6.311272144317627, -6.024632453918457, -5.737993240356445, -5.451354026794434, -5.164714336395264, -4.878075122833252, -4.591435432434082, -4.30479621887207, -4.018157005310059, -3.7315173149108887, -3.444878101348877, -3.158238649368286, -2.8715991973876953, -2.5849599838256836, -2.2983205318450928, -2.011681079864502, -1.7250416278839111, -1.4384022951126099, -1.1517629623413086, -0.8651235103607178, -0.578484058380127, -0.2918447256088257, -0.005205392837524414, 0.2814350128173828, 0.5680744051933289, 0.8547137975692749, 1.1413531303405762, 1.427992582321167, 1.7146320343017578, 2.0012712478637695, 2.2879106998443604, 2.574550151824951, 2.861189603805542, 3.147829055786133, 3.4344682693481445, 3.7211077213287354, 4.007747173309326, 4.294386386871338, 4.581026077270508, 4.8676652908325195, 5.154304504394531, 5.440944194793701, 5.727583408355713, 6.014223098754883, 6.3008623123168945, 6.587501525878906, 6.874140739440918, 7.160780429840088, 7.4474196434021, 7.7340593338012695, 8.020698547363281, 8.307337760925293, 8.593976974487305, 8.880617141723633, 9.167256355285645, 9.453895568847656]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 7.0, 8.0, 12.0, 16.0, 25.0, 27.0, 39.0, 50.0, 99.0, 143.0, 172.0, 277.0, 430.0, 716.0, 1250.0, 2290.0, 4900.0, 14306.0, 97845.0, 846125.0, 59207.0, 11446.0, 4107.0, 2070.0, 1099.0, 611.0, 426.0, 273.0, 162.0, 117.0, 83.0, 44.0, 46.0, 29.0, 15.0, 17.0, 16.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.73046875, -5.56390380859375, -5.3973388671875, -5.23077392578125, -5.064208984375, -4.89764404296875, -4.7310791015625, -4.56451416015625, -4.39794921875, -4.23138427734375, -4.0648193359375, -3.89825439453125, -3.731689453125, -3.56512451171875, -3.3985595703125, -3.23199462890625, -3.0654296875, -2.89886474609375, -2.7322998046875, -2.56573486328125, -2.399169921875, -2.23260498046875, -2.0660400390625, -1.89947509765625, -1.73291015625, -1.56634521484375, -1.3997802734375, -1.23321533203125, -1.066650390625, -0.90008544921875, -0.7335205078125, -0.56695556640625, -0.400390625, -0.23382568359375, -0.0672607421875, 0.09930419921875, 0.265869140625, 0.43243408203125, 0.5989990234375, 0.76556396484375, 0.93212890625, 1.09869384765625, 1.2652587890625, 1.43182373046875, 1.598388671875, 1.76495361328125, 1.9315185546875, 2.09808349609375, 2.2646484375, 2.43121337890625, 2.5977783203125, 2.76434326171875, 2.930908203125, 3.09747314453125, 3.2640380859375, 3.43060302734375, 3.59716796875, 3.76373291015625, 3.9302978515625, 4.09686279296875, 4.263427734375, 4.42999267578125, 4.5965576171875, 4.76312255859375, 4.9296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 16.0, 7.0, 15.0, 32.0, 82.0, 178.0, 241.0, 207.0, 110.0, 50.0, 15.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6539077758789062, -0.6344757080078125, -0.6150436401367188, -0.595611572265625, -0.5761795043945312, -0.5567474365234375, -0.5373153686523438, -0.51788330078125, -0.49845123291015625, -0.4790191650390625, -0.45958709716796875, -0.440155029296875, -0.42072296142578125, -0.4012908935546875, -0.38185882568359375, -0.3624267578125, -0.34299468994140625, -0.3235626220703125, -0.30413055419921875, -0.284698486328125, -0.26526641845703125, -0.2458343505859375, -0.22640228271484375, -0.20697021484375, -0.18753814697265625, -0.1681060791015625, -0.14867401123046875, -0.129241943359375, -0.10980987548828125, -0.0903778076171875, -0.07094573974609375, -0.051513671875, -0.03208160400390625, -0.0126495361328125, 0.00678253173828125, 0.026214599609375, 0.04564666748046875, 0.0650787353515625, 0.08451080322265625, 0.10394287109375, 0.12337493896484375, 0.1428070068359375, 0.16223907470703125, 0.181671142578125, 0.20110321044921875, 0.2205352783203125, 0.23996734619140625, 0.2593994140625, 0.27883148193359375, 0.2982635498046875, 0.31769561767578125, 0.337127685546875, 0.35655975341796875, 0.3759918212890625, 0.39542388916015625, 0.41485595703125, 0.43428802490234375, 0.4537200927734375, 0.47315216064453125, 0.492584228515625, 0.5120162963867188, 0.5314483642578125, 0.5508804321289062, 0.5703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 11.0, 12.0, 15.0, 19.0, 27.0, 41.0, 35.0, 72.0, 87.0, 135.0, 214.0, 315.0, 552.0, 915.0, 1863.0, 4162.0, 13027.0, 78593.0, 829384.0, 95382.0, 14705.0, 4456.0, 1997.0, 1014.0, 507.0, 313.0, 195.0, 149.0, 96.0, 75.0, 62.0, 32.0, 19.0, 19.0, 7.0, 12.0, 7.0, 3.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.93359375, -6.73284912109375, -6.5321044921875, -6.33135986328125, -6.130615234375, -5.92987060546875, -5.7291259765625, -5.52838134765625, -5.32763671875, -5.12689208984375, -4.9261474609375, -4.72540283203125, -4.524658203125, -4.32391357421875, -4.1231689453125, -3.92242431640625, -3.7216796875, -3.52093505859375, -3.3201904296875, -3.11944580078125, -2.918701171875, -2.71795654296875, -2.5172119140625, -2.31646728515625, -2.11572265625, -1.91497802734375, -1.7142333984375, -1.51348876953125, -1.312744140625, -1.11199951171875, -0.9112548828125, -0.71051025390625, -0.509765625, -0.30902099609375, -0.1082763671875, 0.09246826171875, 0.293212890625, 0.49395751953125, 0.6947021484375, 0.89544677734375, 1.09619140625, 1.29693603515625, 1.4976806640625, 1.69842529296875, 1.899169921875, 2.09991455078125, 2.3006591796875, 2.50140380859375, 2.7021484375, 2.90289306640625, 3.1036376953125, 3.30438232421875, 3.505126953125, 3.70587158203125, 3.9066162109375, 4.10736083984375, 4.30810546875, 4.50885009765625, 4.7095947265625, 4.91033935546875, 5.111083984375, 5.31182861328125, 5.5125732421875, 5.71331787109375, 5.9140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 5.0, 11.0, 9.0, 15.0, 17.0, 16.0, 22.0, 24.0, 23.0, 21.0, 25.0, 36.0, 39.0, 28.0, 35.0, 37.0, 45.0, 45.0, 50.0, 38.0, 50.0, 47.0, 39.0, 38.0, 29.0, 29.0, 22.0, 22.0, 33.0, 28.0, 17.0, 23.0, 14.0, 15.0, 6.0, 7.0, 9.0, 9.0, 5.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.725067138671875, -1.66888427734375, -1.612701416015625, -1.5565185546875, -1.500335693359375, -1.44415283203125, -1.387969970703125, -1.331787109375, -1.275604248046875, -1.21942138671875, -1.163238525390625, -1.1070556640625, -1.050872802734375, -0.99468994140625, -0.938507080078125, -0.88232421875, -0.826141357421875, -0.76995849609375, -0.713775634765625, -0.6575927734375, -0.601409912109375, -0.54522705078125, -0.489044189453125, -0.432861328125, -0.376678466796875, -0.32049560546875, -0.264312744140625, -0.2081298828125, -0.151947021484375, -0.09576416015625, -0.039581298828125, 0.0166015625, 0.072784423828125, 0.12896728515625, 0.185150146484375, 0.2413330078125, 0.297515869140625, 0.35369873046875, 0.409881591796875, 0.466064453125, 0.522247314453125, 0.57843017578125, 0.634613037109375, 0.6907958984375, 0.746978759765625, 0.80316162109375, 0.859344482421875, 0.91552734375, 0.971710205078125, 1.02789306640625, 1.084075927734375, 1.1402587890625, 1.196441650390625, 1.25262451171875, 1.308807373046875, 1.364990234375, 1.421173095703125, 1.47735595703125, 1.533538818359375, 1.5897216796875, 1.645904541015625, 1.70208740234375, 1.758270263671875, 1.814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 7.0, 11.0, 10.0, 17.0, 31.0, 43.0, 52.0, 84.0, 146.0, 230.0, 373.0, 817.0, 2318.0, 9905.0, 839987.0, 183795.0, 7243.0, 1834.0, 718.0, 322.0, 209.0, 112.0, 66.0, 54.0, 40.0, 32.0, 16.0, 15.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.328125, -11.916015625, -11.50390625, -11.091796875, -10.6796875, -10.267578125, -9.85546875, -9.443359375, -9.03125, -8.619140625, -8.20703125, -7.794921875, -7.3828125, -6.970703125, -6.55859375, -6.146484375, -5.734375, -5.322265625, -4.91015625, -4.498046875, -4.0859375, -3.673828125, -3.26171875, -2.849609375, -2.4375, -2.025390625, -1.61328125, -1.201171875, -0.7890625, -0.376953125, 0.03515625, 0.447265625, 0.859375, 1.271484375, 1.68359375, 2.095703125, 2.5078125, 2.919921875, 3.33203125, 3.744140625, 4.15625, 4.568359375, 4.98046875, 5.392578125, 5.8046875, 6.216796875, 6.62890625, 7.041015625, 7.453125, 7.865234375, 8.27734375, 8.689453125, 9.1015625, 9.513671875, 9.92578125, 10.337890625, 10.75, 11.162109375, 11.57421875, 11.986328125, 12.3984375, 12.810546875, 13.22265625, 13.634765625, 14.046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 7.0, 2.0, 2.0, 4.0, 12.0, 11.0, 18.0, 14.0, 20.0, 28.0, 35.0, 42.0, 85.0, 194.0, 239.0, 90.0, 53.0, 29.0, 20.0, 16.0, 11.0, 12.0, 8.0, 6.0, 6.0, 3.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.005733489990234375, -0.005574464797973633, -0.005415439605712891, -0.0052564144134521484, -0.005097389221191406, -0.004938364028930664, -0.004779338836669922, -0.00462031364440918, -0.0044612884521484375, -0.004302263259887695, -0.004143238067626953, -0.003984212875366211, -0.0038251876831054688, -0.0036661624908447266, -0.0035071372985839844, -0.003348112106323242, -0.0031890869140625, -0.003030061721801758, -0.0028710365295410156, -0.0027120113372802734, -0.0025529861450195312, -0.002393960952758789, -0.002234935760498047, -0.0020759105682373047, -0.0019168853759765625, -0.0017578601837158203, -0.0015988349914550781, -0.001439809799194336, -0.0012807846069335938, -0.0011217594146728516, -0.0009627342224121094, -0.0008037090301513672, -0.000644683837890625, -0.0004856586456298828, -0.0003266334533691406, -0.00016760826110839844, -8.58306884765625e-06, 0.00015044212341308594, 0.0003094673156738281, 0.0004684925079345703, 0.0006275177001953125, 0.0007865428924560547, 0.0009455680847167969, 0.001104593276977539, 0.0012636184692382812, 0.0014226436614990234, 0.0015816688537597656, 0.0017406940460205078, 0.00189971923828125, 0.002058744430541992, 0.0022177696228027344, 0.0023767948150634766, 0.0025358200073242188, 0.002694845199584961, 0.002853870391845703, 0.0030128955841064453, 0.0031719207763671875, 0.0033309459686279297, 0.003489971160888672, 0.003648996353149414, 0.0038080215454101562, 0.0039670467376708984, 0.004126071929931641, 0.004285097122192383, 0.004444122314453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 10.0, 4.0, 4.0, 16.0, 20.0, 29.0, 28.0, 49.0, 76.0, 126.0, 254.0, 368.0, 815.0, 2065.0, 8732.0, 938676.0, 88787.0, 5476.0, 1517.0, 689.0, 307.0, 169.0, 108.0, 68.0, 56.0, 22.0, 29.0, 14.0, 9.0, 5.0, 3.0, 6.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.9873046875, -24.177734375, -23.3681640625, -22.55859375, -21.7490234375, -20.939453125, -20.1298828125, -19.3203125, -18.5107421875, -17.701171875, -16.8916015625, -16.08203125, -15.2724609375, -14.462890625, -13.6533203125, -12.84375, -12.0341796875, -11.224609375, -10.4150390625, -9.60546875, -8.7958984375, -7.986328125, -7.1767578125, -6.3671875, -5.5576171875, -4.748046875, -3.9384765625, -3.12890625, -2.3193359375, -1.509765625, -0.7001953125, 0.109375, 0.9189453125, 1.728515625, 2.5380859375, 3.34765625, 4.1572265625, 4.966796875, 5.7763671875, 6.5859375, 7.3955078125, 8.205078125, 9.0146484375, 9.82421875, 10.6337890625, 11.443359375, 12.2529296875, 13.0625, 13.8720703125, 14.681640625, 15.4912109375, 16.30078125, 17.1103515625, 17.919921875, 18.7294921875, 19.5390625, 20.3486328125, 21.158203125, 21.9677734375, 22.77734375, 23.5869140625, 24.396484375, 25.2060546875, 26.015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 5.0, 4.0, 8.0, 18.0, 13.0, 15.0, 17.0, 68.0, 216.0, 399.0, 139.0, 27.0, 19.0, 10.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.125, -8.8338623046875, -8.542724609375, -8.2515869140625, -7.96044921875, -7.6693115234375, -7.378173828125, -7.0870361328125, -6.7958984375, -6.5047607421875, -6.213623046875, -5.9224853515625, -5.63134765625, -5.3402099609375, -5.049072265625, -4.7579345703125, -4.466796875, -4.1756591796875, -3.884521484375, -3.5933837890625, -3.30224609375, -3.0111083984375, -2.719970703125, -2.4288330078125, -2.1376953125, -1.8465576171875, -1.555419921875, -1.2642822265625, -0.97314453125, -0.6820068359375, -0.390869140625, -0.0997314453125, 0.19140625, 0.4825439453125, 0.773681640625, 1.0648193359375, 1.35595703125, 1.6470947265625, 1.938232421875, 2.2293701171875, 2.5205078125, 2.8116455078125, 3.102783203125, 3.3939208984375, 3.68505859375, 3.9761962890625, 4.267333984375, 4.5584716796875, 4.849609375, 5.1407470703125, 5.431884765625, 5.7230224609375, 6.01416015625, 6.3052978515625, 6.596435546875, 6.8875732421875, 7.1787109375, 7.4698486328125, 7.760986328125, 8.0521240234375, 8.34326171875, 8.6343994140625, 8.925537109375, 9.2166748046875, 9.5078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 2.0, 4.0, 4.0, 17.0, 22.0, 30.0, 52.0, 69.0, 154.0, 221.0, 195.0, 87.0, 50.0, 24.0, 12.0, 11.0, 4.0, 13.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-45.81078338623047, -44.74501037597656, -43.679237365722656, -42.61346435546875, -41.547691345214844, -40.48191833496094, -39.41614532470703, -38.35037612915039, -37.284603118896484, -36.21883010864258, -35.15305709838867, -34.087284088134766, -33.02151107788086, -31.955739974975586, -30.88996696472168, -29.824193954467773, -28.758420944213867, -27.69264793395996, -26.626874923706055, -25.56110382080078, -24.495330810546875, -23.42955780029297, -22.363784790039062, -21.298011779785156, -20.23223876953125, -19.166465759277344, -18.100692749023438, -17.03491973876953, -15.969148635864258, -14.903375625610352, -13.837602615356445, -12.771829605102539, -11.706060409545898, -10.640287399291992, -9.574515342712402, -8.508742332458496, -7.442969799041748, -6.377197265625, -5.311424255371094, -4.245651721954346, -3.1798791885375977, -2.1141066551208496, -1.0483338832855225, 0.017438888549804688, 1.0832114219665527, 2.148983955383301, 3.214756965637207, 4.280529499053955, 5.346302032470703, 6.412074565887451, 7.477847099304199, 8.543620109558105, 9.609392166137695, 10.675165176391602, 11.740938186645508, 12.806711196899414, 13.872483253479004, 14.93825626373291, 16.0040283203125, 17.069801330566406, 18.135574340820312, 19.20134735107422, 20.267120361328125, 21.3328914642334, 22.398664474487305]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 14.0, 15.0, 25.0, 29.0, 43.0, 51.0, 53.0, 60.0, 95.0, 86.0, 90.0, 79.0, 63.0, 43.0, 65.0, 41.0, 32.0, 22.0, 15.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.051342010498047, -25.085369110107422, -24.11939811706543, -23.153425216674805, -22.187454223632812, -21.221481323242188, -20.255510330200195, -19.28953742980957, -18.323566436767578, -17.357593536376953, -16.39162254333496, -15.425650596618652, -14.459678649902344, -13.493705749511719, -12.527734756469727, -11.561761856079102, -10.595789909362793, -9.629817962646484, -8.663846015930176, -7.697874069213867, -6.731902122497559, -5.765929698944092, -4.799957752227783, -3.8339858055114746, -2.868013858795166, -1.9020419120788574, -0.9360698461532593, 0.029902219772338867, 0.9958741664886475, 1.9618463516235352, 2.9278182983398438, 3.8937902450561523, 4.859762191772461, 5.8257341384887695, 6.791706085205078, 7.757678031921387, 8.723649978637695, 9.68962287902832, 10.655593872070312, 11.621566772460938, 12.58753776550293, 13.553509712219238, 14.519481658935547, 15.485453605651855, 16.451425552368164, 17.41739845275879, 18.38336944580078, 19.349342346191406, 20.31531524658203, 21.281288146972656, 22.24725914001465, 23.213232040405273, 24.179203033447266, 25.14517593383789, 26.111146926879883, 27.077119827270508, 28.0430908203125, 29.009063720703125, 29.975034713745117, 30.941007614135742, 31.906978607177734, 32.87295150756836, 33.838924407958984, 34.804893493652344, 35.77086639404297]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 11.0, 15.0, 28.0, 89.0, 1164.0, 4155638.0, 36436.0, 667.0, 133.0, 40.0, 20.0, 13.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -51.2578125, -48.015625, -44.7734375, -41.53125, -38.2890625, -35.046875, -31.8046875, -28.5625, -25.3203125, -22.078125, -18.8359375, -15.59375, -12.3515625, -9.109375, -5.8671875, -2.625, 0.6171875, 3.859375, 7.1015625, 10.34375, 13.5859375, 16.828125, 20.0703125, 23.3125, 26.5546875, 29.796875, 33.0390625, 36.28125, 39.5234375, 42.765625, 46.0078125, 49.25, 52.4921875, 55.734375, 58.9765625, 62.21875, 65.4609375, 68.703125, 71.9453125, 75.1875, 78.4296875, 81.671875, 84.9140625, 88.15625, 91.3984375, 94.640625, 97.8828125, 101.125, 104.3671875, 107.609375, 110.8515625, 114.09375, 117.3359375, 120.578125, 123.8203125, 127.0625, 130.3046875, 133.546875, 136.7890625, 140.03125, 143.2734375, 146.515625, 149.7578125, 153.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 6.0, 2.0, 2.0, 5.0, 10.0, 9.0, 12.0, 22.0, 38.0, 51.0, 88.0, 128.0, 146.0, 142.0, 98.0, 88.0, 58.0, 19.0, 25.0, 8.0, 7.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3871498107910156, -0.37415313720703125, -0.3611564636230469, -0.3481597900390625, -0.3351631164550781, -0.32216644287109375, -0.3091697692871094, -0.296173095703125, -0.2831764221191406, -0.27017974853515625, -0.2571830749511719, -0.2441864013671875, -0.23118972778320312, -0.21819305419921875, -0.20519638061523438, -0.19219970703125, -0.17920303344726562, -0.16620635986328125, -0.15320968627929688, -0.1402130126953125, -0.12721633911132812, -0.11421966552734375, -0.10122299194335938, -0.088226318359375, -0.07522964477539062, -0.06223297119140625, -0.049236297607421875, -0.0362396240234375, -0.023242950439453125, -0.01024627685546875, 0.002750396728515625, 0.0157470703125, 0.028743743896484375, 0.04174041748046875, 0.054737091064453125, 0.0677337646484375, 0.08073043823242188, 0.09372711181640625, 0.10672378540039062, 0.119720458984375, 0.13271713256835938, 0.14571380615234375, 0.15871047973632812, 0.1717071533203125, 0.18470382690429688, 0.19770050048828125, 0.21069717407226562, 0.22369384765625, 0.23669052124023438, 0.24968719482421875, 0.2626838684082031, 0.2756805419921875, 0.2886772155761719, 0.30167388916015625, 0.3146705627441406, 0.327667236328125, 0.3406639099121094, 0.35366058349609375, 0.3666572570800781, 0.3796539306640625, 0.3926506042480469, 0.40564727783203125, 0.4186439514160156, 0.431640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 19.0, 25.0, 40.0, 97.0, 198.0, 381.0, 1040.0, 5925.0, 3391820.0, 788594.0, 5169.0, 655.0, 208.0, 61.0, 24.0, 13.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.494140625, -41.45703125, -40.419921875, -39.3828125, -38.345703125, -37.30859375, -36.271484375, -35.234375, -34.197265625, -33.16015625, -32.123046875, -31.0859375, -30.048828125, -29.01171875, -27.974609375, -26.9375, -25.900390625, -24.86328125, -23.826171875, -22.7890625, -21.751953125, -20.71484375, -19.677734375, -18.640625, -17.603515625, -16.56640625, -15.529296875, -14.4921875, -13.455078125, -12.41796875, -11.380859375, -10.34375, -9.306640625, -8.26953125, -7.232421875, -6.1953125, -5.158203125, -4.12109375, -3.083984375, -2.046875, -1.009765625, 0.02734375, 1.064453125, 2.1015625, 3.138671875, 4.17578125, 5.212890625, 6.25, 7.287109375, 8.32421875, 9.361328125, 10.3984375, 11.435546875, 12.47265625, 13.509765625, 14.546875, 15.583984375, 16.62109375, 17.658203125, 18.6953125, 19.732421875, 20.76953125, 21.806640625, 22.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 1.0, 7.0, 13.0, 7.0, 12.0, 26.0, 29.0, 35.0, 38.0, 73.0, 136.0, 393.0, 1907.0, 722.0, 209.0, 140.0, 77.0, 65.0, 51.0, 31.0, 20.0, 20.0, 18.0, 14.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4228515625, -1.3903732299804688, -1.3578948974609375, -1.3254165649414062, -1.292938232421875, -1.2604598999023438, -1.2279815673828125, -1.1955032348632812, -1.16302490234375, -1.1305465698242188, -1.0980682373046875, -1.0655899047851562, -1.033111572265625, -1.0006332397460938, -0.9681549072265625, -0.9356765747070312, -0.9031982421875, -0.8707199096679688, -0.8382415771484375, -0.8057632446289062, -0.773284912109375, -0.7408065795898438, -0.7083282470703125, -0.6758499145507812, -0.64337158203125, -0.6108932495117188, -0.5784149169921875, -0.5459365844726562, -0.513458251953125, -0.48097991943359375, -0.4485015869140625, -0.41602325439453125, -0.383544921875, -0.35106658935546875, -0.3185882568359375, -0.28610992431640625, -0.253631591796875, -0.22115325927734375, -0.1886749267578125, -0.15619659423828125, -0.12371826171875, -0.09123992919921875, -0.0587615966796875, -0.02628326416015625, 0.006195068359375, 0.03867340087890625, 0.0711517333984375, 0.10363006591796875, 0.1361083984375, 0.16858673095703125, 0.2010650634765625, 0.23354339599609375, 0.266021728515625, 0.29850006103515625, 0.3309783935546875, 0.36345672607421875, 0.39593505859375, 0.42841339111328125, 0.4608917236328125, 0.49337005615234375, 0.525848388671875, 0.5583267211914062, 0.5908050537109375, 0.6232833862304688, 0.65576171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 10.0, 129.0, 808.0, 51.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-205.85006713867188, -202.1320343017578, -198.4140167236328, -194.69598388671875, -190.97796630859375, -187.2599334716797, -183.5419158935547, -179.82388305664062, -176.10586547851562, -172.38783264160156, -168.66981506347656, -164.9517822265625, -161.2337646484375, -157.51573181152344, -153.79771423339844, -150.07968139648438, -146.36166381835938, -142.6436309814453, -138.9256134033203, -135.20758056640625, -131.48956298828125, -127.77153778076172, -124.05351257324219, -120.33547973632812, -116.61744689941406, -112.89942169189453, -109.181396484375, -105.46337127685547, -101.74534606933594, -98.0273208618164, -94.30929565429688, -90.59126281738281, -86.87323760986328, -83.15521240234375, -79.43718719482422, -75.71916198730469, -72.00113677978516, -68.28311157226562, -64.56507873535156, -60.8470573425293, -57.129032135009766, -53.411006927490234, -49.6929817199707, -45.974952697753906, -42.256927490234375, -38.538902282714844, -34.82087707519531, -31.10285186767578, -27.38482666015625, -23.66680145263672, -19.948776245117188, -16.230749130249023, -12.512723922729492, -8.794698715209961, -5.076671600341797, -1.3586463928222656, 2.3593788146972656, 6.077404499053955, 9.795430183410645, 13.513456344604492, 17.231481552124023, 20.949506759643555, 24.66753387451172, 28.38555908203125, 32.10358428955078]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 16.0, 26.0, 25.0, 52.0, 46.0, 79.0, 80.0, 103.0, 102.0, 84.0, 82.0, 78.0, 63.0, 43.0, 24.0, 35.0, 15.0, 6.0, 8.0, 8.0, 5.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.936280250549316, -11.643210411071777, -11.350141525268555, -11.057071685791016, -10.764002799987793, -10.470932960510254, -10.177864074707031, -9.884794235229492, -9.591724395751953, -9.298654556274414, -9.005585670471191, -8.712515830993652, -8.41944694519043, -8.12637710571289, -7.83330774307251, -7.540238380432129, -7.247169494628906, -6.954100131988525, -6.6610307693481445, -6.367961406707764, -6.074892044067383, -5.781822204589844, -5.488752841949463, -5.195683479309082, -4.902614116668701, -4.60954475402832, -4.3164753913879395, -4.023406028747559, -3.7303364276885986, -3.4372670650482178, -3.144197463989258, -2.851128101348877, -2.558058738708496, -2.2649893760681152, -1.9719198942184448, -1.6788504123687744, -1.3857810497283936, -1.0927116870880127, -0.7996422052383423, -0.5065727233886719, -0.21350336074829102, 0.07956606149673462, 0.37263548374176025, 0.6657049059867859, 0.9587743282318115, 1.2518436908721924, 1.5449131727218628, 1.8379826545715332, 2.131052017211914, 2.424121379852295, 2.717190742492676, 3.0102603435516357, 3.3033297061920166, 3.5963990688323975, 3.8894686698913574, 4.182538032531738, 4.475607395172119, 4.7686767578125, 5.061746120452881, 5.354815483093262, 5.647885322570801, 5.940954208374023, 6.2340240478515625, 6.527093410491943, 6.820162773132324]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 10.0, 8.0, 12.0, 20.0, 17.0, 29.0, 26.0, 36.0, 51.0, 76.0, 124.0, 176.0, 261.0, 397.0, 618.0, 1143.0, 1944.0, 3794.0, 7770.0, 18019.0, 50564.0, 214548.0, 576687.0, 113221.0, 33264.0, 13112.0, 5818.0, 2850.0, 1524.0, 890.0, 476.0, 330.0, 218.0, 143.0, 106.0, 63.0, 48.0, 37.0, 30.0, 17.0, 17.0, 15.0, 12.0, 10.0, 2.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.1640625, -7.9189453125, -7.673828125, -7.4287109375, -7.18359375, -6.9384765625, -6.693359375, -6.4482421875, -6.203125, -5.9580078125, -5.712890625, -5.4677734375, -5.22265625, -4.9775390625, -4.732421875, -4.4873046875, -4.2421875, -3.9970703125, -3.751953125, -3.5068359375, -3.26171875, -3.0166015625, -2.771484375, -2.5263671875, -2.28125, -2.0361328125, -1.791015625, -1.5458984375, -1.30078125, -1.0556640625, -0.810546875, -0.5654296875, -0.3203125, -0.0751953125, 0.169921875, 0.4150390625, 0.66015625, 0.9052734375, 1.150390625, 1.3955078125, 1.640625, 1.8857421875, 2.130859375, 2.3759765625, 2.62109375, 2.8662109375, 3.111328125, 3.3564453125, 3.6015625, 3.8466796875, 4.091796875, 4.3369140625, 4.58203125, 4.8271484375, 5.072265625, 5.3173828125, 5.5625, 5.8076171875, 6.052734375, 6.2978515625, 6.54296875, 6.7880859375, 7.033203125, 7.2783203125, 7.5234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 10.0, 15.0, 21.0, 36.0, 34.0, 56.0, 56.0, 61.0, 79.0, 86.0, 73.0, 58.0, 70.0, 63.0, 53.0, 40.0, 39.0, 28.0, 21.0, 22.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3489341735839844, -0.33678436279296875, -0.3246345520019531, -0.3124847412109375, -0.3003349304199219, -0.28818511962890625, -0.2760353088378906, -0.263885498046875, -0.2517356872558594, -0.23958587646484375, -0.22743606567382812, -0.2152862548828125, -0.20313644409179688, -0.19098663330078125, -0.17883682250976562, -0.16668701171875, -0.15453720092773438, -0.14238739013671875, -0.13023757934570312, -0.1180877685546875, -0.10593795776367188, -0.09378814697265625, -0.08163833618164062, -0.069488525390625, -0.057338714599609375, -0.04518890380859375, -0.033039093017578125, -0.0208892822265625, -0.008739471435546875, 0.00341033935546875, 0.015560150146484375, 0.0277099609375, 0.039859771728515625, 0.05200958251953125, 0.06415939331054688, 0.0763092041015625, 0.08845901489257812, 0.10060882568359375, 0.11275863647460938, 0.124908447265625, 0.13705825805664062, 0.14920806884765625, 0.16135787963867188, 0.1735076904296875, 0.18565750122070312, 0.19780731201171875, 0.20995712280273438, 0.22210693359375, 0.23425674438476562, 0.24640655517578125, 0.2585563659667969, 0.2707061767578125, 0.2828559875488281, 0.29500579833984375, 0.3071556091308594, 0.319305419921875, 0.3314552307128906, 0.34360504150390625, 0.3557548522949219, 0.3679046630859375, 0.3800544738769531, 0.39220428466796875, 0.4043540954589844, 0.41650390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 8.0, 9.0, 9.0, 11.0, 9.0, 16.0, 15.0, 20.0, 16.0, 50.0, 147.0, 1137.0, 39419.0, 994403.0, 12245.0, 691.0, 122.0, 52.0, 33.0, 18.0, 18.0, 17.0, 11.0, 11.0, 5.0, 12.0, 2.0, 5.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96875, -19.181640625, -18.39453125, -17.607421875, -16.8203125, -16.033203125, -15.24609375, -14.458984375, -13.671875, -12.884765625, -12.09765625, -11.310546875, -10.5234375, -9.736328125, -8.94921875, -8.162109375, -7.375, -6.587890625, -5.80078125, -5.013671875, -4.2265625, -3.439453125, -2.65234375, -1.865234375, -1.078125, -0.291015625, 0.49609375, 1.283203125, 2.0703125, 2.857421875, 3.64453125, 4.431640625, 5.21875, 6.005859375, 6.79296875, 7.580078125, 8.3671875, 9.154296875, 9.94140625, 10.728515625, 11.515625, 12.302734375, 13.08984375, 13.876953125, 14.6640625, 15.451171875, 16.23828125, 17.025390625, 17.8125, 18.599609375, 19.38671875, 20.173828125, 20.9609375, 21.748046875, 22.53515625, 23.322265625, 24.109375, 24.896484375, 25.68359375, 26.470703125, 27.2578125, 28.044921875, 28.83203125, 29.619140625, 30.40625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 7.0, 11.0, 10.0, 12.0, 19.0, 27.0, 26.0, 31.0, 16.0, 28.0, 20.0, 43.0, 38.0, 42.0, 44.0, 49.0, 63.0, 44.0, 40.0, 51.0, 48.0, 36.0, 39.0, 33.0, 29.0, 35.0, 21.0, 17.0, 21.0, 14.0, 8.0, 15.0, 14.0, 4.0, 8.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3328094482421875, -1.277923583984375, -1.2230377197265625, -1.16815185546875, -1.1132659912109375, -1.058380126953125, -1.0034942626953125, -0.9486083984375, -0.8937225341796875, -0.838836669921875, -0.7839508056640625, -0.72906494140625, -0.6741790771484375, -0.619293212890625, -0.5644073486328125, -0.509521484375, -0.4546356201171875, -0.399749755859375, -0.3448638916015625, -0.28997802734375, -0.2350921630859375, -0.180206298828125, -0.1253204345703125, -0.0704345703125, -0.0155487060546875, 0.039337158203125, 0.0942230224609375, 0.14910888671875, 0.2039947509765625, 0.258880615234375, 0.3137664794921875, 0.36865234375, 0.4235382080078125, 0.478424072265625, 0.5333099365234375, 0.58819580078125, 0.6430816650390625, 0.697967529296875, 0.7528533935546875, 0.8077392578125, 0.8626251220703125, 0.917510986328125, 0.9723968505859375, 1.02728271484375, 1.0821685791015625, 1.137054443359375, 1.1919403076171875, 1.246826171875, 1.3017120361328125, 1.356597900390625, 1.4114837646484375, 1.46636962890625, 1.5212554931640625, 1.576141357421875, 1.6310272216796875, 1.6859130859375, 1.7407989501953125, 1.795684814453125, 1.8505706787109375, 1.90545654296875, 1.9603424072265625, 2.015228271484375, 2.0701141357421875, 2.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 6.0, 18.0, 20.0, 45.0, 171.0, 2090.0, 1040053.0, 5655.0, 332.0, 72.0, 30.0, 13.0, 13.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.625, -84.763671875, -81.90234375, -79.041015625, -76.1796875, -73.318359375, -70.45703125, -67.595703125, -64.734375, -61.873046875, -59.01171875, -56.150390625, -53.2890625, -50.427734375, -47.56640625, -44.705078125, -41.84375, -38.982421875, -36.12109375, -33.259765625, -30.3984375, -27.537109375, -24.67578125, -21.814453125, -18.953125, -16.091796875, -13.23046875, -10.369140625, -7.5078125, -4.646484375, -1.78515625, 1.076171875, 3.9375, 6.798828125, 9.66015625, 12.521484375, 15.3828125, 18.244140625, 21.10546875, 23.966796875, 26.828125, 29.689453125, 32.55078125, 35.412109375, 38.2734375, 41.134765625, 43.99609375, 46.857421875, 49.71875, 52.580078125, 55.44140625, 58.302734375, 61.1640625, 64.025390625, 66.88671875, 69.748046875, 72.609375, 75.470703125, 78.33203125, 81.193359375, 84.0546875, 86.916015625, 89.77734375, 92.638671875, 95.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 17.0, 26.0, 56.0, 82.0, 503.0, 130.0, 50.0, 31.0, 24.0, 19.0, 5.0, 9.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0214385986328125, -0.020802021026611328, -0.020165443420410156, -0.019528865814208984, -0.018892288208007812, -0.01825571060180664, -0.01761913299560547, -0.016982555389404297, -0.016345977783203125, -0.015709400177001953, -0.015072822570800781, -0.01443624496459961, -0.013799667358398438, -0.013163089752197266, -0.012526512145996094, -0.011889934539794922, -0.01125335693359375, -0.010616779327392578, -0.009980201721191406, -0.009343624114990234, -0.008707046508789062, -0.00807046890258789, -0.007433891296386719, -0.006797313690185547, -0.006160736083984375, -0.005524158477783203, -0.004887580871582031, -0.004251003265380859, -0.0036144256591796875, -0.0029778480529785156, -0.0023412704467773438, -0.0017046928405761719, -0.001068115234375, -0.0004315376281738281, 0.00020503997802734375, 0.0008416175842285156, 0.0014781951904296875, 0.0021147727966308594, 0.0027513504028320312, 0.003387928009033203, 0.004024505615234375, 0.004661083221435547, 0.005297660827636719, 0.005934238433837891, 0.0065708160400390625, 0.007207393646240234, 0.007843971252441406, 0.008480548858642578, 0.00911712646484375, 0.009753704071044922, 0.010390281677246094, 0.011026859283447266, 0.011663436889648438, 0.01230001449584961, 0.012936592102050781, 0.013573169708251953, 0.014209747314453125, 0.014846324920654297, 0.015482902526855469, 0.01611948013305664, 0.016756057739257812, 0.017392635345458984, 0.018029212951660156, 0.018665790557861328, 0.0193023681640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 14.0, 18.0, 19.0, 33.0, 36.0, 66.0, 87.0, 123.0, 172.0, 244.0, 397.0, 644.0, 1163.0, 2426.0, 6405.0, 47522.0, 946856.0, 31869.0, 5803.0, 2286.0, 1043.0, 518.0, 291.0, 163.0, 107.0, 75.0, 46.0, 27.0, 29.0, 18.0, 12.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.734375, -18.892333984375, -18.05029296875, -17.208251953125, -16.3662109375, -15.524169921875, -14.68212890625, -13.840087890625, -12.998046875, -12.156005859375, -11.31396484375, -10.471923828125, -9.6298828125, -8.787841796875, -7.94580078125, -7.103759765625, -6.26171875, -5.419677734375, -4.57763671875, -3.735595703125, -2.8935546875, -2.051513671875, -1.20947265625, -0.367431640625, 0.474609375, 1.316650390625, 2.15869140625, 3.000732421875, 3.8427734375, 4.684814453125, 5.52685546875, 6.368896484375, 7.2109375, 8.052978515625, 8.89501953125, 9.737060546875, 10.5791015625, 11.421142578125, 12.26318359375, 13.105224609375, 13.947265625, 14.789306640625, 15.63134765625, 16.473388671875, 17.3154296875, 18.157470703125, 18.99951171875, 19.841552734375, 20.68359375, 21.525634765625, 22.36767578125, 23.209716796875, 24.0517578125, 24.893798828125, 25.73583984375, 26.577880859375, 27.419921875, 28.261962890625, 29.10400390625, 29.946044921875, 30.7880859375, 31.630126953125, 32.47216796875, 33.314208984375, 34.15625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 19.0, 25.0, 63.0, 186.0, 461.0, 139.0, 36.0, 15.0, 15.0, 3.0, 6.0, 4.0, 1.0, 8.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.484375, -21.00048828125, -20.5166015625, -20.03271484375, -19.548828125, -19.06494140625, -18.5810546875, -18.09716796875, -17.61328125, -17.12939453125, -16.6455078125, -16.16162109375, -15.677734375, -15.19384765625, -14.7099609375, -14.22607421875, -13.7421875, -13.25830078125, -12.7744140625, -12.29052734375, -11.806640625, -11.32275390625, -10.8388671875, -10.35498046875, -9.87109375, -9.38720703125, -8.9033203125, -8.41943359375, -7.935546875, -7.45166015625, -6.9677734375, -6.48388671875, -6.0, -5.51611328125, -5.0322265625, -4.54833984375, -4.064453125, -3.58056640625, -3.0966796875, -2.61279296875, -2.12890625, -1.64501953125, -1.1611328125, -0.67724609375, -0.193359375, 0.29052734375, 0.7744140625, 1.25830078125, 1.7421875, 2.22607421875, 2.7099609375, 3.19384765625, 3.677734375, 4.16162109375, 4.6455078125, 5.12939453125, 5.61328125, 6.09716796875, 6.5810546875, 7.06494140625, 7.548828125, 8.03271484375, 8.5166015625, 9.00048828125, 9.484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 10.0, 43.0, 189.0, 557.0, 169.0, 28.0, 9.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.761932373046875, -29.20995330810547, -24.657974243164062, -20.105995178222656, -15.55401611328125, -11.002037048339844, -6.4500579833984375, -1.8980789184570312, 2.653900146484375, 7.205879211425781, 11.757858276367188, 16.309837341308594, 20.86181640625, 25.413795471191406, 29.965774536132812, 34.51775360107422, 39.069732666015625, 43.62171173095703, 48.17369079589844, 52.725669860839844, 57.27764892578125, 61.829627990722656, 66.38160705566406, 70.93358612060547, 75.48556518554688, 80.03754425048828, 84.58952331542969, 89.1415023803711, 93.6934814453125, 98.2454605102539, 102.79743957519531, 107.34941864013672, 111.90139770507812, 116.45337677001953, 121.00535583496094, 125.55733489990234, 130.10931396484375, 134.66128540039062, 139.21327209472656, 143.7652587890625, 148.31723022460938, 152.86920166015625, 157.4211883544922, 161.97317504882812, 166.525146484375, 171.07711791992188, 175.6291046142578, 180.18109130859375, 184.73306274414062, 189.2850341796875, 193.83702087402344, 198.38900756835938, 202.94097900390625, 207.49295043945312, 212.04493713378906, 216.596923828125, 221.14889526367188, 225.70086669921875, 230.2528533935547, 234.80484008789062, 239.3568115234375, 243.90878295898438, 248.4607696533203, 253.01275634765625, 257.5647277832031]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 10.0, 17.0, 20.0, 25.0, 29.0, 40.0, 54.0, 56.0, 76.0, 79.0, 83.0, 66.0, 70.0, 77.0, 64.0, 51.0, 36.0, 38.0, 29.0, 22.0, 20.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.944580078125, -24.110794067382812, -23.277008056640625, -22.443222045898438, -21.60943603515625, -20.775650024414062, -19.941862106323242, -19.108076095581055, -18.274290084838867, -17.44050407409668, -16.606718063354492, -15.772931098937988, -14.9391450881958, -14.105359077453613, -13.27157211303711, -12.437786102294922, -11.604000091552734, -10.770214080810547, -9.93642807006836, -9.102641105651855, -8.268855094909668, -7.4350690841674805, -6.601282596588135, -5.767496109008789, -4.933710098266602, -4.099924087524414, -3.2661375999450684, -2.4323513507843018, -1.5985651016235352, -0.7647790908813477, 0.06900739669799805, 0.9027938842773438, 1.7365798950195312, 2.570366144180298, 3.4041523933410645, 4.23793888092041, 5.071724891662598, 5.905510902404785, 6.739297389984131, 7.573083877563477, 8.406869888305664, 9.240655899047852, 10.074441909790039, 10.908228874206543, 11.74201488494873, 12.575800895690918, 13.409587860107422, 14.24337387084961, 15.077159881591797, 15.910945892333984, 16.744731903076172, 17.57851791381836, 18.412303924560547, 19.246089935302734, 20.079877853393555, 20.913663864135742, 21.74744987487793, 22.581235885620117, 23.415021896362305, 24.248807907104492, 25.082595825195312, 25.9163818359375, 26.750167846679688, 27.583953857421875, 28.417739868164062]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 4.0, 2.0, 8.0, 2.0, 3.0, 13.0, 11.0, 6.0, 7.0, 7.0, 10.0, 23.0, 26.0, 38.0, 79.0, 183.0, 579.0, 1929.0, 8892.0, 90446.0, 4039914.0, 42835.0, 6376.0, 1643.0, 575.0, 219.0, 132.0, 71.0, 53.0, 35.0, 27.0, 19.0, 20.0, 14.0, 6.0, 13.0, 12.0, 10.0, 12.0, 8.0, 8.0, 1.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.25, -23.47705078125, -22.7041015625, -21.93115234375, -21.158203125, -20.38525390625, -19.6123046875, -18.83935546875, -18.06640625, -17.29345703125, -16.5205078125, -15.74755859375, -14.974609375, -14.20166015625, -13.4287109375, -12.65576171875, -11.8828125, -11.10986328125, -10.3369140625, -9.56396484375, -8.791015625, -8.01806640625, -7.2451171875, -6.47216796875, -5.69921875, -4.92626953125, -4.1533203125, -3.38037109375, -2.607421875, -1.83447265625, -1.0615234375, -0.28857421875, 0.484375, 1.25732421875, 2.0302734375, 2.80322265625, 3.576171875, 4.34912109375, 5.1220703125, 5.89501953125, 6.66796875, 7.44091796875, 8.2138671875, 8.98681640625, 9.759765625, 10.53271484375, 11.3056640625, 12.07861328125, 12.8515625, 13.62451171875, 14.3974609375, 15.17041015625, 15.943359375, 16.71630859375, 17.4892578125, 18.26220703125, 19.03515625, 19.80810546875, 20.5810546875, 21.35400390625, 22.126953125, 22.89990234375, 23.6728515625, 24.44580078125, 25.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 13.0, 8.0, 15.0, 25.0, 28.0, 43.0, 50.0, 80.0, 118.0, 104.0, 108.0, 93.0, 75.0, 73.0, 57.0, 39.0, 25.0, 16.0, 6.0, 13.0, 7.0, 1.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3013801574707031, -0.28171539306640625, -0.2620506286621094, -0.2423858642578125, -0.22272109985351562, -0.20305633544921875, -0.18339157104492188, -0.163726806640625, -0.14406204223632812, -0.12439727783203125, -0.10473251342773438, -0.0850677490234375, -0.06540298461914062, -0.04573822021484375, -0.026073455810546875, -0.00640869140625, 0.013256072998046875, 0.03292083740234375, 0.052585601806640625, 0.0722503662109375, 0.09191513061523438, 0.11157989501953125, 0.13124465942382812, 0.150909423828125, 0.17057418823242188, 0.19023895263671875, 0.20990371704101562, 0.2295684814453125, 0.24923324584960938, 0.26889801025390625, 0.2885627746582031, 0.3082275390625, 0.3278923034667969, 0.34755706787109375, 0.3672218322753906, 0.3868865966796875, 0.4065513610839844, 0.42621612548828125, 0.4458808898925781, 0.465545654296875, 0.4852104187011719, 0.5048751831054688, 0.5245399475097656, 0.5442047119140625, 0.5638694763183594, 0.5835342407226562, 0.6031990051269531, 0.62286376953125, 0.6425285339355469, 0.6621932983398438, 0.6818580627441406, 0.7015228271484375, 0.7211875915527344, 0.7408523559570312, 0.7605171203613281, 0.780181884765625, 0.7998466491699219, 0.8195114135742188, 0.8391761779785156, 0.8588409423828125, 0.8785057067871094, 0.8981704711914062, 0.9178352355957031, 0.9375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 11.0, 24.0, 34.0, 63.0, 298.0, 8749.0, 4182173.0, 2611.0, 203.0, 66.0, 23.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.03125, -40.55712890625, -38.0830078125, -35.60888671875, -33.134765625, -30.66064453125, -28.1865234375, -25.71240234375, -23.23828125, -20.76416015625, -18.2900390625, -15.81591796875, -13.341796875, -10.86767578125, -8.3935546875, -5.91943359375, -3.4453125, -0.97119140625, 1.5029296875, 3.97705078125, 6.451171875, 8.92529296875, 11.3994140625, 13.87353515625, 16.34765625, 18.82177734375, 21.2958984375, 23.77001953125, 26.244140625, 28.71826171875, 31.1923828125, 33.66650390625, 36.140625, 38.61474609375, 41.0888671875, 43.56298828125, 46.037109375, 48.51123046875, 50.9853515625, 53.45947265625, 55.93359375, 58.40771484375, 60.8818359375, 63.35595703125, 65.830078125, 68.30419921875, 70.7783203125, 73.25244140625, 75.7265625, 78.20068359375, 80.6748046875, 83.14892578125, 85.623046875, 88.09716796875, 90.5712890625, 93.04541015625, 95.51953125, 97.99365234375, 100.4677734375, 102.94189453125, 105.416015625, 107.89013671875, 110.3642578125, 112.83837890625, 115.3125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 6.0, 11.0, 23.0, 20.0, 45.0, 64.0, 103.0, 198.0, 2004.0, 1039.0, 243.0, 126.0, 81.0, 31.0, 28.0, 15.0, 9.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.38671875, -2.328338623046875, -2.26995849609375, -2.211578369140625, -2.1531982421875, -2.094818115234375, -2.03643798828125, -1.978057861328125, -1.919677734375, -1.861297607421875, -1.80291748046875, -1.744537353515625, -1.6861572265625, -1.627777099609375, -1.56939697265625, -1.511016845703125, -1.45263671875, -1.394256591796875, -1.33587646484375, -1.277496337890625, -1.2191162109375, -1.160736083984375, -1.10235595703125, -1.043975830078125, -0.985595703125, -0.927215576171875, -0.86883544921875, -0.810455322265625, -0.7520751953125, -0.693695068359375, -0.63531494140625, -0.576934814453125, -0.5185546875, -0.460174560546875, -0.40179443359375, -0.343414306640625, -0.2850341796875, -0.226654052734375, -0.16827392578125, -0.109893798828125, -0.051513671875, 0.006866455078125, 0.06524658203125, 0.123626708984375, 0.1820068359375, 0.240386962890625, 0.29876708984375, 0.357147216796875, 0.41552734375, 0.473907470703125, 0.53228759765625, 0.590667724609375, 0.6490478515625, 0.707427978515625, 0.76580810546875, 0.824188232421875, 0.882568359375, 0.940948486328125, 0.99932861328125, 1.057708740234375, 1.1160888671875, 1.174468994140625, 1.23284912109375, 1.291229248046875, 1.349609375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 976.0, 27.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.707462310791016, -27.73569107055664, -22.763919830322266, -17.79214859008789, -12.820377349853516, -7.848606109619141, -2.8768348693847656, 2.0949363708496094, 7.066707611083984, 12.03847885131836, 17.010250091552734, 21.98202133178711, 26.953792572021484, 31.92556381225586, 36.897335052490234, 41.86910629272461, 46.840877532958984, 51.81264877319336, 56.784420013427734, 61.75619125366211, 66.72796630859375, 71.69973754882812, 76.6715087890625, 81.64328002929688, 86.61505126953125, 91.58682250976562, 96.55859375, 101.53036499023438, 106.50213623046875, 111.47390747070312, 116.4456787109375, 121.41744995117188, 126.38922119140625, 131.36099243164062, 136.332763671875, 141.30453491210938, 146.27630615234375, 151.24807739257812, 156.2198486328125, 161.19161987304688, 166.16339111328125, 171.13516235351562, 176.10693359375, 181.07870483398438, 186.05047607421875, 191.02224731445312, 195.9940185546875, 200.96578979492188, 205.93756103515625, 210.90933227539062, 215.881103515625, 220.85287475585938, 225.82464599609375, 230.79641723632812, 235.7681884765625, 240.73995971679688, 245.71173095703125, 250.68350219726562, 255.6552734375, 260.6270446777344, 265.59881591796875, 270.5705871582031, 275.5423583984375, 280.5141296386719, 285.48590087890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 3.0, 6.0, 13.0, 18.0, 37.0, 53.0, 61.0, 58.0, 102.0, 94.0, 89.0, 87.0, 76.0, 89.0, 61.0, 51.0, 36.0, 21.0, 16.0, 13.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.612344741821289, -11.241537094116211, -10.87073040008545, -10.499923706054688, -10.12911605834961, -9.758308410644531, -9.38750171661377, -9.016695022583008, -8.64588737487793, -8.275079727172852, -7.90427303314209, -7.53346586227417, -7.16265869140625, -6.79185152053833, -6.42104434967041, -6.05023717880249, -5.67943000793457, -5.30862283706665, -4.9378156661987305, -4.5670084953308105, -4.196201324462891, -3.8253941535949707, -3.454586982727051, -3.083779811859131, -2.712972640991211, -2.342165470123291, -1.971358299255371, -1.6005511283874512, -1.2297439575195312, -0.8589367866516113, -0.4881296157836914, -0.11732244491577148, 0.25348567962646484, 0.6242928504943848, 0.9951000213623047, 1.3659071922302246, 1.7367143630981445, 2.1075215339660645, 2.4783287048339844, 2.8491358757019043, 3.219943046569824, 3.590750217437744, 3.961557388305664, 4.332364559173584, 4.703171730041504, 5.073978900909424, 5.444786071777344, 5.815593242645264, 6.186400413513184, 6.5572075843811035, 6.928014755249023, 7.298821926116943, 7.669629096984863, 8.040435791015625, 8.411243438720703, 8.782051086425781, 9.152857780456543, 9.523664474487305, 9.894472122192383, 10.265279769897461, 10.636086463928223, 11.006893157958984, 11.377700805664062, 11.74850845336914, 12.119315147399902]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 9.0, 5.0, 15.0, 14.0, 5.0, 18.0, 14.0, 21.0, 22.0, 26.0, 30.0, 32.0, 38.0, 61.0, 108.0, 518.0, 23011.0, 995219.0, 28333.0, 566.0, 112.0, 68.0, 41.0, 48.0, 35.0, 18.0, 23.0, 16.0, 28.0, 24.0, 14.0, 6.0, 13.0, 5.0, 7.0, 2.0, 6.0, 1.0, 7.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.390625, -21.72265625, -21.0546875, -20.38671875, -19.71875, -19.05078125, -18.3828125, -17.71484375, -17.046875, -16.37890625, -15.7109375, -15.04296875, -14.375, -13.70703125, -13.0390625, -12.37109375, -11.703125, -11.03515625, -10.3671875, -9.69921875, -9.03125, -8.36328125, -7.6953125, -7.02734375, -6.359375, -5.69140625, -5.0234375, -4.35546875, -3.6875, -3.01953125, -2.3515625, -1.68359375, -1.015625, -0.34765625, 0.3203125, 0.98828125, 1.65625, 2.32421875, 2.9921875, 3.66015625, 4.328125, 4.99609375, 5.6640625, 6.33203125, 7.0, 7.66796875, 8.3359375, 9.00390625, 9.671875, 10.33984375, 11.0078125, 11.67578125, 12.34375, 13.01171875, 13.6796875, 14.34765625, 15.015625, 15.68359375, 16.3515625, 17.01953125, 17.6875, 18.35546875, 19.0234375, 19.69140625, 20.359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 19.0, 40.0, 52.0, 87.0, 113.0, 130.0, 135.0, 116.0, 101.0, 82.0, 44.0, 31.0, 29.0, 15.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4443473815917969, -0.41384124755859375, -0.3833351135253906, -0.3528289794921875, -0.3223228454589844, -0.29181671142578125, -0.2613105773925781, -0.230804443359375, -0.20029830932617188, -0.16979217529296875, -0.13928604125976562, -0.1087799072265625, -0.07827377319335938, -0.04776763916015625, -0.017261505126953125, 0.01324462890625, 0.043750762939453125, 0.07425689697265625, 0.10476303100585938, 0.1352691650390625, 0.16577529907226562, 0.19628143310546875, 0.22678756713867188, 0.257293701171875, 0.2877998352050781, 0.31830596923828125, 0.3488121032714844, 0.3793182373046875, 0.4098243713378906, 0.44033050537109375, 0.4708366394042969, 0.5013427734375, 0.5318489074707031, 0.5623550415039062, 0.5928611755371094, 0.6233673095703125, 0.6538734436035156, 0.6843795776367188, 0.7148857116699219, 0.745391845703125, 0.7758979797363281, 0.8064041137695312, 0.8369102478027344, 0.8674163818359375, 0.8979225158691406, 0.9284286499023438, 0.9589347839355469, 0.98944091796875, 1.0199470520019531, 1.0504531860351562, 1.0809593200683594, 1.1114654541015625, 1.1419715881347656, 1.1724777221679688, 1.2029838562011719, 1.233489990234375, 1.2639961242675781, 1.2945022583007812, 1.3250083923339844, 1.3555145263671875, 1.3860206604003906, 1.4165267944335938, 1.4470329284667969, 1.4775390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 4.0, 6.0, 4.0, 4.0, 5.0, 9.0, 10.0, 19.0, 26.0, 33.0, 54.0, 75.0, 127.0, 194.0, 401.0, 891.0, 2116.0, 8533.0, 51396.0, 495479.0, 434274.0, 43955.0, 7356.0, 1946.0, 701.0, 367.0, 208.0, 119.0, 78.0, 47.0, 38.0, 15.0, 18.0, 8.0, 5.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-10.7734375, -10.46533203125, -10.1572265625, -9.84912109375, -9.541015625, -9.23291015625, -8.9248046875, -8.61669921875, -8.30859375, -8.00048828125, -7.6923828125, -7.38427734375, -7.076171875, -6.76806640625, -6.4599609375, -6.15185546875, -5.84375, -5.53564453125, -5.2275390625, -4.91943359375, -4.611328125, -4.30322265625, -3.9951171875, -3.68701171875, -3.37890625, -3.07080078125, -2.7626953125, -2.45458984375, -2.146484375, -1.83837890625, -1.5302734375, -1.22216796875, -0.9140625, -0.60595703125, -0.2978515625, 0.01025390625, 0.318359375, 0.62646484375, 0.9345703125, 1.24267578125, 1.55078125, 1.85888671875, 2.1669921875, 2.47509765625, 2.783203125, 3.09130859375, 3.3994140625, 3.70751953125, 4.015625, 4.32373046875, 4.6318359375, 4.93994140625, 5.248046875, 5.55615234375, 5.8642578125, 6.17236328125, 6.48046875, 6.78857421875, 7.0966796875, 7.40478515625, 7.712890625, 8.02099609375, 8.3291015625, 8.63720703125, 8.9453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 9.0, 13.0, 16.0, 6.0, 13.0, 24.0, 30.0, 29.0, 21.0, 32.0, 46.0, 48.0, 52.0, 54.0, 56.0, 60.0, 55.0, 62.0, 62.0, 52.0, 41.0, 33.0, 31.0, 27.0, 21.0, 17.0, 19.0, 16.0, 14.0, 7.0, 6.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.20172119140625, -3.1065673828125, -3.01141357421875, -2.916259765625, -2.82110595703125, -2.7259521484375, -2.63079833984375, -2.53564453125, -2.44049072265625, -2.3453369140625, -2.25018310546875, -2.155029296875, -2.05987548828125, -1.9647216796875, -1.86956787109375, -1.7744140625, -1.67926025390625, -1.5841064453125, -1.48895263671875, -1.393798828125, -1.29864501953125, -1.2034912109375, -1.10833740234375, -1.01318359375, -0.91802978515625, -0.8228759765625, -0.72772216796875, -0.632568359375, -0.53741455078125, -0.4422607421875, -0.34710693359375, -0.251953125, -0.15679931640625, -0.0616455078125, 0.03350830078125, 0.128662109375, 0.22381591796875, 0.3189697265625, 0.41412353515625, 0.50927734375, 0.60443115234375, 0.6995849609375, 0.79473876953125, 0.889892578125, 0.98504638671875, 1.0802001953125, 1.17535400390625, 1.2705078125, 1.36566162109375, 1.4608154296875, 1.55596923828125, 1.651123046875, 1.74627685546875, 1.8414306640625, 1.93658447265625, 2.03173828125, 2.12689208984375, 2.2220458984375, 2.31719970703125, 2.412353515625, 2.50750732421875, 2.6026611328125, 2.69781494140625, 2.79296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 7.0, 15.0, 26.0, 33.0, 37.0, 63.0, 80.0, 127.0, 209.0, 377.0, 696.0, 1426.0, 3221.0, 9887.0, 46207.0, 411702.0, 500892.0, 55106.0, 11434.0, 3603.0, 1487.0, 772.0, 427.0, 228.0, 159.0, 102.0, 60.0, 31.0, 31.0, 16.0, 20.0, 13.0, 8.0, 4.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.68359375, -7.45794677734375, -7.2322998046875, -7.00665283203125, -6.781005859375, -6.55535888671875, -6.3297119140625, -6.10406494140625, -5.87841796875, -5.65277099609375, -5.4271240234375, -5.20147705078125, -4.975830078125, -4.75018310546875, -4.5245361328125, -4.29888916015625, -4.0732421875, -3.84759521484375, -3.6219482421875, -3.39630126953125, -3.170654296875, -2.94500732421875, -2.7193603515625, -2.49371337890625, -2.26806640625, -2.04241943359375, -1.8167724609375, -1.59112548828125, -1.365478515625, -1.13983154296875, -0.9141845703125, -0.68853759765625, -0.462890625, -0.23724365234375, -0.0115966796875, 0.21405029296875, 0.439697265625, 0.66534423828125, 0.8909912109375, 1.11663818359375, 1.34228515625, 1.56793212890625, 1.7935791015625, 2.01922607421875, 2.244873046875, 2.47052001953125, 2.6961669921875, 2.92181396484375, 3.1474609375, 3.37310791015625, 3.5987548828125, 3.82440185546875, 4.050048828125, 4.27569580078125, 4.5013427734375, 4.72698974609375, 4.95263671875, 5.17828369140625, 5.4039306640625, 5.62957763671875, 5.855224609375, 6.08087158203125, 6.3065185546875, 6.53216552734375, 6.7578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 7.0, 9.0, 17.0, 13.0, 20.0, 25.0, 28.0, 61.0, 83.0, 142.0, 167.0, 126.0, 72.0, 52.0, 37.0, 29.0, 12.0, 14.0, 14.0, 12.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013303756713867188, -0.0012777894735336304, -0.001225203275680542, -0.0011726170778274536, -0.0011200308799743652, -0.0010674446821212769, -0.0010148584842681885, -0.0009622722864151001, -0.0009096860885620117, -0.0008570998907089233, -0.000804513692855835, -0.0007519274950027466, -0.0006993412971496582, -0.0006467550992965698, -0.0005941689014434814, -0.0005415827035903931, -0.0004889965057373047, -0.0004364103078842163, -0.00038382411003112793, -0.00033123791217803955, -0.00027865171432495117, -0.0002260655164718628, -0.00017347931861877441, -0.00012089312076568604, -6.830692291259766e-05, -1.5720725059509277e-05, 3.68654727935791e-05, 8.945167064666748e-05, 0.00014203786849975586, 0.00019462406635284424, 0.0002472102642059326, 0.000299796462059021, 0.0003523826599121094, 0.00040496885776519775, 0.00045755505561828613, 0.0005101412534713745, 0.0005627274513244629, 0.0006153136491775513, 0.0006678998470306396, 0.000720486044883728, 0.0007730722427368164, 0.0008256584405899048, 0.0008782446384429932, 0.0009308308362960815, 0.00098341703414917, 0.0010360032320022583, 0.0010885894298553467, 0.001141175627708435, 0.0011937618255615234, 0.0012463480234146118, 0.0012989342212677002, 0.0013515204191207886, 0.001404106616973877, 0.0014566928148269653, 0.0015092790126800537, 0.001561865210533142, 0.0016144514083862305, 0.0016670376062393188, 0.0017196238040924072, 0.0017722100019454956, 0.001824796199798584, 0.0018773823976516724, 0.0019299685955047607, 0.001982554793357849, 0.0020351409912109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 0.0, 9.0, 8.0, 14.0, 13.0, 18.0, 23.0, 44.0, 64.0, 111.0, 183.0, 444.0, 1238.0, 4694.0, 34716.0, 850894.0, 143627.0, 9160.0, 1949.0, 593.0, 280.0, 168.0, 85.0, 44.0, 42.0, 36.0, 29.0, 23.0, 14.0, 10.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.4609375, -13.0616455078125, -12.662353515625, -12.2630615234375, -11.86376953125, -11.4644775390625, -11.065185546875, -10.6658935546875, -10.2666015625, -9.8673095703125, -9.468017578125, -9.0687255859375, -8.66943359375, -8.2701416015625, -7.870849609375, -7.4715576171875, -7.072265625, -6.6729736328125, -6.273681640625, -5.8743896484375, -5.47509765625, -5.0758056640625, -4.676513671875, -4.2772216796875, -3.8779296875, -3.4786376953125, -3.079345703125, -2.6800537109375, -2.28076171875, -1.8814697265625, -1.482177734375, -1.0828857421875, -0.68359375, -0.2843017578125, 0.114990234375, 0.5142822265625, 0.91357421875, 1.3128662109375, 1.712158203125, 2.1114501953125, 2.5107421875, 2.9100341796875, 3.309326171875, 3.7086181640625, 4.10791015625, 4.5072021484375, 4.906494140625, 5.3057861328125, 5.705078125, 6.1043701171875, 6.503662109375, 6.9029541015625, 7.30224609375, 7.7015380859375, 8.100830078125, 8.5001220703125, 8.8994140625, 9.2987060546875, 9.697998046875, 10.0972900390625, 10.49658203125, 10.8958740234375, 11.295166015625, 11.6944580078125, 12.09375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 16.0, 30.0, 66.0, 108.0, 144.0, 180.0, 173.0, 124.0, 65.0, 37.0, 21.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.744415283203125, -2.58062744140625, -2.416839599609375, -2.2530517578125, -2.089263916015625, -1.92547607421875, -1.761688232421875, -1.597900390625, -1.434112548828125, -1.27032470703125, -1.106536865234375, -0.9427490234375, -0.778961181640625, -0.61517333984375, -0.451385498046875, -0.28759765625, -0.123809814453125, 0.03997802734375, 0.203765869140625, 0.3675537109375, 0.531341552734375, 0.69512939453125, 0.858917236328125, 1.022705078125, 1.186492919921875, 1.35028076171875, 1.514068603515625, 1.6778564453125, 1.841644287109375, 2.00543212890625, 2.169219970703125, 2.3330078125, 2.496795654296875, 2.66058349609375, 2.824371337890625, 2.9881591796875, 3.151947021484375, 3.31573486328125, 3.479522705078125, 3.643310546875, 3.807098388671875, 3.97088623046875, 4.134674072265625, 4.2984619140625, 4.462249755859375, 4.62603759765625, 4.789825439453125, 4.95361328125, 5.117401123046875, 5.28118896484375, 5.444976806640625, 5.6087646484375, 5.772552490234375, 5.93634033203125, 6.100128173828125, 6.263916015625, 6.427703857421875, 6.59149169921875, 6.755279541015625, 6.9190673828125, 7.082855224609375, 7.24664306640625, 7.410430908203125, 7.57421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 12.0, 101.0, 628.0, 230.0, 30.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-303.68780517578125, -298.2363586425781, -292.784912109375, -287.3334655761719, -281.88201904296875, -276.4305725097656, -270.9791259765625, -265.5276794433594, -260.07623291015625, -254.62478637695312, -249.17333984375, -243.72189331054688, -238.27044677734375, -232.81900024414062, -227.3675537109375, -221.91610717773438, -216.4646759033203, -211.0132293701172, -205.56178283691406, -200.11033630371094, -194.6588897705078, -189.2074432373047, -183.75601196289062, -178.3045654296875, -172.85311889648438, -167.40167236328125, -161.95022583007812, -156.498779296875, -151.04733276367188, -145.59588623046875, -140.14443969726562, -134.6929931640625, -129.24154663085938, -123.79010009765625, -118.33865356445312, -112.88720703125, -107.43576049804688, -101.98431396484375, -96.53287506103516, -91.08142852783203, -85.62998962402344, -80.17854309082031, -74.72709655761719, -69.27565002441406, -63.8242073059082, -58.37276077270508, -52.92131805419922, -47.469871520996094, -42.01842498779297, -36.566978454589844, -31.11553382873535, -25.66408920288086, -20.212642669677734, -14.76119613647461, -9.30975341796875, -3.858306884765625, 1.5931396484375, 7.044585227966309, 12.496030807495117, 17.94747543334961, 23.398921966552734, 28.85036849975586, 34.30181121826172, 39.753257751464844, 45.20470428466797]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 18.0, 28.0, 21.0, 61.0, 64.0, 68.0, 127.0, 112.0, 117.0, 107.0, 74.0, 64.0, 48.0, 37.0, 20.0, 11.0, 10.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.36689758300781, -45.920982360839844, -44.475067138671875, -43.029151916503906, -41.58323669433594, -40.13732147216797, -38.69140625, -37.24549102783203, -35.79957580566406, -34.353660583496094, -32.907745361328125, -31.461830139160156, -30.015914916992188, -28.56999969482422, -27.124082565307617, -25.67816734313965, -24.232250213623047, -22.786334991455078, -21.34041976928711, -19.89450454711914, -18.448589324951172, -17.002674102783203, -15.556756973266602, -14.110841751098633, -12.664926528930664, -11.219011306762695, -9.773096084594727, -8.327179908752441, -6.881264686584473, -5.435349464416504, -3.9894332885742188, -2.54351806640625, -1.0976028442382812, 0.3483126163482666, 1.7942280769348145, 3.2401437759399414, 4.68605899810791, 6.131974220275879, 7.577890396118164, 9.023805618286133, 10.469720840454102, 11.91563606262207, 13.361551284790039, 14.807467460632324, 16.25338363647461, 17.699298858642578, 19.145214080810547, 20.591129302978516, 22.037044525146484, 23.482959747314453, 24.928874969482422, 26.37479019165039, 27.82070541381836, 29.266620635986328, 30.71253776550293, 32.15845489501953, 33.6043701171875, 35.05028533935547, 36.49620056152344, 37.942115783691406, 39.388031005859375, 40.833946228027344, 42.27986145019531, 43.72577667236328, 45.17169189453125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 8.0, 19.0, 14.0, 25.0, 75.0, 124.0, 450.0, 4098.0, 4116718.0, 71104.0, 1280.0, 214.0, 87.0, 39.0, 17.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.953125, -25.129638671875, -23.30615234375, -21.482666015625, -19.6591796875, -17.835693359375, -16.01220703125, -14.188720703125, -12.365234375, -10.541748046875, -8.71826171875, -6.894775390625, -5.0712890625, -3.247802734375, -1.42431640625, 0.399169921875, 2.22265625, 4.046142578125, 5.86962890625, 7.693115234375, 9.5166015625, 11.340087890625, 13.16357421875, 14.987060546875, 16.810546875, 18.634033203125, 20.45751953125, 22.281005859375, 24.1044921875, 25.927978515625, 27.75146484375, 29.574951171875, 31.3984375, 33.221923828125, 35.04541015625, 36.868896484375, 38.6923828125, 40.515869140625, 42.33935546875, 44.162841796875, 45.986328125, 47.809814453125, 49.63330078125, 51.456787109375, 53.2802734375, 55.103759765625, 56.92724609375, 58.750732421875, 60.57421875, 62.397705078125, 64.22119140625, 66.044677734375, 67.8681640625, 69.691650390625, 71.51513671875, 73.338623046875, 75.162109375, 76.985595703125, 78.80908203125, 80.632568359375, 82.4560546875, 84.279541015625, 86.10302734375, 87.926513671875, 89.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 11.0, 19.0, 33.0, 54.0, 82.0, 95.0, 126.0, 113.0, 122.0, 89.0, 76.0, 66.0, 58.0, 28.0, 8.0, 10.0, 12.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.77130126953125, -0.7359619140625, -0.70062255859375, -0.665283203125, -0.62994384765625, -0.5946044921875, -0.55926513671875, -0.52392578125, -0.48858642578125, -0.4532470703125, -0.41790771484375, -0.382568359375, -0.34722900390625, -0.3118896484375, -0.27655029296875, -0.2412109375, -0.20587158203125, -0.1705322265625, -0.13519287109375, -0.099853515625, -0.06451416015625, -0.0291748046875, 0.00616455078125, 0.04150390625, 0.07684326171875, 0.1121826171875, 0.14752197265625, 0.182861328125, 0.21820068359375, 0.2535400390625, 0.28887939453125, 0.32421875, 0.35955810546875, 0.3948974609375, 0.43023681640625, 0.465576171875, 0.50091552734375, 0.5362548828125, 0.57159423828125, 0.60693359375, 0.64227294921875, 0.6776123046875, 0.71295166015625, 0.748291015625, 0.78363037109375, 0.8189697265625, 0.85430908203125, 0.8896484375, 0.92498779296875, 0.9603271484375, 0.99566650390625, 1.031005859375, 1.06634521484375, 1.1016845703125, 1.13702392578125, 1.17236328125, 1.20770263671875, 1.2430419921875, 1.27838134765625, 1.313720703125, 1.34906005859375, 1.3843994140625, 1.41973876953125, 1.455078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 6.0, 30.0, 82.0, 118.0, 185.0, 378.0, 4050698.0, 141771.0, 440.0, 210.0, 156.0, 97.0, 57.0, 18.0, 15.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.375, -96.025390625, -90.67578125, -85.326171875, -79.9765625, -74.626953125, -69.27734375, -63.927734375, -58.578125, -53.228515625, -47.87890625, -42.529296875, -37.1796875, -31.830078125, -26.48046875, -21.130859375, -15.78125, -10.431640625, -5.08203125, 0.267578125, 5.6171875, 10.966796875, 16.31640625, 21.666015625, 27.015625, 32.365234375, 37.71484375, 43.064453125, 48.4140625, 53.763671875, 59.11328125, 64.462890625, 69.8125, 75.162109375, 80.51171875, 85.861328125, 91.2109375, 96.560546875, 101.91015625, 107.259765625, 112.609375, 117.958984375, 123.30859375, 128.658203125, 134.0078125, 139.357421875, 144.70703125, 150.056640625, 155.40625, 160.755859375, 166.10546875, 171.455078125, 176.8046875, 182.154296875, 187.50390625, 192.853515625, 198.203125, 203.552734375, 208.90234375, 214.251953125, 219.6015625, 224.951171875, 230.30078125, 235.650390625, 241.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 18.0, 72.0, 906.0, 2889.0, 155.0, 31.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -0.923309326171875, -0.62591552734375, -0.328521728515625, -0.0311279296875, 0.266265869140625, 0.56365966796875, 0.861053466796875, 1.158447265625, 1.455841064453125, 1.75323486328125, 2.050628662109375, 2.3480224609375, 2.645416259765625, 2.94281005859375, 3.240203857421875, 3.53759765625, 3.834991455078125, 4.13238525390625, 4.429779052734375, 4.7271728515625, 5.024566650390625, 5.32196044921875, 5.619354248046875, 5.916748046875, 6.214141845703125, 6.51153564453125, 6.808929443359375, 7.1063232421875, 7.403717041015625, 7.70111083984375, 7.998504638671875, 8.2958984375, 8.593292236328125, 8.89068603515625, 9.188079833984375, 9.4854736328125, 9.782867431640625, 10.08026123046875, 10.377655029296875, 10.675048828125, 10.972442626953125, 11.26983642578125, 11.567230224609375, 11.8646240234375, 12.162017822265625, 12.45941162109375, 12.756805419921875, 13.05419921875, 13.351593017578125, 13.64898681640625, 13.946380615234375, 14.2437744140625, 14.541168212890625, 14.83856201171875, 15.135955810546875, 15.433349609375, 15.730743408203125, 16.02813720703125, 16.325531005859375, 16.6229248046875, 16.920318603515625, 17.21771240234375, 17.515106201171875, 17.8125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 47.0, 806.0, 125.0, 20.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.08822631835938, -120.81544494628906, -113.54267120361328, -106.26988983154297, -98.99710845947266, -91.72433471679688, -84.45155334472656, -77.17877197265625, -69.90599060058594, -62.63321304321289, -55.36043167114258, -48.08765411376953, -40.81487274169922, -33.54209518432617, -26.269317626953125, -18.996536254882812, -11.723762512207031, -4.45098352432251, 2.8217954635620117, 10.094573974609375, 17.367353439331055, 24.640132904052734, 31.91291046142578, 39.185691833496094, 46.45846939086914, 53.73124694824219, 61.0040283203125, 68.27680969238281, 75.5495834350586, 82.8223648071289, 90.09513854980469, 97.367919921875, 104.64070129394531, 111.91348266601562, 119.1862564086914, 126.45903778076172, 133.7318115234375, 141.0045928955078, 148.27737426757812, 155.55015563964844, 162.82293701171875, 170.09571838378906, 177.36849975585938, 184.64126586914062, 191.91404724121094, 199.18682861328125, 206.45960998535156, 213.73239135742188, 221.00515747070312, 228.27793884277344, 235.55072021484375, 242.823486328125, 250.0962677001953, 257.3690490722656, 264.641845703125, 271.91461181640625, 279.1874084472656, 286.4601745605469, 293.73297119140625, 301.0057373046875, 308.2785339355469, 315.5513000488281, 322.8240966796875, 330.09686279296875, 337.36962890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 10.0, 25.0, 65.0, 82.0, 124.0, 167.0, 158.0, 163.0, 94.0, 53.0, 37.0, 14.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.031982421875, -66.29344177246094, -64.55490112304688, -62.81636047363281, -61.07781982421875, -59.33927917480469, -57.600738525390625, -55.86219787597656, -54.1236572265625, -52.38511657714844, -50.646575927734375, -48.90803527832031, -47.16949462890625, -45.43095397949219, -43.692413330078125, -41.95387268066406, -40.215328216552734, -38.47678756713867, -36.73824691772461, -34.99970626831055, -33.261165618896484, -31.522624969482422, -29.784082412719727, -28.045541763305664, -26.3070011138916, -24.56846046447754, -22.829919815063477, -21.09137725830078, -19.35283660888672, -17.614295959472656, -15.875755310058594, -14.137214660644531, -12.398674011230469, -10.660133361816406, -8.921592712402344, -7.183051109313965, -5.444510459899902, -3.70596981048584, -1.967428207397461, -0.22888755798339844, 1.509653091430664, 3.2481939792633057, 4.986734867095947, 6.725275993347168, 8.46381664276123, 10.202357292175293, 11.940898895263672, 13.679439544677734, 15.417980194091797, 17.15652084350586, 18.895061492919922, 20.633602142333984, 22.372142791748047, 24.11068344116211, 25.849225997924805, 27.587766647338867, 29.32630729675293, 31.064847946166992, 32.80339050292969, 34.54193115234375, 36.28047180175781, 38.019012451171875, 39.75755310058594, 41.49609375, 43.23463439941406]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 10.0, 6.0, 14.0, 14.0, 15.0, 18.0, 34.0, 41.0, 71.0, 97.0, 166.0, 289.0, 519.0, 992.0, 2838.0, 14084.0, 131316.0, 795798.0, 87279.0, 10484.0, 2306.0, 926.0, 489.0, 258.0, 144.0, 104.0, 50.0, 41.0, 30.0, 20.0, 16.0, 22.0, 5.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.78125, -21.014892578125, -20.24853515625, -19.482177734375, -18.7158203125, -17.949462890625, -17.18310546875, -16.416748046875, -15.650390625, -14.884033203125, -14.11767578125, -13.351318359375, -12.5849609375, -11.818603515625, -11.05224609375, -10.285888671875, -9.51953125, -8.753173828125, -7.98681640625, -7.220458984375, -6.4541015625, -5.687744140625, -4.92138671875, -4.155029296875, -3.388671875, -2.622314453125, -1.85595703125, -1.089599609375, -0.3232421875, 0.443115234375, 1.20947265625, 1.975830078125, 2.7421875, 3.508544921875, 4.27490234375, 5.041259765625, 5.8076171875, 6.573974609375, 7.34033203125, 8.106689453125, 8.873046875, 9.639404296875, 10.40576171875, 11.172119140625, 11.9384765625, 12.704833984375, 13.47119140625, 14.237548828125, 15.00390625, 15.770263671875, 16.53662109375, 17.302978515625, 18.0693359375, 18.835693359375, 19.60205078125, 20.368408203125, 21.134765625, 21.901123046875, 22.66748046875, 23.433837890625, 24.2001953125, 24.966552734375, 25.73291015625, 26.499267578125, 27.265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 12.0, 19.0, 17.0, 38.0, 59.0, 97.0, 125.0, 123.0, 134.0, 98.0, 82.0, 79.0, 51.0, 24.0, 20.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.34625244140625, -1.2882080078125, -1.23016357421875, -1.172119140625, -1.11407470703125, -1.0560302734375, -0.99798583984375, -0.93994140625, -0.88189697265625, -0.8238525390625, -0.76580810546875, -0.707763671875, -0.64971923828125, -0.5916748046875, -0.53363037109375, -0.4755859375, -0.41754150390625, -0.3594970703125, -0.30145263671875, -0.243408203125, -0.18536376953125, -0.1273193359375, -0.06927490234375, -0.01123046875, 0.04681396484375, 0.1048583984375, 0.16290283203125, 0.220947265625, 0.27899169921875, 0.3370361328125, 0.39508056640625, 0.453125, 0.51116943359375, 0.5692138671875, 0.62725830078125, 0.685302734375, 0.74334716796875, 0.8013916015625, 0.85943603515625, 0.91748046875, 0.97552490234375, 1.0335693359375, 1.09161376953125, 1.149658203125, 1.20770263671875, 1.2657470703125, 1.32379150390625, 1.3818359375, 1.43988037109375, 1.4979248046875, 1.55596923828125, 1.614013671875, 1.67205810546875, 1.7301025390625, 1.78814697265625, 1.84619140625, 1.90423583984375, 1.9622802734375, 2.02032470703125, 2.078369140625, 2.13641357421875, 2.1944580078125, 2.25250244140625, 2.310546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 2.0, 16.0, 23.0, 19.0, 33.0, 53.0, 75.0, 135.0, 214.0, 379.0, 784.0, 1881.0, 6858.0, 39554.0, 435810.0, 504966.0, 46340.0, 7465.0, 2081.0, 819.0, 402.0, 219.0, 132.0, 92.0, 54.0, 25.0, 22.0, 16.0, 14.0, 11.0, 6.0, 10.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.9296875, -11.4884033203125, -11.047119140625, -10.6058349609375, -10.16455078125, -9.7232666015625, -9.281982421875, -8.8406982421875, -8.3994140625, -7.9581298828125, -7.516845703125, -7.0755615234375, -6.63427734375, -6.1929931640625, -5.751708984375, -5.3104248046875, -4.869140625, -4.4278564453125, -3.986572265625, -3.5452880859375, -3.10400390625, -2.6627197265625, -2.221435546875, -1.7801513671875, -1.3388671875, -0.8975830078125, -0.456298828125, -0.0150146484375, 0.42626953125, 0.8675537109375, 1.308837890625, 1.7501220703125, 2.19140625, 2.6326904296875, 3.073974609375, 3.5152587890625, 3.95654296875, 4.3978271484375, 4.839111328125, 5.2803955078125, 5.7216796875, 6.1629638671875, 6.604248046875, 7.0455322265625, 7.48681640625, 7.9281005859375, 8.369384765625, 8.8106689453125, 9.251953125, 9.6932373046875, 10.134521484375, 10.5758056640625, 11.01708984375, 11.4583740234375, 11.899658203125, 12.3409423828125, 12.7822265625, 13.2235107421875, 13.664794921875, 14.1060791015625, 14.54736328125, 14.9886474609375, 15.429931640625, 15.8712158203125, 16.3125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 8.0, 6.0, 14.0, 7.0, 24.0, 21.0, 15.0, 24.0, 27.0, 38.0, 36.0, 40.0, 46.0, 41.0, 43.0, 61.0, 49.0, 50.0, 43.0, 62.0, 46.0, 45.0, 38.0, 35.0, 31.0, 27.0, 16.0, 15.0, 11.0, 13.0, 10.0, 8.0, 8.0, 10.0, 2.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6484375, -3.5146484375, -3.380859375, -3.2470703125, -3.11328125, -2.9794921875, -2.845703125, -2.7119140625, -2.578125, -2.4443359375, -2.310546875, -2.1767578125, -2.04296875, -1.9091796875, -1.775390625, -1.6416015625, -1.5078125, -1.3740234375, -1.240234375, -1.1064453125, -0.97265625, -0.8388671875, -0.705078125, -0.5712890625, -0.4375, -0.3037109375, -0.169921875, -0.0361328125, 0.09765625, 0.2314453125, 0.365234375, 0.4990234375, 0.6328125, 0.7666015625, 0.900390625, 1.0341796875, 1.16796875, 1.3017578125, 1.435546875, 1.5693359375, 1.703125, 1.8369140625, 1.970703125, 2.1044921875, 2.23828125, 2.3720703125, 2.505859375, 2.6396484375, 2.7734375, 2.9072265625, 3.041015625, 3.1748046875, 3.30859375, 3.4423828125, 3.576171875, 3.7099609375, 3.84375, 3.9775390625, 4.111328125, 4.2451171875, 4.37890625, 4.5126953125, 4.646484375, 4.7802734375, 4.9140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 18.0, 16.0, 25.0, 36.0, 57.0, 76.0, 134.0, 238.0, 436.0, 860.0, 2010.0, 5919.0, 24928.0, 297511.0, 662986.0, 40071.0, 8229.0, 2642.0, 1113.0, 507.0, 250.0, 171.0, 107.0, 50.0, 32.0, 29.0, 22.0, 14.0, 7.0, 11.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.484375, -11.115478515625, -10.74658203125, -10.377685546875, -10.0087890625, -9.639892578125, -9.27099609375, -8.902099609375, -8.533203125, -8.164306640625, -7.79541015625, -7.426513671875, -7.0576171875, -6.688720703125, -6.31982421875, -5.950927734375, -5.58203125, -5.213134765625, -4.84423828125, -4.475341796875, -4.1064453125, -3.737548828125, -3.36865234375, -2.999755859375, -2.630859375, -2.261962890625, -1.89306640625, -1.524169921875, -1.1552734375, -0.786376953125, -0.41748046875, -0.048583984375, 0.3203125, 0.689208984375, 1.05810546875, 1.427001953125, 1.7958984375, 2.164794921875, 2.53369140625, 2.902587890625, 3.271484375, 3.640380859375, 4.00927734375, 4.378173828125, 4.7470703125, 5.115966796875, 5.48486328125, 5.853759765625, 6.22265625, 6.591552734375, 6.96044921875, 7.329345703125, 7.6982421875, 8.067138671875, 8.43603515625, 8.804931640625, 9.173828125, 9.542724609375, 9.91162109375, 10.280517578125, 10.6494140625, 11.018310546875, 11.38720703125, 11.756103515625, 12.125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 12.0, 8.0, 13.0, 10.0, 15.0, 28.0, 17.0, 37.0, 28.0, 55.0, 43.0, 67.0, 84.0, 101.0, 95.0, 77.0, 53.0, 52.0, 37.0, 25.0, 20.0, 18.0, 25.0, 10.0, 13.0, 8.0, 9.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0016117095947265625, -0.001567944884300232, -0.0015241801738739014, -0.0014804154634475708, -0.0014366507530212402, -0.0013928860425949097, -0.001349121332168579, -0.0013053566217422485, -0.001261591911315918, -0.0012178272008895874, -0.0011740624904632568, -0.0011302977800369263, -0.0010865330696105957, -0.0010427683591842651, -0.0009990036487579346, -0.000955238938331604, -0.0009114742279052734, -0.0008677095174789429, -0.0008239448070526123, -0.0007801800966262817, -0.0007364153861999512, -0.0006926506757736206, -0.00064888596534729, -0.0006051212549209595, -0.0005613565444946289, -0.0005175918340682983, -0.0004738271236419678, -0.0004300624132156372, -0.00038629770278930664, -0.0003425329923629761, -0.0002987682819366455, -0.00025500357151031494, -0.00021123886108398438, -0.0001674741506576538, -0.00012370944023132324, -7.994472980499268e-05, -3.618001937866211e-05, 7.584691047668457e-06, 5.1349401473999023e-05, 9.511411190032959e-05, 0.00013887882232666016, 0.00018264353275299072, 0.0002264082431793213, 0.00027017295360565186, 0.0003139376640319824, 0.000357702374458313, 0.00040146708488464355, 0.0004452317953109741, 0.0004889965057373047, 0.0005327612161636353, 0.0005765259265899658, 0.0006202906370162964, 0.000664055347442627, 0.0007078200578689575, 0.0007515847682952881, 0.0007953494787216187, 0.0008391141891479492, 0.0008828788995742798, 0.0009266436100006104, 0.0009704083204269409, 0.0010141730308532715, 0.001057937741279602, 0.0011017024517059326, 0.0011454671621322632, 0.0011892318725585938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 20.0, 51.0, 92.0, 281.0, 1069.0, 10069.0, 966234.0, 67215.0, 2639.0, 517.0, 208.0, 69.0, 32.0, 16.0, 9.0, 10.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.5958251953125, -13.668212890625, -12.7406005859375, -11.81298828125, -10.8853759765625, -9.957763671875, -9.0301513671875, -8.1025390625, -7.1749267578125, -6.247314453125, -5.3197021484375, -4.39208984375, -3.4644775390625, -2.536865234375, -1.6092529296875, -0.681640625, 0.2459716796875, 1.173583984375, 2.1011962890625, 3.02880859375, 3.9564208984375, 4.884033203125, 5.8116455078125, 6.7392578125, 7.6668701171875, 8.594482421875, 9.5220947265625, 10.44970703125, 11.3773193359375, 12.304931640625, 13.2325439453125, 14.16015625, 15.0877685546875, 16.015380859375, 16.9429931640625, 17.87060546875, 18.7982177734375, 19.725830078125, 20.6534423828125, 21.5810546875, 22.5086669921875, 23.436279296875, 24.3638916015625, 25.29150390625, 26.2191162109375, 27.146728515625, 28.0743408203125, 29.001953125, 29.9295654296875, 30.857177734375, 31.7847900390625, 32.71240234375, 33.6400146484375, 34.567626953125, 35.4952392578125, 36.4228515625, 37.3504638671875, 38.278076171875, 39.2056884765625, 40.13330078125, 41.0609130859375, 41.988525390625, 42.9161376953125, 43.84375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 17.0, 23.0, 58.0, 133.0, 260.0, 242.0, 132.0, 49.0, 30.0, 20.0, 9.0, 4.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.63922119140625, -4.3292236328125, -4.01922607421875, -3.709228515625, -3.39923095703125, -3.0892333984375, -2.77923583984375, -2.46923828125, -2.15924072265625, -1.8492431640625, -1.53924560546875, -1.229248046875, -0.91925048828125, -0.6092529296875, -0.29925537109375, 0.0107421875, 0.32073974609375, 0.6307373046875, 0.94073486328125, 1.250732421875, 1.56072998046875, 1.8707275390625, 2.18072509765625, 2.49072265625, 2.80072021484375, 3.1107177734375, 3.42071533203125, 3.730712890625, 4.04071044921875, 4.3507080078125, 4.66070556640625, 4.970703125, 5.28070068359375, 5.5906982421875, 5.90069580078125, 6.210693359375, 6.52069091796875, 6.8306884765625, 7.14068603515625, 7.45068359375, 7.76068115234375, 8.0706787109375, 8.38067626953125, 8.690673828125, 9.00067138671875, 9.3106689453125, 9.62066650390625, 9.9306640625, 10.24066162109375, 10.5506591796875, 10.86065673828125, 11.170654296875, 11.48065185546875, 11.7906494140625, 12.10064697265625, 12.41064453125, 12.72064208984375, 13.0306396484375, 13.34063720703125, 13.650634765625, 13.96063232421875, 14.2706298828125, 14.58062744140625, 14.890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 13.0, 28.0, 275.0, 644.0, 49.0, 6.0], "bins": [-530.3862915039062, -521.7348022460938, -513.0833129882812, -504.4318542480469, -495.7803955078125, -487.12890625, -478.4774169921875, -469.8259582519531, -461.1744689941406, -452.5229797363281, -443.87152099609375, -435.22003173828125, -426.5685729980469, -417.9170837402344, -409.265625, -400.6141357421875, -391.962646484375, -383.3111572265625, -374.6596984863281, -366.0082092285156, -357.35675048828125, -348.70526123046875, -340.05377197265625, -331.4023132324219, -322.7508544921875, -314.099365234375, -305.4479064941406, -296.7964172363281, -288.14495849609375, -279.49346923828125, -270.84197998046875, -262.1905212402344, -253.53904724121094, -244.8875732421875, -236.23609924316406, -227.58462524414062, -218.93313598632812, -210.2816619873047, -201.63018798828125, -192.9787139892578, -184.32723999023438, -175.67576599121094, -167.0242919921875, -158.372802734375, -149.72132873535156, -141.06985473632812, -132.4183807373047, -123.76690673828125, -115.11541748046875, -106.46394348144531, -97.81246185302734, -89.1609878540039, -80.50950622558594, -71.8580322265625, -63.20655822753906, -54.55508041381836, -45.90360641479492, -37.25212860107422, -28.60065269470215, -19.949176788330078, -11.297698974609375, -2.646221160888672, 6.005252838134766, 14.656730651855469, 23.308208465576172]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 10.0, 13.0, 14.0, 30.0, 31.0, 52.0, 54.0, 53.0, 65.0, 59.0, 73.0, 71.0, 80.0, 64.0, 69.0, 52.0, 46.0, 50.0, 25.0, 27.0, 12.0, 16.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.724884033203125, -33.39811325073242, -32.07134246826172, -30.744569778442383, -29.417797088623047, -28.091026306152344, -26.76425552368164, -25.437484741210938, -24.1107120513916, -22.7839412689209, -21.457168579101562, -20.13039779663086, -18.803627014160156, -17.47685432434082, -16.150083541870117, -14.823311805725098, -13.496540069580078, -12.169768333435059, -10.842996597290039, -9.516225814819336, -8.189454078674316, -6.862682342529297, -5.5359110832214355, -4.209139823913574, -2.8823680877685547, -1.5555965900421143, -0.22882509231567383, 1.0979464054107666, 2.424717903137207, 3.7514896392822266, 5.078260898590088, 6.405032157897949, 7.731803894042969, 9.058575630187988, 10.385347366333008, 11.712118148803711, 13.03888988494873, 14.36566162109375, 15.692432403564453, 17.019203186035156, 18.345975875854492, 19.672746658325195, 20.99951934814453, 22.326290130615234, 23.653060913085938, 24.979833602905273, 26.306604385375977, 27.633377075195312, 28.960147857666016, 30.28691864013672, 31.613691329956055, 32.94046401977539, 34.267234802246094, 35.5940055847168, 36.9207763671875, 38.2475471496582, 39.574317932128906, 40.90108871459961, 42.22785949707031, 43.55463409423828, 44.881404876708984, 46.20817565917969, 47.53494644165039, 48.861717224121094, 50.18849182128906]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 6.0, 4.0, 7.0, 23.0, 19.0, 57.0, 96.0, 146.0, 406.0, 1503.0, 21429.0, 4090040.0, 76330.0, 3169.0, 617.0, 213.0, 113.0, 52.0, 25.0, 6.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -20.774658203125, -19.25244140625, -17.730224609375, -16.2080078125, -14.685791015625, -13.16357421875, -11.641357421875, -10.119140625, -8.596923828125, -7.07470703125, -5.552490234375, -4.0302734375, -2.508056640625, -0.98583984375, 0.536376953125, 2.05859375, 3.580810546875, 5.10302734375, 6.625244140625, 8.1474609375, 9.669677734375, 11.19189453125, 12.714111328125, 14.236328125, 15.758544921875, 17.28076171875, 18.802978515625, 20.3251953125, 21.847412109375, 23.36962890625, 24.891845703125, 26.4140625, 27.936279296875, 29.45849609375, 30.980712890625, 32.5029296875, 34.025146484375, 35.54736328125, 37.069580078125, 38.591796875, 40.114013671875, 41.63623046875, 43.158447265625, 44.6806640625, 46.202880859375, 47.72509765625, 49.247314453125, 50.76953125, 52.291748046875, 53.81396484375, 55.336181640625, 56.8583984375, 58.380615234375, 59.90283203125, 61.425048828125, 62.947265625, 64.469482421875, 65.99169921875, 67.513916015625, 69.0361328125, 70.558349609375, 72.08056640625, 73.602783203125, 75.125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 12.0, 18.0, 34.0, 48.0, 43.0, 83.0, 75.0, 79.0, 106.0, 99.0, 83.0, 89.0, 66.0, 55.0, 27.0, 29.0, 17.0, 10.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.917755126953125, -0.86676025390625, -0.815765380859375, -0.7647705078125, -0.713775634765625, -0.66278076171875, -0.611785888671875, -0.560791015625, -0.509796142578125, -0.45880126953125, -0.407806396484375, -0.3568115234375, -0.305816650390625, -0.25482177734375, -0.203826904296875, -0.15283203125, -0.101837158203125, -0.05084228515625, 0.000152587890625, 0.0511474609375, 0.102142333984375, 0.15313720703125, 0.204132080078125, 0.255126953125, 0.306121826171875, 0.35711669921875, 0.408111572265625, 0.4591064453125, 0.510101318359375, 0.56109619140625, 0.612091064453125, 0.6630859375, 0.714080810546875, 0.76507568359375, 0.816070556640625, 0.8670654296875, 0.918060302734375, 0.96905517578125, 1.020050048828125, 1.071044921875, 1.122039794921875, 1.17303466796875, 1.224029541015625, 1.2750244140625, 1.326019287109375, 1.37701416015625, 1.428009033203125, 1.47900390625, 1.529998779296875, 1.58099365234375, 1.631988525390625, 1.6829833984375, 1.733978271484375, 1.78497314453125, 1.835968017578125, 1.886962890625, 1.937957763671875, 1.98895263671875, 2.039947509765625, 2.0909423828125, 2.141937255859375, 2.19293212890625, 2.243927001953125, 2.294921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 5.0, 8.0, 10.0, 16.0, 31.0, 39.0, 68.0, 113.0, 274.0, 852.0, 6588.0, 4169898.0, 14252.0, 1301.0, 414.0, 181.0, 92.0, 46.0, 32.0, 26.0, 10.0, 13.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -48.24560546875, -45.3349609375, -42.42431640625, -39.513671875, -36.60302734375, -33.6923828125, -30.78173828125, -27.87109375, -24.96044921875, -22.0498046875, -19.13916015625, -16.228515625, -13.31787109375, -10.4072265625, -7.49658203125, -4.5859375, -1.67529296875, 1.2353515625, 4.14599609375, 7.056640625, 9.96728515625, 12.8779296875, 15.78857421875, 18.69921875, 21.60986328125, 24.5205078125, 27.43115234375, 30.341796875, 33.25244140625, 36.1630859375, 39.07373046875, 41.984375, 44.89501953125, 47.8056640625, 50.71630859375, 53.626953125, 56.53759765625, 59.4482421875, 62.35888671875, 65.26953125, 68.18017578125, 71.0908203125, 74.00146484375, 76.912109375, 79.82275390625, 82.7333984375, 85.64404296875, 88.5546875, 91.46533203125, 94.3759765625, 97.28662109375, 100.197265625, 103.10791015625, 106.0185546875, 108.92919921875, 111.83984375, 114.75048828125, 117.6611328125, 120.57177734375, 123.482421875, 126.39306640625, 129.3037109375, 132.21435546875, 135.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 33.0, 46.0, 100.0, 310.0, 2480.0, 708.0, 189.0, 73.0, 55.0, 27.0, 14.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.91363525390625, -3.7335205078125, -3.55340576171875, -3.373291015625, -3.19317626953125, -3.0130615234375, -2.83294677734375, -2.65283203125, -2.47271728515625, -2.2926025390625, -2.11248779296875, -1.932373046875, -1.75225830078125, -1.5721435546875, -1.39202880859375, -1.2119140625, -1.03179931640625, -0.8516845703125, -0.67156982421875, -0.491455078125, -0.31134033203125, -0.1312255859375, 0.04888916015625, 0.22900390625, 0.40911865234375, 0.5892333984375, 0.76934814453125, 0.949462890625, 1.12957763671875, 1.3096923828125, 1.48980712890625, 1.669921875, 1.85003662109375, 2.0301513671875, 2.21026611328125, 2.390380859375, 2.57049560546875, 2.7506103515625, 2.93072509765625, 3.11083984375, 3.29095458984375, 3.4710693359375, 3.65118408203125, 3.831298828125, 4.01141357421875, 4.1915283203125, 4.37164306640625, 4.5517578125, 4.73187255859375, 4.9119873046875, 5.09210205078125, 5.272216796875, 5.45233154296875, 5.6324462890625, 5.81256103515625, 5.99267578125, 6.17279052734375, 6.3529052734375, 6.53302001953125, 6.713134765625, 6.89324951171875, 7.0733642578125, 7.25347900390625, 7.43359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 32.0, 546.0, 381.0, 32.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.22462463378906, -112.91447448730469, -106.60432434082031, -100.29418182373047, -93.9840316772461, -87.67388153076172, -81.36373901367188, -75.0535888671875, -68.74343872070312, -62.43328857421875, -56.12314224243164, -49.81299591064453, -43.502845764160156, -37.19269561767578, -30.882549285888672, -24.572402954101562, -18.262252807617188, -11.952104568481445, -5.641956329345703, 0.6681919097900391, 6.978340148925781, 13.288488388061523, 19.598636627197266, 25.908782958984375, 32.21893310546875, 38.529083251953125, 44.839229583740234, 51.149375915527344, 57.45952606201172, 63.769676208496094, 70.07981872558594, 76.38996887207031, 82.70010375976562, 89.01025390625, 95.32040405273438, 101.63054656982422, 107.9406967163086, 114.25084686279297, 120.56098937988281, 126.87113952636719, 133.18128967285156, 139.49143981933594, 145.8015899658203, 152.1117401123047, 158.421875, 164.73202514648438, 171.04217529296875, 177.35232543945312, 183.6624755859375, 189.97262573242188, 196.28277587890625, 202.59292602539062, 208.903076171875, 215.2132110595703, 221.5233612060547, 227.83351135253906, 234.14366149902344, 240.4538116455078, 246.7639617919922, 253.07411193847656, 259.3842468261719, 265.69439697265625, 272.0045471191406, 278.314697265625, 284.6248474121094]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 23.0, 26.0, 36.0, 32.0, 51.0, 69.0, 76.0, 94.0, 77.0, 93.0, 70.0, 69.0, 50.0, 46.0, 46.0, 36.0, 38.0, 17.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.123966217041016, -24.456377029418945, -23.788787841796875, -23.121198654174805, -22.453609466552734, -21.786020278930664, -21.118431091308594, -20.450843811035156, -19.783252716064453, -19.115663528442383, -18.448074340820312, -17.780485153198242, -17.112895965576172, -16.4453067779541, -15.777718544006348, -15.110129356384277, -14.442541122436523, -13.774951934814453, -13.107362747192383, -12.439773559570312, -11.772184371948242, -11.104595184326172, -10.437006950378418, -9.769417762756348, -9.101828575134277, -8.434239387512207, -7.766650199890137, -7.099061489105225, -6.431472301483154, -5.763883113861084, -5.096294403076172, -4.428705215454102, -3.7611160278320312, -3.093526840209961, -2.4259378910064697, -1.7583489418029785, -1.0907597541809082, -0.4231705665588379, 0.24441814422607422, 0.9120073318481445, 1.5795965194702148, 2.247185707092285, 2.9147746562957764, 3.5823636054992676, 4.249952793121338, 4.917541980743408, 5.58513069152832, 6.252719879150391, 6.920309066772461, 7.587898254394531, 8.255487442016602, 8.923076629638672, 9.590665817260742, 10.258255004882812, 10.925843238830566, 11.593432426452637, 12.261021614074707, 12.928610801696777, 13.596199989318848, 14.263788223266602, 14.931377410888672, 15.598966598510742, 16.266555786132812, 16.934144973754883, 17.601734161376953]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 23.0, 28.0, 47.0, 48.0, 91.0, 88.0, 147.0, 207.0, 321.0, 544.0, 1166.0, 3209.0, 12109.0, 64343.0, 534160.0, 371791.0, 46071.0, 9091.0, 2589.0, 1038.0, 503.0, 296.0, 179.0, 131.0, 75.0, 55.0, 42.0, 29.0, 34.0, 19.0, 8.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0], "bins": [-22.421875, -21.8455810546875, -21.269287109375, -20.6929931640625, -20.11669921875, -19.5404052734375, -18.964111328125, -18.3878173828125, -17.8115234375, -17.2352294921875, -16.658935546875, -16.0826416015625, -15.50634765625, -14.9300537109375, -14.353759765625, -13.7774658203125, -13.201171875, -12.6248779296875, -12.048583984375, -11.4722900390625, -10.89599609375, -10.3197021484375, -9.743408203125, -9.1671142578125, -8.5908203125, -8.0145263671875, -7.438232421875, -6.8619384765625, -6.28564453125, -5.7093505859375, -5.133056640625, -4.5567626953125, -3.98046875, -3.4041748046875, -2.827880859375, -2.2515869140625, -1.67529296875, -1.0989990234375, -0.522705078125, 0.0535888671875, 0.6298828125, 1.2061767578125, 1.782470703125, 2.3587646484375, 2.93505859375, 3.5113525390625, 4.087646484375, 4.6639404296875, 5.240234375, 5.8165283203125, 6.392822265625, 6.9691162109375, 7.54541015625, 8.1217041015625, 8.697998046875, 9.2742919921875, 9.8505859375, 10.4268798828125, 11.003173828125, 11.5794677734375, 12.15576171875, 12.7320556640625, 13.308349609375, 13.8846435546875, 14.4609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 11.0, 26.0, 25.0, 51.0, 55.0, 82.0, 83.0, 94.0, 100.0, 92.0, 75.0, 69.0, 71.0, 51.0, 29.0, 30.0, 22.0, 5.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0390625, -1.974822998046875, -1.91058349609375, -1.846343994140625, -1.7821044921875, -1.717864990234375, -1.65362548828125, -1.589385986328125, -1.525146484375, -1.460906982421875, -1.39666748046875, -1.332427978515625, -1.2681884765625, -1.203948974609375, -1.13970947265625, -1.075469970703125, -1.01123046875, -0.946990966796875, -0.88275146484375, -0.818511962890625, -0.7542724609375, -0.690032958984375, -0.62579345703125, -0.561553955078125, -0.497314453125, -0.433074951171875, -0.36883544921875, -0.304595947265625, -0.2403564453125, -0.176116943359375, -0.11187744140625, -0.047637939453125, 0.0166015625, 0.080841064453125, 0.14508056640625, 0.209320068359375, 0.2735595703125, 0.337799072265625, 0.40203857421875, 0.466278076171875, 0.530517578125, 0.594757080078125, 0.65899658203125, 0.723236083984375, 0.7874755859375, 0.851715087890625, 0.91595458984375, 0.980194091796875, 1.04443359375, 1.108673095703125, 1.17291259765625, 1.237152099609375, 1.3013916015625, 1.365631103515625, 1.42987060546875, 1.494110107421875, 1.558349609375, 1.622589111328125, 1.68682861328125, 1.751068115234375, 1.8153076171875, 1.879547119140625, 1.94378662109375, 2.008026123046875, 2.072265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 8.0, 5.0, 15.0, 17.0, 26.0, 33.0, 60.0, 66.0, 112.0, 185.0, 268.0, 482.0, 816.0, 1481.0, 3391.0, 8359.0, 27554.0, 140587.0, 602970.0, 206849.0, 36997.0, 10239.0, 3898.0, 1821.0, 905.0, 470.0, 314.0, 187.0, 133.0, 97.0, 56.0, 50.0, 25.0, 27.0, 16.0, 15.0, 3.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.1583251953125, -11.785400390625, -11.4124755859375, -11.03955078125, -10.6666259765625, -10.293701171875, -9.9207763671875, -9.5478515625, -9.1749267578125, -8.802001953125, -8.4290771484375, -8.05615234375, -7.6832275390625, -7.310302734375, -6.9373779296875, -6.564453125, -6.1915283203125, -5.818603515625, -5.4456787109375, -5.07275390625, -4.6998291015625, -4.326904296875, -3.9539794921875, -3.5810546875, -3.2081298828125, -2.835205078125, -2.4622802734375, -2.08935546875, -1.7164306640625, -1.343505859375, -0.9705810546875, -0.59765625, -0.2247314453125, 0.148193359375, 0.5211181640625, 0.89404296875, 1.2669677734375, 1.639892578125, 2.0128173828125, 2.3857421875, 2.7586669921875, 3.131591796875, 3.5045166015625, 3.87744140625, 4.2503662109375, 4.623291015625, 4.9962158203125, 5.369140625, 5.7420654296875, 6.114990234375, 6.4879150390625, 6.86083984375, 7.2337646484375, 7.606689453125, 7.9796142578125, 8.3525390625, 8.7254638671875, 9.098388671875, 9.4713134765625, 9.84423828125, 10.2171630859375, 10.590087890625, 10.9630126953125, 11.3359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 10.0, 12.0, 13.0, 9.0, 20.0, 25.0, 28.0, 33.0, 42.0, 43.0, 53.0, 51.0, 57.0, 47.0, 45.0, 59.0, 53.0, 51.0, 48.0, 46.0, 42.0, 36.0, 30.0, 22.0, 26.0, 18.0, 16.0, 10.0, 10.0, 14.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.41455078125, -6.2158203125, -6.01708984375, -5.818359375, -5.61962890625, -5.4208984375, -5.22216796875, -5.0234375, -4.82470703125, -4.6259765625, -4.42724609375, -4.228515625, -4.02978515625, -3.8310546875, -3.63232421875, -3.43359375, -3.23486328125, -3.0361328125, -2.83740234375, -2.638671875, -2.43994140625, -2.2412109375, -2.04248046875, -1.84375, -1.64501953125, -1.4462890625, -1.24755859375, -1.048828125, -0.85009765625, -0.6513671875, -0.45263671875, -0.25390625, -0.05517578125, 0.1435546875, 0.34228515625, 0.541015625, 0.73974609375, 0.9384765625, 1.13720703125, 1.3359375, 1.53466796875, 1.7333984375, 1.93212890625, 2.130859375, 2.32958984375, 2.5283203125, 2.72705078125, 2.92578125, 3.12451171875, 3.3232421875, 3.52197265625, 3.720703125, 3.91943359375, 4.1181640625, 4.31689453125, 4.515625, 4.71435546875, 4.9130859375, 5.11181640625, 5.310546875, 5.50927734375, 5.7080078125, 5.90673828125, 6.10546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 8.0, 11.0, 25.0, 21.0, 44.0, 55.0, 87.0, 146.0, 228.0, 329.0, 499.0, 836.0, 1364.0, 2392.0, 4237.0, 8618.0, 19274.0, 55400.0, 253636.0, 529885.0, 112489.0, 32430.0, 12853.0, 5939.0, 3093.0, 1808.0, 1001.0, 645.0, 425.0, 263.0, 170.0, 110.0, 85.0, 37.0, 32.0, 32.0, 13.0, 12.0, 8.0, 11.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.412353515625, -4.25048828125, -4.088623046875, -3.9267578125, -3.764892578125, -3.60302734375, -3.441162109375, -3.279296875, -3.117431640625, -2.95556640625, -2.793701171875, -2.6318359375, -2.469970703125, -2.30810546875, -2.146240234375, -1.984375, -1.822509765625, -1.66064453125, -1.498779296875, -1.3369140625, -1.175048828125, -1.01318359375, -0.851318359375, -0.689453125, -0.527587890625, -0.36572265625, -0.203857421875, -0.0419921875, 0.119873046875, 0.28173828125, 0.443603515625, 0.60546875, 0.767333984375, 0.92919921875, 1.091064453125, 1.2529296875, 1.414794921875, 1.57666015625, 1.738525390625, 1.900390625, 2.062255859375, 2.22412109375, 2.385986328125, 2.5478515625, 2.709716796875, 2.87158203125, 3.033447265625, 3.1953125, 3.357177734375, 3.51904296875, 3.680908203125, 3.8427734375, 4.004638671875, 4.16650390625, 4.328369140625, 4.490234375, 4.652099609375, 4.81396484375, 4.975830078125, 5.1376953125, 5.299560546875, 5.46142578125, 5.623291015625, 5.78515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 6.0, 8.0, 9.0, 19.0, 27.0, 35.0, 49.0, 80.0, 129.0, 210.0, 160.0, 95.0, 54.0, 44.0, 24.0, 18.0, 12.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017242431640625, -0.0016758739948272705, -0.001627504825592041, -0.0015791356563568115, -0.001530766487121582, -0.0014823973178863525, -0.001434028148651123, -0.0013856589794158936, -0.001337289810180664, -0.0012889206409454346, -0.001240551471710205, -0.0011921823024749756, -0.001143813133239746, -0.0010954439640045166, -0.0010470747947692871, -0.0009987056255340576, -0.0009503364562988281, -0.0009019672870635986, -0.0008535981178283691, -0.0008052289485931396, -0.0007568597793579102, -0.0007084906101226807, -0.0006601214408874512, -0.0006117522716522217, -0.0005633831024169922, -0.0005150139331817627, -0.0004666447639465332, -0.0004182755947113037, -0.0003699064254760742, -0.0003215372562408447, -0.00027316808700561523, -0.00022479891777038574, -0.00017642974853515625, -0.00012806057929992676, -7.969141006469727e-05, -3.1322240829467773e-05, 1.704692840576172e-05, 6.541609764099121e-05, 0.0001137852668762207, 0.0001621544361114502, 0.0002105236053466797, 0.0002588927745819092, 0.00030726194381713867, 0.00035563111305236816, 0.00040400028228759766, 0.00045236945152282715, 0.0005007386207580566, 0.0005491077899932861, 0.0005974769592285156, 0.0006458461284637451, 0.0006942152976989746, 0.0007425844669342041, 0.0007909536361694336, 0.0008393228054046631, 0.0008876919746398926, 0.0009360611438751221, 0.0009844303131103516, 0.001032799482345581, 0.0010811686515808105, 0.00112953782081604, 0.0011779069900512695, 0.001226276159286499, 0.0012746453285217285, 0.001323014497756958, 0.0013713836669921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 11.0, 16.0, 21.0, 43.0, 51.0, 83.0, 116.0, 249.0, 407.0, 841.0, 1810.0, 4503.0, 13811.0, 59730.0, 618651.0, 296199.0, 36045.0, 9507.0, 3401.0, 1430.0, 691.0, 370.0, 197.0, 109.0, 90.0, 54.0, 32.0, 16.0, 22.0, 14.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.968505859375, -6.71826171875, -6.468017578125, -6.2177734375, -5.967529296875, -5.71728515625, -5.467041015625, -5.216796875, -4.966552734375, -4.71630859375, -4.466064453125, -4.2158203125, -3.965576171875, -3.71533203125, -3.465087890625, -3.21484375, -2.964599609375, -2.71435546875, -2.464111328125, -2.2138671875, -1.963623046875, -1.71337890625, -1.463134765625, -1.212890625, -0.962646484375, -0.71240234375, -0.462158203125, -0.2119140625, 0.038330078125, 0.28857421875, 0.538818359375, 0.7890625, 1.039306640625, 1.28955078125, 1.539794921875, 1.7900390625, 2.040283203125, 2.29052734375, 2.540771484375, 2.791015625, 3.041259765625, 3.29150390625, 3.541748046875, 3.7919921875, 4.042236328125, 4.29248046875, 4.542724609375, 4.79296875, 5.043212890625, 5.29345703125, 5.543701171875, 5.7939453125, 6.044189453125, 6.29443359375, 6.544677734375, 6.794921875, 7.045166015625, 7.29541015625, 7.545654296875, 7.7958984375, 8.046142578125, 8.29638671875, 8.546630859375, 8.796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 0.0, 3.0, 6.0, 12.0, 9.0, 10.0, 15.0, 15.0, 20.0, 34.0, 37.0, 51.0, 52.0, 67.0, 92.0, 95.0, 93.0, 78.0, 61.0, 43.0, 28.0, 33.0, 27.0, 23.0, 11.0, 15.0, 11.0, 11.0, 13.0, 9.0, 7.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8760986328125, -2.771728515625, -2.6673583984375, -2.56298828125, -2.4586181640625, -2.354248046875, -2.2498779296875, -2.1455078125, -2.0411376953125, -1.936767578125, -1.8323974609375, -1.72802734375, -1.6236572265625, -1.519287109375, -1.4149169921875, -1.310546875, -1.2061767578125, -1.101806640625, -0.9974365234375, -0.89306640625, -0.7886962890625, -0.684326171875, -0.5799560546875, -0.4755859375, -0.3712158203125, -0.266845703125, -0.1624755859375, -0.05810546875, 0.0462646484375, 0.150634765625, 0.2550048828125, 0.359375, 0.4637451171875, 0.568115234375, 0.6724853515625, 0.77685546875, 0.8812255859375, 0.985595703125, 1.0899658203125, 1.1943359375, 1.2987060546875, 1.403076171875, 1.5074462890625, 1.61181640625, 1.7161865234375, 1.820556640625, 1.9249267578125, 2.029296875, 2.1336669921875, 2.238037109375, 2.3424072265625, 2.44677734375, 2.5511474609375, 2.655517578125, 2.7598876953125, 2.8642578125, 2.9686279296875, 3.072998046875, 3.1773681640625, 3.28173828125, 3.3861083984375, 3.490478515625, 3.5948486328125, 3.69921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 11.0, 26.0, 59.0, 170.0, 309.0, 274.0, 101.0, 31.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-176.0186767578125, -171.81431579589844, -167.60995483398438, -163.40557861328125, -159.2012176513672, -154.99685668945312, -150.79248046875, -146.58811950683594, -142.38375854492188, -138.1793975830078, -133.97503662109375, -129.77066040039062, -125.56629943847656, -121.3619384765625, -117.1575698852539, -112.95320129394531, -108.74884033203125, -104.54447937011719, -100.3401107788086, -96.1357421875, -91.93138122558594, -87.72702026367188, -83.52265167236328, -79.31828308105469, -75.11392211914062, -70.90956115722656, -66.70519256591797, -62.50082778930664, -58.29646301269531, -54.092098236083984, -49.887733459472656, -45.68336868286133, -41.47900390625, -37.27463912963867, -33.070274353027344, -28.865909576416016, -24.661544799804688, -20.45718002319336, -16.25281524658203, -12.048450469970703, -7.844085693359375, -3.639720916748047, 0.5646438598632812, 4.769008636474609, 8.973373413085938, 13.177738189697266, 17.382102966308594, 21.586467742919922, 25.79083251953125, 29.995197296142578, 34.199562072753906, 38.403926849365234, 42.60829162597656, 46.81265640258789, 51.01702117919922, 55.22138595581055, 59.425750732421875, 63.6301155090332, 67.83448028564453, 72.03884887695312, 76.24320983886719, 80.44757080078125, 84.65193939208984, 88.85630798339844, 93.0606689453125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 9.0, 8.0, 20.0, 15.0, 19.0, 30.0, 27.0, 41.0, 38.0, 45.0, 49.0, 56.0, 50.0, 61.0, 49.0, 51.0, 54.0, 56.0, 43.0, 55.0, 41.0, 37.0, 24.0, 25.0, 15.0, 15.0, 14.0, 8.0, 5.0, 12.0, 5.0, 5.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-44.92616653442383, -43.69116973876953, -42.456172943115234, -41.22117614746094, -39.986183166503906, -38.75118637084961, -37.51618957519531, -36.281192779541016, -35.04619598388672, -33.81119918823242, -32.576202392578125, -31.34120750427246, -30.106210708618164, -28.871213912963867, -27.636219024658203, -26.401222229003906, -25.16622543334961, -23.931228637695312, -22.696231842041016, -21.46123695373535, -20.226240158081055, -18.991243362426758, -17.756248474121094, -16.521251678466797, -15.2862548828125, -14.051258087158203, -12.816262245178223, -11.581266403198242, -10.346269607543945, -9.111272811889648, -7.876276969909668, -6.6412811279296875, -5.406284332275391, -4.171288013458252, -2.9362916946411133, -1.7012953758239746, -0.46629905700683594, 0.7686972618103027, 2.0036935806274414, 3.238689422607422, 4.473686218261719, 5.708682537078857, 6.943678855895996, 8.178674697875977, 9.413671493530273, 10.64866828918457, 11.88366413116455, 13.118659973144531, 14.353656768798828, 15.588653564453125, 16.823650360107422, 18.058645248413086, 19.293642044067383, 20.52863883972168, 21.763633728027344, 22.99863052368164, 24.233627319335938, 25.468624114990234, 26.70362091064453, 27.938615798950195, 29.173612594604492, 30.40860939025879, 31.643604278564453, 32.87860107421875, 34.11359786987305]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 8.0, 10.0, 15.0, 24.0, 22.0, 37.0, 53.0, 51.0, 101.0, 147.0, 237.0, 521.0, 1219.0, 3775.0, 15478.0, 222735.0, 3894467.0, 43733.0, 7721.0, 2263.0, 841.0, 375.0, 168.0, 112.0, 51.0, 35.0, 19.0, 15.0, 12.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.234375, -27.358642578125, -26.48291015625, -25.607177734375, -24.7314453125, -23.855712890625, -22.97998046875, -22.104248046875, -21.228515625, -20.352783203125, -19.47705078125, -18.601318359375, -17.7255859375, -16.849853515625, -15.97412109375, -15.098388671875, -14.22265625, -13.346923828125, -12.47119140625, -11.595458984375, -10.7197265625, -9.843994140625, -8.96826171875, -8.092529296875, -7.216796875, -6.341064453125, -5.46533203125, -4.589599609375, -3.7138671875, -2.838134765625, -1.96240234375, -1.086669921875, -0.2109375, 0.664794921875, 1.54052734375, 2.416259765625, 3.2919921875, 4.167724609375, 5.04345703125, 5.919189453125, 6.794921875, 7.670654296875, 8.54638671875, 9.422119140625, 10.2978515625, 11.173583984375, 12.04931640625, 12.925048828125, 13.80078125, 14.676513671875, 15.55224609375, 16.427978515625, 17.3037109375, 18.179443359375, 19.05517578125, 19.930908203125, 20.806640625, 21.682373046875, 22.55810546875, 23.433837890625, 24.3095703125, 25.185302734375, 26.06103515625, 26.936767578125, 27.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 9.0, 5.0, 14.0, 25.0, 22.0, 34.0, 48.0, 48.0, 61.0, 72.0, 86.0, 81.0, 78.0, 88.0, 61.0, 57.0, 49.0, 39.0, 36.0, 25.0, 21.0, 10.0, 10.0, 11.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8671875, -1.8070068359375, -1.746826171875, -1.6866455078125, -1.62646484375, -1.5662841796875, -1.506103515625, -1.4459228515625, -1.3857421875, -1.3255615234375, -1.265380859375, -1.2052001953125, -1.14501953125, -1.0848388671875, -1.024658203125, -0.9644775390625, -0.904296875, -0.8441162109375, -0.783935546875, -0.7237548828125, -0.66357421875, -0.6033935546875, -0.543212890625, -0.4830322265625, -0.4228515625, -0.3626708984375, -0.302490234375, -0.2423095703125, -0.18212890625, -0.1219482421875, -0.061767578125, -0.0015869140625, 0.05859375, 0.1187744140625, 0.178955078125, 0.2391357421875, 0.29931640625, 0.3594970703125, 0.419677734375, 0.4798583984375, 0.5400390625, 0.6002197265625, 0.660400390625, 0.7205810546875, 0.78076171875, 0.8409423828125, 0.901123046875, 0.9613037109375, 1.021484375, 1.0816650390625, 1.141845703125, 1.2020263671875, 1.26220703125, 1.3223876953125, 1.382568359375, 1.4427490234375, 1.5029296875, 1.5631103515625, 1.623291015625, 1.6834716796875, 1.74365234375, 1.8038330078125, 1.864013671875, 1.9241943359375, 1.984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 7.0, 15.0, 17.0, 36.0, 54.0, 84.0, 148.0, 335.0, 1494.0, 4166172.0, 24689.0, 812.0, 241.0, 92.0, 38.0, 28.0, 14.0, 9.0, 3.0, 0.0, 0.0, 1.0], "bins": [-241.0, -236.34814453125, -231.6962890625, -227.04443359375, -222.392578125, -217.74072265625, -213.0888671875, -208.43701171875, -203.78515625, -199.13330078125, -194.4814453125, -189.82958984375, -185.177734375, -180.52587890625, -175.8740234375, -171.22216796875, -166.5703125, -161.91845703125, -157.2666015625, -152.61474609375, -147.962890625, -143.31103515625, -138.6591796875, -134.00732421875, -129.35546875, -124.70361328125, -120.0517578125, -115.39990234375, -110.748046875, -106.09619140625, -101.4443359375, -96.79248046875, -92.140625, -87.48876953125, -82.8369140625, -78.18505859375, -73.533203125, -68.88134765625, -64.2294921875, -59.57763671875, -54.92578125, -50.27392578125, -45.6220703125, -40.97021484375, -36.318359375, -31.66650390625, -27.0146484375, -22.36279296875, -17.7109375, -13.05908203125, -8.4072265625, -3.75537109375, 0.896484375, 5.54833984375, 10.2001953125, 14.85205078125, 19.50390625, 24.15576171875, 28.8076171875, 33.45947265625, 38.111328125, 42.76318359375, 47.4150390625, 52.06689453125, 56.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 48.0, 1230.0, 2736.0, 56.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.125, -41.330810546875, -40.53662109375, -39.742431640625, -38.9482421875, -38.154052734375, -37.35986328125, -36.565673828125, -35.771484375, -34.977294921875, -34.18310546875, -33.388916015625, -32.5947265625, -31.800537109375, -31.00634765625, -30.212158203125, -29.41796875, -28.623779296875, -27.82958984375, -27.035400390625, -26.2412109375, -25.447021484375, -24.65283203125, -23.858642578125, -23.064453125, -22.270263671875, -21.47607421875, -20.681884765625, -19.8876953125, -19.093505859375, -18.29931640625, -17.505126953125, -16.7109375, -15.916748046875, -15.12255859375, -14.328369140625, -13.5341796875, -12.739990234375, -11.94580078125, -11.151611328125, -10.357421875, -9.563232421875, -8.76904296875, -7.974853515625, -7.1806640625, -6.386474609375, -5.59228515625, -4.798095703125, -4.00390625, -3.209716796875, -2.41552734375, -1.621337890625, -0.8271484375, -0.032958984375, 0.76123046875, 1.555419921875, 2.349609375, 3.143798828125, 3.93798828125, 4.732177734375, 5.5263671875, 6.320556640625, 7.11474609375, 7.908935546875, 8.703125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 62.0, 738.0, 188.0, 10.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.77606201171875, -288.9605407714844, -283.14501953125, -277.3294677734375, -271.5139465332031, -265.69842529296875, -259.8829040527344, -254.06736755371094, -248.2518310546875, -242.43630981445312, -236.6207733154297, -230.8052520751953, -224.98971557617188, -219.1741943359375, -213.35865783691406, -207.5431365966797, -201.72760009765625, -195.91207885742188, -190.09654235839844, -184.28102111816406, -178.46548461914062, -172.64996337890625, -166.8344268798828, -161.01890563964844, -155.20338439941406, -149.3878631591797, -143.57232666015625, -137.75680541992188, -131.94126892089844, -126.12574005126953, -120.31021118164062, -114.49468994140625, -108.67914581298828, -102.86361694335938, -97.04808807373047, -91.23255920410156, -85.41703033447266, -79.60150146484375, -73.78598022460938, -67.97044372558594, -62.1549186706543, -56.33938980102539, -50.523860931396484, -44.708335876464844, -38.89280700683594, -33.07727813720703, -27.261749267578125, -21.44622039794922, -15.630691528320312, -9.815162658691406, -3.9996347427368164, 1.8158931732177734, 7.63142204284668, 13.446950912475586, 19.26247787475586, 25.078006744384766, 30.893535614013672, 36.70906448364258, 42.524593353271484, 48.340118408203125, 54.15564727783203, 59.97117614746094, 65.78670501708984, 71.60223388671875, 77.41776275634766]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 12.0, 27.0, 76.0, 151.0, 212.0, 224.0, 159.0, 86.0, 33.0, 12.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.20745849609375, -66.63844299316406, -64.06942749023438, -61.500404357910156, -58.93138885498047, -56.36237335205078, -53.79335403442383, -51.224334716796875, -48.65531921386719, -46.0863037109375, -43.51728439331055, -40.948265075683594, -38.379249572753906, -35.81023406982422, -33.241214752197266, -30.672197341918945, -28.103179931640625, -25.534162521362305, -22.965145111083984, -20.396127700805664, -17.827110290527344, -15.258092880249023, -12.689075469970703, -10.120058059692383, -7.5510406494140625, -4.982023239135742, -2.413005828857422, 0.15601158142089844, 2.7250289916992188, 5.294046401977539, 7.863063812255859, 10.43208122253418, 13.0010986328125, 15.57011604309082, 18.13913345336914, 20.70815086364746, 23.27716827392578, 25.8461856842041, 28.415203094482422, 30.984220504760742, 33.55323791503906, 36.12225341796875, 38.6912727355957, 41.260292053222656, 43.829307556152344, 46.39832305908203, 48.967342376708984, 51.53636169433594, 54.105377197265625, 56.67439270019531, 59.243412017822266, 61.81243133544922, 64.3814468383789, 66.9504623413086, 69.51948547363281, 72.0885009765625, 74.65751647949219, 77.22653198242188, 79.79554748535156, 82.36457061767578, 84.93358612060547, 87.50260162353516, 90.07162475585938, 92.64064025878906, 95.20965576171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 7.0, 14.0, 12.0, 19.0, 22.0, 35.0, 61.0, 76.0, 101.0, 156.0, 263.0, 505.0, 914.0, 2139.0, 7103.0, 34353.0, 278838.0, 618923.0, 84458.0, 13946.0, 3633.0, 1327.0, 650.0, 321.0, 209.0, 132.0, 93.0, 59.0, 46.0, 41.0, 18.0, 23.0, 9.0, 9.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.447021484375, -17.81591796875, -17.184814453125, -16.5537109375, -15.922607421875, -15.29150390625, -14.660400390625, -14.029296875, -13.398193359375, -12.76708984375, -12.135986328125, -11.5048828125, -10.873779296875, -10.24267578125, -9.611572265625, -8.98046875, -8.349365234375, -7.71826171875, -7.087158203125, -6.4560546875, -5.824951171875, -5.19384765625, -4.562744140625, -3.931640625, -3.300537109375, -2.66943359375, -2.038330078125, -1.4072265625, -0.776123046875, -0.14501953125, 0.486083984375, 1.1171875, 1.748291015625, 2.37939453125, 3.010498046875, 3.6416015625, 4.272705078125, 4.90380859375, 5.534912109375, 6.166015625, 6.797119140625, 7.42822265625, 8.059326171875, 8.6904296875, 9.321533203125, 9.95263671875, 10.583740234375, 11.21484375, 11.845947265625, 12.47705078125, 13.108154296875, 13.7392578125, 14.370361328125, 15.00146484375, 15.632568359375, 16.263671875, 16.894775390625, 17.52587890625, 18.156982421875, 18.7880859375, 19.419189453125, 20.05029296875, 20.681396484375, 21.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 6.0, 12.0, 17.0, 19.0, 40.0, 31.0, 47.0, 37.0, 64.0, 57.0, 65.0, 76.0, 74.0, 71.0, 77.0, 65.0, 55.0, 39.0, 32.0, 24.0, 27.0, 18.0, 12.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5439453125, -1.4868927001953125, -1.429840087890625, -1.3727874755859375, -1.31573486328125, -1.2586822509765625, -1.201629638671875, -1.1445770263671875, -1.0875244140625, -1.0304718017578125, -0.973419189453125, -0.9163665771484375, -0.85931396484375, -0.8022613525390625, -0.745208740234375, -0.6881561279296875, -0.631103515625, -0.5740509033203125, -0.516998291015625, -0.4599456787109375, -0.40289306640625, -0.3458404541015625, -0.288787841796875, -0.2317352294921875, -0.1746826171875, -0.1176300048828125, -0.060577392578125, -0.0035247802734375, 0.05352783203125, 0.1105804443359375, 0.167633056640625, 0.2246856689453125, 0.28173828125, 0.3387908935546875, 0.395843505859375, 0.4528961181640625, 0.50994873046875, 0.5670013427734375, 0.624053955078125, 0.6811065673828125, 0.7381591796875, 0.7952117919921875, 0.852264404296875, 0.9093170166015625, 0.96636962890625, 1.0234222412109375, 1.080474853515625, 1.1375274658203125, 1.194580078125, 1.2516326904296875, 1.308685302734375, 1.3657379150390625, 1.42279052734375, 1.4798431396484375, 1.536895751953125, 1.5939483642578125, 1.6510009765625, 1.7080535888671875, 1.765106201171875, 1.8221588134765625, 1.87921142578125, 1.9362640380859375, 1.993316650390625, 2.0503692626953125, 2.107421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 10.0, 11.0, 16.0, 20.0, 35.0, 65.0, 85.0, 141.0, 186.0, 329.0, 605.0, 1061.0, 2259.0, 5280.0, 17093.0, 80529.0, 518474.0, 348444.0, 53212.0, 12335.0, 4225.0, 1837.0, 962.0, 489.0, 314.0, 183.0, 100.0, 65.0, 47.0, 31.0, 21.0, 19.0, 18.0, 11.0, 11.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.999755859375, -13.54638671875, -13.093017578125, -12.6396484375, -12.186279296875, -11.73291015625, -11.279541015625, -10.826171875, -10.372802734375, -9.91943359375, -9.466064453125, -9.0126953125, -8.559326171875, -8.10595703125, -7.652587890625, -7.19921875, -6.745849609375, -6.29248046875, -5.839111328125, -5.3857421875, -4.932373046875, -4.47900390625, -4.025634765625, -3.572265625, -3.118896484375, -2.66552734375, -2.212158203125, -1.7587890625, -1.305419921875, -0.85205078125, -0.398681640625, 0.0546875, 0.508056640625, 0.96142578125, 1.414794921875, 1.8681640625, 2.321533203125, 2.77490234375, 3.228271484375, 3.681640625, 4.135009765625, 4.58837890625, 5.041748046875, 5.4951171875, 5.948486328125, 6.40185546875, 6.855224609375, 7.30859375, 7.761962890625, 8.21533203125, 8.668701171875, 9.1220703125, 9.575439453125, 10.02880859375, 10.482177734375, 10.935546875, 11.388916015625, 11.84228515625, 12.295654296875, 12.7490234375, 13.202392578125, 13.65576171875, 14.109130859375, 14.5625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 3.0, 7.0, 9.0, 12.0, 14.0, 20.0, 14.0, 27.0, 20.0, 30.0, 30.0, 35.0, 35.0, 33.0, 30.0, 46.0, 40.0, 40.0, 39.0, 43.0, 50.0, 27.0, 46.0, 41.0, 34.0, 38.0, 41.0, 26.0, 27.0, 26.0, 16.0, 21.0, 17.0, 8.0, 13.0, 6.0, 8.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.40234375, -6.2025146484375, -6.002685546875, -5.8028564453125, -5.60302734375, -5.4031982421875, -5.203369140625, -5.0035400390625, -4.8037109375, -4.6038818359375, -4.404052734375, -4.2042236328125, -4.00439453125, -3.8045654296875, -3.604736328125, -3.4049072265625, -3.205078125, -3.0052490234375, -2.805419921875, -2.6055908203125, -2.40576171875, -2.2059326171875, -2.006103515625, -1.8062744140625, -1.6064453125, -1.4066162109375, -1.206787109375, -1.0069580078125, -0.80712890625, -0.6072998046875, -0.407470703125, -0.2076416015625, -0.0078125, 0.1920166015625, 0.391845703125, 0.5916748046875, 0.79150390625, 0.9913330078125, 1.191162109375, 1.3909912109375, 1.5908203125, 1.7906494140625, 1.990478515625, 2.1903076171875, 2.39013671875, 2.5899658203125, 2.789794921875, 2.9896240234375, 3.189453125, 3.3892822265625, 3.589111328125, 3.7889404296875, 3.98876953125, 4.1885986328125, 4.388427734375, 4.5882568359375, 4.7880859375, 4.9879150390625, 5.187744140625, 5.3875732421875, 5.58740234375, 5.7872314453125, 5.987060546875, 6.1868896484375, 6.38671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 16.0, 18.0, 17.0, 23.0, 41.0, 51.0, 58.0, 76.0, 116.0, 158.0, 200.0, 316.0, 362.0, 509.0, 732.0, 1172.0, 1611.0, 2501.0, 4049.0, 6702.0, 12761.0, 27041.0, 73597.0, 352058.0, 417566.0, 83327.0, 29798.0, 13822.0, 7371.0, 4325.0, 2571.0, 1692.0, 1085.0, 798.0, 526.0, 361.0, 291.0, 201.0, 154.0, 101.0, 93.0, 58.0, 48.0, 50.0, 31.0, 26.0, 10.0, 17.0, 6.0, 5.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-5.0, -4.8389892578125, -4.677978515625, -4.5169677734375, -4.35595703125, -4.1949462890625, -4.033935546875, -3.8729248046875, -3.7119140625, -3.5509033203125, -3.389892578125, -3.2288818359375, -3.06787109375, -2.9068603515625, -2.745849609375, -2.5848388671875, -2.423828125, -2.2628173828125, -2.101806640625, -1.9407958984375, -1.77978515625, -1.6187744140625, -1.457763671875, -1.2967529296875, -1.1357421875, -0.9747314453125, -0.813720703125, -0.6527099609375, -0.49169921875, -0.3306884765625, -0.169677734375, -0.0086669921875, 0.15234375, 0.3133544921875, 0.474365234375, 0.6353759765625, 0.79638671875, 0.9573974609375, 1.118408203125, 1.2794189453125, 1.4404296875, 1.6014404296875, 1.762451171875, 1.9234619140625, 2.08447265625, 2.2454833984375, 2.406494140625, 2.5675048828125, 2.728515625, 2.8895263671875, 3.050537109375, 3.2115478515625, 3.37255859375, 3.5335693359375, 3.694580078125, 3.8555908203125, 4.0166015625, 4.1776123046875, 4.338623046875, 4.4996337890625, 4.66064453125, 4.8216552734375, 4.982666015625, 5.1436767578125, 5.3046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 6.0, 9.0, 5.0, 10.0, 10.0, 20.0, 33.0, 40.0, 52.0, 94.0, 151.0, 181.0, 138.0, 79.0, 52.0, 31.0, 19.0, 18.0, 10.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018453598022460938, -0.0017995089292526245, -0.0017536580562591553, -0.001707807183265686, -0.0016619563102722168, -0.0016161054372787476, -0.0015702545642852783, -0.001524403691291809, -0.0014785528182983398, -0.0014327019453048706, -0.0013868510723114014, -0.0013410001993179321, -0.0012951493263244629, -0.0012492984533309937, -0.0012034475803375244, -0.0011575967073440552, -0.001111745834350586, -0.0010658949613571167, -0.0010200440883636475, -0.0009741932153701782, -0.000928342342376709, -0.0008824914693832397, -0.0008366405963897705, -0.0007907897233963013, -0.000744938850402832, -0.0006990879774093628, -0.0006532371044158936, -0.0006073862314224243, -0.0005615353584289551, -0.0005156844854354858, -0.0004698336124420166, -0.00042398273944854736, -0.0003781318664550781, -0.0003322809934616089, -0.00028643012046813965, -0.0002405792474746704, -0.00019472837448120117, -0.00014887750148773193, -0.0001030266284942627, -5.717575550079346e-05, -1.1324882507324219e-05, 3.452599048614502e-05, 8.037686347961426e-05, 0.0001262277364730835, 0.00017207860946655273, 0.00021792948246002197, 0.0002637803554534912, 0.00030963122844696045, 0.0003554821014404297, 0.0004013329744338989, 0.00044718384742736816, 0.0004930347204208374, 0.0005388855934143066, 0.0005847364664077759, 0.0006305873394012451, 0.0006764382123947144, 0.0007222890853881836, 0.0007681399583816528, 0.0008139908313751221, 0.0008598417043685913, 0.0009056925773620605, 0.0009515434503555298, 0.000997394323348999, 0.0010432451963424683, 0.0010890960693359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 13.0, 17.0, 18.0, 27.0, 50.0, 77.0, 95.0, 194.0, 311.0, 646.0, 1287.0, 2978.0, 8176.0, 33121.0, 463735.0, 489431.0, 34242.0, 8374.0, 2928.0, 1270.0, 648.0, 382.0, 192.0, 108.0, 81.0, 42.0, 31.0, 14.0, 14.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5379638671875, -10.208740234375, -9.8795166015625, -9.55029296875, -9.2210693359375, -8.891845703125, -8.5626220703125, -8.2333984375, -7.9041748046875, -7.574951171875, -7.2457275390625, -6.91650390625, -6.5872802734375, -6.258056640625, -5.9288330078125, -5.599609375, -5.2703857421875, -4.941162109375, -4.6119384765625, -4.28271484375, -3.9534912109375, -3.624267578125, -3.2950439453125, -2.9658203125, -2.6365966796875, -2.307373046875, -1.9781494140625, -1.64892578125, -1.3197021484375, -0.990478515625, -0.6612548828125, -0.33203125, -0.0028076171875, 0.326416015625, 0.6556396484375, 0.98486328125, 1.3140869140625, 1.643310546875, 1.9725341796875, 2.3017578125, 2.6309814453125, 2.960205078125, 3.2894287109375, 3.61865234375, 3.9478759765625, 4.277099609375, 4.6063232421875, 4.935546875, 5.2647705078125, 5.593994140625, 5.9232177734375, 6.25244140625, 6.5816650390625, 6.910888671875, 7.2401123046875, 7.5693359375, 7.8985595703125, 8.227783203125, 8.5570068359375, 8.88623046875, 9.2154541015625, 9.544677734375, 9.8739013671875, 10.203125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 5.0, 5.0, 4.0, 22.0, 14.0, 24.0, 21.0, 19.0, 32.0, 42.0, 55.0, 67.0, 81.0, 89.0, 82.0, 95.0, 76.0, 56.0, 39.0, 35.0, 22.0, 28.0, 13.0, 15.0, 14.0, 3.0, 9.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.436309814453125, -3.32183837890625, -3.207366943359375, -3.0928955078125, -2.978424072265625, -2.86395263671875, -2.749481201171875, -2.635009765625, -2.520538330078125, -2.40606689453125, -2.291595458984375, -2.1771240234375, -2.062652587890625, -1.94818115234375, -1.833709716796875, -1.71923828125, -1.604766845703125, -1.49029541015625, -1.375823974609375, -1.2613525390625, -1.146881103515625, -1.03240966796875, -0.917938232421875, -0.803466796875, -0.688995361328125, -0.57452392578125, -0.460052490234375, -0.3455810546875, -0.231109619140625, -0.11663818359375, -0.002166748046875, 0.1123046875, 0.226776123046875, 0.34124755859375, 0.455718994140625, 0.5701904296875, 0.684661865234375, 0.79913330078125, 0.913604736328125, 1.028076171875, 1.142547607421875, 1.25701904296875, 1.371490478515625, 1.4859619140625, 1.600433349609375, 1.71490478515625, 1.829376220703125, 1.94384765625, 2.058319091796875, 2.17279052734375, 2.287261962890625, 2.4017333984375, 2.516204833984375, 2.63067626953125, 2.745147705078125, 2.859619140625, 2.974090576171875, 3.08856201171875, 3.203033447265625, 3.3175048828125, 3.431976318359375, 3.54644775390625, 3.660919189453125, 3.775390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 9.0, 8.0, 38.0, 131.0, 345.0, 303.0, 114.0, 37.0, 12.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.35427856445312, -244.37216186523438, -238.39004516601562, -232.40792846679688, -226.42581176757812, -220.44369506835938, -214.46157836914062, -208.47946166992188, -202.49734497070312, -196.51522827148438, -190.53311157226562, -184.55099487304688, -178.56887817382812, -172.58676147460938, -166.60464477539062, -160.62252807617188, -154.64041137695312, -148.65829467773438, -142.67617797851562, -136.69406127929688, -130.71194458007812, -124.72982788085938, -118.74771118164062, -112.76559448242188, -106.78346252441406, -100.80134582519531, -94.81922912597656, -88.83711242675781, -82.85499572753906, -76.87287902832031, -70.89076232910156, -64.90864562988281, -58.92652893066406, -52.94441223144531, -46.96229553222656, -40.98017883300781, -34.99806213378906, -29.01594352722168, -23.033824920654297, -17.051708221435547, -11.069591522216797, -5.087474346160889, 0.8946428298950195, 6.876760482788086, 12.858877182006836, 18.840993881225586, 24.82311248779297, 30.80522918701172, 36.78734588623047, 42.76946258544922, 48.75157928466797, 54.73369598388672, 60.71581268310547, 66.69792938232422, 72.6800537109375, 78.66217041015625, 84.644287109375, 90.62640380859375, 96.6085205078125, 102.59063720703125, 108.57275390625, 114.55487060546875, 120.5369873046875, 126.51910400390625, 132.501220703125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 4.0, 14.0, 19.0, 15.0, 21.0, 33.0, 31.0, 42.0, 51.0, 38.0, 46.0, 50.0, 61.0, 62.0, 52.0, 63.0, 60.0, 49.0, 51.0, 40.0, 42.0, 28.0, 31.0, 15.0, 20.0, 9.0, 10.0, 7.0, 8.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.66419219970703, -54.155635833740234, -52.64707946777344, -51.13852310180664, -49.629966735839844, -48.12140655517578, -46.612850189208984, -45.10429382324219, -43.59573745727539, -42.087181091308594, -40.5786247253418, -39.070068359375, -37.56150817871094, -36.05295181274414, -34.544395446777344, -33.03583908081055, -31.52728271484375, -30.018726348876953, -28.510169982910156, -27.001611709594727, -25.49305534362793, -23.984498977661133, -22.475940704345703, -20.967384338378906, -19.45882797241211, -17.950271606445312, -16.441715240478516, -14.933156967163086, -13.424600601196289, -11.916044235229492, -10.407486915588379, -8.898929595947266, -7.390369415283203, -5.881812572479248, -4.373255729675293, -2.864698886871338, -1.3561420440673828, 0.15241479873657227, 1.6609716415405273, 3.1695289611816406, 4.6780853271484375, 6.186642169952393, 7.695199012756348, 9.203756332397461, 10.712312698364258, 12.220869064331055, 13.729426383972168, 15.237983703613281, 16.746540069580078, 18.255096435546875, 19.763652801513672, 21.2722110748291, 22.7807674407959, 24.289323806762695, 25.797882080078125, 27.306438446044922, 28.81499481201172, 30.323551177978516, 31.832107543945312, 33.34066390991211, 34.849220275878906, 36.35778045654297, 37.866336822509766, 39.37489318847656, 40.88344955444336]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 12.0, 3.0, 3.0, 5.0, 11.0, 7.0, 8.0, 6.0, 12.0, 13.0, 10.0, 20.0, 15.0, 31.0, 44.0, 56.0, 68.0, 111.0, 135.0, 232.0, 349.0, 599.0, 1152.0, 3025.0, 10181.0, 62387.0, 3856397.0, 227975.0, 22247.0, 5349.0, 2031.0, 851.0, 413.0, 200.0, 111.0, 75.0, 46.0, 26.0, 18.0, 13.0, 8.0, 8.0, 8.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.25, -41.186279296875, -40.12255859375, -39.058837890625, -37.9951171875, -36.931396484375, -35.86767578125, -34.803955078125, -33.740234375, -32.676513671875, -31.61279296875, -30.549072265625, -29.4853515625, -28.421630859375, -27.35791015625, -26.294189453125, -25.23046875, -24.166748046875, -23.10302734375, -22.039306640625, -20.9755859375, -19.911865234375, -18.84814453125, -17.784423828125, -16.720703125, -15.656982421875, -14.59326171875, -13.529541015625, -12.4658203125, -11.402099609375, -10.33837890625, -9.274658203125, -8.2109375, -7.147216796875, -6.08349609375, -5.019775390625, -3.9560546875, -2.892333984375, -1.82861328125, -0.764892578125, 0.298828125, 1.362548828125, 2.42626953125, 3.489990234375, 4.5537109375, 5.617431640625, 6.68115234375, 7.744873046875, 8.80859375, 9.872314453125, 10.93603515625, 11.999755859375, 13.0634765625, 14.127197265625, 15.19091796875, 16.254638671875, 17.318359375, 18.382080078125, 19.44580078125, 20.509521484375, 21.5732421875, 22.636962890625, 23.70068359375, 24.764404296875, 25.828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 8.0, 6.0, 13.0, 13.0, 14.0, 40.0, 31.0, 39.0, 54.0, 55.0, 57.0, 61.0, 65.0, 61.0, 72.0, 70.0, 61.0, 60.0, 48.0, 35.0, 36.0, 36.0, 10.0, 18.0, 15.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.57177734375, -1.5126953125, -1.45361328125, -1.39453125, -1.33544921875, -1.2763671875, -1.21728515625, -1.158203125, -1.09912109375, -1.0400390625, -0.98095703125, -0.921875, -0.86279296875, -0.8037109375, -0.74462890625, -0.685546875, -0.62646484375, -0.5673828125, -0.50830078125, -0.44921875, -0.39013671875, -0.3310546875, -0.27197265625, -0.212890625, -0.15380859375, -0.0947265625, -0.03564453125, 0.0234375, 0.08251953125, 0.1416015625, 0.20068359375, 0.259765625, 0.31884765625, 0.3779296875, 0.43701171875, 0.49609375, 0.55517578125, 0.6142578125, 0.67333984375, 0.732421875, 0.79150390625, 0.8505859375, 0.90966796875, 0.96875, 1.02783203125, 1.0869140625, 1.14599609375, 1.205078125, 1.26416015625, 1.3232421875, 1.38232421875, 1.44140625, 1.50048828125, 1.5595703125, 1.61865234375, 1.677734375, 1.73681640625, 1.7958984375, 1.85498046875, 1.9140625, 1.97314453125, 2.0322265625, 2.09130859375, 2.150390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 5.0, 7.0, 13.0, 15.0, 18.0, 25.0, 43.0, 59.0, 88.0, 138.0, 237.0, 342.0, 658.0, 1241.0, 2697.0, 7324.0, 27449.0, 338428.0, 3741093.0, 55935.0, 11476.0, 3686.0, 1593.0, 748.0, 371.0, 202.0, 130.0, 82.0, 53.0, 24.0, 33.0, 23.0, 12.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.671875, -27.722412109375, -26.77294921875, -25.823486328125, -24.8740234375, -23.924560546875, -22.97509765625, -22.025634765625, -21.076171875, -20.126708984375, -19.17724609375, -18.227783203125, -17.2783203125, -16.328857421875, -15.37939453125, -14.429931640625, -13.48046875, -12.531005859375, -11.58154296875, -10.632080078125, -9.6826171875, -8.733154296875, -7.78369140625, -6.834228515625, -5.884765625, -4.935302734375, -3.98583984375, -3.036376953125, -2.0869140625, -1.137451171875, -0.18798828125, 0.761474609375, 1.7109375, 2.660400390625, 3.60986328125, 4.559326171875, 5.5087890625, 6.458251953125, 7.40771484375, 8.357177734375, 9.306640625, 10.256103515625, 11.20556640625, 12.155029296875, 13.1044921875, 14.053955078125, 15.00341796875, 15.952880859375, 16.90234375, 17.851806640625, 18.80126953125, 19.750732421875, 20.7001953125, 21.649658203125, 22.59912109375, 23.548583984375, 24.498046875, 25.447509765625, 26.39697265625, 27.346435546875, 28.2958984375, 29.245361328125, 30.19482421875, 31.144287109375, 32.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 12.0, 4.0, 11.0, 9.0, 22.0, 25.0, 51.0, 56.0, 89.0, 151.0, 414.0, 1886.0, 755.0, 231.0, 100.0, 75.0, 49.0, 31.0, 16.0, 22.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.130126953125, -7.90869140625, -7.687255859375, -7.4658203125, -7.244384765625, -7.02294921875, -6.801513671875, -6.580078125, -6.358642578125, -6.13720703125, -5.915771484375, -5.6943359375, -5.472900390625, -5.25146484375, -5.030029296875, -4.80859375, -4.587158203125, -4.36572265625, -4.144287109375, -3.9228515625, -3.701416015625, -3.47998046875, -3.258544921875, -3.037109375, -2.815673828125, -2.59423828125, -2.372802734375, -2.1513671875, -1.929931640625, -1.70849609375, -1.487060546875, -1.265625, -1.044189453125, -0.82275390625, -0.601318359375, -0.3798828125, -0.158447265625, 0.06298828125, 0.284423828125, 0.505859375, 0.727294921875, 0.94873046875, 1.170166015625, 1.3916015625, 1.613037109375, 1.83447265625, 2.055908203125, 2.27734375, 2.498779296875, 2.72021484375, 2.941650390625, 3.1630859375, 3.384521484375, 3.60595703125, 3.827392578125, 4.048828125, 4.270263671875, 4.49169921875, 4.713134765625, 4.9345703125, 5.156005859375, 5.37744140625, 5.598876953125, 5.8203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 13.0, 17.0, 40.0, 79.0, 177.0, 283.0, 172.0, 91.0, 51.0, 34.0, 13.0, 7.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-114.51121520996094, -111.74796295166016, -108.98471069335938, -106.2214584350586, -103.45820617675781, -100.69495391845703, -97.93170166015625, -95.16844177246094, -92.40519714355469, -89.6419448852539, -86.87869262695312, -84.11544036865234, -81.35218811035156, -78.58893585205078, -75.82568359375, -73.06242370605469, -70.2991714477539, -67.53591918945312, -64.77266693115234, -62.00941467285156, -59.24616241455078, -56.48291015625, -53.71965408325195, -50.95640182495117, -48.19314956665039, -45.42989730834961, -42.66664505004883, -39.90338897705078, -37.14013671875, -34.37688446044922, -31.613632202148438, -28.850379943847656, -26.08712387084961, -23.323871612548828, -20.560619354248047, -17.797365188598633, -15.034112930297852, -12.27086067199707, -9.507606506347656, -6.744354248046875, -3.9811019897460938, -1.2178492546081543, 1.5454034805297852, 4.308656692504883, 7.071908950805664, 9.835161209106445, 12.59841537475586, 15.36166763305664, 18.124919891357422, 20.888172149658203, 23.651424407958984, 26.4146785736084, 29.17793083190918, 31.94118309020996, 34.704437255859375, 37.467689514160156, 40.23094177246094, 42.99419403076172, 45.7574462890625, 48.52069854736328, 51.28395080566406, 54.047203063964844, 56.81045913696289, 59.57371139526367, 62.33696365356445]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 16.0, 16.0, 22.0, 41.0, 79.0, 79.0, 99.0, 125.0, 118.0, 108.0, 103.0, 73.0, 53.0, 32.0, 24.0, 6.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.98432159423828, -74.82158660888672, -72.65884399414062, -70.49610900878906, -68.33336639404297, -66.1706314086914, -64.00788879394531, -61.84515380859375, -59.68241500854492, -57.519676208496094, -55.356937408447266, -53.19419860839844, -51.031463623046875, -48.86872100830078, -46.70598602294922, -44.54324722290039, -42.38050842285156, -40.217769622802734, -38.055030822753906, -35.89229202270508, -33.72955322265625, -31.566816329956055, -29.40407943725586, -27.24134063720703, -25.078601837158203, -22.915863037109375, -20.753124237060547, -18.59038734436035, -16.427648544311523, -14.264909744262695, -12.102171897888184, -9.939434051513672, -7.776695251464844, -5.613956928253174, -3.451218605041504, -1.288480281829834, 0.8742580413818359, 3.036996841430664, 5.199734687805176, 7.3624725341796875, 9.525211334228516, 11.687950134277344, 13.850687980651855, 16.013425827026367, 18.176164627075195, 20.338903427124023, 22.50164031982422, 24.664379119873047, 26.827117919921875, 28.989856719970703, 31.15259552001953, 33.31533432006836, 35.47807312011719, 37.64080810546875, 39.80354690551758, 41.966285705566406, 44.129024505615234, 46.29176330566406, 48.45450210571289, 50.61724090576172, 52.77997589111328, 54.942718505859375, 57.10545349121094, 59.268192291259766, 61.430931091308594]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 0.0, 4.0, 7.0, 7.0, 7.0, 9.0, 18.0, 28.0, 50.0, 62.0, 97.0, 168.0, 412.0, 964.0, 3658.0, 30359.0, 762968.0, 234945.0, 11327.0, 2042.0, 656.0, 308.0, 158.0, 92.0, 50.0, 47.0, 22.0, 26.0, 20.0, 7.0, 10.0, 7.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-49.65625, -48.40869140625, -47.1611328125, -45.91357421875, -44.666015625, -43.41845703125, -42.1708984375, -40.92333984375, -39.67578125, -38.42822265625, -37.1806640625, -35.93310546875, -34.685546875, -33.43798828125, -32.1904296875, -30.94287109375, -29.6953125, -28.44775390625, -27.2001953125, -25.95263671875, -24.705078125, -23.45751953125, -22.2099609375, -20.96240234375, -19.71484375, -18.46728515625, -17.2197265625, -15.97216796875, -14.724609375, -13.47705078125, -12.2294921875, -10.98193359375, -9.734375, -8.48681640625, -7.2392578125, -5.99169921875, -4.744140625, -3.49658203125, -2.2490234375, -1.00146484375, 0.24609375, 1.49365234375, 2.7412109375, 3.98876953125, 5.236328125, 6.48388671875, 7.7314453125, 8.97900390625, 10.2265625, 11.47412109375, 12.7216796875, 13.96923828125, 15.216796875, 16.46435546875, 17.7119140625, 18.95947265625, 20.20703125, 21.45458984375, 22.7021484375, 23.94970703125, 25.197265625, 26.44482421875, 27.6923828125, 28.93994140625, 30.1875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 13.0, 15.0, 26.0, 34.0, 49.0, 61.0, 81.0, 83.0, 101.0, 102.0, 93.0, 107.0, 77.0, 56.0, 33.0, 26.0, 18.0, 13.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.088470458984375, -2.98944091796875, -2.890411376953125, -2.7913818359375, -2.692352294921875, -2.59332275390625, -2.494293212890625, -2.395263671875, -2.296234130859375, -2.19720458984375, -2.098175048828125, -1.9991455078125, -1.900115966796875, -1.80108642578125, -1.702056884765625, -1.60302734375, -1.503997802734375, -1.40496826171875, -1.305938720703125, -1.2069091796875, -1.107879638671875, -1.00885009765625, -0.909820556640625, -0.810791015625, -0.711761474609375, -0.61273193359375, -0.513702392578125, -0.4146728515625, -0.315643310546875, -0.21661376953125, -0.117584228515625, -0.0185546875, 0.080474853515625, 0.17950439453125, 0.278533935546875, 0.3775634765625, 0.476593017578125, 0.57562255859375, 0.674652099609375, 0.773681640625, 0.872711181640625, 0.97174072265625, 1.070770263671875, 1.1697998046875, 1.268829345703125, 1.36785888671875, 1.466888427734375, 1.56591796875, 1.664947509765625, 1.76397705078125, 1.863006591796875, 1.9620361328125, 2.061065673828125, 2.16009521484375, 2.259124755859375, 2.358154296875, 2.457183837890625, 2.55621337890625, 2.655242919921875, 2.7542724609375, 2.853302001953125, 2.95233154296875, 3.051361083984375, 3.150390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 10.0, 7.0, 22.0, 26.0, 27.0, 59.0, 79.0, 141.0, 229.0, 369.0, 681.0, 1394.0, 3376.0, 10224.0, 42558.0, 259030.0, 591786.0, 107147.0, 21027.0, 5909.0, 2172.0, 952.0, 510.0, 302.0, 179.0, 109.0, 73.0, 46.0, 30.0, 23.0, 23.0, 11.0, 6.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8984375, -14.4219970703125, -13.945556640625, -13.4691162109375, -12.99267578125, -12.5162353515625, -12.039794921875, -11.5633544921875, -11.0869140625, -10.6104736328125, -10.134033203125, -9.6575927734375, -9.18115234375, -8.7047119140625, -8.228271484375, -7.7518310546875, -7.275390625, -6.7989501953125, -6.322509765625, -5.8460693359375, -5.36962890625, -4.8931884765625, -4.416748046875, -3.9403076171875, -3.4638671875, -2.9874267578125, -2.510986328125, -2.0345458984375, -1.55810546875, -1.0816650390625, -0.605224609375, -0.1287841796875, 0.34765625, 0.8240966796875, 1.300537109375, 1.7769775390625, 2.25341796875, 2.7298583984375, 3.206298828125, 3.6827392578125, 4.1591796875, 4.6356201171875, 5.112060546875, 5.5885009765625, 6.06494140625, 6.5413818359375, 7.017822265625, 7.4942626953125, 7.970703125, 8.4471435546875, 8.923583984375, 9.4000244140625, 9.87646484375, 10.3529052734375, 10.829345703125, 11.3057861328125, 11.7822265625, 12.2586669921875, 12.735107421875, 13.2115478515625, 13.68798828125, 14.1644287109375, 14.640869140625, 15.1173095703125, 15.59375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 14.0, 6.0, 16.0, 20.0, 16.0, 23.0, 28.0, 37.0, 56.0, 33.0, 47.0, 50.0, 57.0, 64.0, 53.0, 71.0, 62.0, 56.0, 48.0, 41.0, 26.0, 27.0, 25.0, 23.0, 16.0, 17.0, 13.0, 10.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5078125, -7.229248046875, -6.95068359375, -6.672119140625, -6.3935546875, -6.114990234375, -5.83642578125, -5.557861328125, -5.279296875, -5.000732421875, -4.72216796875, -4.443603515625, -4.1650390625, -3.886474609375, -3.60791015625, -3.329345703125, -3.05078125, -2.772216796875, -2.49365234375, -2.215087890625, -1.9365234375, -1.657958984375, -1.37939453125, -1.100830078125, -0.822265625, -0.543701171875, -0.26513671875, 0.013427734375, 0.2919921875, 0.570556640625, 0.84912109375, 1.127685546875, 1.40625, 1.684814453125, 1.96337890625, 2.241943359375, 2.5205078125, 2.799072265625, 3.07763671875, 3.356201171875, 3.634765625, 3.913330078125, 4.19189453125, 4.470458984375, 4.7490234375, 5.027587890625, 5.30615234375, 5.584716796875, 5.86328125, 6.141845703125, 6.42041015625, 6.698974609375, 6.9775390625, 7.256103515625, 7.53466796875, 7.813232421875, 8.091796875, 8.370361328125, 8.64892578125, 8.927490234375, 9.2060546875, 9.484619140625, 9.76318359375, 10.041748046875, 10.3203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 14.0, 32.0, 40.0, 65.0, 87.0, 141.0, 222.0, 363.0, 582.0, 931.0, 1461.0, 2674.0, 4944.0, 11276.0, 42263.0, 927414.0, 34589.0, 10255.0, 4805.0, 2511.0, 1444.0, 896.0, 504.0, 376.0, 226.0, 155.0, 110.0, 58.0, 26.0, 20.0, 16.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-62.40625, -60.64599609375, -58.8857421875, -57.12548828125, -55.365234375, -53.60498046875, -51.8447265625, -50.08447265625, -48.32421875, -46.56396484375, -44.8037109375, -43.04345703125, -41.283203125, -39.52294921875, -37.7626953125, -36.00244140625, -34.2421875, -32.48193359375, -30.7216796875, -28.96142578125, -27.201171875, -25.44091796875, -23.6806640625, -21.92041015625, -20.16015625, -18.39990234375, -16.6396484375, -14.87939453125, -13.119140625, -11.35888671875, -9.5986328125, -7.83837890625, -6.078125, -4.31787109375, -2.5576171875, -0.79736328125, 0.962890625, 2.72314453125, 4.4833984375, 6.24365234375, 8.00390625, 9.76416015625, 11.5244140625, 13.28466796875, 15.044921875, 16.80517578125, 18.5654296875, 20.32568359375, 22.0859375, 23.84619140625, 25.6064453125, 27.36669921875, 29.126953125, 30.88720703125, 32.6474609375, 34.40771484375, 36.16796875, 37.92822265625, 39.6884765625, 41.44873046875, 43.208984375, 44.96923828125, 46.7294921875, 48.48974609375, 50.25]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 12.0, 15.0, 26.0, 54.0, 259.0, 453.0, 69.0, 34.0, 19.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0060272216796875, -0.005812704563140869, -0.005598187446594238, -0.005383670330047607, -0.0051691532135009766, -0.004954636096954346, -0.004740118980407715, -0.004525601863861084, -0.004311084747314453, -0.004096567630767822, -0.0038820505142211914, -0.0036675333976745605, -0.0034530162811279297, -0.003238499164581299, -0.003023982048034668, -0.002809464931488037, -0.0025949478149414062, -0.0023804306983947754, -0.0021659135818481445, -0.0019513964653015137, -0.0017368793487548828, -0.001522362232208252, -0.001307845115661621, -0.0010933279991149902, -0.0008788108825683594, -0.0006642937660217285, -0.00044977664947509766, -0.0002352595329284668, -2.0742416381835938e-05, 0.00019377470016479492, 0.0004082918167114258, 0.0006228089332580566, 0.0008373260498046875, 0.0010518431663513184, 0.0012663602828979492, 0.00148087739944458, 0.001695394515991211, 0.0019099116325378418, 0.0021244287490844727, 0.0023389458656311035, 0.0025534629821777344, 0.0027679800987243652, 0.002982497215270996, 0.003197014331817627, 0.003411531448364258, 0.0036260485649108887, 0.0038405656814575195, 0.00405508279800415, 0.004269599914550781, 0.004484117031097412, 0.004698634147644043, 0.004913151264190674, 0.005127668380737305, 0.0053421854972839355, 0.005556702613830566, 0.005771219730377197, 0.005985736846923828, 0.006200253963470459, 0.00641477108001709, 0.006629288196563721, 0.0068438053131103516, 0.007058322429656982, 0.007272839546203613, 0.007487356662750244, 0.007701873779296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 6.0, 8.0, 12.0, 17.0, 30.0, 42.0, 67.0, 95.0, 178.0, 285.0, 620.0, 1140.0, 2065.0, 4763.0, 17722.0, 957822.0, 49731.0, 7673.0, 2924.0, 1515.0, 816.0, 396.0, 236.0, 121.0, 80.0, 50.0, 37.0, 22.0, 11.0, 11.0, 5.0, 14.0, 2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.0625, -86.3408203125, -83.619140625, -80.8974609375, -78.17578125, -75.4541015625, -72.732421875, -70.0107421875, -67.2890625, -64.5673828125, -61.845703125, -59.1240234375, -56.40234375, -53.6806640625, -50.958984375, -48.2373046875, -45.515625, -42.7939453125, -40.072265625, -37.3505859375, -34.62890625, -31.9072265625, -29.185546875, -26.4638671875, -23.7421875, -21.0205078125, -18.298828125, -15.5771484375, -12.85546875, -10.1337890625, -7.412109375, -4.6904296875, -1.96875, 0.7529296875, 3.474609375, 6.1962890625, 8.91796875, 11.6396484375, 14.361328125, 17.0830078125, 19.8046875, 22.5263671875, 25.248046875, 27.9697265625, 30.69140625, 33.4130859375, 36.134765625, 38.8564453125, 41.578125, 44.2998046875, 47.021484375, 49.7431640625, 52.46484375, 55.1865234375, 57.908203125, 60.6298828125, 63.3515625, 66.0732421875, 68.794921875, 71.5166015625, 74.23828125, 76.9599609375, 79.681640625, 82.4033203125, 85.125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 7.0, 4.0, 12.0, 18.0, 14.0, 58.0, 454.0, 319.0, 38.0, 13.0, 13.0, 16.0, 8.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8125, -44.37646484375, -42.9404296875, -41.50439453125, -40.068359375, -38.63232421875, -37.1962890625, -35.76025390625, -34.32421875, -32.88818359375, -31.4521484375, -30.01611328125, -28.580078125, -27.14404296875, -25.7080078125, -24.27197265625, -22.8359375, -21.39990234375, -19.9638671875, -18.52783203125, -17.091796875, -15.65576171875, -14.2197265625, -12.78369140625, -11.34765625, -9.91162109375, -8.4755859375, -7.03955078125, -5.603515625, -4.16748046875, -2.7314453125, -1.29541015625, 0.140625, 1.57666015625, 3.0126953125, 4.44873046875, 5.884765625, 7.32080078125, 8.7568359375, 10.19287109375, 11.62890625, 13.06494140625, 14.5009765625, 15.93701171875, 17.373046875, 18.80908203125, 20.2451171875, 21.68115234375, 23.1171875, 24.55322265625, 25.9892578125, 27.42529296875, 28.861328125, 30.29736328125, 31.7333984375, 33.16943359375, 34.60546875, 36.04150390625, 37.4775390625, 38.91357421875, 40.349609375, 41.78564453125, 43.2216796875, 44.65771484375, 46.09375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 26.0, 107.0, 421.0, 297.0, 88.0, 28.0, 11.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1025.8223876953125, -1005.6083374023438, -985.394287109375, -965.1802368164062, -944.9661865234375, -924.7521362304688, -904.5380859375, -884.3240966796875, -864.1099853515625, -843.8959350585938, -823.681884765625, -803.4678344726562, -783.2537841796875, -763.0397338867188, -742.82568359375, -722.6116943359375, -702.3976440429688, -682.18359375, -661.9695434570312, -641.7554931640625, -621.5414428710938, -601.327392578125, -581.1133422851562, -560.8992919921875, -540.685302734375, -520.4712524414062, -500.2572021484375, -480.04315185546875, -459.8291015625, -439.61505126953125, -419.4010314941406, -399.1869812011719, -378.972900390625, -358.75885009765625, -338.5447998046875, -318.33074951171875, -298.11669921875, -277.90264892578125, -257.6886291503906, -237.47457885742188, -217.26052856445312, -197.04647827148438, -176.83242797851562, -156.61839294433594, -136.4043426513672, -116.19029235839844, -95.97624969482422, -75.76220703125, -55.54815673828125, -35.334110260009766, -15.120063781738281, 5.093982696533203, 25.308029174804688, 45.52207946777344, 65.73612213134766, 85.95016479492188, 106.16421508789062, 126.37826538085938, 146.59231567382812, 166.8063507080078, 187.02040100097656, 207.2344512939453, 227.448486328125, 247.66253662109375, 267.8765869140625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 17.0, 15.0, 19.0, 20.0, 24.0, 29.0, 29.0, 34.0, 40.0, 61.0, 45.0, 47.0, 58.0, 39.0, 50.0, 54.0, 56.0, 55.0, 45.0, 46.0, 29.0, 22.0, 24.0, 18.0, 18.0, 15.0, 12.0, 6.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.64715576171875, -79.73237609863281, -76.81758880615234, -73.9028091430664, -70.98802947998047, -68.0732421875, -65.15846252441406, -62.24367904663086, -59.328895568847656, -56.41411209106445, -53.499332427978516, -50.58454895019531, -47.66976547241211, -44.754981994628906, -41.84020233154297, -38.925418853759766, -36.01063919067383, -33.095855712890625, -30.181074142456055, -27.266292572021484, -24.35150909423828, -21.43672752380371, -18.52194595336914, -15.607162475585938, -12.692380905151367, -9.77759838104248, -6.862816333770752, -3.9480342864990234, -1.0332517623901367, 1.88153076171875, 4.79631233215332, 7.711095809936523, 10.625877380371094, 13.54065990447998, 16.455442428588867, 19.370223999023438, 22.28500747680664, 25.19978904724121, 28.11457061767578, 31.029354095458984, 33.94413757324219, 36.85892105102539, 39.77370071411133, 42.68848419189453, 45.603267669677734, 48.51805114746094, 51.432830810546875, 54.34761428833008, 57.262393951416016, 60.17717742919922, 63.091957092285156, 66.00674438476562, 68.92152404785156, 71.8363037109375, 74.75108337402344, 77.6658706665039, 80.58065032958984, 83.49542999267578, 86.41021728515625, 89.32499694824219, 92.23977661132812, 95.1545639038086, 98.06934356689453, 100.984130859375, 103.89891052246094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 10.0, 10.0, 10.0, 13.0, 19.0, 43.0, 54.0, 60.0, 118.0, 214.0, 393.0, 826.0, 2236.0, 7735.0, 43397.0, 4002352.0, 116488.0, 14194.0, 3674.0, 1304.0, 549.0, 269.0, 128.0, 70.0, 42.0, 20.0, 15.0, 9.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.625, -55.08154296875, -53.5380859375, -51.99462890625, -50.451171875, -48.90771484375, -47.3642578125, -45.82080078125, -44.27734375, -42.73388671875, -41.1904296875, -39.64697265625, -38.103515625, -36.56005859375, -35.0166015625, -33.47314453125, -31.9296875, -30.38623046875, -28.8427734375, -27.29931640625, -25.755859375, -24.21240234375, -22.6689453125, -21.12548828125, -19.58203125, -18.03857421875, -16.4951171875, -14.95166015625, -13.408203125, -11.86474609375, -10.3212890625, -8.77783203125, -7.234375, -5.69091796875, -4.1474609375, -2.60400390625, -1.060546875, 0.48291015625, 2.0263671875, 3.56982421875, 5.11328125, 6.65673828125, 8.2001953125, 9.74365234375, 11.287109375, 12.83056640625, 14.3740234375, 15.91748046875, 17.4609375, 19.00439453125, 20.5478515625, 22.09130859375, 23.634765625, 25.17822265625, 26.7216796875, 28.26513671875, 29.80859375, 31.35205078125, 32.8955078125, 34.43896484375, 35.982421875, 37.52587890625, 39.0693359375, 40.61279296875, 42.15625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 10.0, 12.0, 13.0, 30.0, 18.0, 39.0, 46.0, 61.0, 58.0, 82.0, 95.0, 71.0, 85.0, 67.0, 52.0, 58.0, 51.0, 34.0, 35.0, 27.0, 22.0, 8.0, 8.0, 13.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.9761962890625, -2.868408203125, -2.7606201171875, -2.65283203125, -2.5450439453125, -2.437255859375, -2.3294677734375, -2.2216796875, -2.1138916015625, -2.006103515625, -1.8983154296875, -1.79052734375, -1.6827392578125, -1.574951171875, -1.4671630859375, -1.359375, -1.2515869140625, -1.143798828125, -1.0360107421875, -0.92822265625, -0.8204345703125, -0.712646484375, -0.6048583984375, -0.4970703125, -0.3892822265625, -0.281494140625, -0.1737060546875, -0.06591796875, 0.0418701171875, 0.149658203125, 0.2574462890625, 0.365234375, 0.4730224609375, 0.580810546875, 0.6885986328125, 0.79638671875, 0.9041748046875, 1.011962890625, 1.1197509765625, 1.2275390625, 1.3353271484375, 1.443115234375, 1.5509033203125, 1.65869140625, 1.7664794921875, 1.874267578125, 1.9820556640625, 2.08984375, 2.1976318359375, 2.305419921875, 2.4132080078125, 2.52099609375, 2.6287841796875, 2.736572265625, 2.8443603515625, 2.9521484375, 3.0599365234375, 3.167724609375, 3.2755126953125, 3.38330078125, 3.4910888671875, 3.598876953125, 3.7066650390625, 3.814453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 12.0, 7.0, 16.0, 21.0, 30.0, 41.0, 50.0, 109.0, 131.0, 228.0, 351.0, 726.0, 1338.0, 2889.0, 7079.0, 20299.0, 74594.0, 3712671.0, 310228.0, 41304.0, 12859.0, 4850.0, 2078.0, 987.0, 520.0, 347.0, 173.0, 106.0, 76.0, 47.0, 38.0, 20.0, 18.0, 9.0, 9.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.75, -24.82373046875, -23.8974609375, -22.97119140625, -22.044921875, -21.11865234375, -20.1923828125, -19.26611328125, -18.33984375, -17.41357421875, -16.4873046875, -15.56103515625, -14.634765625, -13.70849609375, -12.7822265625, -11.85595703125, -10.9296875, -10.00341796875, -9.0771484375, -8.15087890625, -7.224609375, -6.29833984375, -5.3720703125, -4.44580078125, -3.51953125, -2.59326171875, -1.6669921875, -0.74072265625, 0.185546875, 1.11181640625, 2.0380859375, 2.96435546875, 3.890625, 4.81689453125, 5.7431640625, 6.66943359375, 7.595703125, 8.52197265625, 9.4482421875, 10.37451171875, 11.30078125, 12.22705078125, 13.1533203125, 14.07958984375, 15.005859375, 15.93212890625, 16.8583984375, 17.78466796875, 18.7109375, 19.63720703125, 20.5634765625, 21.48974609375, 22.416015625, 23.34228515625, 24.2685546875, 25.19482421875, 26.12109375, 27.04736328125, 27.9736328125, 28.89990234375, 29.826171875, 30.75244140625, 31.6787109375, 32.60498046875, 33.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 13.0, 15.0, 9.0, 21.0, 25.0, 30.0, 48.0, 77.0, 161.0, 974.0, 2220.0, 203.0, 91.0, 50.0, 41.0, 15.0, 18.0, 18.0, 11.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.407958984375, -12.07373046875, -11.739501953125, -11.4052734375, -11.071044921875, -10.73681640625, -10.402587890625, -10.068359375, -9.734130859375, -9.39990234375, -9.065673828125, -8.7314453125, -8.397216796875, -8.06298828125, -7.728759765625, -7.39453125, -7.060302734375, -6.72607421875, -6.391845703125, -6.0576171875, -5.723388671875, -5.38916015625, -5.054931640625, -4.720703125, -4.386474609375, -4.05224609375, -3.718017578125, -3.3837890625, -3.049560546875, -2.71533203125, -2.381103515625, -2.046875, -1.712646484375, -1.37841796875, -1.044189453125, -0.7099609375, -0.375732421875, -0.04150390625, 0.292724609375, 0.626953125, 0.961181640625, 1.29541015625, 1.629638671875, 1.9638671875, 2.298095703125, 2.63232421875, 2.966552734375, 3.30078125, 3.635009765625, 3.96923828125, 4.303466796875, 4.6376953125, 4.971923828125, 5.30615234375, 5.640380859375, 5.974609375, 6.308837890625, 6.64306640625, 6.977294921875, 7.3115234375, 7.645751953125, 7.97998046875, 8.314208984375, 8.6484375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 12.0, 19.0, 21.0, 29.0, 69.0, 92.0, 131.0, 170.0, 137.0, 106.0, 69.0, 37.0, 28.0, 20.0, 14.0, 11.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.771575927734375, -58.09881591796875, -56.426055908203125, -54.7532958984375, -53.080535888671875, -51.40777587890625, -49.735015869140625, -48.062255859375, -46.389495849609375, -44.71673583984375, -43.043975830078125, -41.3712158203125, -39.698455810546875, -38.02569580078125, -36.352935791015625, -34.68017578125, -33.007415771484375, -31.33465576171875, -29.661895751953125, -27.9891357421875, -26.316375732421875, -24.64361572265625, -22.970855712890625, -21.298095703125, -19.62533950805664, -17.952579498291016, -16.27981948852539, -14.607059478759766, -12.93429946899414, -11.261540412902832, -9.588780403137207, -7.916020393371582, -6.243259429931641, -4.570499420166016, -2.8977396488189697, -1.2249798774719238, 0.44778013229370117, 2.120539665222168, 3.793299674987793, 5.466059684753418, 7.138819694519043, 8.811579704284668, 10.484339714050293, 12.157098770141602, 13.829858779907227, 15.502618789672852, 17.175378799438477, 18.8481388092041, 20.520898818969727, 22.19365882873535, 23.866418838500977, 25.5391788482666, 27.211938858032227, 28.88469696044922, 30.557456970214844, 32.23021697998047, 33.902976989746094, 35.57573699951172, 37.248497009277344, 38.92125701904297, 40.594017028808594, 42.26677703857422, 43.939537048339844, 45.61229705810547, 47.285057067871094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 9.0, 8.0, 20.0, 14.0, 9.0, 20.0, 21.0, 32.0, 31.0, 26.0, 25.0, 24.0, 36.0, 44.0, 43.0, 32.0, 58.0, 32.0, 47.0, 42.0, 45.0, 39.0, 39.0, 39.0, 31.0, 27.0, 27.0, 17.0, 15.0, 27.0, 17.0, 16.0, 9.0, 10.0, 10.0, 8.0, 7.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.978713989257812, -23.21526336669922, -22.451814651489258, -21.688364028930664, -20.92491340637207, -20.16146469116211, -19.398014068603516, -18.634563446044922, -17.871112823486328, -17.107662200927734, -16.344213485717773, -15.58076286315918, -14.817312240600586, -14.053862571716309, -13.290412902832031, -12.526962280273438, -11.763513565063477, -11.0000638961792, -10.236613273620605, -9.473163604736328, -8.709712982177734, -7.946263313293457, -7.18281364440918, -6.419363498687744, -5.655913352966309, -4.892463207244873, -4.1290130615234375, -3.36556339263916, -2.6021132469177246, -1.838663101196289, -1.0752134323120117, -0.31176328659057617, 0.4516868591308594, 1.2151368856430054, 1.9785869121551514, 2.742036819458008, 3.5054869651794434, 4.268937110900879, 5.032386779785156, 5.795836925506592, 6.559287071228027, 7.322737216949463, 8.086187362670898, 8.849637031555176, 9.613086700439453, 10.376537322998047, 11.139986991882324, 11.903436660766602, 12.666887283325195, 13.430336952209473, 14.193787574768066, 14.957237243652344, 15.720687866210938, 16.48413848876953, 17.247587203979492, 18.011037826538086, 18.774486541748047, 19.53793716430664, 20.3013858795166, 21.064836502075195, 21.82828712463379, 22.59173583984375, 23.355186462402344, 24.118637084960938, 24.88208770751953]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 12.0, 13.0, 19.0, 30.0, 66.0, 99.0, 154.0, 289.0, 628.0, 1504.0, 4922.0, 22877.0, 193350.0, 707518.0, 97319.0, 14053.0, 3456.0, 1145.0, 480.0, 241.0, 142.0, 76.0, 53.0, 24.0, 15.0, 22.0, 10.0, 6.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.375, -30.2685546875, -29.162109375, -28.0556640625, -26.94921875, -25.8427734375, -24.736328125, -23.6298828125, -22.5234375, -21.4169921875, -20.310546875, -19.2041015625, -18.09765625, -16.9912109375, -15.884765625, -14.7783203125, -13.671875, -12.5654296875, -11.458984375, -10.3525390625, -9.24609375, -8.1396484375, -7.033203125, -5.9267578125, -4.8203125, -3.7138671875, -2.607421875, -1.5009765625, -0.39453125, 0.7119140625, 1.818359375, 2.9248046875, 4.03125, 5.1376953125, 6.244140625, 7.3505859375, 8.45703125, 9.5634765625, 10.669921875, 11.7763671875, 12.8828125, 13.9892578125, 15.095703125, 16.2021484375, 17.30859375, 18.4150390625, 19.521484375, 20.6279296875, 21.734375, 22.8408203125, 23.947265625, 25.0537109375, 26.16015625, 27.2666015625, 28.373046875, 29.4794921875, 30.5859375, 31.6923828125, 32.798828125, 33.9052734375, 35.01171875, 36.1181640625, 37.224609375, 38.3310546875, 39.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 9.0, 9.0, 11.0, 16.0, 26.0, 30.0, 48.0, 44.0, 73.0, 82.0, 93.0, 88.0, 77.0, 68.0, 76.0, 68.0, 42.0, 39.0, 27.0, 25.0, 12.0, 16.0, 8.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.47296142578125, -3.3521728515625, -3.23138427734375, -3.110595703125, -2.98980712890625, -2.8690185546875, -2.74822998046875, -2.62744140625, -2.50665283203125, -2.3858642578125, -2.26507568359375, -2.144287109375, -2.02349853515625, -1.9027099609375, -1.78192138671875, -1.6611328125, -1.54034423828125, -1.4195556640625, -1.29876708984375, -1.177978515625, -1.05718994140625, -0.9364013671875, -0.81561279296875, -0.69482421875, -0.57403564453125, -0.4532470703125, -0.33245849609375, -0.211669921875, -0.09088134765625, 0.0299072265625, 0.15069580078125, 0.271484375, 0.39227294921875, 0.5130615234375, 0.63385009765625, 0.754638671875, 0.87542724609375, 0.9962158203125, 1.11700439453125, 1.23779296875, 1.35858154296875, 1.4793701171875, 1.60015869140625, 1.720947265625, 1.84173583984375, 1.9625244140625, 2.08331298828125, 2.2041015625, 2.32489013671875, 2.4456787109375, 2.56646728515625, 2.687255859375, 2.80804443359375, 2.9288330078125, 3.04962158203125, 3.17041015625, 3.29119873046875, 3.4119873046875, 3.53277587890625, 3.653564453125, 3.77435302734375, 3.8951416015625, 4.01593017578125, 4.13671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 12.0, 14.0, 8.0, 15.0, 24.0, 41.0, 29.0, 49.0, 61.0, 83.0, 124.0, 180.0, 244.0, 384.0, 683.0, 1273.0, 2772.0, 6993.0, 23399.0, 115474.0, 579675.0, 253721.0, 43895.0, 11227.0, 4064.0, 1717.0, 896.0, 468.0, 303.0, 191.0, 131.0, 96.0, 71.0, 43.0, 31.0, 29.0, 22.0, 11.0, 22.0, 13.0, 11.0, 6.0, 10.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-21.421875, -20.746337890625, -20.07080078125, -19.395263671875, -18.7197265625, -18.044189453125, -17.36865234375, -16.693115234375, -16.017578125, -15.342041015625, -14.66650390625, -13.990966796875, -13.3154296875, -12.639892578125, -11.96435546875, -11.288818359375, -10.61328125, -9.937744140625, -9.26220703125, -8.586669921875, -7.9111328125, -7.235595703125, -6.56005859375, -5.884521484375, -5.208984375, -4.533447265625, -3.85791015625, -3.182373046875, -2.5068359375, -1.831298828125, -1.15576171875, -0.480224609375, 0.1953125, 0.870849609375, 1.54638671875, 2.221923828125, 2.8974609375, 3.572998046875, 4.24853515625, 4.924072265625, 5.599609375, 6.275146484375, 6.95068359375, 7.626220703125, 8.3017578125, 8.977294921875, 9.65283203125, 10.328369140625, 11.00390625, 11.679443359375, 12.35498046875, 13.030517578125, 13.7060546875, 14.381591796875, 15.05712890625, 15.732666015625, 16.408203125, 17.083740234375, 17.75927734375, 18.434814453125, 19.1103515625, 19.785888671875, 20.46142578125, 21.136962890625, 21.8125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 2.0, 11.0, 8.0, 5.0, 16.0, 18.0, 16.0, 21.0, 34.0, 28.0, 34.0, 33.0, 36.0, 39.0, 52.0, 38.0, 44.0, 44.0, 41.0, 37.0, 39.0, 40.0, 31.0, 40.0, 39.0, 30.0, 35.0, 29.0, 28.0, 18.0, 18.0, 17.0, 13.0, 10.0, 13.0, 7.0, 8.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.296875, -10.959228515625, -10.62158203125, -10.283935546875, -9.9462890625, -9.608642578125, -9.27099609375, -8.933349609375, -8.595703125, -8.258056640625, -7.92041015625, -7.582763671875, -7.2451171875, -6.907470703125, -6.56982421875, -6.232177734375, -5.89453125, -5.556884765625, -5.21923828125, -4.881591796875, -4.5439453125, -4.206298828125, -3.86865234375, -3.531005859375, -3.193359375, -2.855712890625, -2.51806640625, -2.180419921875, -1.8427734375, -1.505126953125, -1.16748046875, -0.829833984375, -0.4921875, -0.154541015625, 0.18310546875, 0.520751953125, 0.8583984375, 1.196044921875, 1.53369140625, 1.871337890625, 2.208984375, 2.546630859375, 2.88427734375, 3.221923828125, 3.5595703125, 3.897216796875, 4.23486328125, 4.572509765625, 4.91015625, 5.247802734375, 5.58544921875, 5.923095703125, 6.2607421875, 6.598388671875, 6.93603515625, 7.273681640625, 7.611328125, 7.948974609375, 8.28662109375, 8.624267578125, 8.9619140625, 9.299560546875, 9.63720703125, 9.974853515625, 10.3125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 24.0, 38.0, 56.0, 89.0, 118.0, 192.0, 299.0, 469.0, 749.0, 1342.0, 2161.0, 4247.0, 8687.0, 23420.0, 102314.0, 726218.0, 131032.0, 26742.0, 9725.0, 4550.0, 2414.0, 1423.0, 791.0, 514.0, 331.0, 205.0, 119.0, 88.0, 47.0, 38.0, 20.0, 26.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.203125, -17.64404296875, -17.0849609375, -16.52587890625, -15.966796875, -15.40771484375, -14.8486328125, -14.28955078125, -13.73046875, -13.17138671875, -12.6123046875, -12.05322265625, -11.494140625, -10.93505859375, -10.3759765625, -9.81689453125, -9.2578125, -8.69873046875, -8.1396484375, -7.58056640625, -7.021484375, -6.46240234375, -5.9033203125, -5.34423828125, -4.78515625, -4.22607421875, -3.6669921875, -3.10791015625, -2.548828125, -1.98974609375, -1.4306640625, -0.87158203125, -0.3125, 0.24658203125, 0.8056640625, 1.36474609375, 1.923828125, 2.48291015625, 3.0419921875, 3.60107421875, 4.16015625, 4.71923828125, 5.2783203125, 5.83740234375, 6.396484375, 6.95556640625, 7.5146484375, 8.07373046875, 8.6328125, 9.19189453125, 9.7509765625, 10.31005859375, 10.869140625, 11.42822265625, 11.9873046875, 12.54638671875, 13.10546875, 13.66455078125, 14.2236328125, 14.78271484375, 15.341796875, 15.90087890625, 16.4599609375, 17.01904296875, 17.578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 10.0, 16.0, 23.0, 32.0, 67.0, 190.0, 366.0, 135.0, 56.0, 27.0, 17.0, 23.0, 7.0, 5.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004962921142578125, -0.004774570465087891, -0.004586219787597656, -0.004397869110107422, -0.0042095184326171875, -0.004021167755126953, -0.0038328170776367188, -0.0036444664001464844, -0.00345611572265625, -0.0032677650451660156, -0.0030794143676757812, -0.002891063690185547, -0.0027027130126953125, -0.002514362335205078, -0.0023260116577148438, -0.0021376609802246094, -0.001949310302734375, -0.0017609596252441406, -0.0015726089477539062, -0.0013842582702636719, -0.0011959075927734375, -0.0010075569152832031, -0.0008192062377929688, -0.0006308555603027344, -0.0004425048828125, -0.0002541542053222656, -6.580352783203125e-05, 0.00012254714965820312, 0.0003108978271484375, 0.0004992485046386719, 0.0006875991821289062, 0.0008759498596191406, 0.001064300537109375, 0.0012526512145996094, 0.0014410018920898438, 0.0016293525695800781, 0.0018177032470703125, 0.002006053924560547, 0.0021944046020507812, 0.0023827552795410156, 0.00257110595703125, 0.0027594566345214844, 0.0029478073120117188, 0.003136157989501953, 0.0033245086669921875, 0.003512859344482422, 0.0037012100219726562, 0.0038895606994628906, 0.004077911376953125, 0.004266262054443359, 0.004454612731933594, 0.004642963409423828, 0.0048313140869140625, 0.005019664764404297, 0.005208015441894531, 0.005396366119384766, 0.005584716796875, 0.005773067474365234, 0.005961418151855469, 0.006149768829345703, 0.0063381195068359375, 0.006526470184326172, 0.006714820861816406, 0.006903171539306641, 0.007091522216796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 9.0, 8.0, 9.0, 15.0, 19.0, 26.0, 32.0, 42.0, 78.0, 111.0, 196.0, 382.0, 679.0, 1673.0, 4773.0, 17628.0, 127398.0, 818375.0, 59848.0, 11278.0, 3338.0, 1266.0, 590.0, 301.0, 133.0, 115.0, 75.0, 34.0, 36.0, 26.0, 18.0, 5.0, 7.0, 9.0, 4.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.09375, -23.348876953125, -22.60400390625, -21.859130859375, -21.1142578125, -20.369384765625, -19.62451171875, -18.879638671875, -18.134765625, -17.389892578125, -16.64501953125, -15.900146484375, -15.1552734375, -14.410400390625, -13.66552734375, -12.920654296875, -12.17578125, -11.430908203125, -10.68603515625, -9.941162109375, -9.1962890625, -8.451416015625, -7.70654296875, -6.961669921875, -6.216796875, -5.471923828125, -4.72705078125, -3.982177734375, -3.2373046875, -2.492431640625, -1.74755859375, -1.002685546875, -0.2578125, 0.487060546875, 1.23193359375, 1.976806640625, 2.7216796875, 3.466552734375, 4.21142578125, 4.956298828125, 5.701171875, 6.446044921875, 7.19091796875, 7.935791015625, 8.6806640625, 9.425537109375, 10.17041015625, 10.915283203125, 11.66015625, 12.405029296875, 13.14990234375, 13.894775390625, 14.6396484375, 15.384521484375, 16.12939453125, 16.874267578125, 17.619140625, 18.364013671875, 19.10888671875, 19.853759765625, 20.5986328125, 21.343505859375, 22.08837890625, 22.833251953125, 23.578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 11.0, 16.0, 15.0, 22.0, 30.0, 28.0, 35.0, 59.0, 83.0, 99.0, 113.0, 120.0, 76.0, 36.0, 47.0, 29.0, 26.0, 19.0, 20.0, 17.0, 16.0, 10.0, 2.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.59375, -10.3023681640625, -10.010986328125, -9.7196044921875, -9.42822265625, -9.1368408203125, -8.845458984375, -8.5540771484375, -8.2626953125, -7.9713134765625, -7.679931640625, -7.3885498046875, -7.09716796875, -6.8057861328125, -6.514404296875, -6.2230224609375, -5.931640625, -5.6402587890625, -5.348876953125, -5.0574951171875, -4.76611328125, -4.4747314453125, -4.183349609375, -3.8919677734375, -3.6005859375, -3.3092041015625, -3.017822265625, -2.7264404296875, -2.43505859375, -2.1436767578125, -1.852294921875, -1.5609130859375, -1.26953125, -0.9781494140625, -0.686767578125, -0.3953857421875, -0.10400390625, 0.1873779296875, 0.478759765625, 0.7701416015625, 1.0615234375, 1.3529052734375, 1.644287109375, 1.9356689453125, 2.22705078125, 2.5184326171875, 2.809814453125, 3.1011962890625, 3.392578125, 3.6839599609375, 3.975341796875, 4.2667236328125, 4.55810546875, 4.8494873046875, 5.140869140625, 5.4322509765625, 5.7236328125, 6.0150146484375, 6.306396484375, 6.5977783203125, 6.88916015625, 7.1805419921875, 7.471923828125, 7.7633056640625, 8.0546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 8.0, 28.0, 47.0, 99.0, 168.0, 225.0, 187.0, 105.0, 58.0, 37.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.9297790527344, -273.99517822265625, -267.0605773925781, -260.1259460449219, -253.19134521484375, -246.25674438476562, -239.3221435546875, -232.3875274658203, -225.4529266357422, -218.51832580566406, -211.58370971679688, -204.64910888671875, -197.71449279785156, -190.77989196777344, -183.84527587890625, -176.91067504882812, -169.97607421875, -163.04147338867188, -156.1068572998047, -149.17225646972656, -142.23764038085938, -135.30303955078125, -128.36843872070312, -121.43382263183594, -114.49920654296875, -107.5645980834961, -100.62998962402344, -93.69538879394531, -86.76078033447266, -79.826171875, -72.89156341552734, -65.95695495605469, -59.02235412597656, -52.087745666503906, -45.153141021728516, -38.21853256225586, -31.283926010131836, -24.349319458007812, -17.414710998535156, -10.480106353759766, -3.5454978942871094, 3.3891091346740723, 10.323716163635254, 17.258323669433594, 24.192930221557617, 31.12753677368164, 38.0621452331543, 44.99674987792969, 51.931358337402344, 58.865966796875, 65.80057525634766, 72.73518371582031, 79.66978454589844, 86.6043930053711, 93.53900146484375, 100.47360229492188, 107.40821838378906, 114.34282684326172, 121.27743530273438, 128.2120361328125, 135.1466522216797, 142.0812530517578, 149.015869140625, 155.95046997070312, 162.88507080078125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 7.0, 12.0, 19.0, 12.0, 28.0, 16.0, 26.0, 23.0, 29.0, 31.0, 27.0, 37.0, 51.0, 39.0, 23.0, 42.0, 45.0, 40.0, 45.0, 43.0, 47.0, 30.0, 33.0, 32.0, 35.0, 33.0, 24.0, 22.0, 17.0, 20.0, 14.0, 6.0, 10.0, 15.0, 11.0, 5.0, 6.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.75227355957031, -59.886505126953125, -58.02073669433594, -56.15496826171875, -54.28919982910156, -52.423431396484375, -50.55766296386719, -48.69189453125, -46.82612609863281, -44.960357666015625, -43.09458923339844, -41.22882080078125, -39.36305236816406, -37.497283935546875, -35.63151550292969, -33.7657470703125, -31.899978637695312, -30.034210205078125, -28.168441772460938, -26.30267333984375, -24.436904907226562, -22.571136474609375, -20.705368041992188, -18.839599609375, -16.973831176757812, -15.108062744140625, -13.242294311523438, -11.37652587890625, -9.510757446289062, -7.644989013671875, -5.7792205810546875, -3.9134521484375, -2.0476837158203125, -0.181915283203125, 1.6838531494140625, 3.54962158203125, 5.4153900146484375, 7.281158447265625, 9.146926879882812, 11.0126953125, 12.878463745117188, 14.744232177734375, 16.610000610351562, 18.47576904296875, 20.341537475585938, 22.207305908203125, 24.073074340820312, 25.9388427734375, 27.804611206054688, 29.670379638671875, 31.536148071289062, 33.40191650390625, 35.26768493652344, 37.133453369140625, 38.99922180175781, 40.864990234375, 42.73075866699219, 44.596527099609375, 46.46229553222656, 48.32806396484375, 50.19383239746094, 52.059600830078125, 53.92536926269531, 55.7911376953125, 57.65690612792969]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 8.0, 7.0, 6.0, 12.0, 14.0, 11.0, 26.0, 39.0, 52.0, 69.0, 113.0, 169.0, 302.0, 626.0, 1691.0, 5325.0, 21574.0, 173610.0, 3911314.0, 60951.0, 12398.0, 3594.0, 1254.0, 537.0, 259.0, 129.0, 74.0, 40.0, 34.0, 15.0, 11.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.46875, -53.08251953125, -51.6962890625, -50.31005859375, -48.923828125, -47.53759765625, -46.1513671875, -44.76513671875, -43.37890625, -41.99267578125, -40.6064453125, -39.22021484375, -37.833984375, -36.44775390625, -35.0615234375, -33.67529296875, -32.2890625, -30.90283203125, -29.5166015625, -28.13037109375, -26.744140625, -25.35791015625, -23.9716796875, -22.58544921875, -21.19921875, -19.81298828125, -18.4267578125, -17.04052734375, -15.654296875, -14.26806640625, -12.8818359375, -11.49560546875, -10.109375, -8.72314453125, -7.3369140625, -5.95068359375, -4.564453125, -3.17822265625, -1.7919921875, -0.40576171875, 0.98046875, 2.36669921875, 3.7529296875, 5.13916015625, 6.525390625, 7.91162109375, 9.2978515625, 10.68408203125, 12.0703125, 13.45654296875, 14.8427734375, 16.22900390625, 17.615234375, 19.00146484375, 20.3876953125, 21.77392578125, 23.16015625, 24.54638671875, 25.9326171875, 27.31884765625, 28.705078125, 30.09130859375, 31.4775390625, 32.86376953125, 34.25]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 9.0, 22.0, 15.0, 30.0, 31.0, 42.0, 69.0, 80.0, 83.0, 99.0, 82.0, 83.0, 73.0, 68.0, 37.0, 43.0, 34.0, 26.0, 23.0, 13.0, 6.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.729034423828125, -3.59674072265625, -3.464447021484375, -3.3321533203125, -3.199859619140625, -3.06756591796875, -2.935272216796875, -2.802978515625, -2.670684814453125, -2.53839111328125, -2.406097412109375, -2.2738037109375, -2.141510009765625, -2.00921630859375, -1.876922607421875, -1.74462890625, -1.612335205078125, -1.48004150390625, -1.347747802734375, -1.2154541015625, -1.083160400390625, -0.95086669921875, -0.818572998046875, -0.686279296875, -0.553985595703125, -0.42169189453125, -0.289398193359375, -0.1571044921875, -0.024810791015625, 0.10748291015625, 0.239776611328125, 0.3720703125, 0.504364013671875, 0.63665771484375, 0.768951416015625, 0.9012451171875, 1.033538818359375, 1.16583251953125, 1.298126220703125, 1.430419921875, 1.562713623046875, 1.69500732421875, 1.827301025390625, 1.9595947265625, 2.091888427734375, 2.22418212890625, 2.356475830078125, 2.48876953125, 2.621063232421875, 2.75335693359375, 2.885650634765625, 3.0179443359375, 3.150238037109375, 3.28253173828125, 3.414825439453125, 3.547119140625, 3.679412841796875, 3.81170654296875, 3.944000244140625, 4.0762939453125, 4.208587646484375, 4.34088134765625, 4.473175048828125, 4.60546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 15.0, 25.0, 13.0, 37.0, 40.0, 70.0, 84.0, 116.0, 196.0, 250.0, 443.0, 636.0, 1067.0, 1991.0, 3956.0, 8305.0, 20075.0, 62033.0, 581554.0, 3373907.0, 92264.0, 26441.0, 10236.0, 4593.0, 2474.0, 1237.0, 736.0, 446.0, 288.0, 231.0, 138.0, 97.0, 82.0, 51.0, 46.0, 29.0, 14.0, 13.0, 14.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-26.46875, -25.669921875, -24.87109375, -24.072265625, -23.2734375, -22.474609375, -21.67578125, -20.876953125, -20.078125, -19.279296875, -18.48046875, -17.681640625, -16.8828125, -16.083984375, -15.28515625, -14.486328125, -13.6875, -12.888671875, -12.08984375, -11.291015625, -10.4921875, -9.693359375, -8.89453125, -8.095703125, -7.296875, -6.498046875, -5.69921875, -4.900390625, -4.1015625, -3.302734375, -2.50390625, -1.705078125, -0.90625, -0.107421875, 0.69140625, 1.490234375, 2.2890625, 3.087890625, 3.88671875, 4.685546875, 5.484375, 6.283203125, 7.08203125, 7.880859375, 8.6796875, 9.478515625, 10.27734375, 11.076171875, 11.875, 12.673828125, 13.47265625, 14.271484375, 15.0703125, 15.869140625, 16.66796875, 17.466796875, 18.265625, 19.064453125, 19.86328125, 20.662109375, 21.4609375, 22.259765625, 23.05859375, 23.857421875, 24.65625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 11.0, 7.0, 6.0, 15.0, 13.0, 18.0, 17.0, 34.0, 42.0, 98.0, 126.0, 367.0, 2297.0, 563.0, 161.0, 90.0, 54.0, 32.0, 37.0, 15.0, 15.0, 17.0, 9.0, 4.0, 4.0, 4.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.1875, -9.819091796875, -9.45068359375, -9.082275390625, -8.7138671875, -8.345458984375, -7.97705078125, -7.608642578125, -7.240234375, -6.871826171875, -6.50341796875, -6.135009765625, -5.7666015625, -5.398193359375, -5.02978515625, -4.661376953125, -4.29296875, -3.924560546875, -3.55615234375, -3.187744140625, -2.8193359375, -2.450927734375, -2.08251953125, -1.714111328125, -1.345703125, -0.977294921875, -0.60888671875, -0.240478515625, 0.1279296875, 0.496337890625, 0.86474609375, 1.233154296875, 1.6015625, 1.969970703125, 2.33837890625, 2.706787109375, 3.0751953125, 3.443603515625, 3.81201171875, 4.180419921875, 4.548828125, 4.917236328125, 5.28564453125, 5.654052734375, 6.0224609375, 6.390869140625, 6.75927734375, 7.127685546875, 7.49609375, 7.864501953125, 8.23291015625, 8.601318359375, 8.9697265625, 9.338134765625, 9.70654296875, 10.074951171875, 10.443359375, 10.811767578125, 11.18017578125, 11.548583984375, 11.9169921875, 12.285400390625, 12.65380859375, 13.022216796875, 13.390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 19.0, 44.0, 113.0, 255.0, 295.0, 138.0, 62.0, 40.0, 6.0, 9.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.23471069335938, -158.2018585205078, -154.1689910888672, -150.13613891601562, -146.103271484375, -142.07041931152344, -138.03756713867188, -134.00469970703125, -129.9718475341797, -125.9389877319336, -121.9061279296875, -117.87327575683594, -113.84041595458984, -109.80755615234375, -105.77470397949219, -101.7418441772461, -97.708984375, -93.6761245727539, -89.64326477050781, -85.61041259765625, -81.57755279541016, -77.54469299316406, -73.5118408203125, -69.4789810180664, -65.44612121582031, -61.41326141357422, -57.38040542602539, -53.34754943847656, -49.31468963623047, -45.281829833984375, -41.24897384643555, -37.21611785888672, -33.18327331542969, -29.150415420532227, -25.117557525634766, -21.084699630737305, -17.051841735839844, -13.018983840942383, -8.986125946044922, -4.953268051147461, -0.92041015625, 3.112447738647461, 7.145305633544922, 11.178163528442383, 15.211021423339844, 19.243879318237305, 23.276737213134766, 27.309595108032227, 31.342453002929688, 35.37531280517578, 39.40816879272461, 43.44102478027344, 47.47388458251953, 51.506744384765625, 55.53960037231445, 59.57245635986328, 63.605316162109375, 67.63817596435547, 71.67103576660156, 75.70388793945312, 79.73674774169922, 83.76960754394531, 87.80245971679688, 91.83531951904297, 95.86817932128906]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 12.0, 22.0, 24.0, 32.0, 33.0, 40.0, 37.0, 39.0, 49.0, 57.0, 48.0, 72.0, 58.0, 61.0, 68.0, 55.0, 48.0, 40.0, 34.0, 33.0, 20.0, 20.0, 18.0, 11.0, 15.0, 5.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.781578063964844, -31.347618103027344, -29.913658142089844, -28.479700088500977, -27.045740127563477, -25.611780166625977, -24.17782211303711, -22.74386215209961, -21.30990219116211, -19.87594223022461, -18.44198226928711, -17.008024215698242, -15.574064254760742, -14.140104293823242, -12.706145286560059, -11.272186279296875, -9.838226318359375, -8.404266357421875, -6.970307350158691, -5.53634786605835, -4.102388381958008, -2.668428897857666, -1.2344694137573242, 0.19948959350585938, 1.6334495544433594, 3.067409038543701, 4.501368522644043, 5.935328006744385, 7.369287490844727, 8.803247451782227, 10.23720645904541, 11.671165466308594, 13.105125427246094, 14.539085388183594, 15.973044395446777, 17.40700340270996, 18.84096336364746, 20.27492332458496, 21.708881378173828, 23.142841339111328, 24.576801300048828, 26.010761260986328, 27.444721221923828, 28.878679275512695, 30.312639236450195, 31.746599197387695, 33.18055725097656, 34.61451721191406, 36.04847717285156, 37.48243713378906, 38.91639709472656, 40.35035705566406, 41.78431701660156, 43.2182731628418, 44.6522331237793, 46.0861930847168, 47.5201530456543, 48.9541130065918, 50.3880729675293, 51.8220329284668, 53.25598907470703, 54.68994903564453, 56.12390899658203, 57.55786895751953, 58.99182891845703]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 4.0, 12.0, 7.0, 20.0, 20.0, 48.0, 41.0, 78.0, 101.0, 213.0, 361.0, 718.0, 1512.0, 3684.0, 11009.0, 44479.0, 302531.0, 583106.0, 74938.0, 16489.0, 5232.0, 1990.0, 836.0, 457.0, 226.0, 108.0, 107.0, 54.0, 44.0, 21.0, 20.0, 27.0, 16.0, 11.0, 2.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-32.15625, -31.21484375, -30.2734375, -29.33203125, -28.390625, -27.44921875, -26.5078125, -25.56640625, -24.625, -23.68359375, -22.7421875, -21.80078125, -20.859375, -19.91796875, -18.9765625, -18.03515625, -17.09375, -16.15234375, -15.2109375, -14.26953125, -13.328125, -12.38671875, -11.4453125, -10.50390625, -9.5625, -8.62109375, -7.6796875, -6.73828125, -5.796875, -4.85546875, -3.9140625, -2.97265625, -2.03125, -1.08984375, -0.1484375, 0.79296875, 1.734375, 2.67578125, 3.6171875, 4.55859375, 5.5, 6.44140625, 7.3828125, 8.32421875, 9.265625, 10.20703125, 11.1484375, 12.08984375, 13.03125, 13.97265625, 14.9140625, 15.85546875, 16.796875, 17.73828125, 18.6796875, 19.62109375, 20.5625, 21.50390625, 22.4453125, 23.38671875, 24.328125, 25.26953125, 26.2109375, 27.15234375, 28.09375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 6.0, 14.0, 12.0, 11.0, 28.0, 45.0, 34.0, 54.0, 62.0, 80.0, 110.0, 81.0, 73.0, 85.0, 72.0, 55.0, 41.0, 30.0, 28.0, 18.0, 20.0, 16.0, 5.0, 7.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.09967041015625, -3.9610595703125, -3.82244873046875, -3.683837890625, -3.54522705078125, -3.4066162109375, -3.26800537109375, -3.12939453125, -2.99078369140625, -2.8521728515625, -2.71356201171875, -2.574951171875, -2.43634033203125, -2.2977294921875, -2.15911865234375, -2.0205078125, -1.88189697265625, -1.7432861328125, -1.60467529296875, -1.466064453125, -1.32745361328125, -1.1888427734375, -1.05023193359375, -0.91162109375, -0.77301025390625, -0.6343994140625, -0.49578857421875, -0.357177734375, -0.21856689453125, -0.0799560546875, 0.05865478515625, 0.197265625, 0.33587646484375, 0.4744873046875, 0.61309814453125, 0.751708984375, 0.89031982421875, 1.0289306640625, 1.16754150390625, 1.30615234375, 1.44476318359375, 1.5833740234375, 1.72198486328125, 1.860595703125, 1.99920654296875, 2.1378173828125, 2.27642822265625, 2.4150390625, 2.55364990234375, 2.6922607421875, 2.83087158203125, 2.969482421875, 3.10809326171875, 3.2467041015625, 3.38531494140625, 3.52392578125, 3.66253662109375, 3.8011474609375, 3.93975830078125, 4.078369140625, 4.21697998046875, 4.3555908203125, 4.49420166015625, 4.6328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 4.0, 15.0, 20.0, 20.0, 25.0, 35.0, 55.0, 78.0, 142.0, 243.0, 442.0, 963.0, 2986.0, 11587.0, 76765.0, 753140.0, 174805.0, 20089.0, 4396.0, 1393.0, 552.0, 295.0, 155.0, 92.0, 72.0, 52.0, 27.0, 26.0, 22.0, 12.0, 12.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.28125, -39.15185546875, -38.0224609375, -36.89306640625, -35.763671875, -34.63427734375, -33.5048828125, -32.37548828125, -31.24609375, -30.11669921875, -28.9873046875, -27.85791015625, -26.728515625, -25.59912109375, -24.4697265625, -23.34033203125, -22.2109375, -21.08154296875, -19.9521484375, -18.82275390625, -17.693359375, -16.56396484375, -15.4345703125, -14.30517578125, -13.17578125, -12.04638671875, -10.9169921875, -9.78759765625, -8.658203125, -7.52880859375, -6.3994140625, -5.27001953125, -4.140625, -3.01123046875, -1.8818359375, -0.75244140625, 0.376953125, 1.50634765625, 2.6357421875, 3.76513671875, 4.89453125, 6.02392578125, 7.1533203125, 8.28271484375, 9.412109375, 10.54150390625, 11.6708984375, 12.80029296875, 13.9296875, 15.05908203125, 16.1884765625, 17.31787109375, 18.447265625, 19.57666015625, 20.7060546875, 21.83544921875, 22.96484375, 24.09423828125, 25.2236328125, 26.35302734375, 27.482421875, 28.61181640625, 29.7412109375, 30.87060546875, 32.0]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 12.0, 9.0, 14.0, 16.0, 21.0, 23.0, 21.0, 41.0, 29.0, 30.0, 60.0, 45.0, 56.0, 51.0, 51.0, 54.0, 55.0, 48.0, 50.0, 38.0, 36.0, 29.0, 35.0, 27.0, 32.0, 21.0, 23.0, 10.0, 15.0, 7.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 3.0], "bins": [-18.640625, -18.1822509765625, -17.723876953125, -17.2655029296875, -16.80712890625, -16.3487548828125, -15.890380859375, -15.4320068359375, -14.9736328125, -14.5152587890625, -14.056884765625, -13.5985107421875, -13.14013671875, -12.6817626953125, -12.223388671875, -11.7650146484375, -11.306640625, -10.8482666015625, -10.389892578125, -9.9315185546875, -9.47314453125, -9.0147705078125, -8.556396484375, -8.0980224609375, -7.6396484375, -7.1812744140625, -6.722900390625, -6.2645263671875, -5.80615234375, -5.3477783203125, -4.889404296875, -4.4310302734375, -3.97265625, -3.5142822265625, -3.055908203125, -2.5975341796875, -2.13916015625, -1.6807861328125, -1.222412109375, -0.7640380859375, -0.3056640625, 0.1527099609375, 0.611083984375, 1.0694580078125, 1.52783203125, 1.9862060546875, 2.444580078125, 2.9029541015625, 3.361328125, 3.8197021484375, 4.278076171875, 4.7364501953125, 5.19482421875, 5.6531982421875, 6.111572265625, 6.5699462890625, 7.0283203125, 7.4866943359375, 7.945068359375, 8.4034423828125, 8.86181640625, 9.3201904296875, 9.778564453125, 10.2369384765625, 10.6953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 8.0, 9.0, 8.0, 12.0, 22.0, 40.0, 35.0, 59.0, 99.0, 119.0, 161.0, 247.0, 375.0, 512.0, 764.0, 1227.0, 1857.0, 3180.0, 6324.0, 16728.0, 119685.0, 832494.0, 41885.0, 10812.0, 4676.0, 2538.0, 1516.0, 1013.0, 669.0, 451.0, 299.0, 218.0, 158.0, 91.0, 76.0, 55.0, 39.0, 21.0, 23.0, 13.0, 10.0, 3.0, 10.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.796875, -23.011474609375, -22.22607421875, -21.440673828125, -20.6552734375, -19.869873046875, -19.08447265625, -18.299072265625, -17.513671875, -16.728271484375, -15.94287109375, -15.157470703125, -14.3720703125, -13.586669921875, -12.80126953125, -12.015869140625, -11.23046875, -10.445068359375, -9.65966796875, -8.874267578125, -8.0888671875, -7.303466796875, -6.51806640625, -5.732666015625, -4.947265625, -4.161865234375, -3.37646484375, -2.591064453125, -1.8056640625, -1.020263671875, -0.23486328125, 0.550537109375, 1.3359375, 2.121337890625, 2.90673828125, 3.692138671875, 4.4775390625, 5.262939453125, 6.04833984375, 6.833740234375, 7.619140625, 8.404541015625, 9.18994140625, 9.975341796875, 10.7607421875, 11.546142578125, 12.33154296875, 13.116943359375, 13.90234375, 14.687744140625, 15.47314453125, 16.258544921875, 17.0439453125, 17.829345703125, 18.61474609375, 19.400146484375, 20.185546875, 20.970947265625, 21.75634765625, 22.541748046875, 23.3271484375, 24.112548828125, 24.89794921875, 25.683349609375, 26.46875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 5.0, 8.0, 18.0, 30.0, 74.0, 352.0, 311.0, 68.0, 38.0, 17.0, 12.0, 11.0, 4.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00604248046875, -0.005883276462554932, -0.005724072456359863, -0.005564868450164795, -0.0054056644439697266, -0.005246460437774658, -0.00508725643157959, -0.0049280524253845215, -0.004768848419189453, -0.004609644412994385, -0.004450440406799316, -0.004291236400604248, -0.00413203239440918, -0.003972828388214111, -0.003813624382019043, -0.0036544203758239746, -0.0034952163696289062, -0.003336012363433838, -0.0031768083572387695, -0.003017604351043701, -0.002858400344848633, -0.0026991963386535645, -0.002539992332458496, -0.0023807883262634277, -0.0022215843200683594, -0.002062380313873291, -0.0019031763076782227, -0.0017439723014831543, -0.001584768295288086, -0.0014255642890930176, -0.0012663602828979492, -0.0011071562767028809, -0.0009479522705078125, -0.0007887482643127441, -0.0006295442581176758, -0.0004703402519226074, -0.00031113624572753906, -0.0001519322395324707, 7.271766662597656e-06, 0.00016647577285766602, 0.0003256797790527344, 0.00048488378524780273, 0.0006440877914428711, 0.0008032917976379395, 0.0009624958038330078, 0.0011216998100280762, 0.0012809038162231445, 0.0014401078224182129, 0.0015993118286132812, 0.0017585158348083496, 0.001917719841003418, 0.0020769238471984863, 0.0022361278533935547, 0.002395331859588623, 0.0025545358657836914, 0.0027137398719787598, 0.002872943878173828, 0.0030321478843688965, 0.003191351890563965, 0.003350555896759033, 0.0035097599029541016, 0.00366896390914917, 0.0038281679153442383, 0.003987371921539307, 0.004146575927734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 8.0, 9.0, 14.0, 19.0, 30.0, 61.0, 101.0, 198.0, 399.0, 835.0, 2027.0, 6668.0, 138037.0, 886315.0, 9327.0, 2473.0, 1018.0, 458.0, 259.0, 105.0, 57.0, 35.0, 18.0, 18.0, 13.0, 13.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.5, -56.677734375, -54.85546875, -53.033203125, -51.2109375, -49.388671875, -47.56640625, -45.744140625, -43.921875, -42.099609375, -40.27734375, -38.455078125, -36.6328125, -34.810546875, -32.98828125, -31.166015625, -29.34375, -27.521484375, -25.69921875, -23.876953125, -22.0546875, -20.232421875, -18.41015625, -16.587890625, -14.765625, -12.943359375, -11.12109375, -9.298828125, -7.4765625, -5.654296875, -3.83203125, -2.009765625, -0.1875, 1.634765625, 3.45703125, 5.279296875, 7.1015625, 8.923828125, 10.74609375, 12.568359375, 14.390625, 16.212890625, 18.03515625, 19.857421875, 21.6796875, 23.501953125, 25.32421875, 27.146484375, 28.96875, 30.791015625, 32.61328125, 34.435546875, 36.2578125, 38.080078125, 39.90234375, 41.724609375, 43.546875, 45.369140625, 47.19140625, 49.013671875, 50.8359375, 52.658203125, 54.48046875, 56.302734375, 58.125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 10.0, 15.0, 22.0, 51.0, 149.0, 440.0, 187.0, 36.0, 21.0, 11.0, 9.0, 13.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.484375, -24.676025390625, -23.86767578125, -23.059326171875, -22.2509765625, -21.442626953125, -20.63427734375, -19.825927734375, -19.017578125, -18.209228515625, -17.40087890625, -16.592529296875, -15.7841796875, -14.975830078125, -14.16748046875, -13.359130859375, -12.55078125, -11.742431640625, -10.93408203125, -10.125732421875, -9.3173828125, -8.509033203125, -7.70068359375, -6.892333984375, -6.083984375, -5.275634765625, -4.46728515625, -3.658935546875, -2.8505859375, -2.042236328125, -1.23388671875, -0.425537109375, 0.3828125, 1.191162109375, 1.99951171875, 2.807861328125, 3.6162109375, 4.424560546875, 5.23291015625, 6.041259765625, 6.849609375, 7.657958984375, 8.46630859375, 9.274658203125, 10.0830078125, 10.891357421875, 11.69970703125, 12.508056640625, 13.31640625, 14.124755859375, 14.93310546875, 15.741455078125, 16.5498046875, 17.358154296875, 18.16650390625, 18.974853515625, 19.783203125, 20.591552734375, 21.39990234375, 22.208251953125, 23.0166015625, 23.824951171875, 24.63330078125, 25.441650390625, 26.25]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 20.0, 39.0, 140.0, 260.0, 280.0, 149.0, 48.0, 26.0, 13.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-508.55908203125, -497.2115173339844, -485.8639831542969, -474.51641845703125, -463.1688537597656, -451.8212890625, -440.4737548828125, -429.1261901855469, -417.77862548828125, -406.4310607910156, -395.0835266113281, -383.7359619140625, -372.3883972167969, -361.04083251953125, -349.69329833984375, -338.3457336425781, -326.9981994628906, -315.650634765625, -304.3031005859375, -292.9555358886719, -281.60797119140625, -270.26043701171875, -258.9128723144531, -247.5653076171875, -236.21775817871094, -224.87020874023438, -213.52264404296875, -202.1750946044922, -190.82754516601562, -179.47998046875, -168.13243103027344, -156.78488159179688, -145.43734741210938, -134.0897979736328, -122.74223327636719, -111.39468383789062, -100.04712677001953, -88.69956970214844, -77.35202026367188, -66.00446319580078, -54.65690612792969, -43.309349060058594, -31.961795806884766, -20.614242553710938, -9.266685485839844, 2.08087158203125, 13.428421020507812, 24.775978088378906, 36.12353515625, 47.471092224121094, 58.81864547729492, 70.16619873046875, 81.51375579833984, 92.86131286621094, 104.2088623046875, 115.5564193725586, 126.90397644042969, 138.25152587890625, 149.59909057617188, 160.94664001464844, 172.294189453125, 183.64175415039062, 194.9893035888672, 206.33685302734375, 217.68441772460938]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 13.0, 18.0, 20.0, 15.0, 24.0, 18.0, 31.0, 36.0, 22.0, 36.0, 33.0, 38.0, 33.0, 39.0, 55.0, 37.0, 40.0, 38.0, 35.0, 45.0, 45.0, 33.0, 39.0, 37.0, 24.0, 15.0, 26.0, 17.0, 17.0, 17.0, 13.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-76.69795989990234, -74.50188446044922, -72.30581665039062, -70.1097412109375, -67.91366577148438, -65.71759033203125, -63.521522521972656, -61.32544708251953, -59.12937545776367, -56.93330383300781, -54.73722839355469, -52.54115676879883, -50.34508514404297, -48.149009704589844, -45.952938079833984, -43.756866455078125, -41.560791015625, -39.36471939086914, -37.168643951416016, -34.972572326660156, -32.77649688720703, -30.580425262451172, -28.384353637695312, -26.18828010559082, -23.992206573486328, -21.796133041381836, -19.600059509277344, -17.403987884521484, -15.207914352416992, -13.0118408203125, -10.815768241882324, -8.619695663452148, -6.423618316650391, -4.227545261383057, -2.0314722061157227, 0.16460084915161133, 2.3606739044189453, 4.5567474365234375, 6.752820014953613, 8.948892593383789, 11.144966125488281, 13.341039657592773, 15.53711223602295, 17.733184814453125, 19.929258346557617, 22.12533187866211, 24.32140350341797, 26.51747703552246, 28.713550567626953, 30.909624099731445, 33.10569763183594, 35.3017692565918, 37.497840881347656, 39.69391632080078, 41.88998794555664, 44.0860595703125, 46.282135009765625, 48.478206634521484, 50.67428207397461, 52.87035369873047, 55.066429138183594, 57.26250076293945, 59.45857238769531, 61.65464782714844, 63.8507194519043]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 21.0, 28.0, 23.0, 39.0, 70.0, 123.0, 202.0, 377.0, 841.0, 2031.0, 6689.0, 34331.0, 4020702.0, 111008.0, 12238.0, 3233.0, 1151.0, 524.0, 253.0, 149.0, 78.0, 68.0, 17.0, 18.0, 8.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -64.52734375, -62.5546875, -60.58203125, -58.609375, -56.63671875, -54.6640625, -52.69140625, -50.71875, -48.74609375, -46.7734375, -44.80078125, -42.828125, -40.85546875, -38.8828125, -36.91015625, -34.9375, -32.96484375, -30.9921875, -29.01953125, -27.046875, -25.07421875, -23.1015625, -21.12890625, -19.15625, -17.18359375, -15.2109375, -13.23828125, -11.265625, -9.29296875, -7.3203125, -5.34765625, -3.375, -1.40234375, 0.5703125, 2.54296875, 4.515625, 6.48828125, 8.4609375, 10.43359375, 12.40625, 14.37890625, 16.3515625, 18.32421875, 20.296875, 22.26953125, 24.2421875, 26.21484375, 28.1875, 30.16015625, 32.1328125, 34.10546875, 36.078125, 38.05078125, 40.0234375, 41.99609375, 43.96875, 45.94140625, 47.9140625, 49.88671875, 51.859375, 53.83203125, 55.8046875, 57.77734375, 59.75]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 17.0, 13.0, 26.0, 22.0, 26.0, 54.0, 47.0, 61.0, 73.0, 67.0, 61.0, 72.0, 87.0, 71.0, 63.0, 47.0, 49.0, 35.0, 20.0, 13.0, 18.0, 15.0, 11.0, 5.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.043212890625, -3.89892578125, -3.754638671875, -3.6103515625, -3.466064453125, -3.32177734375, -3.177490234375, -3.033203125, -2.888916015625, -2.74462890625, -2.600341796875, -2.4560546875, -2.311767578125, -2.16748046875, -2.023193359375, -1.87890625, -1.734619140625, -1.59033203125, -1.446044921875, -1.3017578125, -1.157470703125, -1.01318359375, -0.868896484375, -0.724609375, -0.580322265625, -0.43603515625, -0.291748046875, -0.1474609375, -0.003173828125, 0.14111328125, 0.285400390625, 0.4296875, 0.573974609375, 0.71826171875, 0.862548828125, 1.0068359375, 1.151123046875, 1.29541015625, 1.439697265625, 1.583984375, 1.728271484375, 1.87255859375, 2.016845703125, 2.1611328125, 2.305419921875, 2.44970703125, 2.593994140625, 2.73828125, 2.882568359375, 3.02685546875, 3.171142578125, 3.3154296875, 3.459716796875, 3.60400390625, 3.748291015625, 3.892578125, 4.036865234375, 4.18115234375, 4.325439453125, 4.4697265625, 4.614013671875, 4.75830078125, 4.902587890625, 5.046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 10.0, 17.0, 23.0, 24.0, 23.0, 58.0, 80.0, 141.0, 245.0, 406.0, 764.0, 1398.0, 2782.0, 6103.0, 15829.0, 64005.0, 3658078.0, 385809.0, 38300.0, 10973.0, 4580.0, 2033.0, 1055.0, 616.0, 368.0, 179.0, 151.0, 82.0, 40.0, 40.0, 22.0, 17.0, 12.0, 9.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.53125, -33.44677734375, -32.3623046875, -31.27783203125, -30.193359375, -29.10888671875, -28.0244140625, -26.93994140625, -25.85546875, -24.77099609375, -23.6865234375, -22.60205078125, -21.517578125, -20.43310546875, -19.3486328125, -18.26416015625, -17.1796875, -16.09521484375, -15.0107421875, -13.92626953125, -12.841796875, -11.75732421875, -10.6728515625, -9.58837890625, -8.50390625, -7.41943359375, -6.3349609375, -5.25048828125, -4.166015625, -3.08154296875, -1.9970703125, -0.91259765625, 0.171875, 1.25634765625, 2.3408203125, 3.42529296875, 4.509765625, 5.59423828125, 6.6787109375, 7.76318359375, 8.84765625, 9.93212890625, 11.0166015625, 12.10107421875, 13.185546875, 14.27001953125, 15.3544921875, 16.43896484375, 17.5234375, 18.60791015625, 19.6923828125, 20.77685546875, 21.861328125, 22.94580078125, 24.0302734375, 25.11474609375, 26.19921875, 27.28369140625, 28.3681640625, 29.45263671875, 30.537109375, 31.62158203125, 32.7060546875, 33.79052734375, 34.875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 5.0, 4.0, 7.0, 9.0, 18.0, 20.0, 26.0, 39.0, 67.0, 147.0, 676.0, 2578.0, 235.0, 80.0, 60.0, 32.0, 28.0, 10.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -15.9273681640625, -15.432861328125, -14.9383544921875, -14.44384765625, -13.9493408203125, -13.454833984375, -12.9603271484375, -12.4658203125, -11.9713134765625, -11.476806640625, -10.9822998046875, -10.48779296875, -9.9932861328125, -9.498779296875, -9.0042724609375, -8.509765625, -8.0152587890625, -7.520751953125, -7.0262451171875, -6.53173828125, -6.0372314453125, -5.542724609375, -5.0482177734375, -4.5537109375, -4.0592041015625, -3.564697265625, -3.0701904296875, -2.57568359375, -2.0811767578125, -1.586669921875, -1.0921630859375, -0.59765625, -0.1031494140625, 0.391357421875, 0.8858642578125, 1.38037109375, 1.8748779296875, 2.369384765625, 2.8638916015625, 3.3583984375, 3.8529052734375, 4.347412109375, 4.8419189453125, 5.33642578125, 5.8309326171875, 6.325439453125, 6.8199462890625, 7.314453125, 7.8089599609375, 8.303466796875, 8.7979736328125, 9.29248046875, 9.7869873046875, 10.281494140625, 10.7760009765625, 11.2705078125, 11.7650146484375, 12.259521484375, 12.7540283203125, 13.24853515625, 13.7430419921875, 14.237548828125, 14.7320556640625, 15.2265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 11.0, 8.0, 15.0, 34.0, 71.0, 172.0, 364.0, 215.0, 69.0, 28.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.1160125732422, -159.08926391601562, -154.06251525878906, -149.0357666015625, -144.00901794433594, -138.98226928710938, -133.95550537109375, -128.9287567138672, -123.90200805664062, -118.87525939941406, -113.8485107421875, -108.82176208496094, -103.79500579833984, -98.76825714111328, -93.74150848388672, -88.71475219726562, -83.6880111694336, -78.66126251220703, -73.63451385498047, -68.60775756835938, -63.58100891113281, -58.55426025390625, -53.52751159667969, -48.50075912475586, -43.4740104675293, -38.447261810302734, -33.420509338378906, -28.393760681152344, -23.36701011657715, -18.340259552001953, -13.31351089477539, -8.286758422851562, -3.260009765625, 1.766740322113037, 6.793490409851074, 11.820240020751953, 16.84699058532715, 21.873741149902344, 26.900489807128906, 31.927242279052734, 36.9539909362793, 41.98073959350586, 47.00749206542969, 52.03424072265625, 57.06098937988281, 62.08774185180664, 67.11448669433594, 72.14124298095703, 77.1679916381836, 82.19474029541016, 87.22148895263672, 92.24824523925781, 97.27499389648438, 102.30174255371094, 107.3284912109375, 112.35523986816406, 117.38198852539062, 122.40873718261719, 127.43548583984375, 132.4622344970703, 137.48898315429688, 142.5157470703125, 147.54248046875, 152.56924438476562, 157.5959930419922]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 3.0, 13.0, 10.0, 11.0, 14.0, 15.0, 25.0, 23.0, 20.0, 31.0, 37.0, 30.0, 38.0, 44.0, 52.0, 39.0, 31.0, 49.0, 52.0, 43.0, 50.0, 38.0, 37.0, 48.0, 29.0, 40.0, 24.0, 28.0, 22.0, 15.0, 13.0, 10.0, 12.0, 12.0, 5.0, 6.0, 3.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.308349609375, -32.210975646972656, -31.113605499267578, -30.016233444213867, -28.918861389160156, -27.821487426757812, -26.7241153717041, -25.62674331665039, -24.52937126159668, -23.43199920654297, -22.334627151489258, -21.237255096435547, -20.139881134033203, -19.042510986328125, -17.94513702392578, -16.84776496887207, -15.75039291381836, -14.653020858764648, -13.555648803710938, -12.45827579498291, -11.3609037399292, -10.263531684875488, -9.166158676147461, -8.06878662109375, -6.971414566040039, -5.874042510986328, -4.776669979095459, -3.679297685623169, -2.581925392150879, -1.484553337097168, -0.38718080520629883, 0.7101917266845703, 1.8075637817382812, 2.9049360752105713, 4.002308368682861, 5.0996809005737305, 6.197052955627441, 7.294425010681152, 8.39179801940918, 9.48917007446289, 10.586542129516602, 11.683914184570312, 12.781286239624023, 13.87865924835205, 14.976031303405762, 16.073402404785156, 17.1707763671875, 18.26814842224121, 19.365520477294922, 20.462892532348633, 21.560264587402344, 22.657636642456055, 23.755008697509766, 24.85238265991211, 25.94975471496582, 27.04712677001953, 28.144498825073242, 29.241870880126953, 30.339242935180664, 31.436614990234375, 32.53398895263672, 33.6313591003418, 34.72873306274414, 35.82610321044922, 36.92347717285156]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 4.0, 8.0, 2.0, 11.0, 15.0, 17.0, 26.0, 45.0, 46.0, 58.0, 109.0, 199.0, 276.0, 518.0, 966.0, 2065.0, 5119.0, 13825.0, 43829.0, 170860.0, 550840.0, 187538.0, 47091.0, 14963.0, 5515.0, 2264.0, 1001.0, 502.0, 275.0, 173.0, 106.0, 69.0, 61.0, 35.0, 25.0, 21.0, 14.0, 15.0, 6.0, 13.0, 12.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.859375, -17.2333984375, -16.607421875, -15.9814453125, -15.35546875, -14.7294921875, -14.103515625, -13.4775390625, -12.8515625, -12.2255859375, -11.599609375, -10.9736328125, -10.34765625, -9.7216796875, -9.095703125, -8.4697265625, -7.84375, -7.2177734375, -6.591796875, -5.9658203125, -5.33984375, -4.7138671875, -4.087890625, -3.4619140625, -2.8359375, -2.2099609375, -1.583984375, -0.9580078125, -0.33203125, 0.2939453125, 0.919921875, 1.5458984375, 2.171875, 2.7978515625, 3.423828125, 4.0498046875, 4.67578125, 5.3017578125, 5.927734375, 6.5537109375, 7.1796875, 7.8056640625, 8.431640625, 9.0576171875, 9.68359375, 10.3095703125, 10.935546875, 11.5615234375, 12.1875, 12.8134765625, 13.439453125, 14.0654296875, 14.69140625, 15.3173828125, 15.943359375, 16.5693359375, 17.1953125, 17.8212890625, 18.447265625, 19.0732421875, 19.69921875, 20.3251953125, 20.951171875, 21.5771484375, 22.203125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 14.0, 11.0, 24.0, 35.0, 39.0, 48.0, 57.0, 62.0, 56.0, 70.0, 63.0, 72.0, 64.0, 67.0, 59.0, 50.0, 44.0, 31.0, 33.0, 21.0, 12.0, 15.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.9173583984375, -3.776123046875, -3.6348876953125, -3.49365234375, -3.3524169921875, -3.211181640625, -3.0699462890625, -2.9287109375, -2.7874755859375, -2.646240234375, -2.5050048828125, -2.36376953125, -2.2225341796875, -2.081298828125, -1.9400634765625, -1.798828125, -1.6575927734375, -1.516357421875, -1.3751220703125, -1.23388671875, -1.0926513671875, -0.951416015625, -0.8101806640625, -0.6689453125, -0.5277099609375, -0.386474609375, -0.2452392578125, -0.10400390625, 0.0372314453125, 0.178466796875, 0.3197021484375, 0.4609375, 0.6021728515625, 0.743408203125, 0.8846435546875, 1.02587890625, 1.1671142578125, 1.308349609375, 1.4495849609375, 1.5908203125, 1.7320556640625, 1.873291015625, 2.0145263671875, 2.15576171875, 2.2969970703125, 2.438232421875, 2.5794677734375, 2.720703125, 2.8619384765625, 3.003173828125, 3.1444091796875, 3.28564453125, 3.4268798828125, 3.568115234375, 3.7093505859375, 3.8505859375, 3.9918212890625, 4.133056640625, 4.2742919921875, 4.41552734375, 4.5567626953125, 4.697998046875, 4.8392333984375, 4.98046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 4.0, 8.0, 9.0, 12.0, 16.0, 24.0, 24.0, 35.0, 75.0, 102.0, 163.0, 329.0, 649.0, 1395.0, 4075.0, 14591.0, 70768.0, 532733.0, 355727.0, 50981.0, 11015.0, 3342.0, 1196.0, 517.0, 294.0, 154.0, 110.0, 62.0, 35.0, 27.0, 28.0, 13.0, 15.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.859375, -25.0966796875, -24.333984375, -23.5712890625, -22.80859375, -22.0458984375, -21.283203125, -20.5205078125, -19.7578125, -18.9951171875, -18.232421875, -17.4697265625, -16.70703125, -15.9443359375, -15.181640625, -14.4189453125, -13.65625, -12.8935546875, -12.130859375, -11.3681640625, -10.60546875, -9.8427734375, -9.080078125, -8.3173828125, -7.5546875, -6.7919921875, -6.029296875, -5.2666015625, -4.50390625, -3.7412109375, -2.978515625, -2.2158203125, -1.453125, -0.6904296875, 0.072265625, 0.8349609375, 1.59765625, 2.3603515625, 3.123046875, 3.8857421875, 4.6484375, 5.4111328125, 6.173828125, 6.9365234375, 7.69921875, 8.4619140625, 9.224609375, 9.9873046875, 10.75, 11.5126953125, 12.275390625, 13.0380859375, 13.80078125, 14.5634765625, 15.326171875, 16.0888671875, 16.8515625, 17.6142578125, 18.376953125, 19.1396484375, 19.90234375, 20.6650390625, 21.427734375, 22.1904296875, 22.953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 15.0, 6.0, 20.0, 13.0, 29.0, 22.0, 30.0, 37.0, 39.0, 31.0, 46.0, 49.0, 48.0, 61.0, 63.0, 60.0, 44.0, 41.0, 48.0, 46.0, 42.0, 35.0, 39.0, 30.0, 28.0, 14.0, 13.0, 11.0, 12.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.875, -16.391357421875, -15.90771484375, -15.424072265625, -14.9404296875, -14.456787109375, -13.97314453125, -13.489501953125, -13.005859375, -12.522216796875, -12.03857421875, -11.554931640625, -11.0712890625, -10.587646484375, -10.10400390625, -9.620361328125, -9.13671875, -8.653076171875, -8.16943359375, -7.685791015625, -7.2021484375, -6.718505859375, -6.23486328125, -5.751220703125, -5.267578125, -4.783935546875, -4.30029296875, -3.816650390625, -3.3330078125, -2.849365234375, -2.36572265625, -1.882080078125, -1.3984375, -0.914794921875, -0.43115234375, 0.052490234375, 0.5361328125, 1.019775390625, 1.50341796875, 1.987060546875, 2.470703125, 2.954345703125, 3.43798828125, 3.921630859375, 4.4052734375, 4.888916015625, 5.37255859375, 5.856201171875, 6.33984375, 6.823486328125, 7.30712890625, 7.790771484375, 8.2744140625, 8.758056640625, 9.24169921875, 9.725341796875, 10.208984375, 10.692626953125, 11.17626953125, 11.659912109375, 12.1435546875, 12.627197265625, 13.11083984375, 13.594482421875, 14.078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 20.0, 27.0, 43.0, 47.0, 86.0, 123.0, 161.0, 318.0, 474.0, 875.0, 1616.0, 3269.0, 7842.0, 25833.0, 188650.0, 730113.0, 64225.0, 14212.0, 5219.0, 2394.0, 1208.0, 698.0, 371.0, 233.0, 143.0, 87.0, 74.0, 51.0, 32.0, 19.0, 17.0, 12.0, 8.0, 4.0, 7.0, 3.0, 2.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.609375, -11.260498046875, -10.91162109375, -10.562744140625, -10.2138671875, -9.864990234375, -9.51611328125, -9.167236328125, -8.818359375, -8.469482421875, -8.12060546875, -7.771728515625, -7.4228515625, -7.073974609375, -6.72509765625, -6.376220703125, -6.02734375, -5.678466796875, -5.32958984375, -4.980712890625, -4.6318359375, -4.282958984375, -3.93408203125, -3.585205078125, -3.236328125, -2.887451171875, -2.53857421875, -2.189697265625, -1.8408203125, -1.491943359375, -1.14306640625, -0.794189453125, -0.4453125, -0.096435546875, 0.25244140625, 0.601318359375, 0.9501953125, 1.299072265625, 1.64794921875, 1.996826171875, 2.345703125, 2.694580078125, 3.04345703125, 3.392333984375, 3.7412109375, 4.090087890625, 4.43896484375, 4.787841796875, 5.13671875, 5.485595703125, 5.83447265625, 6.183349609375, 6.5322265625, 6.881103515625, 7.22998046875, 7.578857421875, 7.927734375, 8.276611328125, 8.62548828125, 8.974365234375, 9.3232421875, 9.672119140625, 10.02099609375, 10.369873046875, 10.71875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 15.0, 27.0, 54.0, 221.0, 473.0, 74.0, 37.0, 28.0, 12.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005374908447265625, -0.0052412450313568115, -0.005107581615447998, -0.004973918199539185, -0.004840254783630371, -0.004706591367721558, -0.004572927951812744, -0.004439264535903931, -0.004305601119995117, -0.004171937704086304, -0.00403827428817749, -0.0039046108722686768, -0.0037709474563598633, -0.00363728404045105, -0.0035036206245422363, -0.003369957208633423, -0.0032362937927246094, -0.003102630376815796, -0.0029689669609069824, -0.002835303544998169, -0.0027016401290893555, -0.002567976713180542, -0.0024343132972717285, -0.002300649881362915, -0.0021669864654541016, -0.002033323049545288, -0.0018996596336364746, -0.0017659962177276611, -0.0016323328018188477, -0.0014986693859100342, -0.0013650059700012207, -0.0012313425540924072, -0.0010976791381835938, -0.0009640157222747803, -0.0008303523063659668, -0.0006966888904571533, -0.0005630254745483398, -0.00042936205863952637, -0.0002956986427307129, -0.00016203522682189941, -2.8371810913085938e-05, 0.00010529160499572754, 0.00023895502090454102, 0.0003726184368133545, 0.000506281852722168, 0.0006399452686309814, 0.0007736086845397949, 0.0009072721004486084, 0.0010409355163574219, 0.0011745989322662354, 0.0013082623481750488, 0.0014419257640838623, 0.0015755891799926758, 0.0017092525959014893, 0.0018429160118103027, 0.001976579427719116, 0.0021102428436279297, 0.002243906259536743, 0.0023775696754455566, 0.00251123309135437, 0.0026448965072631836, 0.002778559923171997, 0.0029122233390808105, 0.003045886754989624, 0.0031795501708984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 10.0, 4.0, 7.0, 6.0, 5.0, 11.0, 20.0, 18.0, 22.0, 45.0, 92.0, 164.0, 290.0, 535.0, 1051.0, 2113.0, 4417.0, 13470.0, 105322.0, 856660.0, 47990.0, 9077.0, 3637.0, 1669.0, 874.0, 443.0, 232.0, 150.0, 71.0, 40.0, 32.0, 12.0, 17.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.046875, -14.581787109375, -14.11669921875, -13.651611328125, -13.1865234375, -12.721435546875, -12.25634765625, -11.791259765625, -11.326171875, -10.861083984375, -10.39599609375, -9.930908203125, -9.4658203125, -9.000732421875, -8.53564453125, -8.070556640625, -7.60546875, -7.140380859375, -6.67529296875, -6.210205078125, -5.7451171875, -5.280029296875, -4.81494140625, -4.349853515625, -3.884765625, -3.419677734375, -2.95458984375, -2.489501953125, -2.0244140625, -1.559326171875, -1.09423828125, -0.629150390625, -0.1640625, 0.301025390625, 0.76611328125, 1.231201171875, 1.6962890625, 2.161376953125, 2.62646484375, 3.091552734375, 3.556640625, 4.021728515625, 4.48681640625, 4.951904296875, 5.4169921875, 5.882080078125, 6.34716796875, 6.812255859375, 7.27734375, 7.742431640625, 8.20751953125, 8.672607421875, 9.1376953125, 9.602783203125, 10.06787109375, 10.532958984375, 10.998046875, 11.463134765625, 11.92822265625, 12.393310546875, 12.8583984375, 13.323486328125, 13.78857421875, 14.253662109375, 14.71875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 6.0, 2.0, 8.0, 4.0, 11.0, 15.0, 17.0, 20.0, 25.0, 47.0, 91.0, 146.0, 215.0, 161.0, 94.0, 45.0, 19.0, 15.0, 12.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.46875, -10.1649169921875, -9.861083984375, -9.5572509765625, -9.25341796875, -8.9495849609375, -8.645751953125, -8.3419189453125, -8.0380859375, -7.7342529296875, -7.430419921875, -7.1265869140625, -6.82275390625, -6.5189208984375, -6.215087890625, -5.9112548828125, -5.607421875, -5.3035888671875, -4.999755859375, -4.6959228515625, -4.39208984375, -4.0882568359375, -3.784423828125, -3.4805908203125, -3.1767578125, -2.8729248046875, -2.569091796875, -2.2652587890625, -1.96142578125, -1.6575927734375, -1.353759765625, -1.0499267578125, -0.74609375, -0.4422607421875, -0.138427734375, 0.1654052734375, 0.46923828125, 0.7730712890625, 1.076904296875, 1.3807373046875, 1.6845703125, 1.9884033203125, 2.292236328125, 2.5960693359375, 2.89990234375, 3.2037353515625, 3.507568359375, 3.8114013671875, 4.115234375, 4.4190673828125, 4.722900390625, 5.0267333984375, 5.33056640625, 5.6343994140625, 5.938232421875, 6.2420654296875, 6.5458984375, 6.8497314453125, 7.153564453125, 7.4573974609375, 7.76123046875, 8.0650634765625, 8.368896484375, 8.6727294921875, 8.9765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 21.0, 72.0, 191.0, 317.0, 251.0, 96.0, 35.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.5274200439453, -141.41905212402344, -132.31068420410156, -123.20231628417969, -114.09394836425781, -104.98558044433594, -95.87721252441406, -86.76884460449219, -77.66047668457031, -68.55210876464844, -59.44374084472656, -50.33537292480469, -41.22700500488281, -32.11863708496094, -23.010269165039062, -13.901901245117188, -4.7935333251953125, 4.3148345947265625, 13.423202514648438, 22.531570434570312, 31.639938354492188, 40.74830627441406, 49.85667419433594, 58.96504211425781, 68.07341003417969, 77.18177795410156, 86.29014587402344, 95.39851379394531, 104.50688171386719, 113.61524963378906, 122.72361755371094, 131.8319854736328, 140.94036865234375, 150.04873657226562, 159.1571044921875, 168.26547241210938, 177.37384033203125, 186.48220825195312, 195.590576171875, 204.69894409179688, 213.80731201171875, 222.91567993164062, 232.0240478515625, 241.13241577148438, 250.24078369140625, 259.3491516113281, 268.45751953125, 277.5658874511719, 286.67425537109375, 295.7826232910156, 304.8909912109375, 313.9993591308594, 323.10772705078125, 332.2160949707031, 341.324462890625, 350.4328308105469, 359.54119873046875, 368.6495666503906, 377.7579345703125, 386.8663024902344, 395.97467041015625, 405.0830383300781, 414.19140625, 423.2997741699219, 432.40814208984375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 7.0, 21.0, 18.0, 18.0, 14.0, 18.0, 25.0, 34.0, 46.0, 38.0, 42.0, 45.0, 35.0, 37.0, 54.0, 47.0, 45.0, 47.0, 48.0, 48.0, 38.0, 41.0, 36.0, 31.0, 27.0, 26.0, 18.0, 18.0, 16.0, 14.0, 6.0, 11.0, 2.0, 9.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.576663970947266, -59.508697509765625, -57.44073486328125, -55.37276840209961, -53.304805755615234, -51.236839294433594, -49.16887664794922, -47.10091018676758, -45.03294372558594, -42.9649772644043, -40.89701461791992, -38.82904815673828, -36.761085510253906, -34.693119049072266, -32.625152587890625, -30.55718994140625, -28.489227294921875, -26.421262741088867, -24.35329818725586, -22.28533172607422, -20.217369079589844, -18.149402618408203, -16.081438064575195, -14.013473510742188, -11.94550895690918, -9.877544403076172, -7.809579372406006, -5.74161434173584, -3.673649787902832, -1.6056852340698242, 0.4622802734375, 2.530244827270508, 4.59820556640625, 6.666170120239258, 8.734134674072266, 10.80210018157959, 12.870064735412598, 14.938029289245605, 17.00599479675293, 19.073959350585938, 21.141923904418945, 23.209888458251953, 25.27785301208496, 27.34581756591797, 29.41378402709961, 31.481746673583984, 33.549713134765625, 35.61767578125, 37.68564224243164, 39.75360870361328, 41.821571350097656, 43.8895378112793, 45.95750045776367, 48.02546691894531, 50.09342956542969, 52.16139602661133, 54.22936248779297, 56.29732894897461, 58.365291595458984, 60.433258056640625, 62.501220703125, 64.56918334960938, 66.63715362548828, 68.70511627197266, 70.77307891845703]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 5.0, 9.0, 5.0, 16.0, 20.0, 30.0, 44.0, 66.0, 85.0, 155.0, 257.0, 382.0, 682.0, 1541.0, 4333.0, 13610.0, 64309.0, 3991183.0, 92637.0, 16318.0, 4909.0, 1785.0, 837.0, 398.0, 228.0, 147.0, 101.0, 68.0, 36.0, 33.0, 17.0, 11.0, 13.0, 10.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.15625, -56.521484375, -54.88671875, -53.251953125, -51.6171875, -49.982421875, -48.34765625, -46.712890625, -45.078125, -43.443359375, -41.80859375, -40.173828125, -38.5390625, -36.904296875, -35.26953125, -33.634765625, -32.0, -30.365234375, -28.73046875, -27.095703125, -25.4609375, -23.826171875, -22.19140625, -20.556640625, -18.921875, -17.287109375, -15.65234375, -14.017578125, -12.3828125, -10.748046875, -9.11328125, -7.478515625, -5.84375, -4.208984375, -2.57421875, -0.939453125, 0.6953125, 2.330078125, 3.96484375, 5.599609375, 7.234375, 8.869140625, 10.50390625, 12.138671875, 13.7734375, 15.408203125, 17.04296875, 18.677734375, 20.3125, 21.947265625, 23.58203125, 25.216796875, 26.8515625, 28.486328125, 30.12109375, 31.755859375, 33.390625, 35.025390625, 36.66015625, 38.294921875, 39.9296875, 41.564453125, 43.19921875, 44.833984375, 46.46875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 9.0, 12.0, 12.0, 26.0, 20.0, 37.0, 41.0, 55.0, 56.0, 64.0, 72.0, 67.0, 64.0, 64.0, 81.0, 57.0, 50.0, 44.0, 47.0, 23.0, 16.0, 17.0, 20.0, 13.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.08880615234375, -3.9432373046875, -3.79766845703125, -3.652099609375, -3.50653076171875, -3.3609619140625, -3.21539306640625, -3.06982421875, -2.92425537109375, -2.7786865234375, -2.63311767578125, -2.487548828125, -2.34197998046875, -2.1964111328125, -2.05084228515625, -1.9052734375, -1.75970458984375, -1.6141357421875, -1.46856689453125, -1.322998046875, -1.17742919921875, -1.0318603515625, -0.88629150390625, -0.74072265625, -0.59515380859375, -0.4495849609375, -0.30401611328125, -0.158447265625, -0.01287841796875, 0.1326904296875, 0.27825927734375, 0.423828125, 0.56939697265625, 0.7149658203125, 0.86053466796875, 1.006103515625, 1.15167236328125, 1.2972412109375, 1.44281005859375, 1.58837890625, 1.73394775390625, 1.8795166015625, 2.02508544921875, 2.170654296875, 2.31622314453125, 2.4617919921875, 2.60736083984375, 2.7529296875, 2.89849853515625, 3.0440673828125, 3.18963623046875, 3.335205078125, 3.48077392578125, 3.6263427734375, 3.77191162109375, 3.91748046875, 4.06304931640625, 4.2086181640625, 4.35418701171875, 4.499755859375, 4.64532470703125, 4.7908935546875, 4.93646240234375, 5.08203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 11.0, 15.0, 21.0, 28.0, 44.0, 40.0, 64.0, 115.0, 160.0, 239.0, 374.0, 548.0, 1015.0, 1721.0, 3329.0, 7324.0, 19590.0, 80245.0, 3800617.0, 224401.0, 33194.0, 11002.0, 4639.0, 2286.0, 1290.0, 708.0, 454.0, 262.0, 185.0, 104.0, 76.0, 56.0, 48.0, 21.0, 15.0, 12.0, 6.0, 11.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.96875, -31.859375, -30.75, -29.640625, -28.53125, -27.421875, -26.3125, -25.203125, -24.09375, -22.984375, -21.875, -20.765625, -19.65625, -18.546875, -17.4375, -16.328125, -15.21875, -14.109375, -13.0, -11.890625, -10.78125, -9.671875, -8.5625, -7.453125, -6.34375, -5.234375, -4.125, -3.015625, -1.90625, -0.796875, 0.3125, 1.421875, 2.53125, 3.640625, 4.75, 5.859375, 6.96875, 8.078125, 9.1875, 10.296875, 11.40625, 12.515625, 13.625, 14.734375, 15.84375, 16.953125, 18.0625, 19.171875, 20.28125, 21.390625, 22.5, 23.609375, 24.71875, 25.828125, 26.9375, 28.046875, 29.15625, 30.265625, 31.375, 32.484375, 33.59375, 34.703125, 35.8125, 36.921875, 38.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 12.0, 22.0, 26.0, 31.0, 52.0, 79.0, 231.0, 2797.0, 474.0, 118.0, 70.0, 34.0, 32.0, 20.0, 12.0, 8.0, 4.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.4637451171875, -15.005615234375, -14.5474853515625, -14.08935546875, -13.6312255859375, -13.173095703125, -12.7149658203125, -12.2568359375, -11.7987060546875, -11.340576171875, -10.8824462890625, -10.42431640625, -9.9661865234375, -9.508056640625, -9.0499267578125, -8.591796875, -8.1336669921875, -7.675537109375, -7.2174072265625, -6.75927734375, -6.3011474609375, -5.843017578125, -5.3848876953125, -4.9267578125, -4.4686279296875, -4.010498046875, -3.5523681640625, -3.09423828125, -2.6361083984375, -2.177978515625, -1.7198486328125, -1.26171875, -0.8035888671875, -0.345458984375, 0.1126708984375, 0.57080078125, 1.0289306640625, 1.487060546875, 1.9451904296875, 2.4033203125, 2.8614501953125, 3.319580078125, 3.7777099609375, 4.23583984375, 4.6939697265625, 5.152099609375, 5.6102294921875, 6.068359375, 6.5264892578125, 6.984619140625, 7.4427490234375, 7.90087890625, 8.3590087890625, 8.817138671875, 9.2752685546875, 9.7333984375, 10.1915283203125, 10.649658203125, 11.1077880859375, 11.56591796875, 12.0240478515625, 12.482177734375, 12.9403076171875, 13.3984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 11.0, 21.0, 52.0, 88.0, 187.0, 284.0, 203.0, 90.0, 36.0, 8.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.13389587402344, -117.53886413574219, -113.9438247680664, -110.34879302978516, -106.75375366210938, -103.15872192382812, -99.56369018554688, -95.9686508178711, -92.37361145019531, -88.77857971191406, -85.18354034423828, -81.58850860595703, -77.99346923828125, -74.3984375, -70.80340576171875, -67.20836639404297, -63.61333465576172, -60.0182991027832, -56.42326354980469, -52.82823181152344, -49.233192443847656, -45.638160705566406, -42.04312515258789, -38.448089599609375, -34.85305404663086, -31.258018493652344, -27.662982940673828, -24.067949295043945, -20.47291374206543, -16.877878189086914, -13.282844543457031, -9.687808990478516, -6.092765808105469, -2.4977307319641113, 1.097304344177246, 4.692338943481445, 8.287374496459961, 11.882410049438477, 15.47744369506836, 19.072479248046875, 22.66751480102539, 26.262550354003906, 29.857585906982422, 33.45262145996094, 37.04765319824219, 40.64269256591797, 44.23772430419922, 47.832759857177734, 51.42779541015625, 55.022830963134766, 58.61786651611328, 62.21289825439453, 65.80793762207031, 69.40296936035156, 72.99800109863281, 76.5930404663086, 80.18807983398438, 83.78311157226562, 87.3781509399414, 90.97318267822266, 94.56822204589844, 98.16325378417969, 101.75828552246094, 105.35332489013672, 108.94835662841797]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 27.0, 22.0, 39.0, 65.0, 58.0, 76.0, 90.0, 91.0, 110.0, 69.0, 75.0, 68.0, 67.0, 36.0, 40.0, 17.0, 20.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.3806381225586, -64.32205963134766, -62.26347351074219, -60.204891204833984, -58.14630889892578, -56.087730407714844, -54.02914810180664, -51.97056579589844, -49.911983489990234, -47.85340118408203, -45.79481887817383, -43.736236572265625, -41.67765808105469, -39.61907196044922, -37.56049346923828, -35.50191116333008, -33.443328857421875, -31.384746551513672, -29.32616424560547, -27.2675838470459, -25.209001541137695, -23.150419235229492, -21.091838836669922, -19.03325653076172, -16.974674224853516, -14.916091918945312, -12.857510566711426, -10.798929214477539, -8.740346908569336, -6.681764602661133, -4.623183250427246, -2.5646018981933594, -0.506011962890625, 1.55256986618042, 3.611151695251465, 5.66973352432251, 7.728315353393555, 9.786897659301758, 11.845479011535645, 13.904060363769531, 15.962642669677734, 18.021224975585938, 20.07980728149414, 22.13838768005371, 24.196969985961914, 26.255552291870117, 28.314132690429688, 30.37271499633789, 32.431297302246094, 34.4898796081543, 36.5484619140625, 38.6070442199707, 40.665626525878906, 42.724205017089844, 44.78278732299805, 46.84136962890625, 48.89995193481445, 50.958534240722656, 53.01711654663086, 55.07569885253906, 57.13427734375, 59.19286346435547, 61.251441955566406, 63.31002426147461, 65.36860656738281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 6.0, 12.0, 16.0, 27.0, 33.0, 43.0, 98.0, 115.0, 185.0, 326.0, 625.0, 1127.0, 2262.0, 5712.0, 16012.0, 55044.0, 211082.0, 506661.0, 178178.0, 47268.0, 14162.0, 5037.0, 2126.0, 987.0, 563.0, 279.0, 198.0, 123.0, 69.0, 50.0, 26.0, 29.0, 22.0, 13.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.875, -26.0712890625, -25.267578125, -24.4638671875, -23.66015625, -22.8564453125, -22.052734375, -21.2490234375, -20.4453125, -19.6416015625, -18.837890625, -18.0341796875, -17.23046875, -16.4267578125, -15.623046875, -14.8193359375, -14.015625, -13.2119140625, -12.408203125, -11.6044921875, -10.80078125, -9.9970703125, -9.193359375, -8.3896484375, -7.5859375, -6.7822265625, -5.978515625, -5.1748046875, -4.37109375, -3.5673828125, -2.763671875, -1.9599609375, -1.15625, -0.3525390625, 0.451171875, 1.2548828125, 2.05859375, 2.8623046875, 3.666015625, 4.4697265625, 5.2734375, 6.0771484375, 6.880859375, 7.6845703125, 8.48828125, 9.2919921875, 10.095703125, 10.8994140625, 11.703125, 12.5068359375, 13.310546875, 14.1142578125, 14.91796875, 15.7216796875, 16.525390625, 17.3291015625, 18.1328125, 18.9365234375, 19.740234375, 20.5439453125, 21.34765625, 22.1513671875, 22.955078125, 23.7587890625, 24.5625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 7.0, 6.0, 14.0, 19.0, 21.0, 16.0, 30.0, 50.0, 61.0, 61.0, 82.0, 75.0, 64.0, 77.0, 78.0, 60.0, 52.0, 52.0, 43.0, 32.0, 22.0, 26.0, 28.0, 5.0, 5.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.58795166015625, -5.4063720703125, -5.22479248046875, -5.043212890625, -4.86163330078125, -4.6800537109375, -4.49847412109375, -4.31689453125, -4.13531494140625, -3.9537353515625, -3.77215576171875, -3.590576171875, -3.40899658203125, -3.2274169921875, -3.04583740234375, -2.8642578125, -2.68267822265625, -2.5010986328125, -2.31951904296875, -2.137939453125, -1.95635986328125, -1.7747802734375, -1.59320068359375, -1.41162109375, -1.23004150390625, -1.0484619140625, -0.86688232421875, -0.685302734375, -0.50372314453125, -0.3221435546875, -0.14056396484375, 0.041015625, 0.22259521484375, 0.4041748046875, 0.58575439453125, 0.767333984375, 0.94891357421875, 1.1304931640625, 1.31207275390625, 1.49365234375, 1.67523193359375, 1.8568115234375, 2.03839111328125, 2.219970703125, 2.40155029296875, 2.5831298828125, 2.76470947265625, 2.9462890625, 3.12786865234375, 3.3094482421875, 3.49102783203125, 3.672607421875, 3.85418701171875, 4.0357666015625, 4.21734619140625, 4.39892578125, 4.58050537109375, 4.7620849609375, 4.94366455078125, 5.125244140625, 5.30682373046875, 5.4884033203125, 5.66998291015625, 5.8515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 10.0, 10.0, 11.0, 13.0, 20.0, 40.0, 45.0, 48.0, 59.0, 89.0, 119.0, 149.0, 205.0, 370.0, 654.0, 1545.0, 5275.0, 28110.0, 270267.0, 657773.0, 68968.0, 9956.0, 2438.0, 865.0, 468.0, 253.0, 203.0, 134.0, 102.0, 69.0, 58.0, 39.0, 33.0, 33.0, 31.0, 20.0, 10.0, 11.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-35.3125, -34.18115234375, -33.0498046875, -31.91845703125, -30.787109375, -29.65576171875, -28.5244140625, -27.39306640625, -26.26171875, -25.13037109375, -23.9990234375, -22.86767578125, -21.736328125, -20.60498046875, -19.4736328125, -18.34228515625, -17.2109375, -16.07958984375, -14.9482421875, -13.81689453125, -12.685546875, -11.55419921875, -10.4228515625, -9.29150390625, -8.16015625, -7.02880859375, -5.8974609375, -4.76611328125, -3.634765625, -2.50341796875, -1.3720703125, -0.24072265625, 0.890625, 2.02197265625, 3.1533203125, 4.28466796875, 5.416015625, 6.54736328125, 7.6787109375, 8.81005859375, 9.94140625, 11.07275390625, 12.2041015625, 13.33544921875, 14.466796875, 15.59814453125, 16.7294921875, 17.86083984375, 18.9921875, 20.12353515625, 21.2548828125, 22.38623046875, 23.517578125, 24.64892578125, 25.7802734375, 26.91162109375, 28.04296875, 29.17431640625, 30.3056640625, 31.43701171875, 32.568359375, 33.69970703125, 34.8310546875, 35.96240234375, 37.09375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 3.0, 7.0, 8.0, 11.0, 16.0, 12.0, 17.0, 25.0, 24.0, 23.0, 28.0, 32.0, 46.0, 34.0, 43.0, 39.0, 40.0, 46.0, 49.0, 56.0, 49.0, 57.0, 27.0, 47.0, 32.0, 41.0, 23.0, 22.0, 22.0, 27.0, 15.0, 13.0, 8.0, 18.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -17.068115234375, -16.52685546875, -15.985595703125, -15.4443359375, -14.903076171875, -14.36181640625, -13.820556640625, -13.279296875, -12.738037109375, -12.19677734375, -11.655517578125, -11.1142578125, -10.572998046875, -10.03173828125, -9.490478515625, -8.94921875, -8.407958984375, -7.86669921875, -7.325439453125, -6.7841796875, -6.242919921875, -5.70166015625, -5.160400390625, -4.619140625, -4.077880859375, -3.53662109375, -2.995361328125, -2.4541015625, -1.912841796875, -1.37158203125, -0.830322265625, -0.2890625, 0.252197265625, 0.79345703125, 1.334716796875, 1.8759765625, 2.417236328125, 2.95849609375, 3.499755859375, 4.041015625, 4.582275390625, 5.12353515625, 5.664794921875, 6.2060546875, 6.747314453125, 7.28857421875, 7.829833984375, 8.37109375, 8.912353515625, 9.45361328125, 9.994873046875, 10.5361328125, 11.077392578125, 11.61865234375, 12.159912109375, 12.701171875, 13.242431640625, 13.78369140625, 14.324951171875, 14.8662109375, 15.407470703125, 15.94873046875, 16.489990234375, 17.03125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 16.0, 19.0, 25.0, 52.0, 51.0, 97.0, 158.0, 205.0, 376.0, 672.0, 1289.0, 2537.0, 6209.0, 17925.0, 75611.0, 672962.0, 217570.0, 34507.0, 10302.0, 3884.0, 1763.0, 918.0, 511.0, 330.0, 175.0, 99.0, 77.0, 48.0, 40.0, 22.0, 18.0, 12.0, 12.0, 6.0, 5.0, 5.0, 6.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6343994140625, -11.229736328125, -10.8250732421875, -10.42041015625, -10.0157470703125, -9.611083984375, -9.2064208984375, -8.8017578125, -8.3970947265625, -7.992431640625, -7.5877685546875, -7.18310546875, -6.7784423828125, -6.373779296875, -5.9691162109375, -5.564453125, -5.1597900390625, -4.755126953125, -4.3504638671875, -3.94580078125, -3.5411376953125, -3.136474609375, -2.7318115234375, -2.3271484375, -1.9224853515625, -1.517822265625, -1.1131591796875, -0.70849609375, -0.3038330078125, 0.100830078125, 0.5054931640625, 0.91015625, 1.3148193359375, 1.719482421875, 2.1241455078125, 2.52880859375, 2.9334716796875, 3.338134765625, 3.7427978515625, 4.1474609375, 4.5521240234375, 4.956787109375, 5.3614501953125, 5.76611328125, 6.1707763671875, 6.575439453125, 6.9801025390625, 7.384765625, 7.7894287109375, 8.194091796875, 8.5987548828125, 9.00341796875, 9.4080810546875, 9.812744140625, 10.2174072265625, 10.6220703125, 11.0267333984375, 11.431396484375, 11.8360595703125, 12.24072265625, 12.6453857421875, 13.050048828125, 13.4547119140625, 13.859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 9.0, 18.0, 26.0, 32.0, 36.0, 40.0, 59.0, 83.0, 183.0, 157.0, 90.0, 57.0, 47.0, 29.0, 21.0, 16.0, 12.0, 8.0, 4.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0028285980224609375, -0.0027540922164916992, -0.002679586410522461, -0.0026050806045532227, -0.0025305747985839844, -0.002456068992614746, -0.002381563186645508, -0.0023070573806762695, -0.0022325515747070312, -0.002158045768737793, -0.0020835399627685547, -0.0020090341567993164, -0.0019345283508300781, -0.0018600225448608398, -0.0017855167388916016, -0.0017110109329223633, -0.001636505126953125, -0.0015619993209838867, -0.0014874935150146484, -0.0014129877090454102, -0.0013384819030761719, -0.0012639760971069336, -0.0011894702911376953, -0.001114964485168457, -0.0010404586791992188, -0.0009659528732299805, -0.0008914470672607422, -0.0008169412612915039, -0.0007424354553222656, -0.0006679296493530273, -0.0005934238433837891, -0.0005189180374145508, -0.0004444122314453125, -0.0003699064254760742, -0.00029540061950683594, -0.00022089481353759766, -0.00014638900756835938, -7.18832015991211e-05, 2.6226043701171875e-06, 7.712841033935547e-05, 0.00015163421630859375, 0.00022614002227783203, 0.0003006458282470703, 0.0003751516342163086, 0.0004496574401855469, 0.0005241632461547852, 0.0005986690521240234, 0.0006731748580932617, 0.0007476806640625, 0.0008221864700317383, 0.0008966922760009766, 0.0009711980819702148, 0.0010457038879394531, 0.0011202096939086914, 0.0011947154998779297, 0.001269221305847168, 0.0013437271118164062, 0.0014182329177856445, 0.0014927387237548828, 0.001567244529724121, 0.0016417503356933594, 0.0017162561416625977, 0.001790761947631836, 0.0018652677536010742, 0.0019397735595703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 8.0, 7.0, 6.0, 11.0, 21.0, 13.0, 19.0, 18.0, 41.0, 47.0, 54.0, 68.0, 107.0, 203.0, 433.0, 1041.0, 2827.0, 9851.0, 55841.0, 792314.0, 160179.0, 18036.0, 4500.0, 1488.0, 616.0, 244.0, 150.0, 100.0, 70.0, 60.0, 34.0, 29.0, 23.0, 10.0, 7.0, 13.0, 10.0, 6.0, 9.0, 13.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.640625, -17.046630859375, -16.45263671875, -15.858642578125, -15.2646484375, -14.670654296875, -14.07666015625, -13.482666015625, -12.888671875, -12.294677734375, -11.70068359375, -11.106689453125, -10.5126953125, -9.918701171875, -9.32470703125, -8.730712890625, -8.13671875, -7.542724609375, -6.94873046875, -6.354736328125, -5.7607421875, -5.166748046875, -4.57275390625, -3.978759765625, -3.384765625, -2.790771484375, -2.19677734375, -1.602783203125, -1.0087890625, -0.414794921875, 0.17919921875, 0.773193359375, 1.3671875, 1.961181640625, 2.55517578125, 3.149169921875, 3.7431640625, 4.337158203125, 4.93115234375, 5.525146484375, 6.119140625, 6.713134765625, 7.30712890625, 7.901123046875, 8.4951171875, 9.089111328125, 9.68310546875, 10.277099609375, 10.87109375, 11.465087890625, 12.05908203125, 12.653076171875, 13.2470703125, 13.841064453125, 14.43505859375, 15.029052734375, 15.623046875, 16.217041015625, 16.81103515625, 17.405029296875, 17.9990234375, 18.593017578125, 19.18701171875, 19.781005859375, 20.375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 5.0, 7.0, 7.0, 9.0, 10.0, 14.0, 18.0, 20.0, 39.0, 33.0, 63.0, 79.0, 98.0, 115.0, 121.0, 89.0, 60.0, 48.0, 29.0, 22.0, 26.0, 19.0, 9.0, 8.0, 4.0, 5.0, 8.0, 9.0, 1.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.715576171875, -7.41552734375, -7.115478515625, -6.8154296875, -6.515380859375, -6.21533203125, -5.915283203125, -5.615234375, -5.315185546875, -5.01513671875, -4.715087890625, -4.4150390625, -4.114990234375, -3.81494140625, -3.514892578125, -3.21484375, -2.914794921875, -2.61474609375, -2.314697265625, -2.0146484375, -1.714599609375, -1.41455078125, -1.114501953125, -0.814453125, -0.514404296875, -0.21435546875, 0.085693359375, 0.3857421875, 0.685791015625, 0.98583984375, 1.285888671875, 1.5859375, 1.885986328125, 2.18603515625, 2.486083984375, 2.7861328125, 3.086181640625, 3.38623046875, 3.686279296875, 3.986328125, 4.286376953125, 4.58642578125, 4.886474609375, 5.1865234375, 5.486572265625, 5.78662109375, 6.086669921875, 6.38671875, 6.686767578125, 6.98681640625, 7.286865234375, 7.5869140625, 7.886962890625, 8.18701171875, 8.487060546875, 8.787109375, 9.087158203125, 9.38720703125, 9.687255859375, 9.9873046875, 10.287353515625, 10.58740234375, 10.887451171875, 11.1875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 13.0, 20.0, 55.0, 124.0, 295.0, 253.0, 143.0, 59.0, 22.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-380.28985595703125, -369.3919372558594, -358.4940185546875, -347.5960998535156, -336.69818115234375, -325.8002624511719, -314.90234375, -304.00445556640625, -293.10650634765625, -282.2085876464844, -271.3106689453125, -260.4127502441406, -249.51483154296875, -238.61691284179688, -227.71900939941406, -216.8210906982422, -205.92318725585938, -195.0252685546875, -184.12734985351562, -173.22943115234375, -162.33151245117188, -151.43359375, -140.5356903076172, -129.6377716064453, -118.73985290527344, -107.84193420410156, -96.94401550292969, -86.04610443115234, -75.14818572998047, -64.2502670288086, -53.35235595703125, -42.454437255859375, -31.556488037109375, -20.658571243286133, -9.76065444946289, 1.1372604370117188, 12.035179138183594, 22.93309783935547, 33.83100891113281, 44.72892761230469, 55.62684631347656, 66.52476501464844, 77.42268371582031, 88.32059478759766, 99.21851348876953, 110.1164321899414, 121.01434326171875, 131.91226196289062, 142.8101806640625, 153.70809936523438, 164.60601806640625, 175.50393676757812, 186.40185546875, 197.29977416992188, 208.1976776123047, 219.09559631347656, 229.99351501464844, 240.8914337158203, 251.7893524169922, 262.687255859375, 273.5851745605469, 284.48309326171875, 295.3810119628906, 306.2789306640625, 317.1768493652344]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 16.0, 7.0, 17.0, 16.0, 17.0, 22.0, 20.0, 22.0, 28.0, 25.0, 29.0, 40.0, 38.0, 35.0, 33.0, 44.0, 40.0, 41.0, 43.0, 39.0, 31.0, 40.0, 37.0, 39.0, 33.0, 31.0, 33.0, 19.0, 27.0, 17.0, 14.0, 10.0, 9.0, 17.0, 9.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5389404296875, -80.88429260253906, -78.2296371459961, -75.57498931884766, -72.92034149169922, -70.26568603515625, -67.61103820800781, -64.95639038085938, -62.30173873901367, -59.64708709716797, -56.99243927001953, -54.33778762817383, -51.683135986328125, -49.02848815917969, -46.373836517333984, -43.71918487548828, -41.064537048339844, -38.40988540649414, -35.7552375793457, -33.1005859375, -30.44593620300293, -27.79128646850586, -25.136634826660156, -22.481985092163086, -19.827335357666016, -17.172685623168945, -14.518034934997559, -11.863384246826172, -9.208734512329102, -6.554084777832031, -3.8994340896606445, -1.2447834014892578, 1.4098663330078125, 4.064516544342041, 6.7191667556762695, 9.373817443847656, 12.028467178344727, 14.683116912841797, 17.3377685546875, 19.99241828918457, 22.64706802368164, 25.30171775817871, 27.95636749267578, 30.611019134521484, 33.26567077636719, 35.920318603515625, 38.57497024536133, 41.22962188720703, 43.88426971435547, 46.53892135620117, 49.19356918334961, 51.84822082519531, 54.50286865234375, 57.15752029418945, 59.812171936035156, 62.466819763183594, 65.12147521972656, 67.776123046875, 70.43077850341797, 73.0854263305664, 75.74007415771484, 78.39472961425781, 81.04937744140625, 83.70402526855469, 86.35867309570312]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 3.0, 16.0, 18.0, 17.0, 26.0, 47.0, 64.0, 84.0, 117.0, 187.0, 324.0, 575.0, 1090.0, 2193.0, 5722.0, 19024.0, 174963.0, 3924711.0, 48191.0, 10092.0, 3484.0, 1485.0, 752.0, 395.0, 232.0, 134.0, 97.0, 60.0, 45.0, 33.0, 26.0, 15.0, 13.0, 6.0, 11.0, 3.0, 8.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.53125, -52.8916015625, -51.251953125, -49.6123046875, -47.97265625, -46.3330078125, -44.693359375, -43.0537109375, -41.4140625, -39.7744140625, -38.134765625, -36.4951171875, -34.85546875, -33.2158203125, -31.576171875, -29.9365234375, -28.296875, -26.6572265625, -25.017578125, -23.3779296875, -21.73828125, -20.0986328125, -18.458984375, -16.8193359375, -15.1796875, -13.5400390625, -11.900390625, -10.2607421875, -8.62109375, -6.9814453125, -5.341796875, -3.7021484375, -2.0625, -0.4228515625, 1.216796875, 2.8564453125, 4.49609375, 6.1357421875, 7.775390625, 9.4150390625, 11.0546875, 12.6943359375, 14.333984375, 15.9736328125, 17.61328125, 19.2529296875, 20.892578125, 22.5322265625, 24.171875, 25.8115234375, 27.451171875, 29.0908203125, 30.73046875, 32.3701171875, 34.009765625, 35.6494140625, 37.2890625, 38.9287109375, 40.568359375, 42.2080078125, 43.84765625, 45.4873046875, 47.126953125, 48.7666015625, 50.40625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 14.0, 19.0, 15.0, 32.0, 31.0, 51.0, 68.0, 61.0, 54.0, 71.0, 51.0, 99.0, 77.0, 78.0, 53.0, 47.0, 42.0, 35.0, 24.0, 18.0, 19.0, 18.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9422607421875, -5.743896484375, -5.5455322265625, -5.34716796875, -5.1488037109375, -4.950439453125, -4.7520751953125, -4.5537109375, -4.3553466796875, -4.156982421875, -3.9586181640625, -3.76025390625, -3.5618896484375, -3.363525390625, -3.1651611328125, -2.966796875, -2.7684326171875, -2.570068359375, -2.3717041015625, -2.17333984375, -1.9749755859375, -1.776611328125, -1.5782470703125, -1.3798828125, -1.1815185546875, -0.983154296875, -0.7847900390625, -0.58642578125, -0.3880615234375, -0.189697265625, 0.0086669921875, 0.20703125, 0.4053955078125, 0.603759765625, 0.8021240234375, 1.00048828125, 1.1988525390625, 1.397216796875, 1.5955810546875, 1.7939453125, 1.9923095703125, 2.190673828125, 2.3890380859375, 2.58740234375, 2.7857666015625, 2.984130859375, 3.1824951171875, 3.380859375, 3.5792236328125, 3.777587890625, 3.9759521484375, 4.17431640625, 4.3726806640625, 4.571044921875, 4.7694091796875, 4.9677734375, 5.1661376953125, 5.364501953125, 5.5628662109375, 5.76123046875, 5.9595947265625, 6.157958984375, 6.3563232421875, 6.5546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 15.0, 24.0, 33.0, 64.0, 88.0, 142.0, 303.0, 579.0, 1224.0, 3040.0, 8879.0, 32088.0, 341224.0, 3721804.0, 63056.0, 13914.0, 4493.0, 1704.0, 760.0, 419.0, 170.0, 102.0, 52.0, 35.0, 15.0, 11.0, 16.0, 12.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28125, -48.8525390625, -47.423828125, -45.9951171875, -44.56640625, -43.1376953125, -41.708984375, -40.2802734375, -38.8515625, -37.4228515625, -35.994140625, -34.5654296875, -33.13671875, -31.7080078125, -30.279296875, -28.8505859375, -27.421875, -25.9931640625, -24.564453125, -23.1357421875, -21.70703125, -20.2783203125, -18.849609375, -17.4208984375, -15.9921875, -14.5634765625, -13.134765625, -11.7060546875, -10.27734375, -8.8486328125, -7.419921875, -5.9912109375, -4.5625, -3.1337890625, -1.705078125, -0.2763671875, 1.15234375, 2.5810546875, 4.009765625, 5.4384765625, 6.8671875, 8.2958984375, 9.724609375, 11.1533203125, 12.58203125, 14.0107421875, 15.439453125, 16.8681640625, 18.296875, 19.7255859375, 21.154296875, 22.5830078125, 24.01171875, 25.4404296875, 26.869140625, 28.2978515625, 29.7265625, 31.1552734375, 32.583984375, 34.0126953125, 35.44140625, 36.8701171875, 38.298828125, 39.7275390625, 41.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 7.0, 11.0, 5.0, 12.0, 21.0, 25.0, 34.0, 61.0, 91.0, 217.0, 1768.0, 1303.0, 242.0, 94.0, 64.0, 30.0, 21.0, 17.0, 11.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.40625, -18.77978515625, -18.1533203125, -17.52685546875, -16.900390625, -16.27392578125, -15.6474609375, -15.02099609375, -14.39453125, -13.76806640625, -13.1416015625, -12.51513671875, -11.888671875, -11.26220703125, -10.6357421875, -10.00927734375, -9.3828125, -8.75634765625, -8.1298828125, -7.50341796875, -6.876953125, -6.25048828125, -5.6240234375, -4.99755859375, -4.37109375, -3.74462890625, -3.1181640625, -2.49169921875, -1.865234375, -1.23876953125, -0.6123046875, 0.01416015625, 0.640625, 1.26708984375, 1.8935546875, 2.52001953125, 3.146484375, 3.77294921875, 4.3994140625, 5.02587890625, 5.65234375, 6.27880859375, 6.9052734375, 7.53173828125, 8.158203125, 8.78466796875, 9.4111328125, 10.03759765625, 10.6640625, 11.29052734375, 11.9169921875, 12.54345703125, 13.169921875, 13.79638671875, 14.4228515625, 15.04931640625, 15.67578125, 16.30224609375, 16.9287109375, 17.55517578125, 18.181640625, 18.80810546875, 19.4345703125, 20.06103515625, 20.6875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 8.0, 11.0, 19.0, 19.0, 31.0, 53.0, 94.0, 117.0, 179.0, 177.0, 123.0, 66.0, 40.0, 19.0, 9.0, 11.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-150.4306640625, -147.15330505371094, -143.8759307861328, -140.59857177734375, -137.3212127685547, -134.04383850097656, -130.7664794921875, -127.4891128540039, -124.21174621582031, -120.93437957763672, -117.65702056884766, -114.37965393066406, -111.10228729248047, -107.82492065429688, -104.54756164550781, -101.27019500732422, -97.99282836914062, -94.71546173095703, -91.43810272216797, -88.16073608398438, -84.88336944580078, -81.60600280761719, -78.32864379882812, -75.05127716064453, -71.77391815185547, -68.49655151367188, -65.21919250488281, -61.94182586669922, -58.664459228515625, -55.3870964050293, -52.10973358154297, -48.832366943359375, -45.55500411987305, -42.27764129638672, -39.000274658203125, -35.7229118347168, -32.4455451965332, -29.168182373046875, -25.890817642211914, -22.613452911376953, -19.336088180541992, -16.05872344970703, -12.78135871887207, -9.503994941711426, -6.226630210876465, -2.9492664337158203, 0.3280982971191406, 3.6054630279541016, 6.8828277587890625, 10.160192489624023, 13.437557220458984, 16.714920043945312, 19.992286682128906, 23.269649505615234, 26.547014236450195, 29.824378967285156, 33.10174560546875, 36.37910842895508, 39.65647506713867, 42.933837890625, 46.211204528808594, 49.48856735229492, 52.76593017578125, 56.043296813964844, 59.32065963745117]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 12.0, 15.0, 19.0, 17.0, 28.0, 21.0, 23.0, 26.0, 34.0, 24.0, 40.0, 42.0, 46.0, 46.0, 60.0, 60.0, 40.0, 47.0, 46.0, 45.0, 33.0, 48.0, 31.0, 25.0, 23.0, 29.0, 22.0, 21.0, 11.0, 10.0, 7.0, 8.0, 4.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-61.08249282836914, -59.318843841552734, -57.55519104003906, -55.791542053222656, -54.02789306640625, -52.26424026489258, -50.50059127807617, -48.7369384765625, -46.973289489746094, -45.20964050292969, -43.445987701416016, -41.68233871459961, -39.9186897277832, -38.15503692626953, -36.391387939453125, -34.62773895263672, -32.86408996582031, -31.100439071655273, -29.336790084838867, -27.573139190673828, -25.80948829650879, -24.04583740234375, -22.282188415527344, -20.518537521362305, -18.754886627197266, -16.991235733032227, -15.227585792541504, -13.463935852050781, -11.700284957885742, -9.93663501739502, -8.172985076904297, -6.409334182739258, -4.645683288574219, -2.882032871246338, -1.1183826923370361, 0.6452674865722656, 2.4089179039001465, 4.172568321228027, 5.93621826171875, 7.699869155883789, 9.463519096374512, 11.227169036865234, 12.990819931030273, 14.754469871520996, 16.51811981201172, 18.281770706176758, 20.045421600341797, 21.809070587158203, 23.572721481323242, 25.33637237548828, 27.100021362304688, 28.863672256469727, 30.627323150634766, 32.39097213745117, 34.154624938964844, 35.91827392578125, 37.681922912597656, 39.44557189941406, 41.209224700927734, 42.97287368774414, 44.73652267456055, 46.50017547607422, 48.263824462890625, 50.02747344970703, 51.7911262512207]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 5.0, 12.0, 18.0, 20.0, 25.0, 58.0, 72.0, 104.0, 195.0, 364.0, 712.0, 1456.0, 3169.0, 7973.0, 21534.0, 66715.0, 257736.0, 472321.0, 149922.0, 41849.0, 14140.0, 5533.0, 2306.0, 1071.0, 494.0, 273.0, 164.0, 99.0, 68.0, 43.0, 26.0, 24.0, 15.0, 10.0, 9.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.217529296875, -21.40380859375, -20.590087890625, -19.7763671875, -18.962646484375, -18.14892578125, -17.335205078125, -16.521484375, -15.707763671875, -14.89404296875, -14.080322265625, -13.2666015625, -12.452880859375, -11.63916015625, -10.825439453125, -10.01171875, -9.197998046875, -8.38427734375, -7.570556640625, -6.7568359375, -5.943115234375, -5.12939453125, -4.315673828125, -3.501953125, -2.688232421875, -1.87451171875, -1.060791015625, -0.2470703125, 0.566650390625, 1.38037109375, 2.194091796875, 3.0078125, 3.821533203125, 4.63525390625, 5.448974609375, 6.2626953125, 7.076416015625, 7.89013671875, 8.703857421875, 9.517578125, 10.331298828125, 11.14501953125, 11.958740234375, 12.7724609375, 13.586181640625, 14.39990234375, 15.213623046875, 16.02734375, 16.841064453125, 17.65478515625, 18.468505859375, 19.2822265625, 20.095947265625, 20.90966796875, 21.723388671875, 22.537109375, 23.350830078125, 24.16455078125, 24.978271484375, 25.7919921875, 26.605712890625, 27.41943359375, 28.233154296875, 29.046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 8.0, 14.0, 16.0, 23.0, 27.0, 35.0, 44.0, 55.0, 61.0, 70.0, 67.0, 70.0, 75.0, 76.0, 75.0, 63.0, 39.0, 46.0, 35.0, 30.0, 14.0, 18.0, 13.0, 11.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.18115234375, -6.9482421875, -6.71533203125, -6.482421875, -6.24951171875, -6.0166015625, -5.78369140625, -5.55078125, -5.31787109375, -5.0849609375, -4.85205078125, -4.619140625, -4.38623046875, -4.1533203125, -3.92041015625, -3.6875, -3.45458984375, -3.2216796875, -2.98876953125, -2.755859375, -2.52294921875, -2.2900390625, -2.05712890625, -1.82421875, -1.59130859375, -1.3583984375, -1.12548828125, -0.892578125, -0.65966796875, -0.4267578125, -0.19384765625, 0.0390625, 0.27197265625, 0.5048828125, 0.73779296875, 0.970703125, 1.20361328125, 1.4365234375, 1.66943359375, 1.90234375, 2.13525390625, 2.3681640625, 2.60107421875, 2.833984375, 3.06689453125, 3.2998046875, 3.53271484375, 3.765625, 3.99853515625, 4.2314453125, 4.46435546875, 4.697265625, 4.93017578125, 5.1630859375, 5.39599609375, 5.62890625, 5.86181640625, 6.0947265625, 6.32763671875, 6.560546875, 6.79345703125, 7.0263671875, 7.25927734375, 7.4921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 15.0, 15.0, 17.0, 30.0, 40.0, 47.0, 61.0, 81.0, 103.0, 147.0, 221.0, 355.0, 583.0, 1239.0, 4257.0, 27456.0, 419118.0, 551578.0, 35058.0, 4888.0, 1398.0, 598.0, 374.0, 225.0, 141.0, 129.0, 83.0, 57.0, 49.0, 29.0, 38.0, 23.0, 16.0, 6.0, 14.0, 6.0, 3.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.78125, -50.11376953125, -48.4462890625, -46.77880859375, -45.111328125, -43.44384765625, -41.7763671875, -40.10888671875, -38.44140625, -36.77392578125, -35.1064453125, -33.43896484375, -31.771484375, -30.10400390625, -28.4365234375, -26.76904296875, -25.1015625, -23.43408203125, -21.7666015625, -20.09912109375, -18.431640625, -16.76416015625, -15.0966796875, -13.42919921875, -11.76171875, -10.09423828125, -8.4267578125, -6.75927734375, -5.091796875, -3.42431640625, -1.7568359375, -0.08935546875, 1.578125, 3.24560546875, 4.9130859375, 6.58056640625, 8.248046875, 9.91552734375, 11.5830078125, 13.25048828125, 14.91796875, 16.58544921875, 18.2529296875, 19.92041015625, 21.587890625, 23.25537109375, 24.9228515625, 26.59033203125, 28.2578125, 29.92529296875, 31.5927734375, 33.26025390625, 34.927734375, 36.59521484375, 38.2626953125, 39.93017578125, 41.59765625, 43.26513671875, 44.9326171875, 46.60009765625, 48.267578125, 49.93505859375, 51.6025390625, 53.27001953125, 54.9375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 7.0, 5.0, 9.0, 13.0, 12.0, 26.0, 19.0, 19.0, 27.0, 35.0, 23.0, 41.0, 39.0, 38.0, 34.0, 41.0, 55.0, 37.0, 46.0, 47.0, 36.0, 45.0, 30.0, 47.0, 29.0, 35.0, 33.0, 23.0, 18.0, 25.0, 16.0, 17.0, 10.0, 10.0, 16.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.38330078125, -22.6103515625, -21.83740234375, -21.064453125, -20.29150390625, -19.5185546875, -18.74560546875, -17.97265625, -17.19970703125, -16.4267578125, -15.65380859375, -14.880859375, -14.10791015625, -13.3349609375, -12.56201171875, -11.7890625, -11.01611328125, -10.2431640625, -9.47021484375, -8.697265625, -7.92431640625, -7.1513671875, -6.37841796875, -5.60546875, -4.83251953125, -4.0595703125, -3.28662109375, -2.513671875, -1.74072265625, -0.9677734375, -0.19482421875, 0.578125, 1.35107421875, 2.1240234375, 2.89697265625, 3.669921875, 4.44287109375, 5.2158203125, 5.98876953125, 6.76171875, 7.53466796875, 8.3076171875, 9.08056640625, 9.853515625, 10.62646484375, 11.3994140625, 12.17236328125, 12.9453125, 13.71826171875, 14.4912109375, 15.26416015625, 16.037109375, 16.81005859375, 17.5830078125, 18.35595703125, 19.12890625, 19.90185546875, 20.6748046875, 21.44775390625, 22.220703125, 22.99365234375, 23.7666015625, 24.53955078125, 25.3125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 5.0, 5.0, 15.0, 7.0, 19.0, 17.0, 20.0, 36.0, 50.0, 68.0, 109.0, 141.0, 257.0, 472.0, 795.0, 1281.0, 2784.0, 6420.0, 19391.0, 109294.0, 712339.0, 156797.0, 23914.0, 7630.0, 3078.0, 1487.0, 792.0, 478.0, 270.0, 160.0, 118.0, 79.0, 42.0, 31.0, 34.0, 25.0, 23.0, 14.0, 14.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.125, -19.525634765625, -18.92626953125, -18.326904296875, -17.7275390625, -17.128173828125, -16.52880859375, -15.929443359375, -15.330078125, -14.730712890625, -14.13134765625, -13.531982421875, -12.9326171875, -12.333251953125, -11.73388671875, -11.134521484375, -10.53515625, -9.935791015625, -9.33642578125, -8.737060546875, -8.1376953125, -7.538330078125, -6.93896484375, -6.339599609375, -5.740234375, -5.140869140625, -4.54150390625, -3.942138671875, -3.3427734375, -2.743408203125, -2.14404296875, -1.544677734375, -0.9453125, -0.345947265625, 0.25341796875, 0.852783203125, 1.4521484375, 2.051513671875, 2.65087890625, 3.250244140625, 3.849609375, 4.448974609375, 5.04833984375, 5.647705078125, 6.2470703125, 6.846435546875, 7.44580078125, 8.045166015625, 8.64453125, 9.243896484375, 9.84326171875, 10.442626953125, 11.0419921875, 11.641357421875, 12.24072265625, 12.840087890625, 13.439453125, 14.038818359375, 14.63818359375, 15.237548828125, 15.8369140625, 16.436279296875, 17.03564453125, 17.635009765625, 18.234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 3.0, 13.0, 14.0, 12.0, 19.0, 23.0, 34.0, 61.0, 97.0, 144.0, 173.0, 114.0, 79.0, 59.0, 30.0, 24.0, 17.0, 10.0, 14.0, 10.0, 8.0, 4.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.00334930419921875, -0.003263711929321289, -0.003178119659423828, -0.003092527389526367, -0.0030069351196289062, -0.0029213428497314453, -0.0028357505798339844, -0.0027501583099365234, -0.0026645660400390625, -0.0025789737701416016, -0.0024933815002441406, -0.0024077892303466797, -0.0023221969604492188, -0.002236604690551758, -0.002151012420654297, -0.002065420150756836, -0.001979827880859375, -0.001894235610961914, -0.0018086433410644531, -0.0017230510711669922, -0.0016374588012695312, -0.0015518665313720703, -0.0014662742614746094, -0.0013806819915771484, -0.0012950897216796875, -0.0012094974517822266, -0.0011239051818847656, -0.0010383129119873047, -0.0009527206420898438, -0.0008671283721923828, -0.0007815361022949219, -0.0006959438323974609, -0.0006103515625, -0.0005247592926025391, -0.0004391670227050781, -0.0003535747528076172, -0.00026798248291015625, -0.0001823902130126953, -9.679794311523438e-05, -1.1205673217773438e-05, 7.43865966796875e-05, 0.00015997886657714844, 0.0002455711364746094, 0.0003311634063720703, 0.00041675567626953125, 0.0005023479461669922, 0.0005879402160644531, 0.0006735324859619141, 0.000759124755859375, 0.0008447170257568359, 0.0009303092956542969, 0.0010159015655517578, 0.0011014938354492188, 0.0011870861053466797, 0.0012726783752441406, 0.0013582706451416016, 0.0014438629150390625, 0.0015294551849365234, 0.0016150474548339844, 0.0017006397247314453, 0.0017862319946289062, 0.0018718242645263672, 0.001957416534423828, 0.002043008804321289, 0.00212860107421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 7.0, 8.0, 15.0, 19.0, 27.0, 38.0, 54.0, 69.0, 93.0, 200.0, 480.0, 1341.0, 5880.0, 55713.0, 915459.0, 60498.0, 6193.0, 1437.0, 430.0, 214.0, 111.0, 73.0, 51.0, 28.0, 21.0, 20.0, 12.0, 11.0, 10.0, 7.0, 6.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.25927734375, -34.1748046875, -33.09033203125, -32.005859375, -30.92138671875, -29.8369140625, -28.75244140625, -27.66796875, -26.58349609375, -25.4990234375, -24.41455078125, -23.330078125, -22.24560546875, -21.1611328125, -20.07666015625, -18.9921875, -17.90771484375, -16.8232421875, -15.73876953125, -14.654296875, -13.56982421875, -12.4853515625, -11.40087890625, -10.31640625, -9.23193359375, -8.1474609375, -7.06298828125, -5.978515625, -4.89404296875, -3.8095703125, -2.72509765625, -1.640625, -0.55615234375, 0.5283203125, 1.61279296875, 2.697265625, 3.78173828125, 4.8662109375, 5.95068359375, 7.03515625, 8.11962890625, 9.2041015625, 10.28857421875, 11.373046875, 12.45751953125, 13.5419921875, 14.62646484375, 15.7109375, 16.79541015625, 17.8798828125, 18.96435546875, 20.048828125, 21.13330078125, 22.2177734375, 23.30224609375, 24.38671875, 25.47119140625, 26.5556640625, 27.64013671875, 28.724609375, 29.80908203125, 30.8935546875, 31.97802734375, 33.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 10.0, 11.0, 20.0, 19.0, 32.0, 55.0, 59.0, 86.0, 97.0, 105.0, 76.0, 91.0, 88.0, 57.0, 40.0, 35.0, 23.0, 10.0, 13.0, 8.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.859375, -14.4058837890625, -13.952392578125, -13.4989013671875, -13.04541015625, -12.5919189453125, -12.138427734375, -11.6849365234375, -11.2314453125, -10.7779541015625, -10.324462890625, -9.8709716796875, -9.41748046875, -8.9639892578125, -8.510498046875, -8.0570068359375, -7.603515625, -7.1500244140625, -6.696533203125, -6.2430419921875, -5.78955078125, -5.3360595703125, -4.882568359375, -4.4290771484375, -3.9755859375, -3.5220947265625, -3.068603515625, -2.6151123046875, -2.16162109375, -1.7081298828125, -1.254638671875, -0.8011474609375, -0.34765625, 0.1058349609375, 0.559326171875, 1.0128173828125, 1.46630859375, 1.9197998046875, 2.373291015625, 2.8267822265625, 3.2802734375, 3.7337646484375, 4.187255859375, 4.6407470703125, 5.09423828125, 5.5477294921875, 6.001220703125, 6.4547119140625, 6.908203125, 7.3616943359375, 7.815185546875, 8.2686767578125, 8.72216796875, 9.1756591796875, 9.629150390625, 10.0826416015625, 10.5361328125, 10.9896240234375, 11.443115234375, 11.8966064453125, 12.35009765625, 12.8035888671875, 13.257080078125, 13.7105712890625, 14.1640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 19.0, 63.0, 130.0, 227.0, 228.0, 176.0, 82.0, 37.0, 20.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-320.11517333984375, -307.8360900878906, -295.5569763183594, -283.27789306640625, -270.9988098144531, -258.7196960449219, -246.44061279296875, -234.16151428222656, -221.88241577148438, -209.6033172607422, -197.32423400878906, -185.04513549804688, -172.7660369873047, -160.4869384765625, -148.20785522460938, -135.9287567138672, -123.64967346191406, -111.3705825805664, -99.09148406982422, -86.81239318847656, -74.53329467773438, -62.25420379638672, -49.97511291503906, -37.696014404296875, -25.41692352294922, -13.137829780578613, -0.8587360382080078, 11.420356750488281, 23.699451446533203, 35.978546142578125, 48.25763702392578, 60.53673553466797, 72.81582641601562, 85.09491729736328, 97.37401580810547, 109.65310668945312, 121.93220520019531, 134.2113037109375, 146.49038696289062, 158.7694854736328, 171.048583984375, 183.3276824951172, 195.6067657470703, 207.8858642578125, 220.1649627685547, 232.44406127929688, 244.72314453125, 257.00225830078125, 269.28131103515625, 281.5603942871094, 293.8395080566406, 306.11859130859375, 318.3976745605469, 330.6767883300781, 342.95587158203125, 355.2349853515625, 367.5140686035156, 379.79315185546875, 392.072265625, 404.3513488769531, 416.63043212890625, 428.9095458984375, 441.1886291503906, 453.46771240234375, 465.746826171875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 12.0, 6.0, 8.0, 15.0, 23.0, 22.0, 29.0, 21.0, 29.0, 32.0, 33.0, 36.0, 39.0, 38.0, 58.0, 45.0, 43.0, 49.0, 49.0, 45.0, 42.0, 43.0, 44.0, 32.0, 27.0, 28.0, 23.0, 13.0, 19.0, 16.0, 9.0, 12.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.15899658203125, -124.89854431152344, -120.63809204101562, -116.37763214111328, -112.11717987060547, -107.85672760009766, -103.59626770019531, -99.3358154296875, -95.07536315917969, -90.81491088867188, -86.55445861816406, -82.29399871826172, -78.0335464477539, -73.7730941772461, -69.51263427734375, -65.25218200683594, -60.991729736328125, -56.73127746582031, -52.470821380615234, -48.210365295410156, -43.949913024902344, -39.68946075439453, -35.42900466918945, -31.168550491333008, -26.908096313476562, -22.647642135620117, -18.387187957763672, -14.126733779907227, -9.866279602050781, -5.605825424194336, -1.3453712463378906, 2.9150829315185547, 7.175537109375, 11.435991287231445, 15.69644546508789, 19.956899642944336, 24.21735382080078, 28.477807998657227, 32.73826217651367, 36.99871826171875, 41.25917053222656, 45.519622802734375, 49.78007888793945, 54.04053497314453, 58.300987243652344, 62.561439514160156, 66.8218994140625, 71.08235168457031, 75.34280395507812, 79.60325622558594, 83.86370849609375, 88.1241683959961, 92.3846206665039, 96.64507293701172, 100.90553283691406, 105.16598510742188, 109.42643737792969, 113.6868896484375, 117.94734191894531, 122.20780181884766, 126.46825408935547, 130.7287139892578, 134.98916625976562, 139.24961853027344, 143.51007080078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 11.0, 14.0, 23.0, 36.0, 102.0, 145.0, 275.0, 641.0, 1827.0, 10886.0, 4168204.0, 9183.0, 1744.0, 604.0, 294.0, 132.0, 66.0, 37.0, 19.0, 14.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.1875, -91.1943359375, -88.201171875, -85.2080078125, -82.21484375, -79.2216796875, -76.228515625, -73.2353515625, -70.2421875, -67.2490234375, -64.255859375, -61.2626953125, -58.26953125, -55.2763671875, -52.283203125, -49.2900390625, -46.296875, -43.3037109375, -40.310546875, -37.3173828125, -34.32421875, -31.3310546875, -28.337890625, -25.3447265625, -22.3515625, -19.3583984375, -16.365234375, -13.3720703125, -10.37890625, -7.3857421875, -4.392578125, -1.3994140625, 1.59375, 4.5869140625, 7.580078125, 10.5732421875, 13.56640625, 16.5595703125, 19.552734375, 22.5458984375, 25.5390625, 28.5322265625, 31.525390625, 34.5185546875, 37.51171875, 40.5048828125, 43.498046875, 46.4912109375, 49.484375, 52.4775390625, 55.470703125, 58.4638671875, 61.45703125, 64.4501953125, 67.443359375, 70.4365234375, 73.4296875, 76.4228515625, 79.416015625, 82.4091796875, 85.40234375, 88.3955078125, 91.388671875, 94.3818359375, 97.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 9.0, 5.0, 5.0, 8.0, 10.0, 23.0, 19.0, 20.0, 27.0, 28.0, 57.0, 49.0, 51.0, 49.0, 72.0, 67.0, 81.0, 60.0, 66.0, 44.0, 53.0, 39.0, 27.0, 27.0, 28.0, 18.0, 19.0, 18.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.33538818359375, -7.0965576171875, -6.85772705078125, -6.618896484375, -6.38006591796875, -6.1412353515625, -5.90240478515625, -5.66357421875, -5.42474365234375, -5.1859130859375, -4.94708251953125, -4.708251953125, -4.46942138671875, -4.2305908203125, -3.99176025390625, -3.7529296875, -3.51409912109375, -3.2752685546875, -3.03643798828125, -2.797607421875, -2.55877685546875, -2.3199462890625, -2.08111572265625, -1.84228515625, -1.60345458984375, -1.3646240234375, -1.12579345703125, -0.886962890625, -0.64813232421875, -0.4093017578125, -0.17047119140625, 0.068359375, 0.30718994140625, 0.5460205078125, 0.78485107421875, 1.023681640625, 1.26251220703125, 1.5013427734375, 1.74017333984375, 1.97900390625, 2.21783447265625, 2.4566650390625, 2.69549560546875, 2.934326171875, 3.17315673828125, 3.4119873046875, 3.65081787109375, 3.8896484375, 4.12847900390625, 4.3673095703125, 4.60614013671875, 4.844970703125, 5.08380126953125, 5.3226318359375, 5.56146240234375, 5.80029296875, 6.03912353515625, 6.2779541015625, 6.51678466796875, 6.755615234375, 6.99444580078125, 7.2332763671875, 7.47210693359375, 7.7109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 7.0, 11.0, 19.0, 19.0, 20.0, 29.0, 53.0, 69.0, 90.0, 103.0, 143.0, 221.0, 316.0, 499.0, 799.0, 1273.0, 2362.0, 4789.0, 13329.0, 160348.0, 3977003.0, 19676.0, 6101.0, 2759.0, 1548.0, 887.0, 557.0, 367.0, 238.0, 181.0, 102.0, 82.0, 64.0, 48.0, 30.0, 31.0, 18.0, 15.0, 13.0, 9.0, 12.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-38.65625, -37.453125, -36.25, -35.046875, -33.84375, -32.640625, -31.4375, -30.234375, -29.03125, -27.828125, -26.625, -25.421875, -24.21875, -23.015625, -21.8125, -20.609375, -19.40625, -18.203125, -17.0, -15.796875, -14.59375, -13.390625, -12.1875, -10.984375, -9.78125, -8.578125, -7.375, -6.171875, -4.96875, -3.765625, -2.5625, -1.359375, -0.15625, 1.046875, 2.25, 3.453125, 4.65625, 5.859375, 7.0625, 8.265625, 9.46875, 10.671875, 11.875, 13.078125, 14.28125, 15.484375, 16.6875, 17.890625, 19.09375, 20.296875, 21.5, 22.703125, 23.90625, 25.109375, 26.3125, 27.515625, 28.71875, 29.921875, 31.125, 32.328125, 33.53125, 34.734375, 35.9375, 37.140625, 38.34375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 6.0, 13.0, 25.0, 64.0, 3155.0, 677.0, 62.0, 26.0, 6.0, 10.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.387939453125, -8.06494140625, -7.741943359375, -7.4189453125, -7.095947265625, -6.77294921875, -6.449951171875, -6.126953125, -5.803955078125, -5.48095703125, -5.157958984375, -4.8349609375, -4.511962890625, -4.18896484375, -3.865966796875, -3.54296875, -3.219970703125, -2.89697265625, -2.573974609375, -2.2509765625, -1.927978515625, -1.60498046875, -1.281982421875, -0.958984375, -0.635986328125, -0.31298828125, 0.010009765625, 0.3330078125, 0.656005859375, 0.97900390625, 1.302001953125, 1.625, 1.947998046875, 2.27099609375, 2.593994140625, 2.9169921875, 3.239990234375, 3.56298828125, 3.885986328125, 4.208984375, 4.531982421875, 4.85498046875, 5.177978515625, 5.5009765625, 5.823974609375, 6.14697265625, 6.469970703125, 6.79296875, 7.115966796875, 7.43896484375, 7.761962890625, 8.0849609375, 8.407958984375, 8.73095703125, 9.053955078125, 9.376953125, 9.699951171875, 10.02294921875, 10.345947265625, 10.6689453125, 10.991943359375, 11.31494140625, 11.637939453125, 11.9609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 12.0, 20.0, 36.0, 64.0, 98.0, 159.0, 204.0, 164.0, 100.0, 60.0, 40.0, 16.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.77932357788086, -44.521324157714844, -43.26332473754883, -42.00532531738281, -40.74732971191406, -39.48933029174805, -38.23133087158203, -36.973331451416016, -35.71533203125, -34.457332611083984, -33.19933319091797, -31.941335678100586, -30.68333625793457, -29.425338745117188, -28.167339324951172, -26.909339904785156, -25.651342391967773, -24.393342971801758, -23.135345458984375, -21.87734603881836, -20.619346618652344, -19.361347198486328, -18.103349685668945, -16.84535026550293, -15.58735179901123, -14.329353332519531, -13.071353912353516, -11.813355445861816, -10.555356979370117, -9.297357559204102, -8.039359092712402, -6.781359672546387, -5.5233612060546875, -4.26536226272583, -3.0073635578155518, -1.7493648529052734, -0.491365909576416, 0.7666330337524414, 2.0246315002441406, 3.2826309204101562, 4.5406293869018555, 5.798628330230713, 7.05662727355957, 8.31462574005127, 9.572624206542969, 10.830623626708984, 12.088622093200684, 13.3466215133667, 14.604619979858398, 15.862618446350098, 17.120616912841797, 18.378616333007812, 19.636615753173828, 20.894615173339844, 22.152612686157227, 23.410612106323242, 24.668609619140625, 25.92660903930664, 27.184606552124023, 28.44260597229004, 29.700605392456055, 30.958602905273438, 32.21660232543945, 33.47460174560547, 34.732601165771484]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 9.0, 8.0, 7.0, 4.0, 10.0, 12.0, 11.0, 18.0, 22.0, 26.0, 25.0, 25.0, 22.0, 40.0, 49.0, 37.0, 35.0, 37.0, 51.0, 35.0, 39.0, 49.0, 35.0, 57.0, 38.0, 42.0, 51.0, 26.0, 27.0, 20.0, 25.0, 24.0, 17.0, 7.0, 16.0, 9.0, 11.0, 8.0, 8.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.897716522216797, -12.425738334655762, -11.953760147094727, -11.481782913208008, -11.009804725646973, -10.537826538085938, -10.065848350524902, -9.593870162963867, -9.121892929077148, -8.649914741516113, -8.177936553955078, -7.705958843231201, -7.233981132507324, -6.762002944946289, -6.290024757385254, -5.818046569824219, -5.346068382263184, -4.874090194702148, -4.4021124839782715, -3.9301342964172363, -3.4581563472747803, -2.986178398132324, -2.514200210571289, -2.042222261428833, -1.570244312286377, -1.098266363143921, -0.6262882947921753, -0.1543102264404297, 0.31766772270202637, 0.7896456718444824, 1.2616238594055176, 1.7336018085479736, 2.2055797576904297, 2.6775577068328857, 3.149535655975342, 3.621513843536377, 4.093491554260254, 4.565469741821289, 5.037447929382324, 5.509426116943359, 5.981403827667236, 6.4533820152282715, 6.925359725952148, 7.397337913513184, 7.869316101074219, 8.341293334960938, 8.813272476196289, 9.285249710083008, 9.757227897644043, 10.229206085205078, 10.701184272766113, 11.173162460327148, 11.645139694213867, 12.117117881774902, 12.589096069335938, 13.061074256896973, 13.533052444458008, 14.005030632019043, 14.477008819580078, 14.948986053466797, 15.420964241027832, 15.892942428588867, 16.36492156982422, 16.836898803710938, 17.308876037597656]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 13.0, 16.0, 26.0, 34.0, 58.0, 96.0, 159.0, 265.0, 581.0, 1106.0, 2532.0, 6165.0, 16490.0, 49701.0, 163778.0, 419189.0, 264608.0, 81730.0, 26022.0, 9232.0, 3551.0, 1499.0, 762.0, 368.0, 209.0, 138.0, 66.0, 54.0, 29.0, 21.0, 19.0, 8.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.484375, -23.73583984375, -22.9873046875, -22.23876953125, -21.490234375, -20.74169921875, -19.9931640625, -19.24462890625, -18.49609375, -17.74755859375, -16.9990234375, -16.25048828125, -15.501953125, -14.75341796875, -14.0048828125, -13.25634765625, -12.5078125, -11.75927734375, -11.0107421875, -10.26220703125, -9.513671875, -8.76513671875, -8.0166015625, -7.26806640625, -6.51953125, -5.77099609375, -5.0224609375, -4.27392578125, -3.525390625, -2.77685546875, -2.0283203125, -1.27978515625, -0.53125, 0.21728515625, 0.9658203125, 1.71435546875, 2.462890625, 3.21142578125, 3.9599609375, 4.70849609375, 5.45703125, 6.20556640625, 6.9541015625, 7.70263671875, 8.451171875, 9.19970703125, 9.9482421875, 10.69677734375, 11.4453125, 12.19384765625, 12.9423828125, 13.69091796875, 14.439453125, 15.18798828125, 15.9365234375, 16.68505859375, 17.43359375, 18.18212890625, 18.9306640625, 19.67919921875, 20.427734375, 21.17626953125, 21.9248046875, 22.67333984375, 23.421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 4.0, 4.0, 6.0, 13.0, 13.0, 17.0, 18.0, 31.0, 29.0, 33.0, 44.0, 51.0, 34.0, 47.0, 53.0, 66.0, 71.0, 65.0, 53.0, 55.0, 42.0, 41.0, 43.0, 28.0, 28.0, 15.0, 24.0, 20.0, 17.0, 11.0, 12.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.33135986328125, -7.0885009765625, -6.84564208984375, -6.602783203125, -6.35992431640625, -6.1170654296875, -5.87420654296875, -5.63134765625, -5.38848876953125, -5.1456298828125, -4.90277099609375, -4.659912109375, -4.41705322265625, -4.1741943359375, -3.93133544921875, -3.6884765625, -3.44561767578125, -3.2027587890625, -2.95989990234375, -2.717041015625, -2.47418212890625, -2.2313232421875, -1.98846435546875, -1.74560546875, -1.50274658203125, -1.2598876953125, -1.01702880859375, -0.774169921875, -0.53131103515625, -0.2884521484375, -0.04559326171875, 0.197265625, 0.44012451171875, 0.6829833984375, 0.92584228515625, 1.168701171875, 1.41156005859375, 1.6544189453125, 1.89727783203125, 2.14013671875, 2.38299560546875, 2.6258544921875, 2.86871337890625, 3.111572265625, 3.35443115234375, 3.5972900390625, 3.84014892578125, 4.0830078125, 4.32586669921875, 4.5687255859375, 4.81158447265625, 5.054443359375, 5.29730224609375, 5.5401611328125, 5.78302001953125, 6.02587890625, 6.26873779296875, 6.5115966796875, 6.75445556640625, 6.997314453125, 7.24017333984375, 7.4830322265625, 7.72589111328125, 7.96875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 13.0, 9.0, 13.0, 19.0, 17.0, 27.0, 53.0, 55.0, 83.0, 109.0, 139.0, 164.0, 286.0, 416.0, 718.0, 1776.0, 9574.0, 155299.0, 817367.0, 54221.0, 5024.0, 1250.0, 607.0, 362.0, 250.0, 189.0, 132.0, 78.0, 71.0, 47.0, 38.0, 39.0, 25.0, 11.0, 15.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-63.125, -61.1728515625, -59.220703125, -57.2685546875, -55.31640625, -53.3642578125, -51.412109375, -49.4599609375, -47.5078125, -45.5556640625, -43.603515625, -41.6513671875, -39.69921875, -37.7470703125, -35.794921875, -33.8427734375, -31.890625, -29.9384765625, -27.986328125, -26.0341796875, -24.08203125, -22.1298828125, -20.177734375, -18.2255859375, -16.2734375, -14.3212890625, -12.369140625, -10.4169921875, -8.46484375, -6.5126953125, -4.560546875, -2.6083984375, -0.65625, 1.2958984375, 3.248046875, 5.2001953125, 7.15234375, 9.1044921875, 11.056640625, 13.0087890625, 14.9609375, 16.9130859375, 18.865234375, 20.8173828125, 22.76953125, 24.7216796875, 26.673828125, 28.6259765625, 30.578125, 32.5302734375, 34.482421875, 36.4345703125, 38.38671875, 40.3388671875, 42.291015625, 44.2431640625, 46.1953125, 48.1474609375, 50.099609375, 52.0517578125, 54.00390625, 55.9560546875, 57.908203125, 59.8603515625, 61.8125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 8.0, 16.0, 16.0, 23.0, 27.0, 30.0, 21.0, 29.0, 40.0, 39.0, 40.0, 40.0, 44.0, 54.0, 41.0, 52.0, 48.0, 47.0, 37.0, 43.0, 42.0, 28.0, 39.0, 27.0, 25.0, 28.0, 18.0, 10.0, 10.0, 12.0, 10.0, 10.0, 0.0, 6.0, 1.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.4375, -30.44140625, -29.4453125, -28.44921875, -27.453125, -26.45703125, -25.4609375, -24.46484375, -23.46875, -22.47265625, -21.4765625, -20.48046875, -19.484375, -18.48828125, -17.4921875, -16.49609375, -15.5, -14.50390625, -13.5078125, -12.51171875, -11.515625, -10.51953125, -9.5234375, -8.52734375, -7.53125, -6.53515625, -5.5390625, -4.54296875, -3.546875, -2.55078125, -1.5546875, -0.55859375, 0.4375, 1.43359375, 2.4296875, 3.42578125, 4.421875, 5.41796875, 6.4140625, 7.41015625, 8.40625, 9.40234375, 10.3984375, 11.39453125, 12.390625, 13.38671875, 14.3828125, 15.37890625, 16.375, 17.37109375, 18.3671875, 19.36328125, 20.359375, 21.35546875, 22.3515625, 23.34765625, 24.34375, 25.33984375, 26.3359375, 27.33203125, 28.328125, 29.32421875, 30.3203125, 31.31640625, 32.3125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 14.0, 16.0, 21.0, 43.0, 58.0, 103.0, 139.0, 220.0, 428.0, 704.0, 1301.0, 2835.0, 6416.0, 17495.0, 64162.0, 332388.0, 486468.0, 96386.0, 23973.0, 8317.0, 3435.0, 1617.0, 842.0, 457.0, 267.0, 148.0, 90.0, 61.0, 51.0, 34.0, 16.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -11.028564453125, -10.67431640625, -10.320068359375, -9.9658203125, -9.611572265625, -9.25732421875, -8.903076171875, -8.548828125, -8.194580078125, -7.84033203125, -7.486083984375, -7.1318359375, -6.777587890625, -6.42333984375, -6.069091796875, -5.71484375, -5.360595703125, -5.00634765625, -4.652099609375, -4.2978515625, -3.943603515625, -3.58935546875, -3.235107421875, -2.880859375, -2.526611328125, -2.17236328125, -1.818115234375, -1.4638671875, -1.109619140625, -0.75537109375, -0.401123046875, -0.046875, 0.307373046875, 0.66162109375, 1.015869140625, 1.3701171875, 1.724365234375, 2.07861328125, 2.432861328125, 2.787109375, 3.141357421875, 3.49560546875, 3.849853515625, 4.2041015625, 4.558349609375, 4.91259765625, 5.266845703125, 5.62109375, 5.975341796875, 6.32958984375, 6.683837890625, 7.0380859375, 7.392333984375, 7.74658203125, 8.100830078125, 8.455078125, 8.809326171875, 9.16357421875, 9.517822265625, 9.8720703125, 10.226318359375, 10.58056640625, 10.934814453125, 11.2890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 10.0, 13.0, 12.0, 12.0, 15.0, 21.0, 32.0, 47.0, 74.0, 79.0, 88.0, 95.0, 75.0, 76.0, 80.0, 50.0, 40.0, 42.0, 20.0, 18.0, 15.0, 16.0, 15.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0019330978393554688, -0.0018727779388427734, -0.0018124580383300781, -0.0017521381378173828, -0.0016918182373046875, -0.0016314983367919922, -0.0015711784362792969, -0.0015108585357666016, -0.0014505386352539062, -0.001390218734741211, -0.0013298988342285156, -0.0012695789337158203, -0.001209259033203125, -0.0011489391326904297, -0.0010886192321777344, -0.001028299331665039, -0.0009679794311523438, -0.0009076595306396484, -0.0008473396301269531, -0.0007870197296142578, -0.0007266998291015625, -0.0006663799285888672, -0.0006060600280761719, -0.0005457401275634766, -0.00048542022705078125, -0.00042510032653808594, -0.0003647804260253906, -0.0003044605255126953, -0.000244140625, -0.0001838207244873047, -0.00012350082397460938, -6.318092346191406e-05, -2.86102294921875e-06, 5.745887756347656e-05, 0.00011777877807617188, 0.0001780986785888672, 0.0002384185791015625, 0.0002987384796142578, 0.0003590583801269531, 0.00041937828063964844, 0.00047969818115234375, 0.0005400180816650391, 0.0006003379821777344, 0.0006606578826904297, 0.000720977783203125, 0.0007812976837158203, 0.0008416175842285156, 0.0009019374847412109, 0.0009622573852539062, 0.0010225772857666016, 0.0010828971862792969, 0.0011432170867919922, 0.0012035369873046875, 0.0012638568878173828, 0.0013241767883300781, 0.0013844966888427734, 0.0014448165893554688, 0.001505136489868164, 0.0015654563903808594, 0.0016257762908935547, 0.00168609619140625, 0.0017464160919189453, 0.0018067359924316406, 0.001867055892944336, 0.0019273757934570312]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 7.0, 16.0, 11.0, 18.0, 26.0, 60.0, 88.0, 151.0, 241.0, 529.0, 1172.0, 3606.0, 22614.0, 703027.0, 299908.0, 12556.0, 2646.0, 931.0, 432.0, 203.0, 95.0, 71.0, 41.0, 30.0, 16.0, 11.0, 3.0, 10.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.8251953125, -23.994140625, -23.1630859375, -22.33203125, -21.5009765625, -20.669921875, -19.8388671875, -19.0078125, -18.1767578125, -17.345703125, -16.5146484375, -15.68359375, -14.8525390625, -14.021484375, -13.1904296875, -12.359375, -11.5283203125, -10.697265625, -9.8662109375, -9.03515625, -8.2041015625, -7.373046875, -6.5419921875, -5.7109375, -4.8798828125, -4.048828125, -3.2177734375, -2.38671875, -1.5556640625, -0.724609375, 0.1064453125, 0.9375, 1.7685546875, 2.599609375, 3.4306640625, 4.26171875, 5.0927734375, 5.923828125, 6.7548828125, 7.5859375, 8.4169921875, 9.248046875, 10.0791015625, 10.91015625, 11.7412109375, 12.572265625, 13.4033203125, 14.234375, 15.0654296875, 15.896484375, 16.7275390625, 17.55859375, 18.3896484375, 19.220703125, 20.0517578125, 20.8828125, 21.7138671875, 22.544921875, 23.3759765625, 24.20703125, 25.0380859375, 25.869140625, 26.7001953125, 27.53125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 8.0, 9.0, 10.0, 21.0, 26.0, 43.0, 61.0, 77.0, 91.0, 107.0, 95.0, 112.0, 99.0, 80.0, 48.0, 40.0, 26.0, 14.0, 12.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.0625, -17.5823974609375, -17.102294921875, -16.6221923828125, -16.14208984375, -15.6619873046875, -15.181884765625, -14.7017822265625, -14.2216796875, -13.7415771484375, -13.261474609375, -12.7813720703125, -12.30126953125, -11.8211669921875, -11.341064453125, -10.8609619140625, -10.380859375, -9.9007568359375, -9.420654296875, -8.9405517578125, -8.46044921875, -7.9803466796875, -7.500244140625, -7.0201416015625, -6.5400390625, -6.0599365234375, -5.579833984375, -5.0997314453125, -4.61962890625, -4.1395263671875, -3.659423828125, -3.1793212890625, -2.69921875, -2.2191162109375, -1.739013671875, -1.2589111328125, -0.77880859375, -0.2987060546875, 0.181396484375, 0.6614990234375, 1.1416015625, 1.6217041015625, 2.101806640625, 2.5819091796875, 3.06201171875, 3.5421142578125, 4.022216796875, 4.5023193359375, 4.982421875, 5.4625244140625, 5.942626953125, 6.4227294921875, 6.90283203125, 7.3829345703125, 7.863037109375, 8.3431396484375, 8.8232421875, 9.3033447265625, 9.783447265625, 10.2635498046875, 10.74365234375, 11.2237548828125, 11.703857421875, 12.1839599609375, 12.6640625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 7.0, 10.0, 31.0, 105.0, 176.0, 257.0, 216.0, 118.0, 49.0, 20.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.95567321777344, -97.13306427001953, -84.31045532226562, -71.48785400390625, -58.66524124145508, -45.84263610839844, -33.02002716064453, -20.197418212890625, -7.374809265136719, 5.447798728942871, 18.27040672302246, 31.093013763427734, 43.91562271118164, 56.73822784423828, 69.56083679199219, 82.3834457397461, 95.2060546875, 108.0286636352539, 120.85127258300781, 133.6738739013672, 146.49649047851562, 159.319091796875, 172.14169311523438, 184.9643096923828, 197.78692626953125, 210.60952758789062, 223.43214416503906, 236.25474548339844, 249.07736206054688, 261.89996337890625, 274.7225646972656, 287.545166015625, 300.3677673339844, 313.19036865234375, 326.0129699707031, 338.8356018066406, 351.658203125, 364.4808044433594, 377.30340576171875, 390.12603759765625, 402.9486389160156, 415.771240234375, 428.5938415527344, 441.4164733886719, 454.23907470703125, 467.0616760253906, 479.88427734375, 492.7069091796875, 505.52947998046875, 518.3521118164062, 531.1746826171875, 543.997314453125, 556.8198852539062, 569.6425170898438, 582.4651489257812, 595.2877197265625, 608.1103515625, 620.9329833984375, 633.7555541992188, 646.5781860351562, 659.4007568359375, 672.223388671875, 685.0460205078125, 697.8685913085938, 710.6912231445312]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 14.0, 9.0, 20.0, 12.0, 11.0, 20.0, 19.0, 26.0, 24.0, 42.0, 44.0, 42.0, 41.0, 44.0, 51.0, 54.0, 51.0, 51.0, 60.0, 46.0, 37.0, 34.0, 21.0, 33.0, 28.0, 22.0, 27.0, 22.0, 14.0, 15.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-145.62461853027344, -140.9709014892578, -136.3171844482422, -131.66348266601562, -127.009765625, -122.35604858398438, -117.70233154296875, -113.04861450195312, -108.39490509033203, -103.7411880493164, -99.08747863769531, -94.43376159667969, -89.78004455566406, -85.12633514404297, -80.47261810302734, -75.81890869140625, -71.16519165039062, -66.511474609375, -61.857765197753906, -57.20404815673828, -52.55033493041992, -47.89662170410156, -43.24290466308594, -38.58919143676758, -33.93547821044922, -29.28176498413086, -24.628049850463867, -19.974334716796875, -15.320621490478516, -10.666908264160156, -6.013193130493164, -1.3594779968261719, 3.29425048828125, 7.947964668273926, 12.601678848266602, 17.255393981933594, 21.909107208251953, 26.562820434570312, 31.216535568237305, 35.8702507019043, 40.523963928222656, 45.177677154541016, 49.831390380859375, 54.485107421875, 59.13882064819336, 63.79253387451172, 68.44625091552734, 73.09996032714844, 77.75367736816406, 82.40739440917969, 87.06110382080078, 91.7148208618164, 96.3685302734375, 101.02224731445312, 105.67596435546875, 110.32968139648438, 114.98339080810547, 119.6371078491211, 124.29081726074219, 128.9445343017578, 133.59825134277344, 138.251953125, 142.90567016601562, 147.55938720703125, 152.21310424804688]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 8.0, 15.0, 20.0, 32.0, 52.0, 63.0, 127.0, 214.0, 440.0, 1117.0, 4092.0, 34338.0, 4139180.0, 10822.0, 2298.0, 723.0, 309.0, 154.0, 99.0, 51.0, 46.0, 30.0, 15.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-76.0, -74.11328125, -72.2265625, -70.33984375, -68.453125, -66.56640625, -64.6796875, -62.79296875, -60.90625, -59.01953125, -57.1328125, -55.24609375, -53.359375, -51.47265625, -49.5859375, -47.69921875, -45.8125, -43.92578125, -42.0390625, -40.15234375, -38.265625, -36.37890625, -34.4921875, -32.60546875, -30.71875, -28.83203125, -26.9453125, -25.05859375, -23.171875, -21.28515625, -19.3984375, -17.51171875, -15.625, -13.73828125, -11.8515625, -9.96484375, -8.078125, -6.19140625, -4.3046875, -2.41796875, -0.53125, 1.35546875, 3.2421875, 5.12890625, 7.015625, 8.90234375, 10.7890625, 12.67578125, 14.5625, 16.44921875, 18.3359375, 20.22265625, 22.109375, 23.99609375, 25.8828125, 27.76953125, 29.65625, 31.54296875, 33.4296875, 35.31640625, 37.203125, 39.08984375, 40.9765625, 42.86328125, 44.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 5.0, 3.0, 12.0, 7.0, 9.0, 11.0, 24.0, 28.0, 29.0, 30.0, 48.0, 47.0, 43.0, 47.0, 41.0, 51.0, 65.0, 68.0, 56.0, 49.0, 39.0, 54.0, 48.0, 36.0, 26.0, 22.0, 27.0, 27.0, 6.0, 8.0, 4.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.82843017578125, -7.5787353515625, -7.32904052734375, -7.079345703125, -6.82965087890625, -6.5799560546875, -6.33026123046875, -6.08056640625, -5.83087158203125, -5.5811767578125, -5.33148193359375, -5.081787109375, -4.83209228515625, -4.5823974609375, -4.33270263671875, -4.0830078125, -3.83331298828125, -3.5836181640625, -3.33392333984375, -3.084228515625, -2.83453369140625, -2.5848388671875, -2.33514404296875, -2.08544921875, -1.83575439453125, -1.5860595703125, -1.33636474609375, -1.086669921875, -0.83697509765625, -0.5872802734375, -0.33758544921875, -0.087890625, 0.16180419921875, 0.4114990234375, 0.66119384765625, 0.910888671875, 1.16058349609375, 1.4102783203125, 1.65997314453125, 1.90966796875, 2.15936279296875, 2.4090576171875, 2.65875244140625, 2.908447265625, 3.15814208984375, 3.4078369140625, 3.65753173828125, 3.9072265625, 4.15692138671875, 4.4066162109375, 4.65631103515625, 4.906005859375, 5.15570068359375, 5.4053955078125, 5.65509033203125, 5.90478515625, 6.15447998046875, 6.4041748046875, 6.65386962890625, 6.903564453125, 7.15325927734375, 7.4029541015625, 7.65264892578125, 7.90234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 16.0, 21.0, 41.0, 48.0, 49.0, 67.0, 98.0, 125.0, 191.0, 400.0, 815.0, 1553.0, 3984.0, 13552.0, 3560815.0, 591981.0, 13060.0, 3997.0, 1609.0, 770.0, 369.0, 198.0, 145.0, 78.0, 61.0, 50.0, 39.0, 32.0, 25.0, 16.0, 15.0, 8.0, 8.0, 6.0, 8.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84375, -57.1123046875, -55.380859375, -53.6494140625, -51.91796875, -50.1865234375, -48.455078125, -46.7236328125, -44.9921875, -43.2607421875, -41.529296875, -39.7978515625, -38.06640625, -36.3349609375, -34.603515625, -32.8720703125, -31.140625, -29.4091796875, -27.677734375, -25.9462890625, -24.21484375, -22.4833984375, -20.751953125, -19.0205078125, -17.2890625, -15.5576171875, -13.826171875, -12.0947265625, -10.36328125, -8.6318359375, -6.900390625, -5.1689453125, -3.4375, -1.7060546875, 0.025390625, 1.7568359375, 3.48828125, 5.2197265625, 6.951171875, 8.6826171875, 10.4140625, 12.1455078125, 13.876953125, 15.6083984375, 17.33984375, 19.0712890625, 20.802734375, 22.5341796875, 24.265625, 25.9970703125, 27.728515625, 29.4599609375, 31.19140625, 32.9228515625, 34.654296875, 36.3857421875, 38.1171875, 39.8486328125, 41.580078125, 43.3115234375, 45.04296875, 46.7744140625, 48.505859375, 50.2373046875, 51.96875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 6.0, 17.0, 21.0, 40.0, 103.0, 3679.0, 132.0, 22.0, 13.0, 8.0, 11.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -9.966796875, -9.54296875, -9.119140625, -8.6953125, -8.271484375, -7.84765625, -7.423828125, -7.0, -6.576171875, -6.15234375, -5.728515625, -5.3046875, -4.880859375, -4.45703125, -4.033203125, -3.609375, -3.185546875, -2.76171875, -2.337890625, -1.9140625, -1.490234375, -1.06640625, -0.642578125, -0.21875, 0.205078125, 0.62890625, 1.052734375, 1.4765625, 1.900390625, 2.32421875, 2.748046875, 3.171875, 3.595703125, 4.01953125, 4.443359375, 4.8671875, 5.291015625, 5.71484375, 6.138671875, 6.5625, 6.986328125, 7.41015625, 7.833984375, 8.2578125, 8.681640625, 9.10546875, 9.529296875, 9.953125, 10.376953125, 10.80078125, 11.224609375, 11.6484375, 12.072265625, 12.49609375, 12.919921875, 13.34375, 13.767578125, 14.19140625, 14.615234375, 15.0390625, 15.462890625, 15.88671875, 16.310546875, 16.734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 14.0, 16.0, 31.0, 49.0, 95.0, 112.0, 170.0, 194.0, 132.0, 79.0, 35.0, 19.0, 12.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.79228973388672, -53.18091583251953, -51.56954574584961, -49.95817184448242, -48.3468017578125, -46.73542785644531, -45.12405776977539, -43.5126838684082, -41.90131378173828, -40.289939880371094, -38.67856979370117, -37.067195892333984, -35.45582580566406, -33.844451904296875, -32.23308181762695, -30.621707916259766, -29.01033592224121, -27.398963928222656, -25.7875919342041, -24.176219940185547, -22.564847946166992, -20.953475952148438, -19.34210205078125, -17.730731964111328, -16.11935806274414, -14.507986068725586, -12.896614074707031, -11.285242080688477, -9.673870086669922, -8.06249713897705, -6.451125144958496, -4.839753150939941, -3.228382110595703, -1.6170099973678589, -0.0056378841400146484, 1.6057343482971191, 3.217106342315674, 4.828478813171387, 6.439850807189941, 8.051222801208496, 9.66259479522705, 11.273966789245605, 12.88533878326416, 14.496711730957031, 16.108083724975586, 17.71945571899414, 19.330827713012695, 20.94219970703125, 22.553571701049805, 24.16494369506836, 25.776315689086914, 27.38768768310547, 28.999059677124023, 30.610431671142578, 32.221805572509766, 33.83317565917969, 35.444549560546875, 37.05592346191406, 38.667293548583984, 40.27866744995117, 41.890037536621094, 43.50141143798828, 45.1127815246582, 46.72415542602539, 48.33552551269531]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 12.0, 7.0, 13.0, 12.0, 11.0, 22.0, 28.0, 34.0, 33.0, 39.0, 48.0, 46.0, 45.0, 63.0, 63.0, 54.0, 72.0, 41.0, 48.0, 43.0, 44.0, 34.0, 32.0, 40.0, 22.0, 26.0, 11.0, 15.0, 13.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.289989471435547, -24.426227569580078, -23.56246566772461, -22.69870376586914, -21.834941864013672, -20.971179962158203, -20.107418060302734, -19.243656158447266, -18.379894256591797, -17.516132354736328, -16.65237045288086, -15.78860855102539, -14.924846649169922, -14.061084747314453, -13.197322845458984, -12.333560943603516, -11.469799995422363, -10.606038093566895, -9.742276191711426, -8.878514289855957, -8.014752388000488, -7.150990962982178, -6.287229061126709, -5.42346715927124, -4.5597052574157715, -3.6959433555603027, -2.832181453704834, -1.9684197902679443, -1.1046578884124756, -0.24089622497558594, 0.6228656768798828, 1.4866275787353516, 2.3503894805908203, 3.214151382446289, 4.077913284301758, 4.941675186157227, 5.805437088012695, 6.669198513031006, 7.532960414886475, 8.396722793579102, 9.26048469543457, 10.124246597290039, 10.988008499145508, 11.851770401000977, 12.715532302856445, 13.579294204711914, 14.443056106567383, 15.306818008422852, 16.170578002929688, 17.034339904785156, 17.898101806640625, 18.761863708496094, 19.625625610351562, 20.48938751220703, 21.3531494140625, 22.21691131591797, 23.080673217773438, 23.944435119628906, 24.808197021484375, 25.671958923339844, 26.535720825195312, 27.39948272705078, 28.26324462890625, 29.12700653076172, 29.990768432617188]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 9.0, 9.0, 12.0, 17.0, 27.0, 35.0, 57.0, 68.0, 128.0, 197.0, 306.0, 443.0, 729.0, 1199.0, 2012.0, 3658.0, 6690.0, 13043.0, 27190.0, 62234.0, 152200.0, 317701.0, 260592.0, 110478.0, 45890.0, 20644.0, 10262.0, 5367.0, 2976.0, 1662.0, 998.0, 595.0, 375.0, 234.0, 164.0, 98.0, 63.0, 50.0, 44.0, 32.0, 19.0, 8.0, 7.0, 11.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-17.78125, -17.239501953125, -16.69775390625, -16.156005859375, -15.6142578125, -15.072509765625, -14.53076171875, -13.989013671875, -13.447265625, -12.905517578125, -12.36376953125, -11.822021484375, -11.2802734375, -10.738525390625, -10.19677734375, -9.655029296875, -9.11328125, -8.571533203125, -8.02978515625, -7.488037109375, -6.9462890625, -6.404541015625, -5.86279296875, -5.321044921875, -4.779296875, -4.237548828125, -3.69580078125, -3.154052734375, -2.6123046875, -2.070556640625, -1.52880859375, -0.987060546875, -0.4453125, 0.096435546875, 0.63818359375, 1.179931640625, 1.7216796875, 2.263427734375, 2.80517578125, 3.346923828125, 3.888671875, 4.430419921875, 4.97216796875, 5.513916015625, 6.0556640625, 6.597412109375, 7.13916015625, 7.680908203125, 8.22265625, 8.764404296875, 9.30615234375, 9.847900390625, 10.3896484375, 10.931396484375, 11.47314453125, 12.014892578125, 12.556640625, 13.098388671875, 13.64013671875, 14.181884765625, 14.7236328125, 15.265380859375, 15.80712890625, 16.348876953125, 16.890625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 4.0, 12.0, 10.0, 9.0, 19.0, 12.0, 16.0, 36.0, 37.0, 36.0, 31.0, 46.0, 37.0, 48.0, 53.0, 47.0, 72.0, 58.0, 51.0, 45.0, 39.0, 33.0, 27.0, 48.0, 39.0, 23.0, 26.0, 12.0, 14.0, 16.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.21875, -7.9625244140625, -7.706298828125, -7.4500732421875, -7.19384765625, -6.9376220703125, -6.681396484375, -6.4251708984375, -6.1689453125, -5.9127197265625, -5.656494140625, -5.4002685546875, -5.14404296875, -4.8878173828125, -4.631591796875, -4.3753662109375, -4.119140625, -3.8629150390625, -3.606689453125, -3.3504638671875, -3.09423828125, -2.8380126953125, -2.581787109375, -2.3255615234375, -2.0693359375, -1.8131103515625, -1.556884765625, -1.3006591796875, -1.04443359375, -0.7882080078125, -0.531982421875, -0.2757568359375, -0.01953125, 0.2366943359375, 0.492919921875, 0.7491455078125, 1.00537109375, 1.2615966796875, 1.517822265625, 1.7740478515625, 2.0302734375, 2.2864990234375, 2.542724609375, 2.7989501953125, 3.05517578125, 3.3114013671875, 3.567626953125, 3.8238525390625, 4.080078125, 4.3363037109375, 4.592529296875, 4.8487548828125, 5.10498046875, 5.3612060546875, 5.617431640625, 5.8736572265625, 6.1298828125, 6.3861083984375, 6.642333984375, 6.8985595703125, 7.15478515625, 7.4110107421875, 7.667236328125, 7.9234619140625, 8.1796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 5.0, 6.0, 10.0, 12.0, 13.0, 17.0, 21.0, 20.0, 46.0, 40.0, 69.0, 87.0, 123.0, 207.0, 228.0, 339.0, 556.0, 1077.0, 2544.0, 13607.0, 226559.0, 754367.0, 40282.0, 4687.0, 1455.0, 689.0, 432.0, 334.0, 175.0, 148.0, 105.0, 63.0, 57.0, 39.0, 30.0, 19.0, 22.0, 18.0, 10.0, 7.0, 12.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.71875, -55.8701171875, -54.021484375, -52.1728515625, -50.32421875, -48.4755859375, -46.626953125, -44.7783203125, -42.9296875, -41.0810546875, -39.232421875, -37.3837890625, -35.53515625, -33.6865234375, -31.837890625, -29.9892578125, -28.140625, -26.2919921875, -24.443359375, -22.5947265625, -20.74609375, -18.8974609375, -17.048828125, -15.2001953125, -13.3515625, -11.5029296875, -9.654296875, -7.8056640625, -5.95703125, -4.1083984375, -2.259765625, -0.4111328125, 1.4375, 3.2861328125, 5.134765625, 6.9833984375, 8.83203125, 10.6806640625, 12.529296875, 14.3779296875, 16.2265625, 18.0751953125, 19.923828125, 21.7724609375, 23.62109375, 25.4697265625, 27.318359375, 29.1669921875, 31.015625, 32.8642578125, 34.712890625, 36.5615234375, 38.41015625, 40.2587890625, 42.107421875, 43.9560546875, 45.8046875, 47.6533203125, 49.501953125, 51.3505859375, 53.19921875, 55.0478515625, 56.896484375, 58.7451171875, 60.59375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 8.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 17.0, 10.0, 10.0, 12.0, 30.0, 24.0, 27.0, 32.0, 38.0, 27.0, 43.0, 43.0, 47.0, 56.0, 51.0, 36.0, 50.0, 39.0, 37.0, 38.0, 48.0, 41.0, 35.0, 29.0, 16.0, 17.0, 20.0, 19.0, 14.0, 12.0, 8.0, 8.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.5, -37.38330078125, -36.2666015625, -35.14990234375, -34.033203125, -32.91650390625, -31.7998046875, -30.68310546875, -29.56640625, -28.44970703125, -27.3330078125, -26.21630859375, -25.099609375, -23.98291015625, -22.8662109375, -21.74951171875, -20.6328125, -19.51611328125, -18.3994140625, -17.28271484375, -16.166015625, -15.04931640625, -13.9326171875, -12.81591796875, -11.69921875, -10.58251953125, -9.4658203125, -8.34912109375, -7.232421875, -6.11572265625, -4.9990234375, -3.88232421875, -2.765625, -1.64892578125, -0.5322265625, 0.58447265625, 1.701171875, 2.81787109375, 3.9345703125, 5.05126953125, 6.16796875, 7.28466796875, 8.4013671875, 9.51806640625, 10.634765625, 11.75146484375, 12.8681640625, 13.98486328125, 15.1015625, 16.21826171875, 17.3349609375, 18.45166015625, 19.568359375, 20.68505859375, 21.8017578125, 22.91845703125, 24.03515625, 25.15185546875, 26.2685546875, 27.38525390625, 28.501953125, 29.61865234375, 30.7353515625, 31.85205078125, 32.96875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 7.0, 6.0, 5.0, 7.0, 7.0, 8.0, 16.0, 17.0, 32.0, 50.0, 70.0, 171.0, 551.0, 2258.0, 19909.0, 966189.0, 54383.0, 3589.0, 783.0, 230.0, 91.0, 55.0, 30.0, 22.0, 17.0, 11.0, 8.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.21875, -52.697265625, -51.17578125, -49.654296875, -48.1328125, -46.611328125, -45.08984375, -43.568359375, -42.046875, -40.525390625, -39.00390625, -37.482421875, -35.9609375, -34.439453125, -32.91796875, -31.396484375, -29.875, -28.353515625, -26.83203125, -25.310546875, -23.7890625, -22.267578125, -20.74609375, -19.224609375, -17.703125, -16.181640625, -14.66015625, -13.138671875, -11.6171875, -10.095703125, -8.57421875, -7.052734375, -5.53125, -4.009765625, -2.48828125, -0.966796875, 0.5546875, 2.076171875, 3.59765625, 5.119140625, 6.640625, 8.162109375, 9.68359375, 11.205078125, 12.7265625, 14.248046875, 15.76953125, 17.291015625, 18.8125, 20.333984375, 21.85546875, 23.376953125, 24.8984375, 26.419921875, 27.94140625, 29.462890625, 30.984375, 32.505859375, 34.02734375, 35.548828125, 37.0703125, 38.591796875, 40.11328125, 41.634765625, 43.15625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 6.0, 13.0, 22.0, 29.0, 46.0, 60.0, 76.0, 128.0, 136.0, 131.0, 101.0, 60.0, 42.0, 23.0, 25.0, 10.0, 11.0, 11.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020732879638671875, -0.001995474100112915, -0.0019176602363586426, -0.0018398463726043701, -0.0017620325088500977, -0.0016842186450958252, -0.0016064047813415527, -0.0015285909175872803, -0.0014507770538330078, -0.0013729631900787354, -0.0012951493263244629, -0.0012173354625701904, -0.001139521598815918, -0.0010617077350616455, -0.000983893871307373, -0.0009060800075531006, -0.0008282661437988281, -0.0007504522800445557, -0.0006726384162902832, -0.0005948245525360107, -0.0005170106887817383, -0.0004391968250274658, -0.00036138296127319336, -0.0002835690975189209, -0.00020575523376464844, -0.00012794137001037598, -5.0127506256103516e-05, 2.7686357498168945e-05, 0.0001055002212524414, 0.00018331408500671387, 0.00026112794876098633, 0.0003389418125152588, 0.00041675567626953125, 0.0004945695400238037, 0.0005723834037780762, 0.0006501972675323486, 0.0007280111312866211, 0.0008058249950408936, 0.000883638858795166, 0.0009614527225494385, 0.001039266586303711, 0.0011170804500579834, 0.0011948943138122559, 0.0012727081775665283, 0.0013505220413208008, 0.0014283359050750732, 0.0015061497688293457, 0.0015839636325836182, 0.0016617774963378906, 0.001739591360092163, 0.0018174052238464355, 0.001895219087600708, 0.0019730329513549805, 0.002050846815109253, 0.0021286606788635254, 0.002206474542617798, 0.0022842884063720703, 0.0023621022701263428, 0.0024399161338806152, 0.0025177299976348877, 0.00259554386138916, 0.0026733577251434326, 0.002751171588897705, 0.0028289854526519775, 0.00290679931640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 12.0, 28.0, 48.0, 160.0, 461.0, 3631.0, 952421.0, 89432.0, 1853.0, 309.0, 101.0, 44.0, 21.0, 12.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.9375, -70.3193359375, -67.701171875, -65.0830078125, -62.46484375, -59.8466796875, -57.228515625, -54.6103515625, -51.9921875, -49.3740234375, -46.755859375, -44.1376953125, -41.51953125, -38.9013671875, -36.283203125, -33.6650390625, -31.046875, -28.4287109375, -25.810546875, -23.1923828125, -20.57421875, -17.9560546875, -15.337890625, -12.7197265625, -10.1015625, -7.4833984375, -4.865234375, -2.2470703125, 0.37109375, 2.9892578125, 5.607421875, 8.2255859375, 10.84375, 13.4619140625, 16.080078125, 18.6982421875, 21.31640625, 23.9345703125, 26.552734375, 29.1708984375, 31.7890625, 34.4072265625, 37.025390625, 39.6435546875, 42.26171875, 44.8798828125, 47.498046875, 50.1162109375, 52.734375, 55.3525390625, 57.970703125, 60.5888671875, 63.20703125, 65.8251953125, 68.443359375, 71.0615234375, 73.6796875, 76.2978515625, 78.916015625, 81.5341796875, 84.15234375, 86.7705078125, 89.388671875, 92.0068359375, 94.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 18.0, 16.0, 29.0, 52.0, 116.0, 190.0, 222.0, 151.0, 103.0, 43.0, 24.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.029052734375, -15.04248046875, -14.055908203125, -13.0693359375, -12.082763671875, -11.09619140625, -10.109619140625, -9.123046875, -8.136474609375, -7.14990234375, -6.163330078125, -5.1767578125, -4.190185546875, -3.20361328125, -2.217041015625, -1.23046875, -0.243896484375, 0.74267578125, 1.729248046875, 2.7158203125, 3.702392578125, 4.68896484375, 5.675537109375, 6.662109375, 7.648681640625, 8.63525390625, 9.621826171875, 10.6083984375, 11.594970703125, 12.58154296875, 13.568115234375, 14.5546875, 15.541259765625, 16.52783203125, 17.514404296875, 18.5009765625, 19.487548828125, 20.47412109375, 21.460693359375, 22.447265625, 23.433837890625, 24.42041015625, 25.406982421875, 26.3935546875, 27.380126953125, 28.36669921875, 29.353271484375, 30.33984375, 31.326416015625, 32.31298828125, 33.299560546875, 34.2861328125, 35.272705078125, 36.25927734375, 37.245849609375, 38.232421875, 39.218994140625, 40.20556640625, 41.192138671875, 42.1787109375, 43.165283203125, 44.15185546875, 45.138427734375, 46.125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 11.0, 14.0, 33.0, 65.0, 174.0, 256.0, 210.0, 129.0, 58.0, 29.0, 11.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-494.0264892578125, -479.7998352050781, -465.57318115234375, -451.3465270996094, -437.119873046875, -422.8932189941406, -408.66656494140625, -394.43994140625, -380.2132568359375, -365.9866027832031, -351.75994873046875, -337.5332946777344, -323.306640625, -309.0799865722656, -294.85333251953125, -280.626708984375, -266.4000549316406, -252.17340087890625, -237.94674682617188, -223.7200927734375, -209.49343872070312, -195.26678466796875, -181.04014587402344, -166.81349182128906, -152.5868377685547, -138.3601837158203, -124.13352966308594, -109.9068832397461, -95.68022918701172, -81.45357513427734, -67.2269287109375, -53.000274658203125, -38.773651123046875, -24.546998977661133, -10.32034683227539, 3.9063034057617188, 18.132957458496094, 32.35961151123047, 46.58625793457031, 60.81291198730469, 75.03956604003906, 89.26622009277344, 103.49287414550781, 117.71952056884766, 131.9461669921875, 146.17282104492188, 160.39947509765625, 174.62612915039062, 188.852783203125, 203.07943725585938, 217.30609130859375, 231.53274536132812, 245.7593994140625, 259.9860534667969, 274.21270751953125, 288.4393310546875, 302.666015625, 316.8926696777344, 331.11932373046875, 345.3459777832031, 359.5726318359375, 373.7992858886719, 388.02593994140625, 402.2525634765625, 416.4792175292969]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 11.0, 5.0, 15.0, 10.0, 7.0, 15.0, 14.0, 21.0, 29.0, 30.0, 45.0, 35.0, 50.0, 49.0, 62.0, 51.0, 63.0, 59.0, 56.0, 50.0, 38.0, 41.0, 41.0, 27.0, 27.0, 33.0, 15.0, 19.0, 19.0, 16.0, 11.0, 7.0, 3.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.06375122070312, -173.07479858398438, -167.08584594726562, -161.09689331054688, -155.10794067382812, -149.11898803710938, -143.13003540039062, -137.14108276367188, -131.15213012695312, -125.16317749023438, -119.17422485351562, -113.18527221679688, -107.19631958007812, -101.20736694335938, -95.21841430664062, -89.22946166992188, -83.24050903320312, -77.25155639648438, -71.26260375976562, -65.27365112304688, -59.284698486328125, -53.295745849609375, -47.306793212890625, -41.317840576171875, -35.328887939453125, -29.339935302734375, -23.350982666015625, -17.362030029296875, -11.373077392578125, -5.384124755859375, 0.604827880859375, 6.593780517578125, 12.582733154296875, 18.571685791015625, 24.560638427734375, 30.549591064453125, 36.538543701171875, 42.527496337890625, 48.516448974609375, 54.505401611328125, 60.494354248046875, 66.48330688476562, 72.47225952148438, 78.46121215820312, 84.45016479492188, 90.43911743164062, 96.42807006835938, 102.41702270507812, 108.40597534179688, 114.39492797851562, 120.38388061523438, 126.37283325195312, 132.36178588867188, 138.35073852539062, 144.33969116210938, 150.32864379882812, 156.31759643554688, 162.30654907226562, 168.29550170898438, 174.28445434570312, 180.27340698242188, 186.26235961914062, 192.25131225585938, 198.24026489257812, 204.22921752929688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 11.0, 16.0, 17.0, 34.0, 48.0, 81.0, 145.0, 265.0, 449.0, 978.0, 2256.0, 9919.0, 4162332.0, 12992.0, 2476.0, 1076.0, 513.0, 268.0, 171.0, 85.0, 49.0, 30.0, 17.0, 18.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.875, -70.703125, -68.53125, -66.359375, -64.1875, -62.015625, -59.84375, -57.671875, -55.5, -53.328125, -51.15625, -48.984375, -46.8125, -44.640625, -42.46875, -40.296875, -38.125, -35.953125, -33.78125, -31.609375, -29.4375, -27.265625, -25.09375, -22.921875, -20.75, -18.578125, -16.40625, -14.234375, -12.0625, -9.890625, -7.71875, -5.546875, -3.375, -1.203125, 0.96875, 3.140625, 5.3125, 7.484375, 9.65625, 11.828125, 14.0, 16.171875, 18.34375, 20.515625, 22.6875, 24.859375, 27.03125, 29.203125, 31.375, 33.546875, 35.71875, 37.890625, 40.0625, 42.234375, 44.40625, 46.578125, 48.75, 50.921875, 53.09375, 55.265625, 57.4375, 59.609375, 61.78125, 63.953125, 66.125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 13.0, 14.0, 22.0, 22.0, 32.0, 44.0, 64.0, 60.0, 79.0, 68.0, 71.0, 98.0, 89.0, 67.0, 56.0, 44.0, 38.0, 33.0, 24.0, 14.0, 10.0, 7.0, 8.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.6640625, -14.240478515625, -13.81689453125, -13.393310546875, -12.9697265625, -12.546142578125, -12.12255859375, -11.698974609375, -11.275390625, -10.851806640625, -10.42822265625, -10.004638671875, -9.5810546875, -9.157470703125, -8.73388671875, -8.310302734375, -7.88671875, -7.463134765625, -7.03955078125, -6.615966796875, -6.1923828125, -5.768798828125, -5.34521484375, -4.921630859375, -4.498046875, -4.074462890625, -3.65087890625, -3.227294921875, -2.8037109375, -2.380126953125, -1.95654296875, -1.532958984375, -1.109375, -0.685791015625, -0.26220703125, 0.161376953125, 0.5849609375, 1.008544921875, 1.43212890625, 1.855712890625, 2.279296875, 2.702880859375, 3.12646484375, 3.550048828125, 3.9736328125, 4.397216796875, 4.82080078125, 5.244384765625, 5.66796875, 6.091552734375, 6.51513671875, 6.938720703125, 7.3623046875, 7.785888671875, 8.20947265625, 8.633056640625, 9.056640625, 9.480224609375, 9.90380859375, 10.327392578125, 10.7509765625, 11.174560546875, 11.59814453125, 12.021728515625, 12.4453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 13.0, 15.0, 22.0, 24.0, 56.0, 70.0, 100.0, 136.0, 176.0, 268.0, 427.0, 645.0, 1069.0, 1902.0, 3974.0, 16108.0, 4148345.0, 12711.0, 3579.0, 1753.0, 1026.0, 593.0, 397.0, 268.0, 166.0, 113.0, 81.0, 43.0, 44.0, 35.0, 23.0, 17.0, 17.0, 14.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.5751953125, -55.744140625, -53.9130859375, -52.08203125, -50.2509765625, -48.419921875, -46.5888671875, -44.7578125, -42.9267578125, -41.095703125, -39.2646484375, -37.43359375, -35.6025390625, -33.771484375, -31.9404296875, -30.109375, -28.2783203125, -26.447265625, -24.6162109375, -22.78515625, -20.9541015625, -19.123046875, -17.2919921875, -15.4609375, -13.6298828125, -11.798828125, -9.9677734375, -8.13671875, -6.3056640625, -4.474609375, -2.6435546875, -0.8125, 1.0185546875, 2.849609375, 4.6806640625, 6.51171875, 8.3427734375, 10.173828125, 12.0048828125, 13.8359375, 15.6669921875, 17.498046875, 19.3291015625, 21.16015625, 22.9912109375, 24.822265625, 26.6533203125, 28.484375, 30.3154296875, 32.146484375, 33.9775390625, 35.80859375, 37.6396484375, 39.470703125, 41.3017578125, 43.1328125, 44.9638671875, 46.794921875, 48.6259765625, 50.45703125, 52.2880859375, 54.119140625, 55.9501953125, 57.78125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 9.0, 18.0, 3120.0, 880.0, 22.0, 3.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.7032470703125, -13.195556640625, -12.6878662109375, -12.18017578125, -11.6724853515625, -11.164794921875, -10.6571044921875, -10.1494140625, -9.6417236328125, -9.134033203125, -8.6263427734375, -8.11865234375, -7.6109619140625, -7.103271484375, -6.5955810546875, -6.087890625, -5.5802001953125, -5.072509765625, -4.5648193359375, -4.05712890625, -3.5494384765625, -3.041748046875, -2.5340576171875, -2.0263671875, -1.5186767578125, -1.010986328125, -0.5032958984375, 0.00439453125, 0.5120849609375, 1.019775390625, 1.5274658203125, 2.03515625, 2.5428466796875, 3.050537109375, 3.5582275390625, 4.06591796875, 4.5736083984375, 5.081298828125, 5.5889892578125, 6.0966796875, 6.6043701171875, 7.112060546875, 7.6197509765625, 8.12744140625, 8.6351318359375, 9.142822265625, 9.6505126953125, 10.158203125, 10.6658935546875, 11.173583984375, 11.6812744140625, 12.18896484375, 12.6966552734375, 13.204345703125, 13.7120361328125, 14.2197265625, 14.7274169921875, 15.235107421875, 15.7427978515625, 16.25048828125, 16.7581787109375, 17.265869140625, 17.7735595703125, 18.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 8.0, 12.0, 19.0, 19.0, 58.0, 81.0, 123.0, 198.0, 178.0, 124.0, 79.0, 33.0, 22.0, 22.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.01927185058594, -55.553951263427734, -54.08863067626953, -52.62331008911133, -51.157989501953125, -49.69267272949219, -48.227352142333984, -46.76203155517578, -45.29671096801758, -43.831390380859375, -42.36606979370117, -40.90074920654297, -39.43543243408203, -37.97011184692383, -36.504791259765625, -35.03947067260742, -33.57415008544922, -32.108829498291016, -30.643508911132812, -29.178190231323242, -27.71286964416504, -26.247549057006836, -24.782230377197266, -23.316909790039062, -21.85158920288086, -20.386268615722656, -18.920948028564453, -17.455629348754883, -15.99030876159668, -14.524988174438477, -13.05966854095459, -11.594348907470703, -10.129032135009766, -8.663711547851562, -7.198391914367676, -5.733071804046631, -4.267751693725586, -2.802431583404541, -1.337111473083496, 0.12820816040039062, 1.5935287475585938, 3.0588488578796387, 4.524168968200684, 5.9894890785217285, 7.454809188842773, 8.920129776000977, 10.385449409484863, 11.85076904296875, 13.316089630126953, 14.781410217285156, 16.24673080444336, 17.71204948425293, 19.177370071411133, 20.642690658569336, 22.108009338378906, 23.57332992553711, 25.038650512695312, 26.503971099853516, 27.96929168701172, 29.43461036682129, 30.899930953979492, 32.36524963378906, 33.830570220947266, 35.29589080810547, 36.76121139526367]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 9.0, 12.0, 13.0, 14.0, 21.0, 19.0, 28.0, 38.0, 34.0, 29.0, 31.0, 42.0, 43.0, 51.0, 48.0, 47.0, 49.0, 60.0, 63.0, 43.0, 38.0, 42.0, 31.0, 29.0, 24.0, 26.0, 13.0, 18.0, 19.0, 6.0, 11.0, 9.0, 4.0, 5.0, 8.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.803924560546875, -18.190902709960938, -17.577880859375, -16.964860916137695, -16.351839065551758, -15.73881721496582, -15.1257963180542, -14.512775421142578, -13.89975357055664, -13.286731719970703, -12.673710823059082, -12.060689926147461, -11.447668075561523, -10.834646224975586, -10.221625328063965, -9.608604431152344, -8.995582580566406, -8.382560729980469, -7.769539833068848, -7.156518459320068, -6.543497085571289, -5.93047571182251, -5.3174543380737305, -4.704432964324951, -4.091411590576172, -3.4783902168273926, -2.8653688430786133, -2.252347469329834, -1.6393260955810547, -1.0263047218322754, -0.4132833480834961, 0.1997380256652832, 0.8127574920654297, 1.425778865814209, 2.0388002395629883, 2.6518216133117676, 3.264842987060547, 3.877864360809326, 4.4908857345581055, 5.103907108306885, 5.716928482055664, 6.329949855804443, 6.942971229553223, 7.555992603302002, 8.169013977050781, 8.782035827636719, 9.39505672454834, 10.008077621459961, 10.621099472045898, 11.234121322631836, 11.847142219543457, 12.460163116455078, 13.073184967041016, 13.686206817626953, 14.299227714538574, 14.912248611450195, 15.525270462036133, 16.13829231262207, 16.751312255859375, 17.364334106445312, 17.97735595703125, 18.590377807617188, 19.203399658203125, 19.81641960144043, 20.429441452026367]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 20.0, 20.0, 45.0, 60.0, 92.0, 154.0, 220.0, 391.0, 780.0, 1631.0, 3895.0, 10113.0, 33657.0, 144276.0, 532986.0, 243260.0, 52845.0, 14680.0, 5128.0, 2058.0, 998.0, 477.0, 289.0, 166.0, 100.0, 54.0, 36.0, 25.0, 17.0, 17.0, 10.0, 3.0, 9.0, 4.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0], "bins": [-39.125, -38.086181640625, -37.04736328125, -36.008544921875, -34.9697265625, -33.930908203125, -32.89208984375, -31.853271484375, -30.814453125, -29.775634765625, -28.73681640625, -27.697998046875, -26.6591796875, -25.620361328125, -24.58154296875, -23.542724609375, -22.50390625, -21.465087890625, -20.42626953125, -19.387451171875, -18.3486328125, -17.309814453125, -16.27099609375, -15.232177734375, -14.193359375, -13.154541015625, -12.11572265625, -11.076904296875, -10.0380859375, -8.999267578125, -7.96044921875, -6.921630859375, -5.8828125, -4.843994140625, -3.80517578125, -2.766357421875, -1.7275390625, -0.688720703125, 0.35009765625, 1.388916015625, 2.427734375, 3.466552734375, 4.50537109375, 5.544189453125, 6.5830078125, 7.621826171875, 8.66064453125, 9.699462890625, 10.73828125, 11.777099609375, 12.81591796875, 13.854736328125, 14.8935546875, 15.932373046875, 16.97119140625, 18.010009765625, 19.048828125, 20.087646484375, 21.12646484375, 22.165283203125, 23.2041015625, 24.242919921875, 25.28173828125, 26.320556640625, 27.359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 3.0, 11.0, 18.0, 31.0, 20.0, 37.0, 47.0, 66.0, 71.0, 65.0, 79.0, 82.0, 94.0, 80.0, 68.0, 44.0, 48.0, 30.0, 32.0, 26.0, 10.0, 10.0, 3.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.6834716796875, -15.226318359375, -14.7691650390625, -14.31201171875, -13.8548583984375, -13.397705078125, -12.9405517578125, -12.4833984375, -12.0262451171875, -11.569091796875, -11.1119384765625, -10.65478515625, -10.1976318359375, -9.740478515625, -9.2833251953125, -8.826171875, -8.3690185546875, -7.911865234375, -7.4547119140625, -6.99755859375, -6.5404052734375, -6.083251953125, -5.6260986328125, -5.1689453125, -4.7117919921875, -4.254638671875, -3.7974853515625, -3.34033203125, -2.8831787109375, -2.426025390625, -1.9688720703125, -1.51171875, -1.0545654296875, -0.597412109375, -0.1402587890625, 0.31689453125, 0.7740478515625, 1.231201171875, 1.6883544921875, 2.1455078125, 2.6026611328125, 3.059814453125, 3.5169677734375, 3.97412109375, 4.4312744140625, 4.888427734375, 5.3455810546875, 5.802734375, 6.2598876953125, 6.717041015625, 7.1741943359375, 7.63134765625, 8.0885009765625, 8.545654296875, 9.0028076171875, 9.4599609375, 9.9171142578125, 10.374267578125, 10.8314208984375, 11.28857421875, 11.7457275390625, 12.202880859375, 12.6600341796875, 13.1171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 14.0, 14.0, 31.0, 30.0, 53.0, 72.0, 90.0, 138.0, 204.0, 384.0, 644.0, 1410.0, 5122.0, 39340.0, 736455.0, 243251.0, 15979.0, 2881.0, 1057.0, 519.0, 286.0, 167.0, 121.0, 82.0, 56.0, 35.0, 26.0, 18.0, 13.0, 6.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-69.125, -67.1943359375, -65.263671875, -63.3330078125, -61.40234375, -59.4716796875, -57.541015625, -55.6103515625, -53.6796875, -51.7490234375, -49.818359375, -47.8876953125, -45.95703125, -44.0263671875, -42.095703125, -40.1650390625, -38.234375, -36.3037109375, -34.373046875, -32.4423828125, -30.51171875, -28.5810546875, -26.650390625, -24.7197265625, -22.7890625, -20.8583984375, -18.927734375, -16.9970703125, -15.06640625, -13.1357421875, -11.205078125, -9.2744140625, -7.34375, -5.4130859375, -3.482421875, -1.5517578125, 0.37890625, 2.3095703125, 4.240234375, 6.1708984375, 8.1015625, 10.0322265625, 11.962890625, 13.8935546875, 15.82421875, 17.7548828125, 19.685546875, 21.6162109375, 23.546875, 25.4775390625, 27.408203125, 29.3388671875, 31.26953125, 33.2001953125, 35.130859375, 37.0615234375, 38.9921875, 40.9228515625, 42.853515625, 44.7841796875, 46.71484375, 48.6455078125, 50.576171875, 52.5068359375, 54.4375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 6.0, 5.0, 4.0, 11.0, 15.0, 7.0, 13.0, 21.0, 22.0, 16.0, 31.0, 38.0, 24.0, 32.0, 29.0, 46.0, 41.0, 42.0, 36.0, 42.0, 36.0, 45.0, 40.0, 39.0, 21.0, 37.0, 31.0, 34.0, 21.0, 29.0, 15.0, 22.0, 30.0, 27.0, 8.0, 12.0, 13.0, 6.0, 8.0, 5.0, 7.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.0625, -34.88427734375, -33.7060546875, -32.52783203125, -31.349609375, -30.17138671875, -28.9931640625, -27.81494140625, -26.63671875, -25.45849609375, -24.2802734375, -23.10205078125, -21.923828125, -20.74560546875, -19.5673828125, -18.38916015625, -17.2109375, -16.03271484375, -14.8544921875, -13.67626953125, -12.498046875, -11.31982421875, -10.1416015625, -8.96337890625, -7.78515625, -6.60693359375, -5.4287109375, -4.25048828125, -3.072265625, -1.89404296875, -0.7158203125, 0.46240234375, 1.640625, 2.81884765625, 3.9970703125, 5.17529296875, 6.353515625, 7.53173828125, 8.7099609375, 9.88818359375, 11.06640625, 12.24462890625, 13.4228515625, 14.60107421875, 15.779296875, 16.95751953125, 18.1357421875, 19.31396484375, 20.4921875, 21.67041015625, 22.8486328125, 24.02685546875, 25.205078125, 26.38330078125, 27.5615234375, 28.73974609375, 29.91796875, 31.09619140625, 32.2744140625, 33.45263671875, 34.630859375, 35.80908203125, 36.9873046875, 38.16552734375, 39.34375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 6.0, 7.0, 4.0, 8.0, 13.0, 20.0, 22.0, 32.0, 65.0, 91.0, 214.0, 507.0, 1810.0, 13253.0, 702174.0, 318609.0, 9298.0, 1489.0, 478.0, 191.0, 92.0, 51.0, 35.0, 15.0, 13.0, 14.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.6875, -48.341796875, -46.99609375, -45.650390625, -44.3046875, -42.958984375, -41.61328125, -40.267578125, -38.921875, -37.576171875, -36.23046875, -34.884765625, -33.5390625, -32.193359375, -30.84765625, -29.501953125, -28.15625, -26.810546875, -25.46484375, -24.119140625, -22.7734375, -21.427734375, -20.08203125, -18.736328125, -17.390625, -16.044921875, -14.69921875, -13.353515625, -12.0078125, -10.662109375, -9.31640625, -7.970703125, -6.625, -5.279296875, -3.93359375, -2.587890625, -1.2421875, 0.103515625, 1.44921875, 2.794921875, 4.140625, 5.486328125, 6.83203125, 8.177734375, 9.5234375, 10.869140625, 12.21484375, 13.560546875, 14.90625, 16.251953125, 17.59765625, 18.943359375, 20.2890625, 21.634765625, 22.98046875, 24.326171875, 25.671875, 27.017578125, 28.36328125, 29.708984375, 31.0546875, 32.400390625, 33.74609375, 35.091796875, 36.4375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 4.0, 5.0, 7.0, 7.0, 14.0, 10.0, 18.0, 24.0, 24.0, 34.0, 42.0, 41.0, 71.0, 73.0, 105.0, 74.0, 93.0, 67.0, 55.0, 43.0, 43.0, 25.0, 19.0, 18.0, 15.0, 10.0, 9.0, 8.0, 7.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00244140625, -0.002371877431869507, -0.0023023486137390137, -0.0022328197956085205, -0.0021632909774780273, -0.002093762159347534, -0.002024233341217041, -0.001954704523086548, -0.0018851757049560547, -0.0018156468868255615, -0.0017461180686950684, -0.0016765892505645752, -0.001607060432434082, -0.0015375316143035889, -0.0014680027961730957, -0.0013984739780426025, -0.0013289451599121094, -0.0012594163417816162, -0.001189887523651123, -0.0011203587055206299, -0.0010508298873901367, -0.0009813010692596436, -0.0009117722511291504, -0.0008422434329986572, -0.0007727146148681641, -0.0007031857967376709, -0.0006336569786071777, -0.0005641281604766846, -0.0004945993423461914, -0.00042507052421569824, -0.0003555417060852051, -0.0002860128879547119, -0.00021648406982421875, -0.00014695525169372559, -7.742643356323242e-05, -7.897615432739258e-06, 6.16312026977539e-05, 0.00013116002082824707, 0.00020068883895874023, 0.0002702176570892334, 0.00033974647521972656, 0.0004092752933502197, 0.0004788041114807129, 0.0005483329296112061, 0.0006178617477416992, 0.0006873905658721924, 0.0007569193840026855, 0.0008264482021331787, 0.0008959770202636719, 0.000965505838394165, 0.0010350346565246582, 0.0011045634746551514, 0.0011740922927856445, 0.0012436211109161377, 0.0013131499290466309, 0.001382678747177124, 0.0014522075653076172, 0.0015217363834381104, 0.0015912652015686035, 0.0016607940196990967, 0.0017303228378295898, 0.001799851655960083, 0.0018693804740905762, 0.0019389092922210693, 0.0020084381103515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 14.0, 6.0, 9.0, 10.0, 17.0, 19.0, 37.0, 40.0, 76.0, 108.0, 186.0, 373.0, 667.0, 1418.0, 3396.0, 10880.0, 80122.0, 823789.0, 107556.0, 12947.0, 3570.0, 1600.0, 722.0, 381.0, 200.0, 123.0, 83.0, 51.0, 36.0, 26.0, 17.0, 10.0, 11.0, 15.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-29.78125, -28.943603515625, -28.10595703125, -27.268310546875, -26.4306640625, -25.593017578125, -24.75537109375, -23.917724609375, -23.080078125, -22.242431640625, -21.40478515625, -20.567138671875, -19.7294921875, -18.891845703125, -18.05419921875, -17.216552734375, -16.37890625, -15.541259765625, -14.70361328125, -13.865966796875, -13.0283203125, -12.190673828125, -11.35302734375, -10.515380859375, -9.677734375, -8.840087890625, -8.00244140625, -7.164794921875, -6.3271484375, -5.489501953125, -4.65185546875, -3.814208984375, -2.9765625, -2.138916015625, -1.30126953125, -0.463623046875, 0.3740234375, 1.211669921875, 2.04931640625, 2.886962890625, 3.724609375, 4.562255859375, 5.39990234375, 6.237548828125, 7.0751953125, 7.912841796875, 8.75048828125, 9.588134765625, 10.42578125, 11.263427734375, 12.10107421875, 12.938720703125, 13.7763671875, 14.614013671875, 15.45166015625, 16.289306640625, 17.126953125, 17.964599609375, 18.80224609375, 19.639892578125, 20.4775390625, 21.315185546875, 22.15283203125, 22.990478515625, 23.828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 12.0, 19.0, 19.0, 41.0, 32.0, 58.0, 53.0, 88.0, 113.0, 105.0, 77.0, 82.0, 81.0, 54.0, 44.0, 30.0, 30.0, 16.0, 9.0, 10.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.53125, -16.93408203125, -16.3369140625, -15.73974609375, -15.142578125, -14.54541015625, -13.9482421875, -13.35107421875, -12.75390625, -12.15673828125, -11.5595703125, -10.96240234375, -10.365234375, -9.76806640625, -9.1708984375, -8.57373046875, -7.9765625, -7.37939453125, -6.7822265625, -6.18505859375, -5.587890625, -4.99072265625, -4.3935546875, -3.79638671875, -3.19921875, -2.60205078125, -2.0048828125, -1.40771484375, -0.810546875, -0.21337890625, 0.3837890625, 0.98095703125, 1.578125, 2.17529296875, 2.7724609375, 3.36962890625, 3.966796875, 4.56396484375, 5.1611328125, 5.75830078125, 6.35546875, 6.95263671875, 7.5498046875, 8.14697265625, 8.744140625, 9.34130859375, 9.9384765625, 10.53564453125, 11.1328125, 11.72998046875, 12.3271484375, 12.92431640625, 13.521484375, 14.11865234375, 14.7158203125, 15.31298828125, 15.91015625, 16.50732421875, 17.1044921875, 17.70166015625, 18.298828125, 18.89599609375, 19.4931640625, 20.09033203125, 20.6875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 10.0, 36.0, 135.0, 302.0, 320.0, 132.0, 44.0, 16.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.6099853515625, -738.594970703125, -717.5798950195312, -696.5648803710938, -675.5498657226562, -654.5347900390625, -633.519775390625, -612.5047607421875, -591.48974609375, -570.4747314453125, -549.4596557617188, -528.4446411132812, -507.42962646484375, -486.4145812988281, -465.3995361328125, -444.384521484375, -423.36944580078125, -402.3544006347656, -381.3393859863281, -360.3243408203125, -339.309326171875, -318.2942810058594, -297.27923583984375, -276.26422119140625, -255.24917602539062, -234.23414611816406, -213.2191162109375, -192.20407104492188, -171.1890411376953, -150.17401123046875, -129.15896606445312, -108.14393615722656, -87.12896728515625, -66.11393737792969, -45.098899841308594, -24.083866119384766, -3.0688323974609375, 17.946197509765625, 38.96123504638672, 59.97627258300781, 80.99130249023438, 102.00633239746094, 123.02136993408203, 144.03640747070312, 165.0514373779297, 186.06646728515625, 207.08151245117188, 228.09654235839844, 249.111572265625, 270.1266174316406, 291.1416320800781, 312.15667724609375, 333.17169189453125, 354.1867370605469, 375.2017822265625, 396.216796875, 417.2318420410156, 438.24688720703125, 459.26190185546875, 480.2769470214844, 501.2919921875, 522.3070068359375, 543.322021484375, 564.3370971679688, 585.3521118164062]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 3.0, 7.0, 4.0, 10.0, 14.0, 12.0, 16.0, 23.0, 19.0, 34.0, 23.0, 36.0, 37.0, 56.0, 36.0, 65.0, 53.0, 54.0, 53.0, 49.0, 53.0, 48.0, 58.0, 32.0, 30.0, 29.0, 31.0, 23.0, 10.0, 13.0, 13.0, 16.0, 4.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-222.26324462890625, -215.46580505371094, -208.66835021972656, -201.87091064453125, -195.07345581054688, -188.27601623535156, -181.4785614013672, -174.68112182617188, -167.8836669921875, -161.0862274169922, -154.2887725830078, -147.4913330078125, -140.69387817382812, -133.8964385986328, -127.09898376464844, -120.30154418945312, -113.50409698486328, -106.70664978027344, -99.9092025756836, -93.11175537109375, -86.3143081665039, -79.51686096191406, -72.71942138671875, -65.92196655273438, -59.1245231628418, -52.32707595825195, -45.52962875366211, -38.73218536376953, -31.934736251831055, -25.137290954589844, -18.33984375, -11.542396545410156, -4.7449493408203125, 2.052497386932373, 8.849944114685059, 15.647390365600586, 22.44483757019043, 29.24228286743164, 36.039730072021484, 42.83717727661133, 49.63462448120117, 56.432071685791016, 63.22951889038086, 70.02696228027344, 76.82440948486328, 83.62185668945312, 90.41930389404297, 97.21675109863281, 104.01419830322266, 110.8116455078125, 117.60909271240234, 124.40653991699219, 131.2039794921875, 138.00143432617188, 144.7988739013672, 151.59632873535156, 158.39376831054688, 165.1912078857422, 171.98866271972656, 178.78610229492188, 185.58355712890625, 192.38099670410156, 199.17845153808594, 205.97589111328125, 212.77334594726562]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 18.0, 25.0, 35.0, 38.0, 66.0, 109.0, 161.0, 239.0, 433.0, 768.0, 1492.0, 3630.0, 12038.0, 3429864.0, 726612.0, 11720.0, 3564.0, 1544.0, 749.0, 444.0, 270.0, 147.0, 97.0, 63.0, 37.0, 29.0, 25.0, 19.0, 10.0, 6.0, 7.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-68.5, -66.7431640625, -64.986328125, -63.2294921875, -61.47265625, -59.7158203125, -57.958984375, -56.2021484375, -54.4453125, -52.6884765625, -50.931640625, -49.1748046875, -47.41796875, -45.6611328125, -43.904296875, -42.1474609375, -40.390625, -38.6337890625, -36.876953125, -35.1201171875, -33.36328125, -31.6064453125, -29.849609375, -28.0927734375, -26.3359375, -24.5791015625, -22.822265625, -21.0654296875, -19.30859375, -17.5517578125, -15.794921875, -14.0380859375, -12.28125, -10.5244140625, -8.767578125, -7.0107421875, -5.25390625, -3.4970703125, -1.740234375, 0.0166015625, 1.7734375, 3.5302734375, 5.287109375, 7.0439453125, 8.80078125, 10.5576171875, 12.314453125, 14.0712890625, 15.828125, 17.5849609375, 19.341796875, 21.0986328125, 22.85546875, 24.6123046875, 26.369140625, 28.1259765625, 29.8828125, 31.6396484375, 33.396484375, 35.1533203125, 36.91015625, 38.6669921875, 40.423828125, 42.1806640625, 43.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 8.0, 9.0, 19.0, 30.0, 27.0, 45.0, 49.0, 51.0, 70.0, 84.0, 85.0, 97.0, 89.0, 79.0, 55.0, 42.0, 51.0, 39.0, 13.0, 11.0, 16.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.640625, -14.16943359375, -13.6982421875, -13.22705078125, -12.755859375, -12.28466796875, -11.8134765625, -11.34228515625, -10.87109375, -10.39990234375, -9.9287109375, -9.45751953125, -8.986328125, -8.51513671875, -8.0439453125, -7.57275390625, -7.1015625, -6.63037109375, -6.1591796875, -5.68798828125, -5.216796875, -4.74560546875, -4.2744140625, -3.80322265625, -3.33203125, -2.86083984375, -2.3896484375, -1.91845703125, -1.447265625, -0.97607421875, -0.5048828125, -0.03369140625, 0.4375, 0.90869140625, 1.3798828125, 1.85107421875, 2.322265625, 2.79345703125, 3.2646484375, 3.73583984375, 4.20703125, 4.67822265625, 5.1494140625, 5.62060546875, 6.091796875, 6.56298828125, 7.0341796875, 7.50537109375, 7.9765625, 8.44775390625, 8.9189453125, 9.39013671875, 9.861328125, 10.33251953125, 10.8037109375, 11.27490234375, 11.74609375, 12.21728515625, 12.6884765625, 13.15966796875, 13.630859375, 14.10205078125, 14.5732421875, 15.04443359375, 15.515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 19.0, 8.0, 23.0, 25.0, 33.0, 47.0, 59.0, 84.0, 117.0, 173.0, 279.0, 380.0, 634.0, 1087.0, 2022.0, 5010.0, 16640.0, 580488.0, 3558904.0, 17934.0, 5163.0, 2089.0, 1028.0, 657.0, 402.0, 292.0, 209.0, 116.0, 92.0, 81.0, 57.0, 32.0, 27.0, 22.0, 16.0, 11.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-69.9375, -68.09814453125, -66.2587890625, -64.41943359375, -62.580078125, -60.74072265625, -58.9013671875, -57.06201171875, -55.22265625, -53.38330078125, -51.5439453125, -49.70458984375, -47.865234375, -46.02587890625, -44.1865234375, -42.34716796875, -40.5078125, -38.66845703125, -36.8291015625, -34.98974609375, -33.150390625, -31.31103515625, -29.4716796875, -27.63232421875, -25.79296875, -23.95361328125, -22.1142578125, -20.27490234375, -18.435546875, -16.59619140625, -14.7568359375, -12.91748046875, -11.078125, -9.23876953125, -7.3994140625, -5.56005859375, -3.720703125, -1.88134765625, -0.0419921875, 1.79736328125, 3.63671875, 5.47607421875, 7.3154296875, 9.15478515625, 10.994140625, 12.83349609375, 14.6728515625, 16.51220703125, 18.3515625, 20.19091796875, 22.0302734375, 23.86962890625, 25.708984375, 27.54833984375, 29.3876953125, 31.22705078125, 33.06640625, 34.90576171875, 36.7451171875, 38.58447265625, 40.423828125, 42.26318359375, 44.1025390625, 45.94189453125, 47.78125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 4.0, 7.0, 23.0, 39.0, 114.0, 3428.0, 310.0, 53.0, 22.0, 16.0, 13.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.6416015625, -22.845703125, -22.0498046875, -21.25390625, -20.4580078125, -19.662109375, -18.8662109375, -18.0703125, -17.2744140625, -16.478515625, -15.6826171875, -14.88671875, -14.0908203125, -13.294921875, -12.4990234375, -11.703125, -10.9072265625, -10.111328125, -9.3154296875, -8.51953125, -7.7236328125, -6.927734375, -6.1318359375, -5.3359375, -4.5400390625, -3.744140625, -2.9482421875, -2.15234375, -1.3564453125, -0.560546875, 0.2353515625, 1.03125, 1.8271484375, 2.623046875, 3.4189453125, 4.21484375, 5.0107421875, 5.806640625, 6.6025390625, 7.3984375, 8.1943359375, 8.990234375, 9.7861328125, 10.58203125, 11.3779296875, 12.173828125, 12.9697265625, 13.765625, 14.5615234375, 15.357421875, 16.1533203125, 16.94921875, 17.7451171875, 18.541015625, 19.3369140625, 20.1328125, 20.9287109375, 21.724609375, 22.5205078125, 23.31640625, 24.1123046875, 24.908203125, 25.7041015625, 26.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 18.0, 34.0, 42.0, 109.0, 182.0, 177.0, 163.0, 93.0, 57.0, 36.0, 17.0, 12.0, 14.0, 5.0, 8.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.29229736328125, -113.61597442626953, -109.93964385986328, -106.26332092285156, -102.58699798583984, -98.91067504882812, -95.23434448242188, -91.55802154541016, -87.88169860839844, -84.20537567138672, -80.52904510498047, -76.85272216796875, -73.17639923095703, -69.50007629394531, -65.82374572753906, -62.147422790527344, -58.47109603881836, -54.794769287109375, -51.118446350097656, -47.44211959838867, -43.76579666137695, -40.08946990966797, -36.41314697265625, -32.736820220947266, -29.060495376586914, -25.384170532226562, -21.70784568786621, -18.03152084350586, -14.355195045471191, -10.678869247436523, -7.002544403076172, -3.3262195587158203, 0.35010528564453125, 4.026430130004883, 7.702755451202393, 11.379080772399902, 15.055405616760254, 18.731731414794922, 22.408056259155273, 26.084381103515625, 29.760705947875977, 33.43703079223633, 37.11335754394531, 40.78968048095703, 44.466007232666016, 48.142333984375, 51.81865692138672, 55.49497985839844, 59.17130661010742, 62.847633361816406, 66.52395629882812, 70.20027923583984, 73.8766098022461, 77.55293273925781, 81.22925567626953, 84.90557861328125, 88.5819091796875, 92.25823211669922, 95.93456268310547, 99.61088562011719, 103.2872085571289, 106.96353149414062, 110.63986206054688, 114.3161849975586, 117.99250793457031]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 4.0, 10.0, 8.0, 13.0, 14.0, 24.0, 16.0, 19.0, 25.0, 27.0, 34.0, 36.0, 39.0, 33.0, 55.0, 39.0, 33.0, 55.0, 42.0, 49.0, 39.0, 48.0, 48.0, 41.0, 36.0, 26.0, 38.0, 29.0, 16.0, 18.0, 12.0, 14.0, 12.0, 7.0, 8.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0], "bins": [-69.52024841308594, -67.7821044921875, -66.04396057128906, -64.30581665039062, -62.56767272949219, -60.82952880859375, -59.09138488769531, -57.353240966796875, -55.61509704589844, -53.876953125, -52.13880920410156, -50.400665283203125, -48.66252136230469, -46.92437744140625, -45.18623352050781, -43.448089599609375, -41.70994567871094, -39.9718017578125, -38.23365783691406, -36.495513916015625, -34.75736999511719, -33.01922607421875, -31.281082153320312, -29.542938232421875, -27.804790496826172, -26.066646575927734, -24.328502655029297, -22.59035873413086, -20.852214813232422, -19.114070892333984, -17.375926971435547, -15.637782096862793, -13.899639129638672, -12.161495208740234, -10.423351287841797, -8.68520736694336, -6.947062969207764, -5.208918571472168, -3.4707746505737305, -1.732630729675293, 0.005513191223144531, 1.7436572313308716, 3.4818012714385986, 5.219945430755615, 6.958089351654053, 8.696233749389648, 10.434377670288086, 12.172521591186523, 13.910665512084961, 15.648809432983398, 17.386953353881836, 19.125097274780273, 20.86324119567871, 22.60138702392578, 24.33953094482422, 26.077674865722656, 27.815818786621094, 29.55396270751953, 31.29210662841797, 33.030250549316406, 34.768394470214844, 36.50653839111328, 38.24468231201172, 39.982826232910156, 41.720970153808594]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 10.0, 8.0, 15.0, 27.0, 35.0, 47.0, 74.0, 94.0, 145.0, 241.0, 428.0, 840.0, 1727.0, 4178.0, 11138.0, 35524.0, 141699.0, 530470.0, 239718.0, 55283.0, 16376.0, 5776.0, 2256.0, 1065.0, 536.0, 288.0, 185.0, 104.0, 70.0, 59.0, 36.0, 26.0, 11.0, 15.0, 11.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-39.375, -38.20556640625, -37.0361328125, -35.86669921875, -34.697265625, -33.52783203125, -32.3583984375, -31.18896484375, -30.01953125, -28.85009765625, -27.6806640625, -26.51123046875, -25.341796875, -24.17236328125, -23.0029296875, -21.83349609375, -20.6640625, -19.49462890625, -18.3251953125, -17.15576171875, -15.986328125, -14.81689453125, -13.6474609375, -12.47802734375, -11.30859375, -10.13916015625, -8.9697265625, -7.80029296875, -6.630859375, -5.46142578125, -4.2919921875, -3.12255859375, -1.953125, -0.78369140625, 0.3857421875, 1.55517578125, 2.724609375, 3.89404296875, 5.0634765625, 6.23291015625, 7.40234375, 8.57177734375, 9.7412109375, 10.91064453125, 12.080078125, 13.24951171875, 14.4189453125, 15.58837890625, 16.7578125, 17.92724609375, 19.0966796875, 20.26611328125, 21.435546875, 22.60498046875, 23.7744140625, 24.94384765625, 26.11328125, 27.28271484375, 28.4521484375, 29.62158203125, 30.791015625, 31.96044921875, 33.1298828125, 34.29931640625, 35.46875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 11.0, 15.0, 19.0, 19.0, 38.0, 47.0, 60.0, 71.0, 69.0, 92.0, 91.0, 77.0, 80.0, 59.0, 72.0, 43.0, 41.0, 34.0, 25.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.509765625, -16.95703125, -16.404296875, -15.8515625, -15.298828125, -14.74609375, -14.193359375, -13.640625, -13.087890625, -12.53515625, -11.982421875, -11.4296875, -10.876953125, -10.32421875, -9.771484375, -9.21875, -8.666015625, -8.11328125, -7.560546875, -7.0078125, -6.455078125, -5.90234375, -5.349609375, -4.796875, -4.244140625, -3.69140625, -3.138671875, -2.5859375, -2.033203125, -1.48046875, -0.927734375, -0.375, 0.177734375, 0.73046875, 1.283203125, 1.8359375, 2.388671875, 2.94140625, 3.494140625, 4.046875, 4.599609375, 5.15234375, 5.705078125, 6.2578125, 6.810546875, 7.36328125, 7.916015625, 8.46875, 9.021484375, 9.57421875, 10.126953125, 10.6796875, 11.232421875, 11.78515625, 12.337890625, 12.890625, 13.443359375, 13.99609375, 14.548828125, 15.1015625, 15.654296875, 16.20703125, 16.759765625, 17.3125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 12.0, 11.0, 24.0, 23.0, 38.0, 68.0, 111.0, 152.0, 230.0, 360.0, 856.0, 1910.0, 5261.0, 25960.0, 308624.0, 646998.0, 45435.0, 7693.0, 2434.0, 1023.0, 500.0, 269.0, 205.0, 117.0, 82.0, 44.0, 40.0, 14.0, 12.0, 10.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.21875, -50.36279296875, -48.5068359375, -46.65087890625, -44.794921875, -42.93896484375, -41.0830078125, -39.22705078125, -37.37109375, -35.51513671875, -33.6591796875, -31.80322265625, -29.947265625, -28.09130859375, -26.2353515625, -24.37939453125, -22.5234375, -20.66748046875, -18.8115234375, -16.95556640625, -15.099609375, -13.24365234375, -11.3876953125, -9.53173828125, -7.67578125, -5.81982421875, -3.9638671875, -2.10791015625, -0.251953125, 1.60400390625, 3.4599609375, 5.31591796875, 7.171875, 9.02783203125, 10.8837890625, 12.73974609375, 14.595703125, 16.45166015625, 18.3076171875, 20.16357421875, 22.01953125, 23.87548828125, 25.7314453125, 27.58740234375, 29.443359375, 31.29931640625, 33.1552734375, 35.01123046875, 36.8671875, 38.72314453125, 40.5791015625, 42.43505859375, 44.291015625, 46.14697265625, 48.0029296875, 49.85888671875, 51.71484375, 53.57080078125, 55.4267578125, 57.28271484375, 59.138671875, 60.99462890625, 62.8505859375, 64.70654296875, 66.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 10.0, 4.0, 13.0, 18.0, 16.0, 25.0, 26.0, 32.0, 27.0, 37.0, 39.0, 49.0, 44.0, 49.0, 46.0, 50.0, 65.0, 43.0, 52.0, 50.0, 46.0, 47.0, 33.0, 37.0, 23.0, 25.0, 14.0, 22.0, 18.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.53125, -44.91845703125, -43.3056640625, -41.69287109375, -40.080078125, -38.46728515625, -36.8544921875, -35.24169921875, -33.62890625, -32.01611328125, -30.4033203125, -28.79052734375, -27.177734375, -25.56494140625, -23.9521484375, -22.33935546875, -20.7265625, -19.11376953125, -17.5009765625, -15.88818359375, -14.275390625, -12.66259765625, -11.0498046875, -9.43701171875, -7.82421875, -6.21142578125, -4.5986328125, -2.98583984375, -1.373046875, 0.23974609375, 1.8525390625, 3.46533203125, 5.078125, 6.69091796875, 8.3037109375, 9.91650390625, 11.529296875, 13.14208984375, 14.7548828125, 16.36767578125, 17.98046875, 19.59326171875, 21.2060546875, 22.81884765625, 24.431640625, 26.04443359375, 27.6572265625, 29.27001953125, 30.8828125, 32.49560546875, 34.1083984375, 35.72119140625, 37.333984375, 38.94677734375, 40.5595703125, 42.17236328125, 43.78515625, 45.39794921875, 47.0107421875, 48.62353515625, 50.236328125, 51.84912109375, 53.4619140625, 55.07470703125, 56.6875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 10.0, 6.0, 13.0, 13.0, 18.0, 28.0, 41.0, 67.0, 122.0, 169.0, 303.0, 526.0, 1055.0, 2130.0, 5130.0, 15467.0, 69889.0, 600049.0, 295519.0, 40232.0, 10384.0, 3806.0, 1639.0, 846.0, 433.0, 236.0, 140.0, 100.0, 53.0, 37.0, 30.0, 19.0, 8.0, 11.0, 5.0, 11.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-16.203125, -15.7509765625, -15.298828125, -14.8466796875, -14.39453125, -13.9423828125, -13.490234375, -13.0380859375, -12.5859375, -12.1337890625, -11.681640625, -11.2294921875, -10.77734375, -10.3251953125, -9.873046875, -9.4208984375, -8.96875, -8.5166015625, -8.064453125, -7.6123046875, -7.16015625, -6.7080078125, -6.255859375, -5.8037109375, -5.3515625, -4.8994140625, -4.447265625, -3.9951171875, -3.54296875, -3.0908203125, -2.638671875, -2.1865234375, -1.734375, -1.2822265625, -0.830078125, -0.3779296875, 0.07421875, 0.5263671875, 0.978515625, 1.4306640625, 1.8828125, 2.3349609375, 2.787109375, 3.2392578125, 3.69140625, 4.1435546875, 4.595703125, 5.0478515625, 5.5, 5.9521484375, 6.404296875, 6.8564453125, 7.30859375, 7.7607421875, 8.212890625, 8.6650390625, 9.1171875, 9.5693359375, 10.021484375, 10.4736328125, 10.92578125, 11.3779296875, 11.830078125, 12.2822265625, 12.734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 10.0, 16.0, 15.0, 18.0, 23.0, 36.0, 56.0, 79.0, 118.0, 159.0, 125.0, 97.0, 60.0, 29.0, 43.0, 20.0, 16.0, 21.0, 14.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.002386629581451416, -0.002297520637512207, -0.002208411693572998, -0.002119302749633789, -0.00203019380569458, -0.001941084861755371, -0.0018519759178161621, -0.0017628669738769531, -0.0016737580299377441, -0.0015846490859985352, -0.0014955401420593262, -0.0014064311981201172, -0.0013173222541809082, -0.0012282133102416992, -0.0011391043663024902, -0.0010499954223632812, -0.0009608864784240723, -0.0008717775344848633, -0.0007826685905456543, -0.0006935596466064453, -0.0006044507026672363, -0.0005153417587280273, -0.00042623281478881836, -0.0003371238708496094, -0.0002480149269104004, -0.0001589059829711914, -6.979703903198242e-05, 1.9311904907226562e-05, 0.00010842084884643555, 0.00019752979278564453, 0.0002866387367248535, 0.0003757476806640625, 0.0004648566246032715, 0.0005539655685424805, 0.0006430745124816895, 0.0007321834564208984, 0.0008212924003601074, 0.0009104013442993164, 0.0009995102882385254, 0.0010886192321777344, 0.0011777281761169434, 0.0012668371200561523, 0.0013559460639953613, 0.0014450550079345703, 0.0015341639518737793, 0.0016232728958129883, 0.0017123818397521973, 0.0018014907836914062, 0.0018905997276306152, 0.0019797086715698242, 0.002068817615509033, 0.002157926559448242, 0.002247035503387451, 0.00233614444732666, 0.002425253391265869, 0.002514362335205078, 0.002603471279144287, 0.002692580223083496, 0.002781689167022705, 0.002870798110961914, 0.002959907054901123, 0.003049015998840332, 0.003138124942779541, 0.00322723388671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 18.0, 21.0, 16.0, 30.0, 50.0, 74.0, 119.0, 192.0, 316.0, 530.0, 1115.0, 2428.0, 6648.0, 25828.0, 202136.0, 701028.0, 84669.0, 15049.0, 4512.0, 1732.0, 863.0, 452.0, 264.0, 137.0, 90.0, 46.0, 41.0, 35.0, 25.0, 17.0, 19.0, 7.0, 5.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.4375, -15.91259765625, -15.3876953125, -14.86279296875, -14.337890625, -13.81298828125, -13.2880859375, -12.76318359375, -12.23828125, -11.71337890625, -11.1884765625, -10.66357421875, -10.138671875, -9.61376953125, -9.0888671875, -8.56396484375, -8.0390625, -7.51416015625, -6.9892578125, -6.46435546875, -5.939453125, -5.41455078125, -4.8896484375, -4.36474609375, -3.83984375, -3.31494140625, -2.7900390625, -2.26513671875, -1.740234375, -1.21533203125, -0.6904296875, -0.16552734375, 0.359375, 0.88427734375, 1.4091796875, 1.93408203125, 2.458984375, 2.98388671875, 3.5087890625, 4.03369140625, 4.55859375, 5.08349609375, 5.6083984375, 6.13330078125, 6.658203125, 7.18310546875, 7.7080078125, 8.23291015625, 8.7578125, 9.28271484375, 9.8076171875, 10.33251953125, 10.857421875, 11.38232421875, 11.9072265625, 12.43212890625, 12.95703125, 13.48193359375, 14.0068359375, 14.53173828125, 15.056640625, 15.58154296875, 16.1064453125, 16.63134765625, 17.15625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 4.0, 11.0, 12.0, 15.0, 28.0, 41.0, 84.0, 86.0, 119.0, 123.0, 133.0, 104.0, 87.0, 65.0, 24.0, 19.0, 13.0, 8.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.323486328125, -15.63134765625, -14.939208984375, -14.2470703125, -13.554931640625, -12.86279296875, -12.170654296875, -11.478515625, -10.786376953125, -10.09423828125, -9.402099609375, -8.7099609375, -8.017822265625, -7.32568359375, -6.633544921875, -5.94140625, -5.249267578125, -4.55712890625, -3.864990234375, -3.1728515625, -2.480712890625, -1.78857421875, -1.096435546875, -0.404296875, 0.287841796875, 0.97998046875, 1.672119140625, 2.3642578125, 3.056396484375, 3.74853515625, 4.440673828125, 5.1328125, 5.824951171875, 6.51708984375, 7.209228515625, 7.9013671875, 8.593505859375, 9.28564453125, 9.977783203125, 10.669921875, 11.362060546875, 12.05419921875, 12.746337890625, 13.4384765625, 14.130615234375, 14.82275390625, 15.514892578125, 16.20703125, 16.899169921875, 17.59130859375, 18.283447265625, 18.9755859375, 19.667724609375, 20.35986328125, 21.052001953125, 21.744140625, 22.436279296875, 23.12841796875, 23.820556640625, 24.5126953125, 25.204833984375, 25.89697265625, 26.589111328125, 27.28125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 1.0, 5.0, 11.0, 21.0, 24.0, 23.0, 40.0, 62.0, 91.0, 137.0, 166.0, 138.0, 88.0, 67.0, 49.0, 21.0, 16.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.4237976074219, -279.2752380371094, -270.12664794921875, -260.97808837890625, -251.82949829101562, -242.68093872070312, -233.53236389160156, -224.3837890625, -215.23521423339844, -206.08663940429688, -196.9380645751953, -187.78948974609375, -178.64093017578125, -169.49234008789062, -160.34378051757812, -151.19520568847656, -142.046630859375, -132.89805603027344, -123.74948120117188, -114.60091400146484, -105.45233917236328, -96.30376434326172, -87.15519714355469, -78.00662231445312, -68.85804748535156, -59.70947265625, -50.5609016418457, -41.412330627441406, -32.263755798339844, -23.11518096923828, -13.966609954833984, -4.8180389404296875, 4.33050537109375, 13.47907829284668, 22.62765121459961, 31.77622413635254, 40.92479705810547, 50.07337188720703, 59.22194290161133, 68.37051391601562, 77.51908874511719, 86.66766357421875, 95.81623840332031, 104.96480560302734, 114.1133804321289, 123.26195526123047, 132.4105224609375, 141.55909729003906, 150.70767211914062, 159.8562469482422, 169.00482177734375, 178.1533966064453, 187.30197143554688, 196.45053100585938, 205.59910583496094, 214.7476806640625, 223.89625549316406, 233.04483032226562, 242.1934051513672, 251.34197998046875, 260.49053955078125, 269.6391296386719, 278.7876892089844, 287.936279296875, 297.0848388671875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 4.0, 11.0, 10.0, 17.0, 20.0, 18.0, 29.0, 33.0, 42.0, 33.0, 50.0, 64.0, 64.0, 61.0, 68.0, 66.0, 56.0, 47.0, 62.0, 45.0, 39.0, 51.0, 27.0, 15.0, 13.0, 16.0, 7.0, 5.0, 4.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.83233642578125, -237.46595764160156, -229.0995635986328, -220.73318481445312, -212.36679077148438, -204.0004119873047, -195.634033203125, -187.26763916015625, -178.90126037597656, -170.53488159179688, -162.16848754882812, -153.80210876464844, -145.43572998046875, -137.0693359375, -128.7029571533203, -120.3365707397461, -111.97018432617188, -103.60379791259766, -95.23741149902344, -86.87103271484375, -78.50464630126953, -70.13825988769531, -61.77187728881836, -53.405494689941406, -45.03910827636719, -36.67272186279297, -28.306339263916016, -19.93995475769043, -11.573570251464844, -3.207183837890625, 5.159198760986328, 13.525581359863281, 21.8919677734375, 30.258352279663086, 38.62473678588867, 46.991119384765625, 55.357505798339844, 63.72389221191406, 72.09027099609375, 80.45665740966797, 88.82304382324219, 97.1894302368164, 105.55581665039062, 113.92219543457031, 122.28858184814453, 130.65496826171875, 139.02134704589844, 147.38772583007812, 155.75411987304688, 164.12049865722656, 172.4868927001953, 180.853271484375, 189.21966552734375, 197.58604431152344, 205.95242309570312, 214.31881713867188, 222.68519592285156, 231.05157470703125, 239.41796875, 247.7843475341797, 256.1507263183594, 264.5171203613281, 272.8835144042969, 281.2498779296875, 289.61627197265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 11.0, 41.0, 75.0, 129.0, 295.0, 575.0, 1266.0, 3192.0, 8440.0, 28165.0, 220998.0, 3824497.0, 79194.0, 17401.0, 5721.0, 2200.0, 972.0, 501.0, 236.0, 115.0, 84.0, 59.0, 36.0, 24.0, 11.0, 16.0, 3.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.421875, -25.182861328125, -23.94384765625, -22.704833984375, -21.4658203125, -20.226806640625, -18.98779296875, -17.748779296875, -16.509765625, -15.270751953125, -14.03173828125, -12.792724609375, -11.5537109375, -10.314697265625, -9.07568359375, -7.836669921875, -6.59765625, -5.358642578125, -4.11962890625, -2.880615234375, -1.6416015625, -0.402587890625, 0.83642578125, 2.075439453125, 3.314453125, 4.553466796875, 5.79248046875, 7.031494140625, 8.2705078125, 9.509521484375, 10.74853515625, 11.987548828125, 13.2265625, 14.465576171875, 15.70458984375, 16.943603515625, 18.1826171875, 19.421630859375, 20.66064453125, 21.899658203125, 23.138671875, 24.377685546875, 25.61669921875, 26.855712890625, 28.0947265625, 29.333740234375, 30.57275390625, 31.811767578125, 33.05078125, 34.289794921875, 35.52880859375, 36.767822265625, 38.0068359375, 39.245849609375, 40.48486328125, 41.723876953125, 42.962890625, 44.201904296875, 45.44091796875, 46.679931640625, 47.9189453125, 49.157958984375, 50.39697265625, 51.635986328125, 52.875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 9.0, 7.0, 30.0, 48.0, 57.0, 53.0, 85.0, 106.0, 119.0, 93.0, 96.0, 85.0, 80.0, 47.0, 30.0, 21.0, 8.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4375, -10.83349609375, -10.2294921875, -9.62548828125, -9.021484375, -8.41748046875, -7.8134765625, -7.20947265625, -6.60546875, -6.00146484375, -5.3974609375, -4.79345703125, -4.189453125, -3.58544921875, -2.9814453125, -2.37744140625, -1.7734375, -1.16943359375, -0.5654296875, 0.03857421875, 0.642578125, 1.24658203125, 1.8505859375, 2.45458984375, 3.05859375, 3.66259765625, 4.2666015625, 4.87060546875, 5.474609375, 6.07861328125, 6.6826171875, 7.28662109375, 7.890625, 8.49462890625, 9.0986328125, 9.70263671875, 10.306640625, 10.91064453125, 11.5146484375, 12.11865234375, 12.72265625, 13.32666015625, 13.9306640625, 14.53466796875, 15.138671875, 15.74267578125, 16.3466796875, 16.95068359375, 17.5546875, 18.15869140625, 18.7626953125, 19.36669921875, 19.970703125, 20.57470703125, 21.1787109375, 21.78271484375, 22.38671875, 22.99072265625, 23.5947265625, 24.19873046875, 24.802734375, 25.40673828125, 26.0107421875, 26.61474609375, 27.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 10.0, 21.0, 26.0, 50.0, 51.0, 109.0, 191.0, 334.0, 670.0, 1575.0, 4426.0, 15231.0, 68166.0, 3479665.0, 564684.0, 42521.0, 10366.0, 3388.0, 1398.0, 566.0, 336.0, 180.0, 118.0, 73.0, 35.0, 25.0, 26.0, 12.0, 2.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.375, -49.9013671875, -48.427734375, -46.9541015625, -45.48046875, -44.0068359375, -42.533203125, -41.0595703125, -39.5859375, -38.1123046875, -36.638671875, -35.1650390625, -33.69140625, -32.2177734375, -30.744140625, -29.2705078125, -27.796875, -26.3232421875, -24.849609375, -23.3759765625, -21.90234375, -20.4287109375, -18.955078125, -17.4814453125, -16.0078125, -14.5341796875, -13.060546875, -11.5869140625, -10.11328125, -8.6396484375, -7.166015625, -5.6923828125, -4.21875, -2.7451171875, -1.271484375, 0.2021484375, 1.67578125, 3.1494140625, 4.623046875, 6.0966796875, 7.5703125, 9.0439453125, 10.517578125, 11.9912109375, 13.46484375, 14.9384765625, 16.412109375, 17.8857421875, 19.359375, 20.8330078125, 22.306640625, 23.7802734375, 25.25390625, 26.7275390625, 28.201171875, 29.6748046875, 31.1484375, 32.6220703125, 34.095703125, 35.5693359375, 37.04296875, 38.5166015625, 39.990234375, 41.4638671875, 42.9375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 3.0, 9.0, 13.0, 11.0, 17.0, 31.0, 41.0, 33.0, 54.0, 112.0, 290.0, 1316.0, 1519.0, 287.0, 116.0, 59.0, 47.0, 27.0, 16.0, 13.0, 15.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.7421875, -37.359375, -35.9765625, -34.59375, -33.2109375, -31.828125, -30.4453125, -29.0625, -27.6796875, -26.296875, -24.9140625, -23.53125, -22.1484375, -20.765625, -19.3828125, -18.0, -16.6171875, -15.234375, -13.8515625, -12.46875, -11.0859375, -9.703125, -8.3203125, -6.9375, -5.5546875, -4.171875, -2.7890625, -1.40625, -0.0234375, 1.359375, 2.7421875, 4.125, 5.5078125, 6.890625, 8.2734375, 9.65625, 11.0390625, 12.421875, 13.8046875, 15.1875, 16.5703125, 17.953125, 19.3359375, 20.71875, 22.1015625, 23.484375, 24.8671875, 26.25, 27.6328125, 29.015625, 30.3984375, 31.78125, 33.1640625, 34.546875, 35.9296875, 37.3125, 38.6953125, 40.078125, 41.4609375, 42.84375, 44.2265625, 45.609375, 46.9921875, 48.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 8.0, 22.0, 26.0, 54.0, 46.0, 101.0, 148.0, 158.0, 157.0, 100.0, 60.0, 37.0, 18.0, 11.0, 12.0, 4.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.23724365234375, -263.87884521484375, -255.5204315185547, -247.16201782226562, -238.80361938476562, -230.44520568847656, -222.0867919921875, -213.7283935546875, -205.3699951171875, -197.01158142089844, -188.65318298339844, -180.29476928710938, -171.93637084960938, -163.5779571533203, -155.21954345703125, -146.86114501953125, -138.5027313232422, -130.14431762695312, -121.78591918945312, -113.42750549316406, -105.06910705566406, -96.710693359375, -88.35228729248047, -79.99388122558594, -71.6354751586914, -63.277069091796875, -54.918663024902344, -46.56025314331055, -38.201847076416016, -29.843441009521484, -21.485031127929688, -13.126625061035156, -4.768218994140625, 3.5901880264282227, 11.94859504699707, 20.307003021240234, 28.665409088134766, 37.0238151550293, 45.382225036621094, 53.740631103515625, 62.099037170410156, 70.45744323730469, 78.81584930419922, 87.17425537109375, 95.53266906738281, 103.89106750488281, 112.24948120117188, 120.6078872680664, 128.96629333496094, 137.32470703125, 145.68310546875, 154.04151916503906, 162.39991760253906, 170.75833129882812, 179.11672973632812, 187.4751434326172, 195.83355712890625, 204.1919708251953, 212.5503692626953, 220.90878295898438, 229.26718139648438, 237.62559509277344, 245.9840087890625, 254.3424072265625, 262.7008056640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 14.0, 8.0, 26.0, 26.0, 26.0, 50.0, 47.0, 53.0, 73.0, 62.0, 63.0, 78.0, 72.0, 65.0, 77.0, 52.0, 40.0, 37.0, 28.0, 17.0, 25.0, 7.0, 13.0, 9.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.37545776367188, -156.95108032226562, -150.52671813964844, -144.1023406982422, -137.67796325683594, -131.25360107421875, -124.8292236328125, -118.40484619140625, -111.98047637939453, -105.55610656738281, -99.13172912597656, -92.70735931396484, -86.28298950195312, -79.85861206054688, -73.43424224853516, -67.00987243652344, -60.58549499511719, -54.1611213684082, -47.73674774169922, -41.3123779296875, -34.888004302978516, -28.46363067626953, -22.039260864257812, -15.614887237548828, -9.190513610839844, -2.766140937805176, 3.658231735229492, 10.082603454589844, 16.506977081298828, 22.931350708007812, 29.35572052001953, 35.780094146728516, 42.2044677734375, 48.628841400146484, 55.05321502685547, 61.47758483886719, 67.90196228027344, 74.32633209228516, 80.75070190429688, 87.17507934570312, 93.59944915771484, 100.02381896972656, 106.44819641113281, 112.87256622314453, 119.29693603515625, 125.7213134765625, 132.14569091796875, 138.57005310058594, 144.9944305419922, 151.41880798339844, 157.84317016601562, 164.26754760742188, 170.69192504882812, 177.11630249023438, 183.54066467285156, 189.9650421142578, 196.389404296875, 202.81378173828125, 209.23814392089844, 215.6625213623047, 222.08689880371094, 228.51126098632812, 234.93563842773438, 241.36001586914062, 247.78439331054688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 2.0, 12.0, 15.0, 19.0, 31.0, 37.0, 57.0, 89.0, 124.0, 172.0, 239.0, 345.0, 569.0, 783.0, 1158.0, 1742.0, 2797.0, 4491.0, 7774.0, 13899.0, 26356.0, 54101.0, 120721.0, 293674.0, 287329.0, 118979.0, 53208.0, 26092.0, 13634.0, 7490.0, 4491.0, 2742.0, 1754.0, 1163.0, 756.0, 502.0, 364.0, 247.0, 184.0, 116.0, 82.0, 73.0, 43.0, 28.0, 17.0, 14.0, 17.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-19.765625, -19.18408203125, -18.6025390625, -18.02099609375, -17.439453125, -16.85791015625, -16.2763671875, -15.69482421875, -15.11328125, -14.53173828125, -13.9501953125, -13.36865234375, -12.787109375, -12.20556640625, -11.6240234375, -11.04248046875, -10.4609375, -9.87939453125, -9.2978515625, -8.71630859375, -8.134765625, -7.55322265625, -6.9716796875, -6.39013671875, -5.80859375, -5.22705078125, -4.6455078125, -4.06396484375, -3.482421875, -2.90087890625, -2.3193359375, -1.73779296875, -1.15625, -0.57470703125, 0.0068359375, 0.58837890625, 1.169921875, 1.75146484375, 2.3330078125, 2.91455078125, 3.49609375, 4.07763671875, 4.6591796875, 5.24072265625, 5.822265625, 6.40380859375, 6.9853515625, 7.56689453125, 8.1484375, 8.72998046875, 9.3115234375, 9.89306640625, 10.474609375, 11.05615234375, 11.6376953125, 12.21923828125, 12.80078125, 13.38232421875, 13.9638671875, 14.54541015625, 15.126953125, 15.70849609375, 16.2900390625, 16.87158203125, 17.453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 7.0, 7.0, 10.0, 15.0, 18.0, 18.0, 22.0, 23.0, 31.0, 33.0, 45.0, 61.0, 56.0, 63.0, 63.0, 63.0, 61.0, 54.0, 55.0, 49.0, 43.0, 35.0, 40.0, 31.0, 21.0, 20.0, 8.0, 16.0, 13.0, 2.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.064697265625, -8.70751953125, -8.350341796875, -7.9931640625, -7.635986328125, -7.27880859375, -6.921630859375, -6.564453125, -6.207275390625, -5.85009765625, -5.492919921875, -5.1357421875, -4.778564453125, -4.42138671875, -4.064208984375, -3.70703125, -3.349853515625, -2.99267578125, -2.635498046875, -2.2783203125, -1.921142578125, -1.56396484375, -1.206787109375, -0.849609375, -0.492431640625, -0.13525390625, 0.221923828125, 0.5791015625, 0.936279296875, 1.29345703125, 1.650634765625, 2.0078125, 2.364990234375, 2.72216796875, 3.079345703125, 3.4365234375, 3.793701171875, 4.15087890625, 4.508056640625, 4.865234375, 5.222412109375, 5.57958984375, 5.936767578125, 6.2939453125, 6.651123046875, 7.00830078125, 7.365478515625, 7.72265625, 8.079833984375, 8.43701171875, 8.794189453125, 9.1513671875, 9.508544921875, 9.86572265625, 10.222900390625, 10.580078125, 10.937255859375, 11.29443359375, 11.651611328125, 12.0087890625, 12.365966796875, 12.72314453125, 13.080322265625, 13.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 4.0, 5.0, 9.0, 14.0, 11.0, 19.0, 29.0, 46.0, 58.0, 77.0, 124.0, 187.0, 287.0, 529.0, 881.0, 1999.0, 5041.0, 20019.0, 152721.0, 769631.0, 77042.0, 12786.0, 3622.0, 1453.0, 778.0, 400.0, 258.0, 147.0, 108.0, 72.0, 48.0, 44.0, 24.0, 21.0, 11.0, 18.0, 9.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.15625, -49.52490234375, -47.8935546875, -46.26220703125, -44.630859375, -42.99951171875, -41.3681640625, -39.73681640625, -38.10546875, -36.47412109375, -34.8427734375, -33.21142578125, -31.580078125, -29.94873046875, -28.3173828125, -26.68603515625, -25.0546875, -23.42333984375, -21.7919921875, -20.16064453125, -18.529296875, -16.89794921875, -15.2666015625, -13.63525390625, -12.00390625, -10.37255859375, -8.7412109375, -7.10986328125, -5.478515625, -3.84716796875, -2.2158203125, -0.58447265625, 1.046875, 2.67822265625, 4.3095703125, 5.94091796875, 7.572265625, 9.20361328125, 10.8349609375, 12.46630859375, 14.09765625, 15.72900390625, 17.3603515625, 18.99169921875, 20.623046875, 22.25439453125, 23.8857421875, 25.51708984375, 27.1484375, 28.77978515625, 30.4111328125, 32.04248046875, 33.673828125, 35.30517578125, 36.9365234375, 38.56787109375, 40.19921875, 41.83056640625, 43.4619140625, 45.09326171875, 46.724609375, 48.35595703125, 49.9873046875, 51.61865234375, 53.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 20.0, 14.0, 12.0, 16.0, 22.0, 27.0, 23.0, 24.0, 36.0, 29.0, 42.0, 49.0, 53.0, 57.0, 50.0, 33.0, 46.0, 51.0, 37.0, 45.0, 33.0, 37.0, 24.0, 25.0, 21.0, 25.0, 21.0, 17.0, 17.0, 8.0, 11.0, 14.0, 7.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.46875, -41.193359375, -39.91796875, -38.642578125, -37.3671875, -36.091796875, -34.81640625, -33.541015625, -32.265625, -30.990234375, -29.71484375, -28.439453125, -27.1640625, -25.888671875, -24.61328125, -23.337890625, -22.0625, -20.787109375, -19.51171875, -18.236328125, -16.9609375, -15.685546875, -14.41015625, -13.134765625, -11.859375, -10.583984375, -9.30859375, -8.033203125, -6.7578125, -5.482421875, -4.20703125, -2.931640625, -1.65625, -0.380859375, 0.89453125, 2.169921875, 3.4453125, 4.720703125, 5.99609375, 7.271484375, 8.546875, 9.822265625, 11.09765625, 12.373046875, 13.6484375, 14.923828125, 16.19921875, 17.474609375, 18.75, 20.025390625, 21.30078125, 22.576171875, 23.8515625, 25.126953125, 26.40234375, 27.677734375, 28.953125, 30.228515625, 31.50390625, 32.779296875, 34.0546875, 35.330078125, 36.60546875, 37.880859375, 39.15625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 14.0, 10.0, 6.0, 27.0, 29.0, 35.0, 46.0, 68.0, 101.0, 185.0, 301.0, 498.0, 982.0, 2278.0, 6460.0, 27339.0, 306589.0, 648595.0, 41048.0, 8517.0, 2757.0, 1134.0, 598.0, 310.0, 202.0, 111.0, 93.0, 68.0, 29.0, 36.0, 22.0, 8.0, 9.0, 11.0, 9.0, 4.0, 1.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.171875, -25.356689453125, -24.54150390625, -23.726318359375, -22.9111328125, -22.095947265625, -21.28076171875, -20.465576171875, -19.650390625, -18.835205078125, -18.02001953125, -17.204833984375, -16.3896484375, -15.574462890625, -14.75927734375, -13.944091796875, -13.12890625, -12.313720703125, -11.49853515625, -10.683349609375, -9.8681640625, -9.052978515625, -8.23779296875, -7.422607421875, -6.607421875, -5.792236328125, -4.97705078125, -4.161865234375, -3.3466796875, -2.531494140625, -1.71630859375, -0.901123046875, -0.0859375, 0.729248046875, 1.54443359375, 2.359619140625, 3.1748046875, 3.989990234375, 4.80517578125, 5.620361328125, 6.435546875, 7.250732421875, 8.06591796875, 8.881103515625, 9.6962890625, 10.511474609375, 11.32666015625, 12.141845703125, 12.95703125, 13.772216796875, 14.58740234375, 15.402587890625, 16.2177734375, 17.032958984375, 17.84814453125, 18.663330078125, 19.478515625, 20.293701171875, 21.10888671875, 21.924072265625, 22.7392578125, 23.554443359375, 24.36962890625, 25.184814453125, 26.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 30.0, 27.0, 49.0, 94.0, 179.0, 222.0, 124.0, 78.0, 52.0, 31.0, 24.0, 21.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005489349365234375, -0.005319178104400635, -0.0051490068435668945, -0.004978835582733154, -0.004808664321899414, -0.004638493061065674, -0.004468321800231934, -0.004298150539398193, -0.004127979278564453, -0.003957808017730713, -0.0037876367568969727, -0.0036174654960632324, -0.003447294235229492, -0.003277122974395752, -0.0031069517135620117, -0.0029367804527282715, -0.0027666091918945312, -0.002596437931060791, -0.0024262666702270508, -0.0022560954093933105, -0.0020859241485595703, -0.00191575288772583, -0.0017455816268920898, -0.0015754103660583496, -0.0014052391052246094, -0.0012350678443908691, -0.001064896583557129, -0.0008947253227233887, -0.0007245540618896484, -0.0005543828010559082, -0.00038421154022216797, -0.00021404027938842773, -4.38690185546875e-05, 0.00012630224227905273, 0.00029647350311279297, 0.0004666447639465332, 0.0006368160247802734, 0.0008069872856140137, 0.000977158546447754, 0.0011473298072814941, 0.0013175010681152344, 0.0014876723289489746, 0.0016578435897827148, 0.001828014850616455, 0.0019981861114501953, 0.0021683573722839355, 0.0023385286331176758, 0.002508699893951416, 0.0026788711547851562, 0.0028490424156188965, 0.0030192136764526367, 0.003189384937286377, 0.003359556198120117, 0.0035297274589538574, 0.0036998987197875977, 0.003870069980621338, 0.004040241241455078, 0.004210412502288818, 0.004380583763122559, 0.004550755023956299, 0.004720926284790039, 0.004891097545623779, 0.0050612688064575195, 0.00523144006729126, 0.005401611328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 13.0, 15.0, 20.0, 28.0, 51.0, 59.0, 89.0, 125.0, 186.0, 315.0, 495.0, 885.0, 1886.0, 4603.0, 14463.0, 76920.0, 724554.0, 186513.0, 25036.0, 6673.0, 2638.0, 1227.0, 638.0, 360.0, 220.0, 160.0, 88.0, 72.0, 46.0, 41.0, 23.0, 21.0, 13.0, 14.0, 6.0, 8.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.453125, -20.776123046875, -20.09912109375, -19.422119140625, -18.7451171875, -18.068115234375, -17.39111328125, -16.714111328125, -16.037109375, -15.360107421875, -14.68310546875, -14.006103515625, -13.3291015625, -12.652099609375, -11.97509765625, -11.298095703125, -10.62109375, -9.944091796875, -9.26708984375, -8.590087890625, -7.9130859375, -7.236083984375, -6.55908203125, -5.882080078125, -5.205078125, -4.528076171875, -3.85107421875, -3.174072265625, -2.4970703125, -1.820068359375, -1.14306640625, -0.466064453125, 0.2109375, 0.887939453125, 1.56494140625, 2.241943359375, 2.9189453125, 3.595947265625, 4.27294921875, 4.949951171875, 5.626953125, 6.303955078125, 6.98095703125, 7.657958984375, 8.3349609375, 9.011962890625, 9.68896484375, 10.365966796875, 11.04296875, 11.719970703125, 12.39697265625, 13.073974609375, 13.7509765625, 14.427978515625, 15.10498046875, 15.781982421875, 16.458984375, 17.135986328125, 17.81298828125, 18.489990234375, 19.1669921875, 19.843994140625, 20.52099609375, 21.197998046875, 21.875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 12.0, 11.0, 15.0, 17.0, 20.0, 35.0, 62.0, 62.0, 74.0, 92.0, 105.0, 119.0, 93.0, 77.0, 50.0, 49.0, 29.0, 25.0, 16.0, 10.0, 6.0, 10.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.592041015625, -16.82470703125, -16.057373046875, -15.2900390625, -14.522705078125, -13.75537109375, -12.988037109375, -12.220703125, -11.453369140625, -10.68603515625, -9.918701171875, -9.1513671875, -8.384033203125, -7.61669921875, -6.849365234375, -6.08203125, -5.314697265625, -4.54736328125, -3.780029296875, -3.0126953125, -2.245361328125, -1.47802734375, -0.710693359375, 0.056640625, 0.823974609375, 1.59130859375, 2.358642578125, 3.1259765625, 3.893310546875, 4.66064453125, 5.427978515625, 6.1953125, 6.962646484375, 7.72998046875, 8.497314453125, 9.2646484375, 10.031982421875, 10.79931640625, 11.566650390625, 12.333984375, 13.101318359375, 13.86865234375, 14.635986328125, 15.4033203125, 16.170654296875, 16.93798828125, 17.705322265625, 18.47265625, 19.239990234375, 20.00732421875, 20.774658203125, 21.5419921875, 22.309326171875, 23.07666015625, 23.843994140625, 24.611328125, 25.378662109375, 26.14599609375, 26.913330078125, 27.6806640625, 28.447998046875, 29.21533203125, 29.982666015625, 30.75]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 9.0, 26.0, 61.0, 118.0, 249.0, 280.0, 152.0, 62.0, 21.0, 7.0, 8.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-684.4962768554688, -667.06591796875, -649.635498046875, -632.2051391601562, -614.7747802734375, -597.3443603515625, -579.9140014648438, -562.4835815429688, -545.05322265625, -527.6228637695312, -510.19244384765625, -492.7620849609375, -475.3316955566406, -457.90130615234375, -440.470947265625, -423.0405578613281, -405.61016845703125, -388.1797790527344, -370.7493896484375, -353.31903076171875, -335.8886413574219, -318.458251953125, -301.02789306640625, -283.5975036621094, -266.1671142578125, -248.73672485351562, -231.3063507080078, -213.8759765625, -196.44558715820312, -179.01519775390625, -161.58482360839844, -144.15444946289062, -126.72402954101562, -109.29364776611328, -91.86326599121094, -74.4328842163086, -57.00250244140625, -39.572120666503906, -22.141738891601562, -4.711357116699219, 12.719024658203125, 30.14940643310547, 47.57978820800781, 65.01016998291016, 82.4405517578125, 99.87093353271484, 117.30131530761719, 134.731689453125, 152.16207885742188, 169.59246826171875, 187.02284240722656, 204.45321655273438, 221.88360595703125, 239.31399536132812, 256.744384765625, 274.17474365234375, 291.6051330566406, 309.0355224609375, 326.46588134765625, 343.8962707519531, 361.32666015625, 378.7570495605469, 396.18743896484375, 413.6177978515625, 431.0481872558594]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 3.0, 6.0, 15.0, 8.0, 11.0, 14.0, 16.0, 21.0, 25.0, 26.0, 26.0, 33.0, 41.0, 49.0, 44.0, 51.0, 45.0, 60.0, 62.0, 58.0, 43.0, 40.0, 28.0, 38.0, 33.0, 36.0, 37.0, 22.0, 23.0, 14.0, 15.0, 10.0, 7.0, 5.0, 7.0, 8.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-206.066650390625, -200.31167602539062, -194.5567169189453, -188.80174255371094, -183.04678344726562, -177.29180908203125, -171.53684997558594, -165.78187561035156, -160.02691650390625, -154.27194213867188, -148.51698303222656, -142.7620086669922, -137.00704956054688, -131.2520751953125, -125.49711608886719, -119.74214172363281, -113.98717498779297, -108.23220825195312, -102.47724151611328, -96.72227478027344, -90.9673080444336, -85.21234130859375, -79.45736694335938, -73.70240783691406, -67.94743347167969, -62.192466735839844, -56.4375, -50.682533264160156, -44.92756652832031, -39.17259979248047, -33.41762924194336, -27.662662506103516, -21.907699584960938, -16.152732849121094, -10.397765159606934, -4.642797470092773, 1.1121692657470703, 6.867136001586914, 12.62210464477539, 18.377071380615234, 24.132038116455078, 29.887004852294922, 35.641971588134766, 41.396942138671875, 47.15190887451172, 52.90687561035156, 58.661842346191406, 64.41680908203125, 70.1717758178711, 75.92674255371094, 81.68170928955078, 87.43667602539062, 93.19164276123047, 98.94660949707031, 104.70158386230469, 110.45654296875, 116.21151733398438, 121.96648406982422, 127.72145080566406, 133.47642517089844, 139.23138427734375, 144.98635864257812, 150.74131774902344, 156.4962921142578, 162.25125122070312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 11.0, 14.0, 21.0, 27.0, 59.0, 94.0, 197.0, 323.0, 610.0, 1129.0, 2433.0, 5727.0, 18390.0, 115166.0, 3781952.0, 230278.0, 25016.0, 7181.0, 2848.0, 1299.0, 691.0, 336.0, 177.0, 86.0, 67.0, 46.0, 32.0, 17.0, 12.0, 7.0, 5.0, 1.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.28125, -36.203857421875, -35.12646484375, -34.049072265625, -32.9716796875, -31.894287109375, -30.81689453125, -29.739501953125, -28.662109375, -27.584716796875, -26.50732421875, -25.429931640625, -24.3525390625, -23.275146484375, -22.19775390625, -21.120361328125, -20.04296875, -18.965576171875, -17.88818359375, -16.810791015625, -15.7333984375, -14.656005859375, -13.57861328125, -12.501220703125, -11.423828125, -10.346435546875, -9.26904296875, -8.191650390625, -7.1142578125, -6.036865234375, -4.95947265625, -3.882080078125, -2.8046875, -1.727294921875, -0.64990234375, 0.427490234375, 1.5048828125, 2.582275390625, 3.65966796875, 4.737060546875, 5.814453125, 6.891845703125, 7.96923828125, 9.046630859375, 10.1240234375, 11.201416015625, 12.27880859375, 13.356201171875, 14.43359375, 15.510986328125, 16.58837890625, 17.665771484375, 18.7431640625, 19.820556640625, 20.89794921875, 21.975341796875, 23.052734375, 24.130126953125, 25.20751953125, 26.284912109375, 27.3623046875, 28.439697265625, 29.51708984375, 30.594482421875, 31.671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 7.0, 9.0, 5.0, 15.0, 13.0, 21.0, 29.0, 32.0, 37.0, 34.0, 56.0, 65.0, 61.0, 57.0, 65.0, 61.0, 51.0, 63.0, 66.0, 41.0, 35.0, 33.0, 28.0, 28.0, 26.0, 15.0, 8.0, 13.0, 4.0, 4.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.833984375, -12.46484375, -12.095703125, -11.7265625, -11.357421875, -10.98828125, -10.619140625, -10.25, -9.880859375, -9.51171875, -9.142578125, -8.7734375, -8.404296875, -8.03515625, -7.666015625, -7.296875, -6.927734375, -6.55859375, -6.189453125, -5.8203125, -5.451171875, -5.08203125, -4.712890625, -4.34375, -3.974609375, -3.60546875, -3.236328125, -2.8671875, -2.498046875, -2.12890625, -1.759765625, -1.390625, -1.021484375, -0.65234375, -0.283203125, 0.0859375, 0.455078125, 0.82421875, 1.193359375, 1.5625, 1.931640625, 2.30078125, 2.669921875, 3.0390625, 3.408203125, 3.77734375, 4.146484375, 4.515625, 4.884765625, 5.25390625, 5.623046875, 5.9921875, 6.361328125, 6.73046875, 7.099609375, 7.46875, 7.837890625, 8.20703125, 8.576171875, 8.9453125, 9.314453125, 9.68359375, 10.052734375, 10.421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 1.0, 7.0, 7.0, 10.0, 19.0, 26.0, 24.0, 30.0, 45.0, 48.0, 53.0, 88.0, 140.0, 176.0, 272.0, 402.0, 589.0, 970.0, 1494.0, 2525.0, 4395.0, 8261.0, 17145.0, 41079.0, 127764.0, 1208150.0, 2506472.0, 178060.0, 51214.0, 21135.0, 10309.0, 5330.0, 3039.0, 1782.0, 1154.0, 657.0, 445.0, 288.0, 198.0, 156.0, 85.0, 60.0, 58.0, 42.0, 24.0, 15.0, 13.0, 8.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0], "bins": [-23.859375, -23.19873046875, -22.5380859375, -21.87744140625, -21.216796875, -20.55615234375, -19.8955078125, -19.23486328125, -18.57421875, -17.91357421875, -17.2529296875, -16.59228515625, -15.931640625, -15.27099609375, -14.6103515625, -13.94970703125, -13.2890625, -12.62841796875, -11.9677734375, -11.30712890625, -10.646484375, -9.98583984375, -9.3251953125, -8.66455078125, -8.00390625, -7.34326171875, -6.6826171875, -6.02197265625, -5.361328125, -4.70068359375, -4.0400390625, -3.37939453125, -2.71875, -2.05810546875, -1.3974609375, -0.73681640625, -0.076171875, 0.58447265625, 1.2451171875, 1.90576171875, 2.56640625, 3.22705078125, 3.8876953125, 4.54833984375, 5.208984375, 5.86962890625, 6.5302734375, 7.19091796875, 7.8515625, 8.51220703125, 9.1728515625, 9.83349609375, 10.494140625, 11.15478515625, 11.8154296875, 12.47607421875, 13.13671875, 13.79736328125, 14.4580078125, 15.11865234375, 15.779296875, 16.43994140625, 17.1005859375, 17.76123046875, 18.421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 15.0, 13.0, 13.0, 37.0, 71.0, 76.0, 118.0, 254.0, 530.0, 1290.0, 902.0, 326.0, 143.0, 60.0, 48.0, 41.0, 27.0, 22.0, 14.0, 6.0, 7.0, 8.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-43.53125, -42.404296875, -41.27734375, -40.150390625, -39.0234375, -37.896484375, -36.76953125, -35.642578125, -34.515625, -33.388671875, -32.26171875, -31.134765625, -30.0078125, -28.880859375, -27.75390625, -26.626953125, -25.5, -24.373046875, -23.24609375, -22.119140625, -20.9921875, -19.865234375, -18.73828125, -17.611328125, -16.484375, -15.357421875, -14.23046875, -13.103515625, -11.9765625, -10.849609375, -9.72265625, -8.595703125, -7.46875, -6.341796875, -5.21484375, -4.087890625, -2.9609375, -1.833984375, -0.70703125, 0.419921875, 1.546875, 2.673828125, 3.80078125, 4.927734375, 6.0546875, 7.181640625, 8.30859375, 9.435546875, 10.5625, 11.689453125, 12.81640625, 13.943359375, 15.0703125, 16.197265625, 17.32421875, 18.451171875, 19.578125, 20.705078125, 21.83203125, 22.958984375, 24.0859375, 25.212890625, 26.33984375, 27.466796875, 28.59375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 7.0, 16.0, 35.0, 72.0, 139.0, 255.0, 235.0, 124.0, 53.0, 27.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-493.7953186035156, -481.5564270019531, -469.3175354003906, -457.0786437988281, -444.8397521972656, -432.6008605957031, -420.3619689941406, -408.1230773925781, -395.8841857910156, -383.6452941894531, -371.4064025878906, -359.1675109863281, -346.9286193847656, -334.6897277832031, -322.4508361816406, -310.2119445800781, -297.9730224609375, -285.734130859375, -273.4952392578125, -261.25634765625, -249.0174560546875, -236.778564453125, -224.5396728515625, -212.30078125, -200.0618896484375, -187.822998046875, -175.5841064453125, -163.34521484375, -151.1063232421875, -138.867431640625, -126.62853240966797, -114.38964080810547, -102.1507568359375, -89.911865234375, -77.6729736328125, -65.43408203125, -53.195186614990234, -40.956295013427734, -28.71739959716797, -16.47850799560547, -4.239616394042969, 7.999276161193848, 20.238168716430664, 32.4770622253418, 44.7159538269043, 56.9548454284668, 69.19374084472656, 81.43263244628906, 93.67152404785156, 105.91041564941406, 118.14930725097656, 130.38819885253906, 142.62709045410156, 154.86598205566406, 167.10488891601562, 179.34378051757812, 191.58267211914062, 203.82156372070312, 216.06045532226562, 228.29934692382812, 240.53823852539062, 252.77713012695312, 265.0160217285156, 277.2549133300781, 289.4938049316406]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 14.0, 17.0, 19.0, 22.0, 27.0, 27.0, 34.0, 58.0, 33.0, 51.0, 50.0, 68.0, 72.0, 60.0, 60.0, 70.0, 58.0, 56.0, 30.0, 32.0, 29.0, 24.0, 17.0, 23.0, 14.0, 9.0, 9.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.53219604492188, -161.57308959960938, -155.61398315429688, -149.65487670898438, -143.69577026367188, -137.73666381835938, -131.77755737304688, -125.81846618652344, -119.85935974121094, -113.90025329589844, -107.94114685058594, -101.98204040527344, -96.02294158935547, -90.06383514404297, -84.10472869873047, -78.1456298828125, -72.18651580810547, -66.22740936279297, -60.268306732177734, -54.309200286865234, -48.35009765625, -42.3909912109375, -36.431884765625, -30.472782135009766, -24.513675689697266, -18.5545711517334, -12.595465660095215, -6.636360168457031, -0.6772556304931641, 5.281848907470703, 11.240955352783203, 17.200057983398438, 23.159164428710938, 29.118268966674805, 35.07737350463867, 41.03647994995117, 46.995582580566406, 52.954689025878906, 58.913795471191406, 64.87289428710938, 70.83200073242188, 76.79110717773438, 82.75021362304688, 88.70932006835938, 94.66841888427734, 100.62752532958984, 106.58663177490234, 112.54573059082031, 118.50484466552734, 124.46395111083984, 130.4230499267578, 136.3821563720703, 142.3412628173828, 148.3003692626953, 154.2594757080078, 160.2185821533203, 166.1776885986328, 172.1367950439453, 178.0959014892578, 184.0550079345703, 190.0141143798828, 195.97320556640625, 201.93231201171875, 207.89141845703125, 213.85052490234375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 22.0, 35.0, 60.0, 83.0, 120.0, 193.0, 342.0, 510.0, 937.0, 1832.0, 3725.0, 7868.0, 18378.0, 47866.0, 146670.0, 437271.0, 255293.0, 77650.0, 27887.0, 11238.0, 5103.0, 2392.0, 1269.0, 713.0, 409.0, 253.0, 141.0, 97.0, 64.0, 40.0, 17.0, 12.0, 15.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-26.59375, -25.827880859375, -25.06201171875, -24.296142578125, -23.5302734375, -22.764404296875, -21.99853515625, -21.232666015625, -20.466796875, -19.700927734375, -18.93505859375, -18.169189453125, -17.4033203125, -16.637451171875, -15.87158203125, -15.105712890625, -14.33984375, -13.573974609375, -12.80810546875, -12.042236328125, -11.2763671875, -10.510498046875, -9.74462890625, -8.978759765625, -8.212890625, -7.447021484375, -6.68115234375, -5.915283203125, -5.1494140625, -4.383544921875, -3.61767578125, -2.851806640625, -2.0859375, -1.320068359375, -0.55419921875, 0.211669921875, 0.9775390625, 1.743408203125, 2.50927734375, 3.275146484375, 4.041015625, 4.806884765625, 5.57275390625, 6.338623046875, 7.1044921875, 7.870361328125, 8.63623046875, 9.402099609375, 10.16796875, 10.933837890625, 11.69970703125, 12.465576171875, 13.2314453125, 13.997314453125, 14.76318359375, 15.529052734375, 16.294921875, 17.060791015625, 17.82666015625, 18.592529296875, 19.3583984375, 20.124267578125, 20.89013671875, 21.656005859375, 22.421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 9.0, 11.0, 16.0, 17.0, 19.0, 17.0, 28.0, 27.0, 26.0, 49.0, 50.0, 53.0, 59.0, 50.0, 70.0, 54.0, 51.0, 58.0, 45.0, 42.0, 33.0, 34.0, 33.0, 39.0, 27.0, 15.0, 15.0, 13.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.55859375, -10.1796875, -9.80078125, -9.421875, -9.04296875, -8.6640625, -8.28515625, -7.90625, -7.52734375, -7.1484375, -6.76953125, -6.390625, -6.01171875, -5.6328125, -5.25390625, -4.875, -4.49609375, -4.1171875, -3.73828125, -3.359375, -2.98046875, -2.6015625, -2.22265625, -1.84375, -1.46484375, -1.0859375, -0.70703125, -0.328125, 0.05078125, 0.4296875, 0.80859375, 1.1875, 1.56640625, 1.9453125, 2.32421875, 2.703125, 3.08203125, 3.4609375, 3.83984375, 4.21875, 4.59765625, 4.9765625, 5.35546875, 5.734375, 6.11328125, 6.4921875, 6.87109375, 7.25, 7.62890625, 8.0078125, 8.38671875, 8.765625, 9.14453125, 9.5234375, 9.90234375, 10.28125, 10.66015625, 11.0390625, 11.41796875, 11.796875, 12.17578125, 12.5546875, 12.93359375, 13.3125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 12.0, 17.0, 20.0, 25.0, 24.0, 55.0, 50.0, 89.0, 135.0, 168.0, 259.0, 410.0, 712.0, 1232.0, 2611.0, 6466.0, 21421.0, 98209.0, 640503.0, 218187.0, 39504.0, 10541.0, 3823.0, 1612.0, 910.0, 559.0, 337.0, 206.0, 131.0, 91.0, 57.0, 40.0, 31.0, 31.0, 19.0, 16.0, 8.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.0, -38.77734375, -37.5546875, -36.33203125, -35.109375, -33.88671875, -32.6640625, -31.44140625, -30.21875, -28.99609375, -27.7734375, -26.55078125, -25.328125, -24.10546875, -22.8828125, -21.66015625, -20.4375, -19.21484375, -17.9921875, -16.76953125, -15.546875, -14.32421875, -13.1015625, -11.87890625, -10.65625, -9.43359375, -8.2109375, -6.98828125, -5.765625, -4.54296875, -3.3203125, -2.09765625, -0.875, 0.34765625, 1.5703125, 2.79296875, 4.015625, 5.23828125, 6.4609375, 7.68359375, 8.90625, 10.12890625, 11.3515625, 12.57421875, 13.796875, 15.01953125, 16.2421875, 17.46484375, 18.6875, 19.91015625, 21.1328125, 22.35546875, 23.578125, 24.80078125, 26.0234375, 27.24609375, 28.46875, 29.69140625, 30.9140625, 32.13671875, 33.359375, 34.58203125, 35.8046875, 37.02734375, 38.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 7.0, 6.0, 7.0, 12.0, 10.0, 26.0, 13.0, 23.0, 31.0, 25.0, 29.0, 40.0, 36.0, 32.0, 59.0, 50.0, 43.0, 47.0, 49.0, 46.0, 47.0, 39.0, 35.0, 30.0, 40.0, 49.0, 31.0, 19.0, 26.0, 13.0, 11.0, 12.0, 10.0, 6.0, 7.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.21875, -43.80712890625, -42.3955078125, -40.98388671875, -39.572265625, -38.16064453125, -36.7490234375, -35.33740234375, -33.92578125, -32.51416015625, -31.1025390625, -29.69091796875, -28.279296875, -26.86767578125, -25.4560546875, -24.04443359375, -22.6328125, -21.22119140625, -19.8095703125, -18.39794921875, -16.986328125, -15.57470703125, -14.1630859375, -12.75146484375, -11.33984375, -9.92822265625, -8.5166015625, -7.10498046875, -5.693359375, -4.28173828125, -2.8701171875, -1.45849609375, -0.046875, 1.36474609375, 2.7763671875, 4.18798828125, 5.599609375, 7.01123046875, 8.4228515625, 9.83447265625, 11.24609375, 12.65771484375, 14.0693359375, 15.48095703125, 16.892578125, 18.30419921875, 19.7158203125, 21.12744140625, 22.5390625, 23.95068359375, 25.3623046875, 26.77392578125, 28.185546875, 29.59716796875, 31.0087890625, 32.42041015625, 33.83203125, 35.24365234375, 36.6552734375, 38.06689453125, 39.478515625, 40.89013671875, 42.3017578125, 43.71337890625, 45.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 8.0, 15.0, 25.0, 30.0, 53.0, 91.0, 153.0, 368.0, 941.0, 3564.0, 22397.0, 397506.0, 590731.0, 26812.0, 4002.0, 1035.0, 376.0, 164.0, 88.0, 59.0, 37.0, 17.0, 15.0, 14.0, 10.0, 2.0, 5.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.38671875, -19.6328125, -18.87890625, -18.125, -17.37109375, -16.6171875, -15.86328125, -15.109375, -14.35546875, -13.6015625, -12.84765625, -12.09375, -11.33984375, -10.5859375, -9.83203125, -9.078125, -8.32421875, -7.5703125, -6.81640625, -6.0625, -5.30859375, -4.5546875, -3.80078125, -3.046875, -2.29296875, -1.5390625, -0.78515625, -0.03125, 0.72265625, 1.4765625, 2.23046875, 2.984375, 3.73828125, 4.4921875, 5.24609375, 6.0, 6.75390625, 7.5078125, 8.26171875, 9.015625, 9.76953125, 10.5234375, 11.27734375, 12.03125, 12.78515625, 13.5390625, 14.29296875, 15.046875, 15.80078125, 16.5546875, 17.30859375, 18.0625, 18.81640625, 19.5703125, 20.32421875, 21.078125, 21.83203125, 22.5859375, 23.33984375, 24.09375, 24.84765625, 25.6015625, 26.35546875, 27.109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 8.0, 4.0, 10.0, 16.0, 9.0, 17.0, 19.0, 16.0, 26.0, 43.0, 44.0, 53.0, 73.0, 103.0, 110.0, 96.0, 65.0, 57.0, 46.0, 34.0, 31.0, 26.0, 19.0, 13.0, 14.0, 4.0, 7.0, 7.0, 5.0, 1.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025615692138671875, -0.0024892985820770264, -0.0024170279502868652, -0.002344757318496704, -0.002272486686706543, -0.002200216054916382, -0.0021279454231262207, -0.0020556747913360596, -0.0019834041595458984, -0.0019111335277557373, -0.0018388628959655762, -0.001766592264175415, -0.001694321632385254, -0.0016220510005950928, -0.0015497803688049316, -0.0014775097370147705, -0.0014052391052246094, -0.0013329684734344482, -0.0012606978416442871, -0.001188427209854126, -0.0011161565780639648, -0.0010438859462738037, -0.0009716153144836426, -0.0008993446826934814, -0.0008270740509033203, -0.0007548034191131592, -0.000682532787322998, -0.0006102621555328369, -0.0005379915237426758, -0.00046572089195251465, -0.0003934502601623535, -0.0003211796283721924, -0.00024890899658203125, -0.00017663836479187012, -0.00010436773300170898, -3.209710121154785e-05, 4.017353057861328e-05, 0.00011244416236877441, 0.00018471479415893555, 0.0002569854259490967, 0.0003292560577392578, 0.00040152668952941895, 0.0004737973213195801, 0.0005460679531097412, 0.0006183385848999023, 0.0006906092166900635, 0.0007628798484802246, 0.0008351504802703857, 0.0009074211120605469, 0.000979691743850708, 0.0010519623756408691, 0.0011242330074310303, 0.0011965036392211914, 0.0012687742710113525, 0.0013410449028015137, 0.0014133155345916748, 0.001485586166381836, 0.001557856798171997, 0.0016301274299621582, 0.0017023980617523193, 0.0017746686935424805, 0.0018469393253326416, 0.0019192099571228027, 0.001991480588912964, 0.002063751220703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 8.0, 8.0, 6.0, 4.0, 11.0, 17.0, 35.0, 45.0, 65.0, 70.0, 140.0, 233.0, 357.0, 720.0, 1472.0, 3776.0, 12717.0, 74931.0, 671534.0, 242137.0, 28665.0, 6878.0, 2397.0, 1055.0, 522.0, 284.0, 156.0, 109.0, 70.0, 33.0, 29.0, 21.0, 12.0, 8.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5703125, -13.0631103515625, -12.555908203125, -12.0487060546875, -11.54150390625, -11.0343017578125, -10.527099609375, -10.0198974609375, -9.5126953125, -9.0054931640625, -8.498291015625, -7.9910888671875, -7.48388671875, -6.9766845703125, -6.469482421875, -5.9622802734375, -5.455078125, -4.9478759765625, -4.440673828125, -3.9334716796875, -3.42626953125, -2.9190673828125, -2.411865234375, -1.9046630859375, -1.3974609375, -0.8902587890625, -0.383056640625, 0.1241455078125, 0.63134765625, 1.1385498046875, 1.645751953125, 2.1529541015625, 2.66015625, 3.1673583984375, 3.674560546875, 4.1817626953125, 4.68896484375, 5.1961669921875, 5.703369140625, 6.2105712890625, 6.7177734375, 7.2249755859375, 7.732177734375, 8.2393798828125, 8.74658203125, 9.2537841796875, 9.760986328125, 10.2681884765625, 10.775390625, 11.2825927734375, 11.789794921875, 12.2969970703125, 12.80419921875, 13.3114013671875, 13.818603515625, 14.3258056640625, 14.8330078125, 15.3402099609375, 15.847412109375, 16.3546142578125, 16.86181640625, 17.3690185546875, 17.876220703125, 18.3834228515625, 18.890625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 9.0, 11.0, 20.0, 18.0, 28.0, 23.0, 41.0, 51.0, 60.0, 73.0, 67.0, 91.0, 80.0, 71.0, 68.0, 50.0, 34.0, 40.0, 33.0, 27.0, 16.0, 15.0, 9.0, 9.0, 7.0, 8.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.171875, -11.7847900390625, -11.397705078125, -11.0106201171875, -10.62353515625, -10.2364501953125, -9.849365234375, -9.4622802734375, -9.0751953125, -8.6881103515625, -8.301025390625, -7.9139404296875, -7.52685546875, -7.1397705078125, -6.752685546875, -6.3656005859375, -5.978515625, -5.5914306640625, -5.204345703125, -4.8172607421875, -4.43017578125, -4.0430908203125, -3.656005859375, -3.2689208984375, -2.8818359375, -2.4947509765625, -2.107666015625, -1.7205810546875, -1.33349609375, -0.9464111328125, -0.559326171875, -0.1722412109375, 0.21484375, 0.6019287109375, 0.989013671875, 1.3760986328125, 1.76318359375, 2.1502685546875, 2.537353515625, 2.9244384765625, 3.3115234375, 3.6986083984375, 4.085693359375, 4.4727783203125, 4.85986328125, 5.2469482421875, 5.634033203125, 6.0211181640625, 6.408203125, 6.7952880859375, 7.182373046875, 7.5694580078125, 7.95654296875, 8.3436279296875, 8.730712890625, 9.1177978515625, 9.5048828125, 9.8919677734375, 10.279052734375, 10.6661376953125, 11.05322265625, 11.4403076171875, 11.827392578125, 12.2144775390625, 12.6015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 12.0, 7.0, 29.0, 52.0, 84.0, 151.0, 193.0, 174.0, 111.0, 64.0, 45.0, 20.0, 15.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-259.2537841796875, -250.2814483642578, -241.30911254882812, -232.33677673339844, -223.36444091796875, -214.39210510253906, -205.41976928710938, -196.44744873046875, -187.47509765625, -178.5027618408203, -169.53042602539062, -160.55809020996094, -151.58575439453125, -142.61341857910156, -133.64108276367188, -124.66875457763672, -115.69642639160156, -106.72409057617188, -97.75175476074219, -88.7794189453125, -79.80708312988281, -70.83474731445312, -61.86241912841797, -52.89008331298828, -43.917747497558594, -34.945411682128906, -25.97307777404785, -17.000743865966797, -8.02840805053711, 0.9439277648925781, 9.916259765625, 18.888595581054688, 27.860931396484375, 36.83326721191406, 45.80560302734375, 54.77793502807617, 63.75027084350586, 72.72261047363281, 81.69493865966797, 90.66727447509766, 99.63961029052734, 108.61194610595703, 117.58428192138672, 126.55661010742188, 135.52894592285156, 144.50128173828125, 153.47361755371094, 162.44595336914062, 171.4182891845703, 180.390625, 189.3629608154297, 198.33529663085938, 207.30763244628906, 216.27996826171875, 225.25228881835938, 234.22463989257812, 243.19696044921875, 252.16929626464844, 261.1416320800781, 270.11395263671875, 279.0863037109375, 288.0586242675781, 297.0309753417969, 306.0032958984375, 314.97564697265625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 1.0, 3.0, 5.0, 8.0, 5.0, 6.0, 9.0, 11.0, 11.0, 16.0, 14.0, 15.0, 28.0, 24.0, 35.0, 28.0, 38.0, 53.0, 40.0, 57.0, 47.0, 46.0, 53.0, 55.0, 39.0, 47.0, 36.0, 40.0, 34.0, 27.0, 22.0, 24.0, 29.0, 22.0, 14.0, 11.0, 12.0, 6.0, 6.0, 9.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-203.80874633789062, -198.2371063232422, -192.66546630859375, -187.09381103515625, -181.5221710205078, -175.95053100585938, -170.37889099121094, -164.8072509765625, -159.235595703125, -153.66395568847656, -148.09231567382812, -142.52066040039062, -136.9490203857422, -131.37738037109375, -125.80574035644531, -120.23410034179688, -114.66246032714844, -109.0908203125, -103.51917266845703, -97.9475326538086, -92.37588500976562, -86.80424499511719, -81.23260498046875, -75.66096496582031, -70.08931732177734, -64.5176773071289, -58.94602966308594, -53.3743896484375, -47.8027458190918, -42.231101989746094, -36.659461975097656, -31.087818145751953, -25.51617431640625, -19.944530487060547, -14.372888565063477, -8.801246643066406, -3.229602813720703, 2.342041015625, 7.9136810302734375, 13.48532485961914, 19.056968688964844, 24.628612518310547, 30.200254440307617, 35.77189636230469, 41.34354019165039, 46.915184020996094, 52.48682403564453, 58.058467864990234, 63.63011169433594, 69.20175170898438, 74.77339935302734, 80.34503936767578, 85.91668701171875, 91.48832702636719, 97.05996704101562, 102.63160705566406, 108.20325469970703, 113.77489471435547, 119.34654235839844, 124.91818237304688, 130.4898223876953, 136.06146240234375, 141.63311767578125, 147.2047576904297, 152.77639770507812]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 6.0, 10.0, 9.0, 18.0, 22.0, 27.0, 32.0, 56.0, 74.0, 116.0, 151.0, 257.0, 384.0, 745.0, 1299.0, 2630.0, 5279.0, 11802.0, 30434.0, 110586.0, 934710.0, 2672600.0, 327065.0, 59644.0, 19641.0, 8339.0, 3904.0, 1913.0, 1036.0, 570.0, 341.0, 210.0, 103.0, 77.0, 59.0, 29.0, 36.0, 13.0, 9.0, 13.0, 3.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -16.0496826171875, -15.552490234375, -15.0552978515625, -14.55810546875, -14.0609130859375, -13.563720703125, -13.0665283203125, -12.5693359375, -12.0721435546875, -11.574951171875, -11.0777587890625, -10.58056640625, -10.0833740234375, -9.586181640625, -9.0889892578125, -8.591796875, -8.0946044921875, -7.597412109375, -7.1002197265625, -6.60302734375, -6.1058349609375, -5.608642578125, -5.1114501953125, -4.6142578125, -4.1170654296875, -3.619873046875, -3.1226806640625, -2.62548828125, -2.1282958984375, -1.631103515625, -1.1339111328125, -0.63671875, -0.1395263671875, 0.357666015625, 0.8548583984375, 1.35205078125, 1.8492431640625, 2.346435546875, 2.8436279296875, 3.3408203125, 3.8380126953125, 4.335205078125, 4.8323974609375, 5.32958984375, 5.8267822265625, 6.323974609375, 6.8211669921875, 7.318359375, 7.8155517578125, 8.312744140625, 8.8099365234375, 9.30712890625, 9.8043212890625, 10.301513671875, 10.7987060546875, 11.2958984375, 11.7930908203125, 12.290283203125, 12.7874755859375, 13.28466796875, 13.7818603515625, 14.279052734375, 14.7762451171875, 15.2734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 8.0, 6.0, 11.0, 15.0, 18.0, 31.0, 21.0, 46.0, 44.0, 48.0, 40.0, 53.0, 63.0, 70.0, 52.0, 51.0, 55.0, 55.0, 48.0, 45.0, 33.0, 42.0, 28.0, 33.0, 24.0, 14.0, 9.0, 8.0, 4.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.27978515625, -9.9033203125, -9.52685546875, -9.150390625, -8.77392578125, -8.3974609375, -8.02099609375, -7.64453125, -7.26806640625, -6.8916015625, -6.51513671875, -6.138671875, -5.76220703125, -5.3857421875, -5.00927734375, -4.6328125, -4.25634765625, -3.8798828125, -3.50341796875, -3.126953125, -2.75048828125, -2.3740234375, -1.99755859375, -1.62109375, -1.24462890625, -0.8681640625, -0.49169921875, -0.115234375, 0.26123046875, 0.6376953125, 1.01416015625, 1.390625, 1.76708984375, 2.1435546875, 2.52001953125, 2.896484375, 3.27294921875, 3.6494140625, 4.02587890625, 4.40234375, 4.77880859375, 5.1552734375, 5.53173828125, 5.908203125, 6.28466796875, 6.6611328125, 7.03759765625, 7.4140625, 7.79052734375, 8.1669921875, 8.54345703125, 8.919921875, 9.29638671875, 9.6728515625, 10.04931640625, 10.42578125, 10.80224609375, 11.1787109375, 11.55517578125, 11.931640625, 12.30810546875, 12.6845703125, 13.06103515625, 13.4375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 5.0, 6.0, 19.0, 18.0, 28.0, 37.0, 53.0, 83.0, 103.0, 158.0, 276.0, 443.0, 805.0, 1682.0, 4374.0, 14412.0, 75352.0, 1585550.0, 2394303.0, 91590.0, 16967.0, 4691.0, 1755.0, 759.0, 369.0, 166.0, 97.0, 64.0, 43.0, 25.0, 16.0, 13.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.21875, -38.099609375, -36.98046875, -35.861328125, -34.7421875, -33.623046875, -32.50390625, -31.384765625, -30.265625, -29.146484375, -28.02734375, -26.908203125, -25.7890625, -24.669921875, -23.55078125, -22.431640625, -21.3125, -20.193359375, -19.07421875, -17.955078125, -16.8359375, -15.716796875, -14.59765625, -13.478515625, -12.359375, -11.240234375, -10.12109375, -9.001953125, -7.8828125, -6.763671875, -5.64453125, -4.525390625, -3.40625, -2.287109375, -1.16796875, -0.048828125, 1.0703125, 2.189453125, 3.30859375, 4.427734375, 5.546875, 6.666015625, 7.78515625, 8.904296875, 10.0234375, 11.142578125, 12.26171875, 13.380859375, 14.5, 15.619140625, 16.73828125, 17.857421875, 18.9765625, 20.095703125, 21.21484375, 22.333984375, 23.453125, 24.572265625, 25.69140625, 26.810546875, 27.9296875, 29.048828125, 30.16796875, 31.287109375, 32.40625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 14.0, 22.0, 32.0, 61.0, 81.0, 155.0, 349.0, 1012.0, 1311.0, 496.0, 223.0, 116.0, 72.0, 31.0, 38.0, 16.0, 9.0, 8.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.0625, -69.49072265625, -67.9189453125, -66.34716796875, -64.775390625, -63.20361328125, -61.6318359375, -60.06005859375, -58.48828125, -56.91650390625, -55.3447265625, -53.77294921875, -52.201171875, -50.62939453125, -49.0576171875, -47.48583984375, -45.9140625, -44.34228515625, -42.7705078125, -41.19873046875, -39.626953125, -38.05517578125, -36.4833984375, -34.91162109375, -33.33984375, -31.76806640625, -30.1962890625, -28.62451171875, -27.052734375, -25.48095703125, -23.9091796875, -22.33740234375, -20.765625, -19.19384765625, -17.6220703125, -16.05029296875, -14.478515625, -12.90673828125, -11.3349609375, -9.76318359375, -8.19140625, -6.61962890625, -5.0478515625, -3.47607421875, -1.904296875, -0.33251953125, 1.2392578125, 2.81103515625, 4.3828125, 5.95458984375, 7.5263671875, 9.09814453125, 10.669921875, 12.24169921875, 13.8134765625, 15.38525390625, 16.95703125, 18.52880859375, 20.1005859375, 21.67236328125, 23.244140625, 24.81591796875, 26.3876953125, 27.95947265625, 29.53125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 21.0, 49.0, 146.0, 223.0, 261.0, 148.0, 71.0, 30.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-506.2106628417969, -492.54583740234375, -478.88104248046875, -465.2162170410156, -451.5513916015625, -437.8865661621094, -424.22174072265625, -410.55694580078125, -396.8921203613281, -383.227294921875, -369.5625, -355.8976745605469, -342.23284912109375, -328.5680236816406, -314.9031982421875, -301.2384033203125, -287.5735778808594, -273.90875244140625, -260.24395751953125, -246.57913208007812, -232.914306640625, -219.24948120117188, -205.5846710205078, -191.91986083984375, -178.25503540039062, -164.5902099609375, -150.92539978027344, -137.26058959960938, -123.59576416015625, -109.93094635009766, -96.26612854003906, -82.60131072998047, -68.9365234375, -55.271705627441406, -41.60688781738281, -27.94207000732422, -14.277252197265625, -0.6124343872070312, 13.052383422851562, 26.717201232910156, 40.38201904296875, 54.046836853027344, 67.71165466308594, 81.37647247314453, 95.04129028320312, 108.70610809326172, 122.37092590332031, 136.03573608398438, 149.7005615234375, 163.36538696289062, 177.0301971435547, 190.69500732421875, 204.35983276367188, 218.024658203125, 231.68946838378906, 245.35427856445312, 259.01910400390625, 272.6839294433594, 286.3487548828125, 300.0135498046875, 313.6783752441406, 327.34320068359375, 341.00799560546875, 354.6728210449219, 368.337646484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 1.0, 6.0, 9.0, 11.0, 19.0, 21.0, 18.0, 24.0, 24.0, 28.0, 34.0, 45.0, 39.0, 34.0, 47.0, 52.0, 33.0, 50.0, 44.0, 48.0, 51.0, 40.0, 49.0, 41.0, 33.0, 24.0, 25.0, 33.0, 19.0, 13.0, 15.0, 17.0, 8.0, 6.0, 12.0, 6.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-164.20034790039062, -159.4052734375, -154.6101837158203, -149.81509399414062, -145.02001953125, -140.22494506835938, -135.4298553466797, -130.634765625, -125.83969116210938, -121.04460906982422, -116.24952697753906, -111.4544448852539, -106.65936279296875, -101.8642807006836, -97.06919860839844, -92.27411651611328, -87.47903442382812, -82.68395233154297, -77.88887023925781, -73.09378814697266, -68.2987060546875, -63.503623962402344, -58.70854187011719, -53.91345977783203, -49.118377685546875, -44.32329559326172, -39.52821350097656, -34.733131408691406, -29.93804931640625, -25.142967224121094, -20.347885131835938, -15.552803039550781, -10.757720947265625, -5.962638854980469, -1.1675567626953125, 3.6275253295898438, 8.422607421875, 13.217689514160156, 18.012771606445312, 22.80785369873047, 27.602935791015625, 32.39801788330078, 37.19309997558594, 41.988182067871094, 46.78326416015625, 51.578346252441406, 56.37342834472656, 61.16851043701172, 65.96359252929688, 70.75867462158203, 75.55375671386719, 80.34883880615234, 85.1439208984375, 89.93900299072266, 94.73408508300781, 99.52916717529297, 104.32424926757812, 109.11933135986328, 113.91441345214844, 118.7094955444336, 123.50457763671875, 128.29965209960938, 133.09474182128906, 137.88983154296875, 142.68490600585938]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 8.0, 23.0, 36.0, 53.0, 69.0, 106.0, 178.0, 312.0, 411.0, 737.0, 1197.0, 2232.0, 4188.0, 8176.0, 16533.0, 36004.0, 79223.0, 180558.0, 342068.0, 206616.0, 90839.0, 40551.0, 18640.0, 9207.0, 4637.0, 2478.0, 1412.0, 751.0, 450.0, 289.0, 188.0, 147.0, 73.0, 45.0, 27.0, 27.0, 14.0, 13.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.216796875, -17.62109375, -17.025390625, -16.4296875, -15.833984375, -15.23828125, -14.642578125, -14.046875, -13.451171875, -12.85546875, -12.259765625, -11.6640625, -11.068359375, -10.47265625, -9.876953125, -9.28125, -8.685546875, -8.08984375, -7.494140625, -6.8984375, -6.302734375, -5.70703125, -5.111328125, -4.515625, -3.919921875, -3.32421875, -2.728515625, -2.1328125, -1.537109375, -0.94140625, -0.345703125, 0.25, 0.845703125, 1.44140625, 2.037109375, 2.6328125, 3.228515625, 3.82421875, 4.419921875, 5.015625, 5.611328125, 6.20703125, 6.802734375, 7.3984375, 7.994140625, 8.58984375, 9.185546875, 9.78125, 10.376953125, 10.97265625, 11.568359375, 12.1640625, 12.759765625, 13.35546875, 13.951171875, 14.546875, 15.142578125, 15.73828125, 16.333984375, 16.9296875, 17.525390625, 18.12109375, 18.716796875, 19.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 14.0, 14.0, 17.0, 21.0, 22.0, 25.0, 33.0, 35.0, 44.0, 35.0, 47.0, 41.0, 49.0, 58.0, 38.0, 43.0, 47.0, 53.0, 42.0, 38.0, 44.0, 34.0, 27.0, 25.0, 26.0, 31.0, 17.0, 13.0, 9.0, 8.0, 4.0, 9.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.359375, -11.040283203125, -10.72119140625, -10.402099609375, -10.0830078125, -9.763916015625, -9.44482421875, -9.125732421875, -8.806640625, -8.487548828125, -8.16845703125, -7.849365234375, -7.5302734375, -7.211181640625, -6.89208984375, -6.572998046875, -6.25390625, -5.934814453125, -5.61572265625, -5.296630859375, -4.9775390625, -4.658447265625, -4.33935546875, -4.020263671875, -3.701171875, -3.382080078125, -3.06298828125, -2.743896484375, -2.4248046875, -2.105712890625, -1.78662109375, -1.467529296875, -1.1484375, -0.829345703125, -0.51025390625, -0.191162109375, 0.1279296875, 0.447021484375, 0.76611328125, 1.085205078125, 1.404296875, 1.723388671875, 2.04248046875, 2.361572265625, 2.6806640625, 2.999755859375, 3.31884765625, 3.637939453125, 3.95703125, 4.276123046875, 4.59521484375, 4.914306640625, 5.2333984375, 5.552490234375, 5.87158203125, 6.190673828125, 6.509765625, 6.828857421875, 7.14794921875, 7.467041015625, 7.7861328125, 8.105224609375, 8.42431640625, 8.743408203125, 9.0625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 16.0, 20.0, 32.0, 33.0, 46.0, 61.0, 98.0, 178.0, 233.0, 342.0, 589.0, 988.0, 1818.0, 4264.0, 17402.0, 163222.0, 772622.0, 69690.0, 10108.0, 3123.0, 1384.0, 813.0, 498.0, 337.0, 195.0, 155.0, 81.0, 47.0, 48.0, 24.0, 23.0, 13.0, 15.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.09375, -51.34326171875, -49.5927734375, -47.84228515625, -46.091796875, -44.34130859375, -42.5908203125, -40.84033203125, -39.08984375, -37.33935546875, -35.5888671875, -33.83837890625, -32.087890625, -30.33740234375, -28.5869140625, -26.83642578125, -25.0859375, -23.33544921875, -21.5849609375, -19.83447265625, -18.083984375, -16.33349609375, -14.5830078125, -12.83251953125, -11.08203125, -9.33154296875, -7.5810546875, -5.83056640625, -4.080078125, -2.32958984375, -0.5791015625, 1.17138671875, 2.921875, 4.67236328125, 6.4228515625, 8.17333984375, 9.923828125, 11.67431640625, 13.4248046875, 15.17529296875, 16.92578125, 18.67626953125, 20.4267578125, 22.17724609375, 23.927734375, 25.67822265625, 27.4287109375, 29.17919921875, 30.9296875, 32.68017578125, 34.4306640625, 36.18115234375, 37.931640625, 39.68212890625, 41.4326171875, 43.18310546875, 44.93359375, 46.68408203125, 48.4345703125, 50.18505859375, 51.935546875, 53.68603515625, 55.4365234375, 57.18701171875, 58.9375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 14.0, 11.0, 12.0, 13.0, 28.0, 35.0, 29.0, 37.0, 36.0, 45.0, 48.0, 53.0, 50.0, 63.0, 47.0, 58.0, 49.0, 53.0, 61.0, 37.0, 46.0, 33.0, 23.0, 19.0, 17.0, 23.0, 12.0, 6.0, 9.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34375, -37.63916015625, -35.9345703125, -34.22998046875, -32.525390625, -30.82080078125, -29.1162109375, -27.41162109375, -25.70703125, -24.00244140625, -22.2978515625, -20.59326171875, -18.888671875, -17.18408203125, -15.4794921875, -13.77490234375, -12.0703125, -10.36572265625, -8.6611328125, -6.95654296875, -5.251953125, -3.54736328125, -1.8427734375, -0.13818359375, 1.56640625, 3.27099609375, 4.9755859375, 6.68017578125, 8.384765625, 10.08935546875, 11.7939453125, 13.49853515625, 15.203125, 16.90771484375, 18.6123046875, 20.31689453125, 22.021484375, 23.72607421875, 25.4306640625, 27.13525390625, 28.83984375, 30.54443359375, 32.2490234375, 33.95361328125, 35.658203125, 37.36279296875, 39.0673828125, 40.77197265625, 42.4765625, 44.18115234375, 45.8857421875, 47.59033203125, 49.294921875, 50.99951171875, 52.7041015625, 54.40869140625, 56.11328125, 57.81787109375, 59.5224609375, 61.22705078125, 62.931640625, 64.63623046875, 66.3408203125, 68.04541015625, 69.75]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 8.0, 26.0, 41.0, 117.0, 335.0, 1758.0, 35074.0, 976791.0, 32145.0, 1696.0, 332.0, 112.0, 56.0, 22.0, 16.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.625, -29.37451171875, -28.1240234375, -26.87353515625, -25.623046875, -24.37255859375, -23.1220703125, -21.87158203125, -20.62109375, -19.37060546875, -18.1201171875, -16.86962890625, -15.619140625, -14.36865234375, -13.1181640625, -11.86767578125, -10.6171875, -9.36669921875, -8.1162109375, -6.86572265625, -5.615234375, -4.36474609375, -3.1142578125, -1.86376953125, -0.61328125, 0.63720703125, 1.8876953125, 3.13818359375, 4.388671875, 5.63916015625, 6.8896484375, 8.14013671875, 9.390625, 10.64111328125, 11.8916015625, 13.14208984375, 14.392578125, 15.64306640625, 16.8935546875, 18.14404296875, 19.39453125, 20.64501953125, 21.8955078125, 23.14599609375, 24.396484375, 25.64697265625, 26.8974609375, 28.14794921875, 29.3984375, 30.64892578125, 31.8994140625, 33.14990234375, 34.400390625, 35.65087890625, 36.9013671875, 38.15185546875, 39.40234375, 40.65283203125, 41.9033203125, 43.15380859375, 44.404296875, 45.65478515625, 46.9052734375, 48.15576171875, 49.40625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 12.0, 17.0, 14.0, 30.0, 30.0, 56.0, 73.0, 113.0, 141.0, 119.0, 87.0, 72.0, 56.0, 45.0, 24.0, 19.0, 12.0, 10.0, 15.0, 2.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.003997802734375, -0.0038862526416778564, -0.003774702548980713, -0.0036631524562835693, -0.0035516023635864258, -0.0034400522708892822, -0.0033285021781921387, -0.003216952085494995, -0.0031054019927978516, -0.002993851900100708, -0.0028823018074035645, -0.002770751714706421, -0.0026592016220092773, -0.002547651529312134, -0.0024361014366149902, -0.0023245513439178467, -0.002213001251220703, -0.0021014511585235596, -0.001989901065826416, -0.0018783509731292725, -0.001766800880432129, -0.0016552507877349854, -0.0015437006950378418, -0.0014321506023406982, -0.0013206005096435547, -0.0012090504169464111, -0.0010975003242492676, -0.000985950231552124, -0.0008744001388549805, -0.0007628500461578369, -0.0006512999534606934, -0.0005397498607635498, -0.00042819976806640625, -0.0003166496753692627, -0.00020509958267211914, -9.354948997497559e-05, 1.800060272216797e-05, 0.00012955069541931152, 0.00024110078811645508, 0.00035265088081359863, 0.0004642009735107422, 0.0005757510662078857, 0.0006873011589050293, 0.0007988512516021729, 0.0009104013442993164, 0.00102195143699646, 0.0011335015296936035, 0.001245051622390747, 0.0013566017150878906, 0.0014681518077850342, 0.0015797019004821777, 0.0016912519931793213, 0.0018028020858764648, 0.0019143521785736084, 0.002025902271270752, 0.0021374523639678955, 0.002249002456665039, 0.0023605525493621826, 0.002472102642059326, 0.0025836527347564697, 0.0026952028274536133, 0.002806752920150757, 0.0029183030128479004, 0.003029853105545044, 0.0031414031982421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 14.0, 18.0, 34.0, 59.0, 94.0, 146.0, 282.0, 518.0, 934.0, 2139.0, 6781.0, 42230.0, 728485.0, 239814.0, 19475.0, 4256.0, 1580.0, 778.0, 369.0, 213.0, 130.0, 74.0, 41.0, 31.0, 20.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.28125, -22.6815185546875, -22.081787109375, -21.4820556640625, -20.88232421875, -20.2825927734375, -19.682861328125, -19.0831298828125, -18.4833984375, -17.8836669921875, -17.283935546875, -16.6842041015625, -16.08447265625, -15.4847412109375, -14.885009765625, -14.2852783203125, -13.685546875, -13.0858154296875, -12.486083984375, -11.8863525390625, -11.28662109375, -10.6868896484375, -10.087158203125, -9.4874267578125, -8.8876953125, -8.2879638671875, -7.688232421875, -7.0885009765625, -6.48876953125, -5.8890380859375, -5.289306640625, -4.6895751953125, -4.08984375, -3.4901123046875, -2.890380859375, -2.2906494140625, -1.69091796875, -1.0911865234375, -0.491455078125, 0.1082763671875, 0.7080078125, 1.3077392578125, 1.907470703125, 2.5072021484375, 3.10693359375, 3.7066650390625, 4.306396484375, 4.9061279296875, 5.505859375, 6.1055908203125, 6.705322265625, 7.3050537109375, 7.90478515625, 8.5045166015625, 9.104248046875, 9.7039794921875, 10.3037109375, 10.9034423828125, 11.503173828125, 12.1029052734375, 12.70263671875, 13.3023681640625, 13.902099609375, 14.5018310546875, 15.1015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 5.0, 8.0, 6.0, 5.0, 12.0, 19.0, 17.0, 29.0, 29.0, 32.0, 25.0, 39.0, 43.0, 46.0, 53.0, 71.0, 75.0, 78.0, 62.0, 49.0, 39.0, 53.0, 35.0, 28.0, 30.0, 23.0, 20.0, 12.0, 12.0, 7.0, 5.0, 10.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.9453125, -11.5819091796875, -11.218505859375, -10.8551025390625, -10.49169921875, -10.1282958984375, -9.764892578125, -9.4014892578125, -9.0380859375, -8.6746826171875, -8.311279296875, -7.9478759765625, -7.58447265625, -7.2210693359375, -6.857666015625, -6.4942626953125, -6.130859375, -5.7674560546875, -5.404052734375, -5.0406494140625, -4.67724609375, -4.3138427734375, -3.950439453125, -3.5870361328125, -3.2236328125, -2.8602294921875, -2.496826171875, -2.1334228515625, -1.77001953125, -1.4066162109375, -1.043212890625, -0.6798095703125, -0.31640625, 0.0469970703125, 0.410400390625, 0.7738037109375, 1.13720703125, 1.5006103515625, 1.864013671875, 2.2274169921875, 2.5908203125, 2.9542236328125, 3.317626953125, 3.6810302734375, 4.04443359375, 4.4078369140625, 4.771240234375, 5.1346435546875, 5.498046875, 5.8614501953125, 6.224853515625, 6.5882568359375, 6.95166015625, 7.3150634765625, 7.678466796875, 8.0418701171875, 8.4052734375, 8.7686767578125, 9.132080078125, 9.4954833984375, 9.85888671875, 10.2222900390625, 10.585693359375, 10.9490966796875, 11.3125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 12.0, 37.0, 121.0, 325.0, 330.0, 113.0, 45.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-710.5503540039062, -691.8973999023438, -673.244384765625, -654.5914306640625, -635.9384155273438, -617.2854614257812, -598.6324462890625, -579.9794921875, -561.3265380859375, -542.673583984375, -524.0205688476562, -505.3675842285156, -486.714599609375, -468.0616455078125, -449.4086608886719, -430.75567626953125, -412.1026611328125, -393.4496765136719, -374.79669189453125, -356.1437072753906, -337.49072265625, -318.8377685546875, -300.1847839355469, -281.53179931640625, -262.8788146972656, -244.225830078125, -225.57284545898438, -206.9198760986328, -188.2668914794922, -169.61390686035156, -150.9609375, -132.30795288085938, -113.65499877929688, -95.00201416015625, -76.34903717041016, -57.6960563659668, -39.04307556152344, -20.390090942382812, -1.7371139526367188, 16.915863037109375, 35.56884765625, 54.22182846069336, 72.87480926513672, 91.52778625488281, 110.18077087402344, 128.83375549316406, 147.48672485351562, 166.13970947265625, 184.79269409179688, 203.4456787109375, 222.09866333007812, 240.7516326904297, 259.40460205078125, 278.0576171875, 296.7105712890625, 315.3635559082031, 334.01654052734375, 352.6695251464844, 371.322509765625, 389.9754943847656, 408.62847900390625, 427.28143310546875, 445.9344177246094, 464.58740234375, 483.2403869628906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 5.0, 8.0, 15.0, 8.0, 17.0, 22.0, 26.0, 27.0, 32.0, 39.0, 33.0, 53.0, 70.0, 98.0, 92.0, 72.0, 62.0, 50.0, 53.0, 37.0, 37.0, 24.0, 25.0, 27.0, 19.0, 15.0, 4.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0], "bins": [-327.4236145019531, -320.19720458984375, -312.97076416015625, -305.7443542480469, -298.5179443359375, -291.29150390625, -284.0650939941406, -276.83868408203125, -269.61224365234375, -262.3858337402344, -255.15940856933594, -247.9329833984375, -240.70657348632812, -233.4801483154297, -226.25372314453125, -219.02731323242188, -211.8009033203125, -204.57447814941406, -197.3480682373047, -190.12164306640625, -182.89523315429688, -175.66880798339844, -168.4423828125, -161.21597290039062, -153.9895477294922, -146.76312255859375, -139.53671264648438, -132.31028747558594, -125.08386993408203, -117.85745239257812, -110.63102722167969, -103.40460968017578, -96.17819213867188, -88.95177459716797, -81.72535705566406, -74.49893188476562, -67.27251434326172, -60.04609680175781, -52.81967544555664, -45.59325408935547, -38.36683654785156, -31.140417098999023, -23.913997650146484, -16.687578201293945, -9.461158752441406, -2.2347412109375, 4.991680145263672, 12.218101501464844, 19.44451904296875, 26.67093849182129, 33.89735794067383, 41.123779296875, 48.350196838378906, 55.57661437988281, 62.803035736083984, 70.02945709228516, 77.25587463378906, 84.48229217529297, 91.70870971679688, 98.93513488769531, 106.16155242919922, 113.38796997070312, 120.61439514160156, 127.84081268310547, 135.06723022460938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 12.0, 11.0, 25.0, 26.0, 51.0, 131.0, 298.0, 521.0, 1273.0, 3337.0, 10527.0, 48144.0, 718014.0, 3197017.0, 177730.0, 25618.0, 7138.0, 2663.0, 988.0, 403.0, 173.0, 87.0, 42.0, 16.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-33.59375, -32.835205078125, -32.07666015625, -31.318115234375, -30.5595703125, -29.801025390625, -29.04248046875, -28.283935546875, -27.525390625, -26.766845703125, -26.00830078125, -25.249755859375, -24.4912109375, -23.732666015625, -22.97412109375, -22.215576171875, -21.45703125, -20.698486328125, -19.93994140625, -19.181396484375, -18.4228515625, -17.664306640625, -16.90576171875, -16.147216796875, -15.388671875, -14.630126953125, -13.87158203125, -13.113037109375, -12.3544921875, -11.595947265625, -10.83740234375, -10.078857421875, -9.3203125, -8.561767578125, -7.80322265625, -7.044677734375, -6.2861328125, -5.527587890625, -4.76904296875, -4.010498046875, -3.251953125, -2.493408203125, -1.73486328125, -0.976318359375, -0.2177734375, 0.540771484375, 1.29931640625, 2.057861328125, 2.81640625, 3.574951171875, 4.33349609375, 5.092041015625, 5.8505859375, 6.609130859375, 7.36767578125, 8.126220703125, 8.884765625, 9.643310546875, 10.40185546875, 11.160400390625, 11.9189453125, 12.677490234375, 13.43603515625, 14.194580078125, 14.953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 10.0, 17.0, 38.0, 49.0, 63.0, 95.0, 94.0, 112.0, 114.0, 102.0, 81.0, 81.0, 63.0, 46.0, 26.0, 8.0, 9.0, 2.0, 3.0, 1.0], "bins": [-39.96875, -39.202880859375, -38.43701171875, -37.671142578125, -36.9052734375, -36.139404296875, -35.37353515625, -34.607666015625, -33.841796875, -33.075927734375, -32.31005859375, -31.544189453125, -30.7783203125, -30.012451171875, -29.24658203125, -28.480712890625, -27.71484375, -26.948974609375, -26.18310546875, -25.417236328125, -24.6513671875, -23.885498046875, -23.11962890625, -22.353759765625, -21.587890625, -20.822021484375, -20.05615234375, -19.290283203125, -18.5244140625, -17.758544921875, -16.99267578125, -16.226806640625, -15.4609375, -14.695068359375, -13.92919921875, -13.163330078125, -12.3974609375, -11.631591796875, -10.86572265625, -10.099853515625, -9.333984375, -8.568115234375, -7.80224609375, -7.036376953125, -6.2705078125, -5.504638671875, -4.73876953125, -3.972900390625, -3.20703125, -2.441162109375, -1.67529296875, -0.909423828125, -0.1435546875, 0.622314453125, 1.38818359375, 2.154052734375, 2.919921875, 3.685791015625, 4.45166015625, 5.217529296875, 5.9833984375, 6.749267578125, 7.51513671875, 8.281005859375, 9.046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 2.0, 1.0, 7.0, 12.0, 8.0, 28.0, 32.0, 43.0, 74.0, 101.0, 179.0, 315.0, 542.0, 1131.0, 2339.0, 5478.0, 14974.0, 49319.0, 252274.0, 3133137.0, 610944.0, 83585.0, 23925.0, 8521.0, 3529.0, 1632.0, 875.0, 440.0, 289.0, 170.0, 110.0, 77.0, 45.0, 40.0, 18.0, 25.0, 14.0, 15.0, 13.0, 8.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.671875, -19.950927734375, -19.22998046875, -18.509033203125, -17.7880859375, -17.067138671875, -16.34619140625, -15.625244140625, -14.904296875, -14.183349609375, -13.46240234375, -12.741455078125, -12.0205078125, -11.299560546875, -10.57861328125, -9.857666015625, -9.13671875, -8.415771484375, -7.69482421875, -6.973876953125, -6.2529296875, -5.531982421875, -4.81103515625, -4.090087890625, -3.369140625, -2.648193359375, -1.92724609375, -1.206298828125, -0.4853515625, 0.235595703125, 0.95654296875, 1.677490234375, 2.3984375, 3.119384765625, 3.84033203125, 4.561279296875, 5.2822265625, 6.003173828125, 6.72412109375, 7.445068359375, 8.166015625, 8.886962890625, 9.60791015625, 10.328857421875, 11.0498046875, 11.770751953125, 12.49169921875, 13.212646484375, 13.93359375, 14.654541015625, 15.37548828125, 16.096435546875, 16.8173828125, 17.538330078125, 18.25927734375, 18.980224609375, 19.701171875, 20.422119140625, 21.14306640625, 21.864013671875, 22.5849609375, 23.305908203125, 24.02685546875, 24.747802734375, 25.46875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 17.0, 18.0, 41.0, 44.0, 47.0, 100.0, 162.0, 287.0, 567.0, 949.0, 781.0, 417.0, 215.0, 115.0, 68.0, 44.0, 41.0, 32.0, 24.0, 18.0, 13.0, 12.0, 13.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0625, -22.09228515625, -21.1220703125, -20.15185546875, -19.181640625, -18.21142578125, -17.2412109375, -16.27099609375, -15.30078125, -14.33056640625, -13.3603515625, -12.39013671875, -11.419921875, -10.44970703125, -9.4794921875, -8.50927734375, -7.5390625, -6.56884765625, -5.5986328125, -4.62841796875, -3.658203125, -2.68798828125, -1.7177734375, -0.74755859375, 0.22265625, 1.19287109375, 2.1630859375, 3.13330078125, 4.103515625, 5.07373046875, 6.0439453125, 7.01416015625, 7.984375, 8.95458984375, 9.9248046875, 10.89501953125, 11.865234375, 12.83544921875, 13.8056640625, 14.77587890625, 15.74609375, 16.71630859375, 17.6865234375, 18.65673828125, 19.626953125, 20.59716796875, 21.5673828125, 22.53759765625, 23.5078125, 24.47802734375, 25.4482421875, 26.41845703125, 27.388671875, 28.35888671875, 29.3291015625, 30.29931640625, 31.26953125, 32.23974609375, 33.2099609375, 34.18017578125, 35.150390625, 36.12060546875, 37.0908203125, 38.06103515625, 39.03125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 24.0, 51.0, 85.0, 148.0, 210.0, 229.0, 107.0, 53.0, 30.0, 16.0, 10.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.58343505859375, -155.22848510742188, -145.87353515625, -136.5186004638672, -127.16365051269531, -117.80870056152344, -108.4537582397461, -99.09881591796875, -89.74386596679688, -80.388916015625, -71.03397369384766, -61.67902755737305, -52.32408142089844, -42.96913528442383, -33.61418914794922, -24.259246826171875, -14.904296875, -5.549350738525391, 3.8055953979492188, 13.160541534423828, 22.515487670898438, 31.870433807373047, 41.225379943847656, 50.580322265625, 59.935272216796875, 69.29022216796875, 78.6451644897461, 88.00010681152344, 97.35505676269531, 106.71000671386719, 116.06494903564453, 125.41989135742188, 134.77484130859375, 144.12979125976562, 153.4847412109375, 162.8396759033203, 172.1946258544922, 181.54957580566406, 190.90451049804688, 200.25946044921875, 209.61441040039062, 218.9693603515625, 228.32431030273438, 237.6792449951172, 247.03419494628906, 256.3891296386719, 265.74407958984375, 275.0990295410156, 284.4539794921875, 293.8089294433594, 303.16387939453125, 312.5188293457031, 321.873779296875, 331.22869873046875, 340.5836486816406, 349.9385986328125, 359.2935485839844, 368.64849853515625, 378.0034484863281, 387.3583984375, 396.71331787109375, 406.0682678222656, 415.4232177734375, 424.7781677246094, 434.13311767578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 17.0, 11.0, 23.0, 26.0, 29.0, 31.0, 56.0, 54.0, 88.0, 67.0, 85.0, 72.0, 83.0, 56.0, 59.0, 63.0, 32.0, 35.0, 41.0, 18.0, 14.0, 10.0, 8.0, 6.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.55867004394531, -110.41510009765625, -104.27153015136719, -98.12796020507812, -91.98439025878906, -85.8408203125, -79.6972427368164, -73.55367279052734, -67.41010284423828, -61.26653289794922, -55.122962951660156, -48.97938919067383, -42.835819244384766, -36.6922492980957, -30.548675537109375, -24.405105590820312, -18.26153564453125, -12.117964744567871, -5.974393844604492, 0.16917800903320312, 6.312747955322266, 12.456317901611328, 18.599891662597656, 24.74346160888672, 30.88703155517578, 37.030601501464844, 43.174171447753906, 49.317745208740234, 55.4613151550293, 61.60488510131836, 67.74845886230469, 73.89202880859375, 80.03558349609375, 86.17915344238281, 92.32272338867188, 98.46629333496094, 104.60986328125, 110.75343322753906, 116.89701080322266, 123.04058074951172, 129.18414306640625, 135.3277130126953, 141.47128295898438, 147.61485290527344, 153.7584228515625, 159.90199279785156, 166.04556274414062, 172.18914794921875, 178.3327178955078, 184.47628784179688, 190.61985778808594, 196.763427734375, 202.90699768066406, 209.05056762695312, 215.19415283203125, 221.33770751953125, 227.48129272460938, 233.62486267089844, 239.7684326171875, 245.91200256347656, 252.05557250976562, 258.19915771484375, 264.34271240234375, 270.4862976074219, 276.6298522949219]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 14.0, 17.0, 27.0, 31.0, 38.0, 47.0, 89.0, 114.0, 186.0, 286.0, 442.0, 777.0, 1277.0, 2087.0, 3967.0, 7794.0, 16096.0, 34399.0, 78570.0, 191619.0, 362787.0, 197440.0, 80943.0, 35753.0, 16058.0, 7962.0, 4104.0, 2293.0, 1261.0, 740.0, 451.0, 315.0, 191.0, 134.0, 65.0, 53.0, 44.0, 27.0, 26.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.7900390625, -15.236328125, -14.6826171875, -14.12890625, -13.5751953125, -13.021484375, -12.4677734375, -11.9140625, -11.3603515625, -10.806640625, -10.2529296875, -9.69921875, -9.1455078125, -8.591796875, -8.0380859375, -7.484375, -6.9306640625, -6.376953125, -5.8232421875, -5.26953125, -4.7158203125, -4.162109375, -3.6083984375, -3.0546875, -2.5009765625, -1.947265625, -1.3935546875, -0.83984375, -0.2861328125, 0.267578125, 0.8212890625, 1.375, 1.9287109375, 2.482421875, 3.0361328125, 3.58984375, 4.1435546875, 4.697265625, 5.2509765625, 5.8046875, 6.3583984375, 6.912109375, 7.4658203125, 8.01953125, 8.5732421875, 9.126953125, 9.6806640625, 10.234375, 10.7880859375, 11.341796875, 11.8955078125, 12.44921875, 13.0029296875, 13.556640625, 14.1103515625, 14.6640625, 15.2177734375, 15.771484375, 16.3251953125, 16.87890625, 17.4326171875, 17.986328125, 18.5400390625, 19.09375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 7.0, 12.0, 6.0, 15.0, 14.0, 14.0, 14.0, 19.0, 26.0, 20.0, 31.0, 26.0, 39.0, 32.0, 39.0, 51.0, 46.0, 48.0, 48.0, 38.0, 50.0, 36.0, 36.0, 36.0, 37.0, 33.0, 39.0, 28.0, 26.0, 26.0, 19.0, 16.0, 11.0, 12.0, 8.0, 9.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.422119140625, -9.12548828125, -8.828857421875, -8.5322265625, -8.235595703125, -7.93896484375, -7.642333984375, -7.345703125, -7.049072265625, -6.75244140625, -6.455810546875, -6.1591796875, -5.862548828125, -5.56591796875, -5.269287109375, -4.97265625, -4.676025390625, -4.37939453125, -4.082763671875, -3.7861328125, -3.489501953125, -3.19287109375, -2.896240234375, -2.599609375, -2.302978515625, -2.00634765625, -1.709716796875, -1.4130859375, -1.116455078125, -0.81982421875, -0.523193359375, -0.2265625, 0.070068359375, 0.36669921875, 0.663330078125, 0.9599609375, 1.256591796875, 1.55322265625, 1.849853515625, 2.146484375, 2.443115234375, 2.73974609375, 3.036376953125, 3.3330078125, 3.629638671875, 3.92626953125, 4.222900390625, 4.51953125, 4.816162109375, 5.11279296875, 5.409423828125, 5.7060546875, 6.002685546875, 6.29931640625, 6.595947265625, 6.892578125, 7.189208984375, 7.48583984375, 7.782470703125, 8.0791015625, 8.375732421875, 8.67236328125, 8.968994140625, 9.265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 19.0, 13.0, 29.0, 39.0, 92.0, 138.0, 217.0, 344.0, 656.0, 1240.0, 2951.0, 10338.0, 67252.0, 768166.0, 169099.0, 19718.0, 4486.0, 1757.0, 828.0, 431.0, 261.0, 177.0, 92.0, 66.0, 50.0, 28.0, 22.0, 14.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.0, -45.4169921875, -43.833984375, -42.2509765625, -40.66796875, -39.0849609375, -37.501953125, -35.9189453125, -34.3359375, -32.7529296875, -31.169921875, -29.5869140625, -28.00390625, -26.4208984375, -24.837890625, -23.2548828125, -21.671875, -20.0888671875, -18.505859375, -16.9228515625, -15.33984375, -13.7568359375, -12.173828125, -10.5908203125, -9.0078125, -7.4248046875, -5.841796875, -4.2587890625, -2.67578125, -1.0927734375, 0.490234375, 2.0732421875, 3.65625, 5.2392578125, 6.822265625, 8.4052734375, 9.98828125, 11.5712890625, 13.154296875, 14.7373046875, 16.3203125, 17.9033203125, 19.486328125, 21.0693359375, 22.65234375, 24.2353515625, 25.818359375, 27.4013671875, 28.984375, 30.5673828125, 32.150390625, 33.7333984375, 35.31640625, 36.8994140625, 38.482421875, 40.0654296875, 41.6484375, 43.2314453125, 44.814453125, 46.3974609375, 47.98046875, 49.5634765625, 51.146484375, 52.7294921875, 54.3125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 15.0, 13.0, 16.0, 11.0, 22.0, 35.0, 36.0, 42.0, 44.0, 35.0, 45.0, 66.0, 42.0, 57.0, 46.0, 52.0, 56.0, 42.0, 33.0, 40.0, 33.0, 35.0, 28.0, 22.0, 22.0, 16.0, 11.0, 9.0, 14.0, 10.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0], "bins": [-49.5625, -48.236328125, -46.91015625, -45.583984375, -44.2578125, -42.931640625, -41.60546875, -40.279296875, -38.953125, -37.626953125, -36.30078125, -34.974609375, -33.6484375, -32.322265625, -30.99609375, -29.669921875, -28.34375, -27.017578125, -25.69140625, -24.365234375, -23.0390625, -21.712890625, -20.38671875, -19.060546875, -17.734375, -16.408203125, -15.08203125, -13.755859375, -12.4296875, -11.103515625, -9.77734375, -8.451171875, -7.125, -5.798828125, -4.47265625, -3.146484375, -1.8203125, -0.494140625, 0.83203125, 2.158203125, 3.484375, 4.810546875, 6.13671875, 7.462890625, 8.7890625, 10.115234375, 11.44140625, 12.767578125, 14.09375, 15.419921875, 16.74609375, 18.072265625, 19.3984375, 20.724609375, 22.05078125, 23.376953125, 24.703125, 26.029296875, 27.35546875, 28.681640625, 30.0078125, 31.333984375, 32.66015625, 33.986328125, 35.3125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 12.0, 5.0, 18.0, 14.0, 18.0, 28.0, 37.0, 52.0, 107.0, 164.0, 277.0, 467.0, 968.0, 2405.0, 6532.0, 23475.0, 124856.0, 692501.0, 156693.0, 27442.0, 7467.0, 2630.0, 1091.0, 486.0, 277.0, 159.0, 103.0, 72.0, 48.0, 29.0, 24.0, 24.0, 6.0, 12.0, 8.0, 6.0, 1.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5228271484375, -10.178466796875, -9.8341064453125, -9.48974609375, -9.1453857421875, -8.801025390625, -8.4566650390625, -8.1123046875, -7.7679443359375, -7.423583984375, -7.0792236328125, -6.73486328125, -6.3905029296875, -6.046142578125, -5.7017822265625, -5.357421875, -5.0130615234375, -4.668701171875, -4.3243408203125, -3.97998046875, -3.6356201171875, -3.291259765625, -2.9468994140625, -2.6025390625, -2.2581787109375, -1.913818359375, -1.5694580078125, -1.22509765625, -0.8807373046875, -0.536376953125, -0.1920166015625, 0.15234375, 0.4967041015625, 0.841064453125, 1.1854248046875, 1.52978515625, 1.8741455078125, 2.218505859375, 2.5628662109375, 2.9072265625, 3.2515869140625, 3.595947265625, 3.9403076171875, 4.28466796875, 4.6290283203125, 4.973388671875, 5.3177490234375, 5.662109375, 6.0064697265625, 6.350830078125, 6.6951904296875, 7.03955078125, 7.3839111328125, 7.728271484375, 8.0726318359375, 8.4169921875, 8.7613525390625, 9.105712890625, 9.4500732421875, 9.79443359375, 10.1387939453125, 10.483154296875, 10.8275146484375, 11.171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 13.0, 23.0, 30.0, 33.0, 42.0, 62.0, 83.0, 114.0, 115.0, 107.0, 86.0, 52.0, 44.0, 33.0, 25.0, 22.0, 18.0, 14.0, 12.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024662017822265625, -0.0023854970932006836, -0.0023047924041748047, -0.0022240877151489258, -0.002143383026123047, -0.002062678337097168, -0.001981973648071289, -0.0019012689590454102, -0.0018205642700195312, -0.0017398595809936523, -0.0016591548919677734, -0.0015784502029418945, -0.0014977455139160156, -0.0014170408248901367, -0.0013363361358642578, -0.001255631446838379, -0.0011749267578125, -0.001094222068786621, -0.0010135173797607422, -0.0009328126907348633, -0.0008521080017089844, -0.0007714033126831055, -0.0006906986236572266, -0.0006099939346313477, -0.0005292892456054688, -0.00044858455657958984, -0.00036787986755371094, -0.00028717517852783203, -0.00020647048950195312, -0.00012576580047607422, -4.506111145019531e-05, 3.5643577575683594e-05, 0.0001163482666015625, 0.0001970529556274414, 0.0002777576446533203, 0.0003584623336791992, 0.0004391670227050781, 0.000519871711730957, 0.0006005764007568359, 0.0006812810897827148, 0.0007619857788085938, 0.0008426904678344727, 0.0009233951568603516, 0.0010040998458862305, 0.0010848045349121094, 0.0011655092239379883, 0.0012462139129638672, 0.001326918601989746, 0.001407623291015625, 0.001488327980041504, 0.0015690326690673828, 0.0016497373580932617, 0.0017304420471191406, 0.0018111467361450195, 0.0018918514251708984, 0.0019725561141967773, 0.0020532608032226562, 0.002133965492248535, 0.002214670181274414, 0.002295374870300293, 0.002376079559326172, 0.0024567842483520508, 0.0025374889373779297, 0.0026181936264038086, 0.0026988983154296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 16.0, 7.0, 19.0, 21.0, 52.0, 56.0, 86.0, 123.0, 186.0, 324.0, 606.0, 1116.0, 2644.0, 7055.0, 26874.0, 185225.0, 699991.0, 97829.0, 17038.0, 5039.0, 2023.0, 997.0, 470.0, 285.0, 154.0, 102.0, 56.0, 46.0, 32.0, 25.0, 16.0, 15.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.5078125, -12.1436767578125, -11.779541015625, -11.4154052734375, -11.05126953125, -10.6871337890625, -10.322998046875, -9.9588623046875, -9.5947265625, -9.2305908203125, -8.866455078125, -8.5023193359375, -8.13818359375, -7.7740478515625, -7.409912109375, -7.0457763671875, -6.681640625, -6.3175048828125, -5.953369140625, -5.5892333984375, -5.22509765625, -4.8609619140625, -4.496826171875, -4.1326904296875, -3.7685546875, -3.4044189453125, -3.040283203125, -2.6761474609375, -2.31201171875, -1.9478759765625, -1.583740234375, -1.2196044921875, -0.85546875, -0.4913330078125, -0.127197265625, 0.2369384765625, 0.60107421875, 0.9652099609375, 1.329345703125, 1.6934814453125, 2.0576171875, 2.4217529296875, 2.785888671875, 3.1500244140625, 3.51416015625, 3.8782958984375, 4.242431640625, 4.6065673828125, 4.970703125, 5.3348388671875, 5.698974609375, 6.0631103515625, 6.42724609375, 6.7913818359375, 7.155517578125, 7.5196533203125, 7.8837890625, 8.2479248046875, 8.612060546875, 8.9761962890625, 9.34033203125, 9.7044677734375, 10.068603515625, 10.4327392578125, 10.796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 7.0, 5.0, 10.0, 6.0, 12.0, 22.0, 25.0, 16.0, 29.0, 38.0, 31.0, 34.0, 48.0, 61.0, 55.0, 59.0, 64.0, 74.0, 62.0, 53.0, 51.0, 40.0, 30.0, 24.0, 18.0, 36.0, 13.0, 12.0, 10.0, 9.0, 6.0, 4.0, 0.0, 6.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.71484375, -7.46307373046875, -7.2113037109375, -6.95953369140625, -6.707763671875, -6.45599365234375, -6.2042236328125, -5.95245361328125, -5.70068359375, -5.44891357421875, -5.1971435546875, -4.94537353515625, -4.693603515625, -4.44183349609375, -4.1900634765625, -3.93829345703125, -3.6865234375, -3.43475341796875, -3.1829833984375, -2.93121337890625, -2.679443359375, -2.42767333984375, -2.1759033203125, -1.92413330078125, -1.67236328125, -1.42059326171875, -1.1688232421875, -0.91705322265625, -0.665283203125, -0.41351318359375, -0.1617431640625, 0.09002685546875, 0.341796875, 0.59356689453125, 0.8453369140625, 1.09710693359375, 1.348876953125, 1.60064697265625, 1.8524169921875, 2.10418701171875, 2.35595703125, 2.60772705078125, 2.8594970703125, 3.11126708984375, 3.363037109375, 3.61480712890625, 3.8665771484375, 4.11834716796875, 4.3701171875, 4.62188720703125, 4.8736572265625, 5.12542724609375, 5.377197265625, 5.62896728515625, 5.8807373046875, 6.13250732421875, 6.38427734375, 6.63604736328125, 6.8878173828125, 7.13958740234375, 7.391357421875, 7.64312744140625, 7.8948974609375, 8.14666748046875, 8.3984375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 10.0, 13.0, 44.0, 101.0, 230.0, 275.0, 142.0, 74.0, 38.0, 16.0, 12.0, 11.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.6971435546875, -224.0459442138672, -213.39476013183594, -202.74356079101562, -192.09237670898438, -181.44117736816406, -170.78997802734375, -160.1387939453125, -149.4875946044922, -138.83639526367188, -128.18521118164062, -117.53401184082031, -106.88282012939453, -96.23162841796875, -85.58042907714844, -74.92923736572266, -64.27804565429688, -53.626853942871094, -42.97565841674805, -32.324462890625, -21.67327117919922, -11.022079467773438, -0.3708839416503906, 10.280311584472656, 20.931503295898438, 31.58269691467285, 42.233890533447266, 52.88508605957031, 63.536277770996094, 74.18746948242188, 84.83866882324219, 95.48986053466797, 106.14105224609375, 116.79224395751953, 127.44343566894531, 138.09463500976562, 148.74581909179688, 159.3970184326172, 170.0482177734375, 180.69940185546875, 191.35060119628906, 202.00180053710938, 212.65298461914062, 223.30418395996094, 233.95538330078125, 244.6065673828125, 255.2577667236328, 265.9089660644531, 276.5601501464844, 287.2113342285156, 297.862548828125, 308.51373291015625, 319.1649169921875, 329.81610107421875, 340.4673156738281, 351.1184997558594, 361.76971435546875, 372.4208984375, 383.0721130371094, 393.7232971191406, 404.3744812011719, 415.02569580078125, 425.6768798828125, 436.32806396484375, 446.979248046875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 10.0, 9.0, 20.0, 19.0, 13.0, 24.0, 20.0, 25.0, 24.0, 37.0, 32.0, 26.0, 39.0, 51.0, 58.0, 74.0, 76.0, 57.0, 47.0, 33.0, 33.0, 27.0, 27.0, 26.0, 28.0, 27.0, 20.0, 19.0, 11.0, 13.0, 13.0, 10.0, 7.0, 6.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.01571655273438, -143.23721313476562, -138.45870971679688, -133.68019104003906, -128.9016876220703, -124.12318420410156, -119.34467315673828, -114.566162109375, -109.78765869140625, -105.0091552734375, -100.23064422607422, -95.45213317871094, -90.67362976074219, -85.89512634277344, -81.11661529541016, -76.33810424804688, -71.55960083007812, -66.78109741210938, -62.002586364746094, -57.22407913208008, -52.44557189941406, -47.66706466674805, -42.88855743408203, -38.110050201416016, -33.33154296875, -28.553035736083984, -23.77452850341797, -18.996021270751953, -14.217514038085938, -9.439006805419922, -4.660499572753906, 0.11800765991210938, 4.896514892578125, 9.67502212524414, 14.453529357910156, 19.232036590576172, 24.010543823242188, 28.789051055908203, 33.56755828857422, 38.346065521240234, 43.12457275390625, 47.903079986572266, 52.68158721923828, 57.4600944519043, 62.23860168457031, 67.01710510253906, 71.79561614990234, 76.57412719726562, 81.35263061523438, 86.13113403320312, 90.9096450805664, 95.68815612792969, 100.46665954589844, 105.24516296386719, 110.02367401123047, 114.80218505859375, 119.5806884765625, 124.35919189453125, 129.1376953125, 133.9162139892578, 138.69471740722656, 143.4732208251953, 148.25173950195312, 153.03024291992188, 157.80874633789062]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 4.0, 7.0, 12.0, 25.0, 20.0, 40.0, 54.0, 107.0, 134.0, 306.0, 637.0, 1385.0, 3962.0, 14314.0, 96319.0, 2725873.0, 1278219.0, 56457.0, 10763.0, 3224.0, 1252.0, 509.0, 253.0, 155.0, 93.0, 54.0, 35.0, 26.0, 19.0, 9.0, 3.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.734375, -30.00048828125, -29.2666015625, -28.53271484375, -27.798828125, -27.06494140625, -26.3310546875, -25.59716796875, -24.86328125, -24.12939453125, -23.3955078125, -22.66162109375, -21.927734375, -21.19384765625, -20.4599609375, -19.72607421875, -18.9921875, -18.25830078125, -17.5244140625, -16.79052734375, -16.056640625, -15.32275390625, -14.5888671875, -13.85498046875, -13.12109375, -12.38720703125, -11.6533203125, -10.91943359375, -10.185546875, -9.45166015625, -8.7177734375, -7.98388671875, -7.25, -6.51611328125, -5.7822265625, -5.04833984375, -4.314453125, -3.58056640625, -2.8466796875, -2.11279296875, -1.37890625, -0.64501953125, 0.0888671875, 0.82275390625, 1.556640625, 2.29052734375, 3.0244140625, 3.75830078125, 4.4921875, 5.22607421875, 5.9599609375, 6.69384765625, 7.427734375, 8.16162109375, 8.8955078125, 9.62939453125, 10.36328125, 11.09716796875, 11.8310546875, 12.56494140625, 13.298828125, 14.03271484375, 14.7666015625, 15.50048828125, 16.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 10.0, 12.0, 12.0, 20.0, 16.0, 34.0, 37.0, 41.0, 33.0, 50.0, 52.0, 52.0, 42.0, 50.0, 49.0, 52.0, 42.0, 48.0, 42.0, 43.0, 27.0, 34.0, 32.0, 26.0, 29.0, 14.0, 22.0, 13.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.7943115234375, -8.502685546875, -8.2110595703125, -7.91943359375, -7.6278076171875, -7.336181640625, -7.0445556640625, -6.7529296875, -6.4613037109375, -6.169677734375, -5.8780517578125, -5.58642578125, -5.2947998046875, -5.003173828125, -4.7115478515625, -4.419921875, -4.1282958984375, -3.836669921875, -3.5450439453125, -3.25341796875, -2.9617919921875, -2.670166015625, -2.3785400390625, -2.0869140625, -1.7952880859375, -1.503662109375, -1.2120361328125, -0.92041015625, -0.6287841796875, -0.337158203125, -0.0455322265625, 0.24609375, 0.5377197265625, 0.829345703125, 1.1209716796875, 1.41259765625, 1.7042236328125, 1.995849609375, 2.2874755859375, 2.5791015625, 2.8707275390625, 3.162353515625, 3.4539794921875, 3.74560546875, 4.0372314453125, 4.328857421875, 4.6204833984375, 4.912109375, 5.2037353515625, 5.495361328125, 5.7869873046875, 6.07861328125, 6.3702392578125, 6.661865234375, 6.9534912109375, 7.2451171875, 7.5367431640625, 7.828369140625, 8.1199951171875, 8.41162109375, 8.7032470703125, 8.994873046875, 9.2864990234375, 9.578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 13.0, 23.0, 33.0, 61.0, 95.0, 196.0, 350.0, 896.0, 2348.0, 7607.0, 34347.0, 356585.0, 3612380.0, 150630.0, 20839.0, 4988.0, 1624.0, 630.0, 284.0, 153.0, 81.0, 41.0, 22.0, 10.0, 12.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.86181640625, -25.8798828125, -24.89794921875, -23.916015625, -22.93408203125, -21.9521484375, -20.97021484375, -19.98828125, -19.00634765625, -18.0244140625, -17.04248046875, -16.060546875, -15.07861328125, -14.0966796875, -13.11474609375, -12.1328125, -11.15087890625, -10.1689453125, -9.18701171875, -8.205078125, -7.22314453125, -6.2412109375, -5.25927734375, -4.27734375, -3.29541015625, -2.3134765625, -1.33154296875, -0.349609375, 0.63232421875, 1.6142578125, 2.59619140625, 3.578125, 4.56005859375, 5.5419921875, 6.52392578125, 7.505859375, 8.48779296875, 9.4697265625, 10.45166015625, 11.43359375, 12.41552734375, 13.3974609375, 14.37939453125, 15.361328125, 16.34326171875, 17.3251953125, 18.30712890625, 19.2890625, 20.27099609375, 21.2529296875, 22.23486328125, 23.216796875, 24.19873046875, 25.1806640625, 26.16259765625, 27.14453125, 28.12646484375, 29.1083984375, 30.09033203125, 31.072265625, 32.05419921875, 33.0361328125, 34.01806640625, 35.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 16.0, 15.0, 23.0, 38.0, 43.0, 73.0, 101.0, 172.0, 407.0, 743.0, 1039.0, 586.0, 315.0, 172.0, 90.0, 62.0, 39.0, 26.0, 18.0, 17.0, 9.0, 10.0, 9.0, 7.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.561279296875, -32.68505859375, -31.808837890625, -30.9326171875, -30.056396484375, -29.18017578125, -28.303955078125, -27.427734375, -26.551513671875, -25.67529296875, -24.799072265625, -23.9228515625, -23.046630859375, -22.17041015625, -21.294189453125, -20.41796875, -19.541748046875, -18.66552734375, -17.789306640625, -16.9130859375, -16.036865234375, -15.16064453125, -14.284423828125, -13.408203125, -12.531982421875, -11.65576171875, -10.779541015625, -9.9033203125, -9.027099609375, -8.15087890625, -7.274658203125, -6.3984375, -5.522216796875, -4.64599609375, -3.769775390625, -2.8935546875, -2.017333984375, -1.14111328125, -0.264892578125, 0.611328125, 1.487548828125, 2.36376953125, 3.239990234375, 4.1162109375, 4.992431640625, 5.86865234375, 6.744873046875, 7.62109375, 8.497314453125, 9.37353515625, 10.249755859375, 11.1259765625, 12.002197265625, 12.87841796875, 13.754638671875, 14.630859375, 15.507080078125, 16.38330078125, 17.259521484375, 18.1357421875, 19.011962890625, 19.88818359375, 20.764404296875, 21.640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 24.0, 38.0, 97.0, 137.0, 216.0, 208.0, 119.0, 65.0, 24.0, 20.0, 9.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.76614379882812, -192.91183471679688, -185.05752563476562, -177.20321655273438, -169.34890747070312, -161.49459838867188, -153.64028930664062, -145.78598022460938, -137.93167114257812, -130.07736206054688, -122.22305297851562, -114.36874389648438, -106.51443481445312, -98.66012573242188, -90.80581665039062, -82.95150756835938, -75.0971908569336, -67.24288177490234, -59.388572692871094, -51.534263610839844, -43.679954528808594, -35.82564163208008, -27.971332550048828, -20.117023468017578, -12.262714385986328, -4.40840482711792, 3.4459047317504883, 11.300214767456055, 19.154523849487305, 27.008834838867188, 34.86314392089844, 42.71745300292969, 50.57176208496094, 58.42607116699219, 66.28038024902344, 74.13468933105469, 81.98899841308594, 89.84330749511719, 97.69761657714844, 105.55192565917969, 113.40623474121094, 121.26054382324219, 129.11485290527344, 136.9691619873047, 144.82347106933594, 152.6777801513672, 160.53208923339844, 168.3863983154297, 176.24072265625, 184.09503173828125, 191.9493408203125, 199.80364990234375, 207.657958984375, 215.51226806640625, 223.3665771484375, 231.22088623046875, 239.0751953125, 246.92950439453125, 254.7838134765625, 262.63812255859375, 270.492431640625, 278.34674072265625, 286.2010498046875, 294.05535888671875, 301.90966796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 9.0, 12.0, 9.0, 14.0, 16.0, 30.0, 24.0, 25.0, 27.0, 31.0, 47.0, 33.0, 34.0, 41.0, 57.0, 50.0, 51.0, 49.0, 39.0, 57.0, 38.0, 37.0, 36.0, 31.0, 25.0, 29.0, 30.0, 21.0, 19.0, 12.0, 16.0, 9.0, 13.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.6579818725586, -97.26591491699219, -93.87384796142578, -90.48177337646484, -87.08970642089844, -83.69763946533203, -80.30557250976562, -76.91349792480469, -73.52143096923828, -70.12936401367188, -66.73729705810547, -63.3452262878418, -59.953155517578125, -56.56108856201172, -53.16902160644531, -49.77695083618164, -46.384883880615234, -42.99281692504883, -39.600746154785156, -36.20867919921875, -32.81660842895508, -29.424541473388672, -26.032472610473633, -22.640403747558594, -19.248334884643555, -15.856266021728516, -12.464197158813477, -9.072129249572754, -5.680060386657715, -2.287992477416992, 1.1040763854980469, 4.496145248413086, 7.888214111328125, 11.280282974243164, 14.672351837158203, 18.06441879272461, 21.45648956298828, 24.848556518554688, 28.240625381469727, 31.632694244384766, 35.02476501464844, 38.416831970214844, 41.808902740478516, 45.20096969604492, 48.593040466308594, 51.985107421875, 55.377174377441406, 58.76924514770508, 62.161312103271484, 65.55338287353516, 68.94544982910156, 72.33751678466797, 75.72958374023438, 79.12165832519531, 82.51372528076172, 85.90579223632812, 89.29785919189453, 92.68992614746094, 96.08199310302734, 99.47406768798828, 102.86613464355469, 106.2582015991211, 109.6502685546875, 113.04234313964844, 116.43441009521484]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 7.0, 12.0, 15.0, 18.0, 31.0, 24.0, 52.0, 83.0, 143.0, 217.0, 317.0, 580.0, 979.0, 1618.0, 2837.0, 5830.0, 12094.0, 27085.0, 67018.0, 176462.0, 357438.0, 237696.0, 91195.0, 35716.0, 15275.0, 7217.0, 3673.0, 1999.0, 1107.0, 664.0, 423.0, 237.0, 149.0, 115.0, 78.0, 56.0, 25.0, 27.0, 21.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.375, -17.8870849609375, -17.399169921875, -16.9112548828125, -16.42333984375, -15.9354248046875, -15.447509765625, -14.9595947265625, -14.4716796875, -13.9837646484375, -13.495849609375, -13.0079345703125, -12.52001953125, -12.0321044921875, -11.544189453125, -11.0562744140625, -10.568359375, -10.0804443359375, -9.592529296875, -9.1046142578125, -8.61669921875, -8.1287841796875, -7.640869140625, -7.1529541015625, -6.6650390625, -6.1771240234375, -5.689208984375, -5.2012939453125, -4.71337890625, -4.2254638671875, -3.737548828125, -3.2496337890625, -2.76171875, -2.2738037109375, -1.785888671875, -1.2979736328125, -0.81005859375, -0.3221435546875, 0.165771484375, 0.6536865234375, 1.1416015625, 1.6295166015625, 2.117431640625, 2.6053466796875, 3.09326171875, 3.5811767578125, 4.069091796875, 4.5570068359375, 5.044921875, 5.5328369140625, 6.020751953125, 6.5086669921875, 6.99658203125, 7.4844970703125, 7.972412109375, 8.4603271484375, 8.9482421875, 9.4361572265625, 9.924072265625, 10.4119873046875, 10.89990234375, 11.3878173828125, 11.875732421875, 12.3636474609375, 12.8515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 4.0, 7.0, 5.0, 9.0, 14.0, 18.0, 15.0, 18.0, 19.0, 34.0, 28.0, 31.0, 43.0, 42.0, 38.0, 46.0, 45.0, 41.0, 43.0, 38.0, 40.0, 47.0, 35.0, 39.0, 39.0, 35.0, 26.0, 32.0, 26.0, 30.0, 15.0, 21.0, 14.0, 12.0, 10.0, 11.0, 7.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.168701171875, -7.88427734375, -7.599853515625, -7.3154296875, -7.031005859375, -6.74658203125, -6.462158203125, -6.177734375, -5.893310546875, -5.60888671875, -5.324462890625, -5.0400390625, -4.755615234375, -4.47119140625, -4.186767578125, -3.90234375, -3.617919921875, -3.33349609375, -3.049072265625, -2.7646484375, -2.480224609375, -2.19580078125, -1.911376953125, -1.626953125, -1.342529296875, -1.05810546875, -0.773681640625, -0.4892578125, -0.204833984375, 0.07958984375, 0.364013671875, 0.6484375, 0.932861328125, 1.21728515625, 1.501708984375, 1.7861328125, 2.070556640625, 2.35498046875, 2.639404296875, 2.923828125, 3.208251953125, 3.49267578125, 3.777099609375, 4.0615234375, 4.345947265625, 4.63037109375, 4.914794921875, 5.19921875, 5.483642578125, 5.76806640625, 6.052490234375, 6.3369140625, 6.621337890625, 6.90576171875, 7.190185546875, 7.474609375, 7.759033203125, 8.04345703125, 8.327880859375, 8.6123046875, 8.896728515625, 9.18115234375, 9.465576171875, 9.75]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 11.0, 6.0, 14.0, 16.0, 16.0, 35.0, 43.0, 68.0, 101.0, 210.0, 305.0, 653.0, 1375.0, 3432.0, 9589.0, 34375.0, 162683.0, 651115.0, 139751.0, 30301.0, 8622.0, 3059.0, 1292.0, 610.0, 326.0, 177.0, 112.0, 71.0, 48.0, 34.0, 27.0, 16.0, 14.0, 8.0, 9.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.203125, -29.396728515625, -28.59033203125, -27.783935546875, -26.9775390625, -26.171142578125, -25.36474609375, -24.558349609375, -23.751953125, -22.945556640625, -22.13916015625, -21.332763671875, -20.5263671875, -19.719970703125, -18.91357421875, -18.107177734375, -17.30078125, -16.494384765625, -15.68798828125, -14.881591796875, -14.0751953125, -13.268798828125, -12.46240234375, -11.656005859375, -10.849609375, -10.043212890625, -9.23681640625, -8.430419921875, -7.6240234375, -6.817626953125, -6.01123046875, -5.204833984375, -4.3984375, -3.592041015625, -2.78564453125, -1.979248046875, -1.1728515625, -0.366455078125, 0.43994140625, 1.246337890625, 2.052734375, 2.859130859375, 3.66552734375, 4.471923828125, 5.2783203125, 6.084716796875, 6.89111328125, 7.697509765625, 8.50390625, 9.310302734375, 10.11669921875, 10.923095703125, 11.7294921875, 12.535888671875, 13.34228515625, 14.148681640625, 14.955078125, 15.761474609375, 16.56787109375, 17.374267578125, 18.1806640625, 18.987060546875, 19.79345703125, 20.599853515625, 21.40625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 8.0, 18.0, 13.0, 23.0, 29.0, 24.0, 27.0, 32.0, 46.0, 46.0, 62.0, 68.0, 46.0, 46.0, 63.0, 54.0, 44.0, 42.0, 50.0, 27.0, 43.0, 28.0, 22.0, 23.0, 21.0, 19.0, 12.0, 10.0, 13.0, 7.0, 4.0, 0.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.4375, -31.2275390625, -30.017578125, -28.8076171875, -27.59765625, -26.3876953125, -25.177734375, -23.9677734375, -22.7578125, -21.5478515625, -20.337890625, -19.1279296875, -17.91796875, -16.7080078125, -15.498046875, -14.2880859375, -13.078125, -11.8681640625, -10.658203125, -9.4482421875, -8.23828125, -7.0283203125, -5.818359375, -4.6083984375, -3.3984375, -2.1884765625, -0.978515625, 0.2314453125, 1.44140625, 2.6513671875, 3.861328125, 5.0712890625, 6.28125, 7.4912109375, 8.701171875, 9.9111328125, 11.12109375, 12.3310546875, 13.541015625, 14.7509765625, 15.9609375, 17.1708984375, 18.380859375, 19.5908203125, 20.80078125, 22.0107421875, 23.220703125, 24.4306640625, 25.640625, 26.8505859375, 28.060546875, 29.2705078125, 30.48046875, 31.6904296875, 32.900390625, 34.1103515625, 35.3203125, 36.5302734375, 37.740234375, 38.9501953125, 40.16015625, 41.3701171875, 42.580078125, 43.7900390625, 45.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 20.0, 39.0, 58.0, 110.0, 214.0, 454.0, 1084.0, 3144.0, 10603.0, 51428.0, 581417.0, 342958.0, 43097.0, 9180.0, 2776.0, 1071.0, 419.0, 185.0, 107.0, 57.0, 38.0, 20.0, 13.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1640625, -11.8057861328125, -11.447509765625, -11.0892333984375, -10.73095703125, -10.3726806640625, -10.014404296875, -9.6561279296875, -9.2978515625, -8.9395751953125, -8.581298828125, -8.2230224609375, -7.86474609375, -7.5064697265625, -7.148193359375, -6.7899169921875, -6.431640625, -6.0733642578125, -5.715087890625, -5.3568115234375, -4.99853515625, -4.6402587890625, -4.281982421875, -3.9237060546875, -3.5654296875, -3.2071533203125, -2.848876953125, -2.4906005859375, -2.13232421875, -1.7740478515625, -1.415771484375, -1.0574951171875, -0.69921875, -0.3409423828125, 0.017333984375, 0.3756103515625, 0.73388671875, 1.0921630859375, 1.450439453125, 1.8087158203125, 2.1669921875, 2.5252685546875, 2.883544921875, 3.2418212890625, 3.60009765625, 3.9583740234375, 4.316650390625, 4.6749267578125, 5.033203125, 5.3914794921875, 5.749755859375, 6.1080322265625, 6.46630859375, 6.8245849609375, 7.182861328125, 7.5411376953125, 7.8994140625, 8.2576904296875, 8.615966796875, 8.9742431640625, 9.33251953125, 9.6907958984375, 10.049072265625, 10.4073486328125, 10.765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 8.0, 9.0, 7.0, 18.0, 18.0, 41.0, 53.0, 86.0, 135.0, 186.0, 152.0, 95.0, 76.0, 34.0, 28.0, 14.0, 10.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00200653076171875, -0.0019089579582214355, -0.001811385154724121, -0.0017138123512268066, -0.0016162395477294922, -0.0015186667442321777, -0.0014210939407348633, -0.0013235211372375488, -0.0012259483337402344, -0.00112837553024292, -0.0010308027267456055, -0.000933229923248291, -0.0008356571197509766, -0.0007380843162536621, -0.0006405115127563477, -0.0005429387092590332, -0.00044536590576171875, -0.0003477931022644043, -0.00025022029876708984, -0.0001526474952697754, -5.507469177246094e-05, 4.2498111724853516e-05, 0.00014007091522216797, 0.00023764371871948242, 0.0003352165222167969, 0.00043278932571411133, 0.0005303621292114258, 0.0006279349327087402, 0.0007255077362060547, 0.0008230805397033691, 0.0009206533432006836, 0.001018226146697998, 0.0011157989501953125, 0.001213371753692627, 0.0013109445571899414, 0.0014085173606872559, 0.0015060901641845703, 0.0016036629676818848, 0.0017012357711791992, 0.0017988085746765137, 0.0018963813781738281, 0.0019939541816711426, 0.002091526985168457, 0.0021890997886657715, 0.002286672592163086, 0.0023842453956604004, 0.002481818199157715, 0.0025793910026550293, 0.0026769638061523438, 0.002774536609649658, 0.0028721094131469727, 0.002969682216644287, 0.0030672550201416016, 0.003164827823638916, 0.0032624006271362305, 0.003359973430633545, 0.0034575462341308594, 0.003555119037628174, 0.0036526918411254883, 0.0037502646446228027, 0.003847837448120117, 0.003945410251617432, 0.004042983055114746, 0.0041405558586120605, 0.004238128662109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 35.0, 67.0, 109.0, 182.0, 298.0, 579.0, 1240.0, 3041.0, 8414.0, 31227.0, 160792.0, 665965.0, 136192.0, 27366.0, 7817.0, 2667.0, 1165.0, 551.0, 317.0, 183.0, 97.0, 62.0, 35.0, 26.0, 13.0, 14.0, 10.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.3203125, -11.009765625, -10.69921875, -10.388671875, -10.078125, -9.767578125, -9.45703125, -9.146484375, -8.8359375, -8.525390625, -8.21484375, -7.904296875, -7.59375, -7.283203125, -6.97265625, -6.662109375, -6.3515625, -6.041015625, -5.73046875, -5.419921875, -5.109375, -4.798828125, -4.48828125, -4.177734375, -3.8671875, -3.556640625, -3.24609375, -2.935546875, -2.625, -2.314453125, -2.00390625, -1.693359375, -1.3828125, -1.072265625, -0.76171875, -0.451171875, -0.140625, 0.169921875, 0.48046875, 0.791015625, 1.1015625, 1.412109375, 1.72265625, 2.033203125, 2.34375, 2.654296875, 2.96484375, 3.275390625, 3.5859375, 3.896484375, 4.20703125, 4.517578125, 4.828125, 5.138671875, 5.44921875, 5.759765625, 6.0703125, 6.380859375, 6.69140625, 7.001953125, 7.3125, 7.623046875, 7.93359375, 8.244140625, 8.5546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 6.0, 9.0, 6.0, 7.0, 14.0, 28.0, 40.0, 65.0, 67.0, 88.0, 89.0, 105.0, 77.0, 73.0, 82.0, 68.0, 44.0, 27.0, 20.0, 17.0, 18.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9254150390625, -9.569580078125, -9.2137451171875, -8.85791015625, -8.5020751953125, -8.146240234375, -7.7904052734375, -7.4345703125, -7.0787353515625, -6.722900390625, -6.3670654296875, -6.01123046875, -5.6553955078125, -5.299560546875, -4.9437255859375, -4.587890625, -4.2320556640625, -3.876220703125, -3.5203857421875, -3.16455078125, -2.8087158203125, -2.452880859375, -2.0970458984375, -1.7412109375, -1.3853759765625, -1.029541015625, -0.6737060546875, -0.31787109375, 0.0379638671875, 0.393798828125, 0.7496337890625, 1.10546875, 1.4613037109375, 1.817138671875, 2.1729736328125, 2.52880859375, 2.8846435546875, 3.240478515625, 3.5963134765625, 3.9521484375, 4.3079833984375, 4.663818359375, 5.0196533203125, 5.37548828125, 5.7313232421875, 6.087158203125, 6.4429931640625, 6.798828125, 7.1546630859375, 7.510498046875, 7.8663330078125, 8.22216796875, 8.5780029296875, 8.933837890625, 9.2896728515625, 9.6455078125, 10.0013427734375, 10.357177734375, 10.7130126953125, 11.06884765625, 11.4246826171875, 11.780517578125, 12.1363525390625, 12.4921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 9.0, 6.0, 8.0, 6.0, 12.0, 40.0, 77.0, 138.0, 259.0, 217.0, 121.0, 50.0, 35.0, 13.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-329.45477294921875, -321.75799560546875, -314.0611877441406, -306.3643798828125, -298.6676025390625, -290.9708251953125, -283.2740173339844, -275.57720947265625, -267.88043212890625, -260.18365478515625, -252.48684692382812, -244.79005432128906, -237.09326171875, -229.39646911621094, -221.69967651367188, -214.0028839111328, -206.30609130859375, -198.6092987060547, -190.91250610351562, -183.21571350097656, -175.5189208984375, -167.82212829589844, -160.12533569335938, -152.4285430908203, -144.73175048828125, -137.0349578857422, -129.33816528320312, -121.64137268066406, -113.944580078125, -106.24778747558594, -98.55099487304688, -90.85420227050781, -83.15739440917969, -75.46060180664062, -67.76380920410156, -60.0670166015625, -52.37022399902344, -44.673431396484375, -36.97663879394531, -29.27984619140625, -21.583053588867188, -13.886260986328125, -6.1894683837890625, 1.50732421875, 9.204116821289062, 16.900909423828125, 24.597702026367188, 32.29449462890625, 39.99128723144531, 47.688079833984375, 55.38487243652344, 63.0816650390625, 70.77845764160156, 78.47525024414062, 86.17204284667969, 93.86883544921875, 101.56562805175781, 109.26242065429688, 116.95921325683594, 124.656005859375, 132.35279846191406, 140.04959106445312, 147.7463836669922, 155.44317626953125, 163.1399688720703]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 13.0, 9.0, 4.0, 16.0, 16.0, 20.0, 31.0, 27.0, 27.0, 24.0, 33.0, 33.0, 44.0, 37.0, 49.0, 63.0, 74.0, 82.0, 69.0, 36.0, 41.0, 37.0, 37.0, 25.0, 20.0, 20.0, 20.0, 16.0, 22.0, 7.0, 8.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.47335815429688, -123.01971435546875, -118.5660629272461, -114.11241912841797, -109.65876770019531, -105.20512390136719, -100.75148010253906, -96.2978286743164, -91.84417724609375, -87.39053344726562, -82.93688201904297, -78.48323822021484, -74.02958679199219, -69.57594299316406, -65.12229919433594, -60.66864776611328, -56.215003967285156, -51.761356353759766, -47.307708740234375, -42.85406494140625, -38.400413513183594, -33.94676971435547, -29.493122100830078, -25.039474487304688, -20.585826873779297, -16.132179260253906, -11.678532600402832, -7.224885940551758, -2.771238327026367, 1.6824092864990234, 6.136054992675781, 10.589702606201172, 15.043350219726562, 19.496997833251953, 23.950645446777344, 28.4042911529541, 32.857940673828125, 37.31158447265625, 41.76523208618164, 46.21887969970703, 50.67252731323242, 55.12617492675781, 59.5798225402832, 64.0334701538086, 68.48711395263672, 72.94076538085938, 77.3944091796875, 81.84805297851562, 86.30170440673828, 90.7553482055664, 95.20899963378906, 99.66264343261719, 104.11629486083984, 108.56993865966797, 113.02359008789062, 117.47723388671875, 121.93087768554688, 126.384521484375, 130.83816528320312, 135.2918243408203, 139.74546813964844, 144.19911193847656, 148.6527557373047, 153.10641479492188, 157.56005859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 21.0, 22.0, 33.0, 44.0, 71.0, 132.0, 248.0, 480.0, 1048.0, 2385.0, 5974.0, 19236.0, 100120.0, 1787015.0, 2126836.0, 117726.0, 21716.0, 6622.0, 2442.0, 1017.0, 544.0, 224.0, 133.0, 73.0, 39.0, 30.0, 14.0, 10.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.5, -23.872314453125, -23.24462890625, -22.616943359375, -21.9892578125, -21.361572265625, -20.73388671875, -20.106201171875, -19.478515625, -18.850830078125, -18.22314453125, -17.595458984375, -16.9677734375, -16.340087890625, -15.71240234375, -15.084716796875, -14.45703125, -13.829345703125, -13.20166015625, -12.573974609375, -11.9462890625, -11.318603515625, -10.69091796875, -10.063232421875, -9.435546875, -8.807861328125, -8.18017578125, -7.552490234375, -6.9248046875, -6.297119140625, -5.66943359375, -5.041748046875, -4.4140625, -3.786376953125, -3.15869140625, -2.531005859375, -1.9033203125, -1.275634765625, -0.64794921875, -0.020263671875, 0.607421875, 1.235107421875, 1.86279296875, 2.490478515625, 3.1181640625, 3.745849609375, 4.37353515625, 5.001220703125, 5.62890625, 6.256591796875, 6.88427734375, 7.511962890625, 8.1396484375, 8.767333984375, 9.39501953125, 10.022705078125, 10.650390625, 11.278076171875, 11.90576171875, 12.533447265625, 13.1611328125, 13.788818359375, 14.41650390625, 15.044189453125, 15.671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 5.0, 11.0, 12.0, 26.0, 19.0, 26.0, 35.0, 29.0, 37.0, 37.0, 40.0, 42.0, 56.0, 59.0, 42.0, 50.0, 47.0, 51.0, 52.0, 34.0, 55.0, 29.0, 38.0, 32.0, 18.0, 24.0, 16.0, 12.0, 11.0, 18.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.5894775390625, -9.272705078125, -8.9559326171875, -8.63916015625, -8.3223876953125, -8.005615234375, -7.6888427734375, -7.3720703125, -7.0552978515625, -6.738525390625, -6.4217529296875, -6.10498046875, -5.7882080078125, -5.471435546875, -5.1546630859375, -4.837890625, -4.5211181640625, -4.204345703125, -3.8875732421875, -3.57080078125, -3.2540283203125, -2.937255859375, -2.6204833984375, -2.3037109375, -1.9869384765625, -1.670166015625, -1.3533935546875, -1.03662109375, -0.7198486328125, -0.403076171875, -0.0863037109375, 0.23046875, 0.5472412109375, 0.864013671875, 1.1807861328125, 1.49755859375, 1.8143310546875, 2.131103515625, 2.4478759765625, 2.7646484375, 3.0814208984375, 3.398193359375, 3.7149658203125, 4.03173828125, 4.3485107421875, 4.665283203125, 4.9820556640625, 5.298828125, 5.6156005859375, 5.932373046875, 6.2491455078125, 6.56591796875, 6.8826904296875, 7.199462890625, 7.5162353515625, 7.8330078125, 8.1497802734375, 8.466552734375, 8.7833251953125, 9.10009765625, 9.4168701171875, 9.733642578125, 10.0504150390625, 10.3671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 12.0, 15.0, 15.0, 27.0, 36.0, 51.0, 84.0, 226.0, 507.0, 1414.0, 5293.0, 30785.0, 505320.0, 3539546.0, 95400.0, 11735.0, 2465.0, 740.0, 283.0, 124.0, 56.0, 51.0, 25.0, 21.0, 12.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.3623046875, -25.318359375, -24.2744140625, -23.23046875, -22.1865234375, -21.142578125, -20.0986328125, -19.0546875, -18.0107421875, -16.966796875, -15.9228515625, -14.87890625, -13.8349609375, -12.791015625, -11.7470703125, -10.703125, -9.6591796875, -8.615234375, -7.5712890625, -6.52734375, -5.4833984375, -4.439453125, -3.3955078125, -2.3515625, -1.3076171875, -0.263671875, 0.7802734375, 1.82421875, 2.8681640625, 3.912109375, 4.9560546875, 6.0, 7.0439453125, 8.087890625, 9.1318359375, 10.17578125, 11.2197265625, 12.263671875, 13.3076171875, 14.3515625, 15.3955078125, 16.439453125, 17.4833984375, 18.52734375, 19.5712890625, 20.615234375, 21.6591796875, 22.703125, 23.7470703125, 24.791015625, 25.8349609375, 26.87890625, 27.9228515625, 28.966796875, 30.0107421875, 31.0546875, 32.0986328125, 33.142578125, 34.1865234375, 35.23046875, 36.2744140625, 37.318359375, 38.3623046875, 39.40625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 6.0, 6.0, 5.0, 16.0, 26.0, 25.0, 24.0, 43.0, 39.0, 71.0, 91.0, 155.0, 296.0, 501.0, 723.0, 785.0, 472.0, 274.0, 160.0, 101.0, 60.0, 42.0, 28.0, 19.0, 22.0, 13.0, 20.0, 7.0, 3.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-28.109375, -27.42236328125, -26.7353515625, -26.04833984375, -25.361328125, -24.67431640625, -23.9873046875, -23.30029296875, -22.61328125, -21.92626953125, -21.2392578125, -20.55224609375, -19.865234375, -19.17822265625, -18.4912109375, -17.80419921875, -17.1171875, -16.43017578125, -15.7431640625, -15.05615234375, -14.369140625, -13.68212890625, -12.9951171875, -12.30810546875, -11.62109375, -10.93408203125, -10.2470703125, -9.56005859375, -8.873046875, -8.18603515625, -7.4990234375, -6.81201171875, -6.125, -5.43798828125, -4.7509765625, -4.06396484375, -3.376953125, -2.68994140625, -2.0029296875, -1.31591796875, -0.62890625, 0.05810546875, 0.7451171875, 1.43212890625, 2.119140625, 2.80615234375, 3.4931640625, 4.18017578125, 4.8671875, 5.55419921875, 6.2412109375, 6.92822265625, 7.615234375, 8.30224609375, 8.9892578125, 9.67626953125, 10.36328125, 11.05029296875, 11.7373046875, 12.42431640625, 13.111328125, 13.79833984375, 14.4853515625, 15.17236328125, 15.859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 20.0, 76.0, 392.0, 395.0, 108.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-507.98516845703125, -489.189453125, -470.39373779296875, -451.5979919433594, -432.8022766113281, -414.0065612792969, -395.2108154296875, -376.41510009765625, -357.619384765625, -338.82366943359375, -320.0279541015625, -301.2322082519531, -282.4364929199219, -263.6407775878906, -244.8450469970703, -226.04931640625, -207.25360107421875, -188.4578857421875, -169.6621551513672, -150.86642456054688, -132.07070922851562, -113.27498626708984, -94.47926330566406, -75.68353271484375, -56.8878173828125, -38.09209442138672, -19.296371459960938, -0.5006484985351562, 18.295074462890625, 37.090797424316406, 55.88652038574219, 74.6822509765625, 93.4779052734375, 112.27362823486328, 131.06935119628906, 149.86508178710938, 168.66079711914062, 187.45651245117188, 206.2522430419922, 225.0479736328125, 243.84368896484375, 262.639404296875, 281.43511962890625, 300.2308654785156, 319.0265808105469, 337.8222961425781, 356.6180419921875, 375.41375732421875, 394.20947265625, 413.00518798828125, 431.8009033203125, 450.5966491699219, 469.3923645019531, 488.1880798339844, 506.98382568359375, 525.779541015625, 544.5752563476562, 563.3709716796875, 582.1666870117188, 600.96240234375, 619.7581787109375, 638.5538940429688, 657.349609375, 676.1453247070312, 694.9410400390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 8.0, 8.0, 7.0, 12.0, 9.0, 11.0, 18.0, 27.0, 26.0, 23.0, 44.0, 36.0, 43.0, 54.0, 55.0, 60.0, 57.0, 64.0, 53.0, 40.0, 55.0, 38.0, 46.0, 35.0, 33.0, 21.0, 25.0, 18.0, 8.0, 13.0, 15.0, 14.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-123.46343994140625, -119.88617706298828, -116.30891418457031, -112.73165130615234, -109.15438842773438, -105.5771255493164, -101.99986267089844, -98.42259979248047, -94.8453369140625, -91.26807403564453, -87.69081115722656, -84.1135482788086, -80.53628540039062, -76.95902252197266, -73.38175964355469, -69.80449676513672, -66.22723388671875, -62.64997100830078, -59.07270812988281, -55.495445251464844, -51.918182373046875, -48.340919494628906, -44.76365661621094, -41.18639373779297, -37.60913848876953, -34.03187561035156, -30.454612731933594, -26.877349853515625, -23.300086975097656, -19.72282600402832, -16.14556312561035, -12.568300247192383, -8.991035461425781, -5.4137725830078125, -1.836510181427002, 1.7407522201538086, 5.318015098571777, 8.89527702331543, 12.472539901733398, 16.049802780151367, 19.627065658569336, 23.204328536987305, 26.781591415405273, 30.35885238647461, 33.93611526489258, 37.51337814331055, 41.090641021728516, 44.667903900146484, 48.24516677856445, 51.82242965698242, 55.39969253540039, 58.97695541381836, 62.55421829223633, 66.13147735595703, 69.708740234375, 73.28600311279297, 76.86326599121094, 80.4405288696289, 84.01779174804688, 87.59505462646484, 91.17231750488281, 94.74958038330078, 98.32684326171875, 101.90410614013672, 105.48136901855469]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 15.0, 21.0, 33.0, 56.0, 86.0, 139.0, 276.0, 627.0, 1625.0, 5355.0, 20654.0, 106191.0, 597331.0, 259420.0, 42442.0, 9656.0, 2765.0, 982.0, 397.0, 191.0, 117.0, 60.0, 46.0, 23.0, 14.0, 11.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-35.28125, -34.4150390625, -33.548828125, -32.6826171875, -31.81640625, -30.9501953125, -30.083984375, -29.2177734375, -28.3515625, -27.4853515625, -26.619140625, -25.7529296875, -24.88671875, -24.0205078125, -23.154296875, -22.2880859375, -21.421875, -20.5556640625, -19.689453125, -18.8232421875, -17.95703125, -17.0908203125, -16.224609375, -15.3583984375, -14.4921875, -13.6259765625, -12.759765625, -11.8935546875, -11.02734375, -10.1611328125, -9.294921875, -8.4287109375, -7.5625, -6.6962890625, -5.830078125, -4.9638671875, -4.09765625, -3.2314453125, -2.365234375, -1.4990234375, -0.6328125, 0.2333984375, 1.099609375, 1.9658203125, 2.83203125, 3.6982421875, 4.564453125, 5.4306640625, 6.296875, 7.1630859375, 8.029296875, 8.8955078125, 9.76171875, 10.6279296875, 11.494140625, 12.3603515625, 13.2265625, 14.0927734375, 14.958984375, 15.8251953125, 16.69140625, 17.5576171875, 18.423828125, 19.2900390625, 20.15625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 8.0, 7.0, 6.0, 8.0, 16.0, 20.0, 22.0, 19.0, 25.0, 40.0, 34.0, 38.0, 36.0, 38.0, 44.0, 42.0, 48.0, 45.0, 32.0, 44.0, 50.0, 39.0, 40.0, 50.0, 43.0, 38.0, 28.0, 18.0, 23.0, 16.0, 9.0, 18.0, 12.0, 6.0, 8.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.7257080078125, -8.435791015625, -8.1458740234375, -7.85595703125, -7.5660400390625, -7.276123046875, -6.9862060546875, -6.6962890625, -6.4063720703125, -6.116455078125, -5.8265380859375, -5.53662109375, -5.2467041015625, -4.956787109375, -4.6668701171875, -4.376953125, -4.0870361328125, -3.797119140625, -3.5072021484375, -3.21728515625, -2.9273681640625, -2.637451171875, -2.3475341796875, -2.0576171875, -1.7677001953125, -1.477783203125, -1.1878662109375, -0.89794921875, -0.6080322265625, -0.318115234375, -0.0281982421875, 0.26171875, 0.5516357421875, 0.841552734375, 1.1314697265625, 1.42138671875, 1.7113037109375, 2.001220703125, 2.2911376953125, 2.5810546875, 2.8709716796875, 3.160888671875, 3.4508056640625, 3.74072265625, 4.0306396484375, 4.320556640625, 4.6104736328125, 4.900390625, 5.1903076171875, 5.480224609375, 5.7701416015625, 6.06005859375, 6.3499755859375, 6.639892578125, 6.9298095703125, 7.2197265625, 7.5096435546875, 7.799560546875, 8.0894775390625, 8.37939453125, 8.6693115234375, 8.959228515625, 9.2491455078125, 9.5390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 8.0, 15.0, 17.0, 18.0, 26.0, 35.0, 35.0, 75.0, 104.0, 139.0, 252.0, 325.0, 655.0, 1237.0, 3092.0, 9722.0, 42246.0, 301088.0, 614662.0, 55760.0, 12079.0, 3570.0, 1418.0, 730.0, 390.0, 262.0, 165.0, 124.0, 90.0, 52.0, 53.0, 29.0, 15.0, 18.0, 13.0, 7.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.714111328125, -24.91259765625, -24.111083984375, -23.3095703125, -22.508056640625, -21.70654296875, -20.905029296875, -20.103515625, -19.302001953125, -18.50048828125, -17.698974609375, -16.8974609375, -16.095947265625, -15.29443359375, -14.492919921875, -13.69140625, -12.889892578125, -12.08837890625, -11.286865234375, -10.4853515625, -9.683837890625, -8.88232421875, -8.080810546875, -7.279296875, -6.477783203125, -5.67626953125, -4.874755859375, -4.0732421875, -3.271728515625, -2.47021484375, -1.668701171875, -0.8671875, -0.065673828125, 0.73583984375, 1.537353515625, 2.3388671875, 3.140380859375, 3.94189453125, 4.743408203125, 5.544921875, 6.346435546875, 7.14794921875, 7.949462890625, 8.7509765625, 9.552490234375, 10.35400390625, 11.155517578125, 11.95703125, 12.758544921875, 13.56005859375, 14.361572265625, 15.1630859375, 15.964599609375, 16.76611328125, 17.567626953125, 18.369140625, 19.170654296875, 19.97216796875, 20.773681640625, 21.5751953125, 22.376708984375, 23.17822265625, 23.979736328125, 24.78125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 10.0, 11.0, 13.0, 10.0, 18.0, 19.0, 30.0, 37.0, 24.0, 41.0, 62.0, 67.0, 50.0, 57.0, 56.0, 67.0, 62.0, 52.0, 57.0, 39.0, 38.0, 33.0, 30.0, 15.0, 19.0, 17.0, 15.0, 12.0, 5.0, 10.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -37.12841796875, -35.9130859375, -34.69775390625, -33.482421875, -32.26708984375, -31.0517578125, -29.83642578125, -28.62109375, -27.40576171875, -26.1904296875, -24.97509765625, -23.759765625, -22.54443359375, -21.3291015625, -20.11376953125, -18.8984375, -17.68310546875, -16.4677734375, -15.25244140625, -14.037109375, -12.82177734375, -11.6064453125, -10.39111328125, -9.17578125, -7.96044921875, -6.7451171875, -5.52978515625, -4.314453125, -3.09912109375, -1.8837890625, -0.66845703125, 0.546875, 1.76220703125, 2.9775390625, 4.19287109375, 5.408203125, 6.62353515625, 7.8388671875, 9.05419921875, 10.26953125, 11.48486328125, 12.7001953125, 13.91552734375, 15.130859375, 16.34619140625, 17.5615234375, 18.77685546875, 19.9921875, 21.20751953125, 22.4228515625, 23.63818359375, 24.853515625, 26.06884765625, 27.2841796875, 28.49951171875, 29.71484375, 30.93017578125, 32.1455078125, 33.36083984375, 34.576171875, 35.79150390625, 37.0068359375, 38.22216796875, 39.4375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 9.0, 9.0, 6.0, 12.0, 23.0, 20.0, 29.0, 43.0, 62.0, 103.0, 168.0, 248.0, 417.0, 721.0, 1397.0, 3159.0, 6994.0, 17975.0, 55376.0, 249731.0, 598142.0, 74484.0, 23013.0, 8752.0, 3680.0, 1731.0, 915.0, 465.0, 297.0, 186.0, 99.0, 76.0, 51.0, 42.0, 32.0, 20.0, 18.0, 15.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.7890625, -5.59686279296875, -5.4046630859375, -5.21246337890625, -5.020263671875, -4.82806396484375, -4.6358642578125, -4.44366455078125, -4.25146484375, -4.05926513671875, -3.8670654296875, -3.67486572265625, -3.482666015625, -3.29046630859375, -3.0982666015625, -2.90606689453125, -2.7138671875, -2.52166748046875, -2.3294677734375, -2.13726806640625, -1.945068359375, -1.75286865234375, -1.5606689453125, -1.36846923828125, -1.17626953125, -0.98406982421875, -0.7918701171875, -0.59967041015625, -0.407470703125, -0.21527099609375, -0.0230712890625, 0.16912841796875, 0.361328125, 0.55352783203125, 0.7457275390625, 0.93792724609375, 1.130126953125, 1.32232666015625, 1.5145263671875, 1.70672607421875, 1.89892578125, 2.09112548828125, 2.2833251953125, 2.47552490234375, 2.667724609375, 2.85992431640625, 3.0521240234375, 3.24432373046875, 3.4365234375, 3.62872314453125, 3.8209228515625, 4.01312255859375, 4.205322265625, 4.39752197265625, 4.5897216796875, 4.78192138671875, 4.97412109375, 5.16632080078125, 5.3585205078125, 5.55072021484375, 5.742919921875, 5.93511962890625, 6.1273193359375, 6.31951904296875, 6.51171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 12.0, 9.0, 16.0, 25.0, 28.0, 37.0, 62.0, 85.0, 145.0, 176.0, 111.0, 92.0, 44.0, 28.0, 29.0, 17.0, 15.0, 17.0, 10.0, 4.0, 5.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016109943389892578, -0.0015473365783691406, -0.0014836788177490234, -0.0014200210571289062, -0.001356363296508789, -0.0012927055358886719, -0.0012290477752685547, -0.0011653900146484375, -0.0011017322540283203, -0.0010380744934082031, -0.0009744167327880859, -0.0009107589721679688, -0.0008471012115478516, -0.0007834434509277344, -0.0007197856903076172, -0.0006561279296875, -0.0005924701690673828, -0.0005288124084472656, -0.00046515464782714844, -0.00040149688720703125, -0.00033783912658691406, -0.0002741813659667969, -0.0002105236053466797, -0.0001468658447265625, -8.320808410644531e-05, -1.9550323486328125e-05, 4.410743713378906e-05, 0.00010776519775390625, 0.00017142295837402344, 0.00023508071899414062, 0.0002987384796142578, 0.000362396240234375, 0.0004260540008544922, 0.0004897117614746094, 0.0005533695220947266, 0.0006170272827148438, 0.0006806850433349609, 0.0007443428039550781, 0.0008080005645751953, 0.0008716583251953125, 0.0009353160858154297, 0.0009989738464355469, 0.001062631607055664, 0.0011262893676757812, 0.0011899471282958984, 0.0012536048889160156, 0.0013172626495361328, 0.00138092041015625, 0.0014445781707763672, 0.0015082359313964844, 0.0015718936920166016, 0.0016355514526367188, 0.001699209213256836, 0.0017628669738769531, 0.0018265247344970703, 0.0018901824951171875, 0.0019538402557373047, 0.002017498016357422, 0.002081155776977539, 0.0021448135375976562, 0.0022084712982177734, 0.0022721290588378906, 0.002335786819458008, 0.002399444580078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 12.0, 4.0, 13.0, 17.0, 21.0, 37.0, 58.0, 99.0, 123.0, 255.0, 387.0, 781.0, 1738.0, 3840.0, 10755.0, 38631.0, 195412.0, 685512.0, 80107.0, 19405.0, 6254.0, 2452.0, 1130.0, 640.0, 349.0, 180.0, 109.0, 78.0, 52.0, 26.0, 23.0, 18.0, 9.0, 5.0, 7.0, 1.0, 4.0, 1.0, 1.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.0172119140625, -6.768798828125, -6.5203857421875, -6.27197265625, -6.0235595703125, -5.775146484375, -5.5267333984375, -5.2783203125, -5.0299072265625, -4.781494140625, -4.5330810546875, -4.28466796875, -4.0362548828125, -3.787841796875, -3.5394287109375, -3.291015625, -3.0426025390625, -2.794189453125, -2.5457763671875, -2.29736328125, -2.0489501953125, -1.800537109375, -1.5521240234375, -1.3037109375, -1.0552978515625, -0.806884765625, -0.5584716796875, -0.31005859375, -0.0616455078125, 0.186767578125, 0.4351806640625, 0.68359375, 0.9320068359375, 1.180419921875, 1.4288330078125, 1.67724609375, 1.9256591796875, 2.174072265625, 2.4224853515625, 2.6708984375, 2.9193115234375, 3.167724609375, 3.4161376953125, 3.66455078125, 3.9129638671875, 4.161376953125, 4.4097900390625, 4.658203125, 4.9066162109375, 5.155029296875, 5.4034423828125, 5.65185546875, 5.9002685546875, 6.148681640625, 6.3970947265625, 6.6455078125, 6.8939208984375, 7.142333984375, 7.3907470703125, 7.63916015625, 7.8875732421875, 8.135986328125, 8.3843994140625, 8.6328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 15.0, 8.0, 15.0, 17.0, 25.0, 31.0, 34.0, 59.0, 104.0, 122.0, 147.0, 108.0, 77.0, 55.0, 44.0, 27.0, 26.0, 21.0, 21.0, 6.0, 14.0, 4.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3428955078125, -9.045166015625, -8.7474365234375, -8.44970703125, -8.1519775390625, -7.854248046875, -7.5565185546875, -7.2587890625, -6.9610595703125, -6.663330078125, -6.3656005859375, -6.06787109375, -5.7701416015625, -5.472412109375, -5.1746826171875, -4.876953125, -4.5792236328125, -4.281494140625, -3.9837646484375, -3.68603515625, -3.3883056640625, -3.090576171875, -2.7928466796875, -2.4951171875, -2.1973876953125, -1.899658203125, -1.6019287109375, -1.30419921875, -1.0064697265625, -0.708740234375, -0.4110107421875, -0.11328125, 0.1844482421875, 0.482177734375, 0.7799072265625, 1.07763671875, 1.3753662109375, 1.673095703125, 1.9708251953125, 2.2685546875, 2.5662841796875, 2.864013671875, 3.1617431640625, 3.45947265625, 3.7572021484375, 4.054931640625, 4.3526611328125, 4.650390625, 4.9481201171875, 5.245849609375, 5.5435791015625, 5.84130859375, 6.1390380859375, 6.436767578125, 6.7344970703125, 7.0322265625, 7.3299560546875, 7.627685546875, 7.9254150390625, 8.22314453125, 8.5208740234375, 8.818603515625, 9.1163330078125, 9.4140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 15.0, 12.0, 47.0, 78.0, 125.0, 318.0, 194.0, 109.0, 44.0, 21.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-311.8720703125, -305.0699768066406, -298.26788330078125, -291.46575927734375, -284.6636657714844, -277.861572265625, -271.0594787597656, -264.25738525390625, -257.45526123046875, -250.65316772460938, -243.85105895996094, -237.04896545410156, -230.24685668945312, -223.44476318359375, -216.64266967773438, -209.84056091308594, -203.03846740722656, -196.2363739013672, -189.43426513671875, -182.63217163085938, -175.83006286621094, -169.02796936035156, -162.22586059570312, -155.42376708984375, -148.62167358398438, -141.819580078125, -135.01747131347656, -128.2153778076172, -121.41326904296875, -114.61117553710938, -107.80907440185547, -101.00697326660156, -94.20487976074219, -87.40277862548828, -80.60067749023438, -73.798583984375, -66.99647521972656, -60.19437789916992, -53.39228057861328, -46.590179443359375, -39.78807830810547, -32.98597717285156, -26.18387794494629, -19.381778717041016, -12.57967758178711, -5.777576446533203, 1.0245208740234375, 7.826622009277344, 14.62872314453125, 21.430824279785156, 28.23292350769043, 35.0350227355957, 41.83712387084961, 48.639225006103516, 55.441322326660156, 62.24342346191406, 69.04552459716797, 75.84762573242188, 82.64972686767578, 89.45182800292969, 96.25392150878906, 103.0560302734375, 109.85812377929688, 116.66022491455078, 123.46232604980469]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 6.0, 9.0, 8.0, 20.0, 15.0, 14.0, 12.0, 24.0, 23.0, 23.0, 24.0, 25.0, 34.0, 43.0, 55.0, 81.0, 104.0, 70.0, 44.0, 39.0, 34.0, 36.0, 25.0, 35.0, 24.0, 24.0, 16.0, 17.0, 15.0, 13.0, 6.0, 9.0, 9.0, 6.0, 6.0, 12.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.42549133300781, -103.50971984863281, -99.59395599365234, -95.67818450927734, -91.76242065429688, -87.84664916992188, -83.93087768554688, -80.0151138305664, -76.0993423461914, -72.1835708618164, -68.26780700683594, -64.35203552246094, -60.4362678527832, -56.52050018310547, -52.604732513427734, -48.68896484375, -44.773197174072266, -40.85742950439453, -36.9416618347168, -33.02589416503906, -29.110122680664062, -25.194355010986328, -21.278587341308594, -17.362817764282227, -13.447050094604492, -9.531281471252441, -5.615513324737549, -1.6997451782226562, 2.2160234451293945, 6.131792068481445, 10.04755973815918, 13.963329315185547, 17.87909698486328, 21.794864654541016, 25.710634231567383, 29.626401901245117, 33.542171478271484, 37.45793914794922, 41.37370681762695, 45.28947448730469, 49.20524597167969, 53.12101364135742, 57.036781311035156, 60.952552795410156, 64.86831665039062, 68.78408813476562, 72.69985961914062, 76.6156234741211, 80.53138732910156, 84.44715881347656, 88.36292266845703, 92.27869415283203, 96.1944580078125, 100.1102294921875, 104.0260009765625, 107.94176483154297, 111.85753631591797, 115.77330780029297, 119.68907165527344, 123.60484313964844, 127.5206069946289, 131.43637084960938, 135.35214233398438, 139.26791381835938, 143.18368530273438]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 12.0, 8.0, 30.0, 43.0, 48.0, 99.0, 150.0, 237.0, 403.0, 730.0, 1485.0, 3162.0, 6545.0, 16211.0, 52995.0, 296976.0, 2167530.0, 1403666.0, 182748.0, 37317.0, 13038.0, 5537.0, 2592.0, 1225.0, 634.0, 345.0, 197.0, 118.0, 67.0, 42.0, 25.0, 19.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.6953125, -13.265625, -12.8359375, -12.40625, -11.9765625, -11.546875, -11.1171875, -10.6875, -10.2578125, -9.828125, -9.3984375, -8.96875, -8.5390625, -8.109375, -7.6796875, -7.25, -6.8203125, -6.390625, -5.9609375, -5.53125, -5.1015625, -4.671875, -4.2421875, -3.8125, -3.3828125, -2.953125, -2.5234375, -2.09375, -1.6640625, -1.234375, -0.8046875, -0.375, 0.0546875, 0.484375, 0.9140625, 1.34375, 1.7734375, 2.203125, 2.6328125, 3.0625, 3.4921875, 3.921875, 4.3515625, 4.78125, 5.2109375, 5.640625, 6.0703125, 6.5, 6.9296875, 7.359375, 7.7890625, 8.21875, 8.6484375, 9.078125, 9.5078125, 9.9375, 10.3671875, 10.796875, 11.2265625, 11.65625, 12.0859375, 12.515625, 12.9453125, 13.375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 3.0, 6.0, 12.0, 4.0, 12.0, 25.0, 24.0, 26.0, 26.0, 36.0, 27.0, 42.0, 33.0, 33.0, 47.0, 65.0, 36.0, 37.0, 43.0, 55.0, 54.0, 44.0, 43.0, 44.0, 34.0, 31.0, 24.0, 19.0, 17.0, 22.0, 16.0, 15.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.5711669921875, -8.290771484375, -8.0103759765625, -7.72998046875, -7.4495849609375, -7.169189453125, -6.8887939453125, -6.6083984375, -6.3280029296875, -6.047607421875, -5.7672119140625, -5.48681640625, -5.2064208984375, -4.926025390625, -4.6456298828125, -4.365234375, -4.0848388671875, -3.804443359375, -3.5240478515625, -3.24365234375, -2.9632568359375, -2.682861328125, -2.4024658203125, -2.1220703125, -1.8416748046875, -1.561279296875, -1.2808837890625, -1.00048828125, -0.7200927734375, -0.439697265625, -0.1593017578125, 0.12109375, 0.4014892578125, 0.681884765625, 0.9622802734375, 1.24267578125, 1.5230712890625, 1.803466796875, 2.0838623046875, 2.3642578125, 2.6446533203125, 2.925048828125, 3.2054443359375, 3.48583984375, 3.7662353515625, 4.046630859375, 4.3270263671875, 4.607421875, 4.8878173828125, 5.168212890625, 5.4486083984375, 5.72900390625, 6.0093994140625, 6.289794921875, 6.5701904296875, 6.8505859375, 7.1309814453125, 7.411376953125, 7.6917724609375, 7.97216796875, 8.2525634765625, 8.532958984375, 8.8133544921875, 9.09375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 9.0, 8.0, 9.0, 20.0, 19.0, 17.0, 39.0, 40.0, 104.0, 144.0, 341.0, 961.0, 3538.0, 17873.0, 147635.0, 3470304.0, 506716.0, 37555.0, 6429.0, 1500.0, 487.0, 205.0, 121.0, 64.0, 44.0, 27.0, 15.0, 12.0, 12.0, 12.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.375, -28.574462890625, -27.77392578125, -26.973388671875, -26.1728515625, -25.372314453125, -24.57177734375, -23.771240234375, -22.970703125, -22.170166015625, -21.36962890625, -20.569091796875, -19.7685546875, -18.968017578125, -18.16748046875, -17.366943359375, -16.56640625, -15.765869140625, -14.96533203125, -14.164794921875, -13.3642578125, -12.563720703125, -11.76318359375, -10.962646484375, -10.162109375, -9.361572265625, -8.56103515625, -7.760498046875, -6.9599609375, -6.159423828125, -5.35888671875, -4.558349609375, -3.7578125, -2.957275390625, -2.15673828125, -1.356201171875, -0.5556640625, 0.244873046875, 1.04541015625, 1.845947265625, 2.646484375, 3.447021484375, 4.24755859375, 5.048095703125, 5.8486328125, 6.649169921875, 7.44970703125, 8.250244140625, 9.05078125, 9.851318359375, 10.65185546875, 11.452392578125, 12.2529296875, 13.053466796875, 13.85400390625, 14.654541015625, 15.455078125, 16.255615234375, 17.05615234375, 17.856689453125, 18.6572265625, 19.457763671875, 20.25830078125, 21.058837890625, 21.859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 11.0, 9.0, 10.0, 13.0, 24.0, 19.0, 26.0, 32.0, 34.0, 58.0, 79.0, 105.0, 131.0, 163.0, 285.0, 448.0, 521.0, 574.0, 424.0, 312.0, 218.0, 151.0, 85.0, 65.0, 59.0, 35.0, 28.0, 36.0, 20.0, 16.0, 12.0, 9.0, 13.0, 5.0, 11.0, 2.0, 2.0, 7.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.3035888671875, -15.810302734375, -15.3170166015625, -14.82373046875, -14.3304443359375, -13.837158203125, -13.3438720703125, -12.8505859375, -12.3572998046875, -11.864013671875, -11.3707275390625, -10.87744140625, -10.3841552734375, -9.890869140625, -9.3975830078125, -8.904296875, -8.4110107421875, -7.917724609375, -7.4244384765625, -6.93115234375, -6.4378662109375, -5.944580078125, -5.4512939453125, -4.9580078125, -4.4647216796875, -3.971435546875, -3.4781494140625, -2.98486328125, -2.4915771484375, -1.998291015625, -1.5050048828125, -1.01171875, -0.5184326171875, -0.025146484375, 0.4681396484375, 0.96142578125, 1.4547119140625, 1.947998046875, 2.4412841796875, 2.9345703125, 3.4278564453125, 3.921142578125, 4.4144287109375, 4.90771484375, 5.4010009765625, 5.894287109375, 6.3875732421875, 6.880859375, 7.3741455078125, 7.867431640625, 8.3607177734375, 8.85400390625, 9.3472900390625, 9.840576171875, 10.3338623046875, 10.8271484375, 11.3204345703125, 11.813720703125, 12.3070068359375, 12.80029296875, 13.2935791015625, 13.786865234375, 14.2801513671875, 14.7734375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 4.0, 14.0, 32.0, 85.0, 138.0, 237.0, 235.0, 122.0, 68.0, 25.0, 15.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-273.0617370605469, -265.6741027832031, -258.2864990234375, -250.8988800048828, -243.51126098632812, -236.12364196777344, -228.73602294921875, -221.34840393066406, -213.96078491210938, -206.5731658935547, -199.185546875, -191.7979278564453, -184.41030883789062, -177.02268981933594, -169.63507080078125, -162.24745178222656, -154.85983276367188, -147.4722137451172, -140.0845947265625, -132.6969757080078, -125.30935668945312, -117.92173767089844, -110.53411865234375, -103.14649963378906, -95.75886535644531, -88.37124633789062, -80.98362731933594, -73.59600830078125, -66.20838928222656, -58.82076644897461, -51.43314743041992, -44.045528411865234, -36.65791320800781, -29.270294189453125, -21.882675170898438, -14.495054244995117, -7.10743522644043, 0.2801856994628906, 7.667804718017578, 15.055423736572266, 22.443042755126953, 29.83066177368164, 37.21828079223633, 44.60590362548828, 51.99352264404297, 59.381141662597656, 66.76876068115234, 74.15637969970703, 81.54399871826172, 88.9316177368164, 96.3192367553711, 103.70685577392578, 111.09447479248047, 118.48210144042969, 125.86972045898438, 133.25733947753906, 140.64495849609375, 148.03257751464844, 155.42019653320312, 162.8078155517578, 170.1954345703125, 177.5830535888672, 184.97067260742188, 192.35829162597656, 199.74591064453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 12.0, 8.0, 11.0, 11.0, 14.0, 20.0, 24.0, 29.0, 26.0, 16.0, 35.0, 34.0, 36.0, 34.0, 40.0, 52.0, 66.0, 68.0, 54.0, 44.0, 30.0, 33.0, 37.0, 28.0, 30.0, 32.0, 31.0, 22.0, 15.0, 14.0, 13.0, 20.0, 10.0, 8.0, 9.0, 3.0, 3.0, 3.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-87.25569152832031, -84.55699920654297, -81.85830688476562, -79.15961456298828, -76.46092224121094, -73.76222229003906, -71.06353759765625, -68.36483764648438, -65.66614532470703, -62.96745300292969, -60.268760681152344, -57.570068359375, -54.87137222290039, -52.17267990112305, -49.4739875793457, -46.775291442871094, -44.076602935791016, -41.37791061401367, -38.67921829223633, -35.98052215576172, -33.281829833984375, -30.58313751220703, -27.884445190429688, -25.18575096130371, -22.487058639526367, -19.788366317749023, -17.089672088623047, -14.390979766845703, -11.692286491394043, -8.993593215942383, -6.294900894165039, -3.5962066650390625, -0.8975143432617188, 1.8011786937713623, 4.499871730804443, 7.198564529418945, 9.897257804870605, 12.595951080322266, 15.29464340209961, 17.993337631225586, 20.69202995300293, 23.390722274780273, 26.08941650390625, 28.788108825683594, 31.486801147460938, 34.18549346923828, 36.884185791015625, 39.582881927490234, 42.28157424926758, 44.98026657104492, 47.678958892822266, 50.377655029296875, 53.07634735107422, 55.77503967285156, 58.473731994628906, 61.17242431640625, 63.871116638183594, 66.56980895996094, 69.26850128173828, 71.96719360351562, 74.66588592529297, 77.36457824707031, 80.06327819824219, 82.76197052001953, 85.46066284179688]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 10.0, 4.0, 11.0, 10.0, 18.0, 17.0, 27.0, 32.0, 65.0, 61.0, 116.0, 166.0, 282.0, 389.0, 689.0, 1170.0, 2002.0, 3733.0, 7228.0, 15161.0, 35719.0, 103575.0, 379610.0, 343332.0, 93270.0, 32684.0, 13844.0, 6791.0, 3637.0, 1904.0, 1095.0, 671.0, 408.0, 277.0, 168.0, 110.0, 78.0, 45.0, 41.0, 27.0, 14.0, 23.0, 15.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.140625, -15.601806640625, -15.06298828125, -14.524169921875, -13.9853515625, -13.446533203125, -12.90771484375, -12.368896484375, -11.830078125, -11.291259765625, -10.75244140625, -10.213623046875, -9.6748046875, -9.135986328125, -8.59716796875, -8.058349609375, -7.51953125, -6.980712890625, -6.44189453125, -5.903076171875, -5.3642578125, -4.825439453125, -4.28662109375, -3.747802734375, -3.208984375, -2.670166015625, -2.13134765625, -1.592529296875, -1.0537109375, -0.514892578125, 0.02392578125, 0.562744140625, 1.1015625, 1.640380859375, 2.17919921875, 2.718017578125, 3.2568359375, 3.795654296875, 4.33447265625, 4.873291015625, 5.412109375, 5.950927734375, 6.48974609375, 7.028564453125, 7.5673828125, 8.106201171875, 8.64501953125, 9.183837890625, 9.72265625, 10.261474609375, 10.80029296875, 11.339111328125, 11.8779296875, 12.416748046875, 12.95556640625, 13.494384765625, 14.033203125, 14.572021484375, 15.11083984375, 15.649658203125, 16.1884765625, 16.727294921875, 17.26611328125, 17.804931640625, 18.34375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 8.0, 6.0, 12.0, 13.0, 13.0, 19.0, 21.0, 26.0, 24.0, 36.0, 35.0, 47.0, 40.0, 46.0, 62.0, 57.0, 54.0, 38.0, 55.0, 63.0, 46.0, 32.0, 43.0, 43.0, 31.0, 24.0, 22.0, 21.0, 12.0, 11.0, 9.0, 11.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.9453125, -11.619140625, -11.29296875, -10.966796875, -10.640625, -10.314453125, -9.98828125, -9.662109375, -9.3359375, -9.009765625, -8.68359375, -8.357421875, -8.03125, -7.705078125, -7.37890625, -7.052734375, -6.7265625, -6.400390625, -6.07421875, -5.748046875, -5.421875, -5.095703125, -4.76953125, -4.443359375, -4.1171875, -3.791015625, -3.46484375, -3.138671875, -2.8125, -2.486328125, -2.16015625, -1.833984375, -1.5078125, -1.181640625, -0.85546875, -0.529296875, -0.203125, 0.123046875, 0.44921875, 0.775390625, 1.1015625, 1.427734375, 1.75390625, 2.080078125, 2.40625, 2.732421875, 3.05859375, 3.384765625, 3.7109375, 4.037109375, 4.36328125, 4.689453125, 5.015625, 5.341796875, 5.66796875, 5.994140625, 6.3203125, 6.646484375, 6.97265625, 7.298828125, 7.625, 7.951171875, 8.27734375, 8.603515625, 8.9296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 3.0, 7.0, 9.0, 15.0, 24.0, 21.0, 28.0, 44.0, 71.0, 91.0, 133.0, 218.0, 310.0, 504.0, 945.0, 1951.0, 6214.0, 38998.0, 811442.0, 165806.0, 15156.0, 3424.0, 1301.0, 622.0, 416.0, 264.0, 176.0, 95.0, 81.0, 44.0, 41.0, 24.0, 21.0, 13.0, 13.0, 12.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.074951171875, -27.94677734375, -26.818603515625, -25.6904296875, -24.562255859375, -23.43408203125, -22.305908203125, -21.177734375, -20.049560546875, -18.92138671875, -17.793212890625, -16.6650390625, -15.536865234375, -14.40869140625, -13.280517578125, -12.15234375, -11.024169921875, -9.89599609375, -8.767822265625, -7.6396484375, -6.511474609375, -5.38330078125, -4.255126953125, -3.126953125, -1.998779296875, -0.87060546875, 0.257568359375, 1.3857421875, 2.513916015625, 3.64208984375, 4.770263671875, 5.8984375, 7.026611328125, 8.15478515625, 9.282958984375, 10.4111328125, 11.539306640625, 12.66748046875, 13.795654296875, 14.923828125, 16.052001953125, 17.18017578125, 18.308349609375, 19.4365234375, 20.564697265625, 21.69287109375, 22.821044921875, 23.94921875, 25.077392578125, 26.20556640625, 27.333740234375, 28.4619140625, 29.590087890625, 30.71826171875, 31.846435546875, 32.974609375, 34.102783203125, 35.23095703125, 36.359130859375, 37.4873046875, 38.615478515625, 39.74365234375, 40.871826171875, 42.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 10.0, 5.0, 7.0, 7.0, 32.0, 17.0, 24.0, 30.0, 34.0, 41.0, 39.0, 55.0, 63.0, 51.0, 59.0, 64.0, 59.0, 60.0, 53.0, 56.0, 55.0, 32.0, 20.0, 25.0, 22.0, 15.0, 16.0, 10.0, 11.0, 11.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-46.25, -44.978515625, -43.70703125, -42.435546875, -41.1640625, -39.892578125, -38.62109375, -37.349609375, -36.078125, -34.806640625, -33.53515625, -32.263671875, -30.9921875, -29.720703125, -28.44921875, -27.177734375, -25.90625, -24.634765625, -23.36328125, -22.091796875, -20.8203125, -19.548828125, -18.27734375, -17.005859375, -15.734375, -14.462890625, -13.19140625, -11.919921875, -10.6484375, -9.376953125, -8.10546875, -6.833984375, -5.5625, -4.291015625, -3.01953125, -1.748046875, -0.4765625, 0.794921875, 2.06640625, 3.337890625, 4.609375, 5.880859375, 7.15234375, 8.423828125, 9.6953125, 10.966796875, 12.23828125, 13.509765625, 14.78125, 16.052734375, 17.32421875, 18.595703125, 19.8671875, 21.138671875, 22.41015625, 23.681640625, 24.953125, 26.224609375, 27.49609375, 28.767578125, 30.0390625, 31.310546875, 32.58203125, 33.853515625, 35.125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 10.0, 4.0, 12.0, 16.0, 13.0, 21.0, 29.0, 47.0, 49.0, 85.0, 149.0, 237.0, 476.0, 985.0, 2206.0, 6652.0, 28686.0, 230701.0, 717279.0, 45802.0, 9637.0, 2951.0, 1195.0, 537.0, 288.0, 146.0, 100.0, 68.0, 41.0, 23.0, 24.0, 20.0, 15.0, 6.0, 8.0, 9.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.65234375, -7.40655517578125, -7.1607666015625, -6.91497802734375, -6.669189453125, -6.42340087890625, -6.1776123046875, -5.93182373046875, -5.68603515625, -5.44024658203125, -5.1944580078125, -4.94866943359375, -4.702880859375, -4.45709228515625, -4.2113037109375, -3.96551513671875, -3.7197265625, -3.47393798828125, -3.2281494140625, -2.98236083984375, -2.736572265625, -2.49078369140625, -2.2449951171875, -1.99920654296875, -1.75341796875, -1.50762939453125, -1.2618408203125, -1.01605224609375, -0.770263671875, -0.52447509765625, -0.2786865234375, -0.03289794921875, 0.212890625, 0.45867919921875, 0.7044677734375, 0.95025634765625, 1.196044921875, 1.44183349609375, 1.6876220703125, 1.93341064453125, 2.17919921875, 2.42498779296875, 2.6707763671875, 2.91656494140625, 3.162353515625, 3.40814208984375, 3.6539306640625, 3.89971923828125, 4.1455078125, 4.39129638671875, 4.6370849609375, 4.88287353515625, 5.128662109375, 5.37445068359375, 5.6202392578125, 5.86602783203125, 6.11181640625, 6.35760498046875, 6.6033935546875, 6.84918212890625, 7.094970703125, 7.34075927734375, 7.5865478515625, 7.83233642578125, 8.078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 14.0, 9.0, 19.0, 22.0, 35.0, 51.0, 70.0, 145.0, 192.0, 143.0, 69.0, 57.0, 39.0, 25.0, 19.0, 15.0, 11.0, 12.0, 4.0, 2.0, 4.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018253326416015625, -0.0017631947994232178, -0.001701056957244873, -0.0016389191150665283, -0.0015767812728881836, -0.0015146434307098389, -0.0014525055885314941, -0.0013903677463531494, -0.0013282299041748047, -0.00126609206199646, -0.0012039542198181152, -0.0011418163776397705, -0.0010796785354614258, -0.001017540693283081, -0.0009554028511047363, -0.0008932650089263916, -0.0008311271667480469, -0.0007689893245697021, -0.0007068514823913574, -0.0006447136402130127, -0.000582575798034668, -0.0005204379558563232, -0.0004583001136779785, -0.0003961622714996338, -0.00033402442932128906, -0.00027188658714294434, -0.0002097487449645996, -0.00014761090278625488, -8.547306060791016e-05, -2.333521842956543e-05, 3.88026237487793e-05, 0.00010094046592712402, 0.00016307830810546875, 0.00022521615028381348, 0.0002873539924621582, 0.00034949183464050293, 0.00041162967681884766, 0.0004737675189971924, 0.0005359053611755371, 0.0005980432033538818, 0.0006601810455322266, 0.0007223188877105713, 0.000784456729888916, 0.0008465945720672607, 0.0009087324142456055, 0.0009708702564239502, 0.001033008098602295, 0.0010951459407806396, 0.0011572837829589844, 0.001219421625137329, 0.0012815594673156738, 0.0013436973094940186, 0.0014058351516723633, 0.001467972993850708, 0.0015301108360290527, 0.0015922486782073975, 0.0016543865203857422, 0.001716524362564087, 0.0017786622047424316, 0.0018408000469207764, 0.001902937889099121, 0.001965075731277466, 0.0020272135734558105, 0.0020893514156341553, 0.0021514892578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 12.0, 11.0, 22.0, 30.0, 36.0, 65.0, 73.0, 140.0, 246.0, 478.0, 1020.0, 2713.0, 9057.0, 50448.0, 789965.0, 166298.0, 20048.0, 4684.0, 1721.0, 674.0, 337.0, 161.0, 115.0, 59.0, 45.0, 18.0, 20.0, 20.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.3125, -11.02056884765625, -10.7286376953125, -10.43670654296875, -10.144775390625, -9.85284423828125, -9.5609130859375, -9.26898193359375, -8.97705078125, -8.68511962890625, -8.3931884765625, -8.10125732421875, -7.809326171875, -7.51739501953125, -7.2254638671875, -6.93353271484375, -6.6416015625, -6.34967041015625, -6.0577392578125, -5.76580810546875, -5.473876953125, -5.18194580078125, -4.8900146484375, -4.59808349609375, -4.30615234375, -4.01422119140625, -3.7222900390625, -3.43035888671875, -3.138427734375, -2.84649658203125, -2.5545654296875, -2.26263427734375, -1.970703125, -1.67877197265625, -1.3868408203125, -1.09490966796875, -0.802978515625, -0.51104736328125, -0.2191162109375, 0.07281494140625, 0.36474609375, 0.65667724609375, 0.9486083984375, 1.24053955078125, 1.532470703125, 1.82440185546875, 2.1163330078125, 2.40826416015625, 2.7001953125, 2.99212646484375, 3.2840576171875, 3.57598876953125, 3.867919921875, 4.15985107421875, 4.4517822265625, 4.74371337890625, 5.03564453125, 5.32757568359375, 5.6195068359375, 5.91143798828125, 6.203369140625, 6.49530029296875, 6.7872314453125, 7.07916259765625, 7.37109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 15.0, 23.0, 31.0, 35.0, 35.0, 44.0, 84.0, 96.0, 119.0, 98.0, 87.0, 71.0, 60.0, 47.0, 24.0, 33.0, 19.0, 8.0, 15.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.2744140625, -7.052734375, -6.8310546875, -6.609375, -6.3876953125, -6.166015625, -5.9443359375, -5.72265625, -5.5009765625, -5.279296875, -5.0576171875, -4.8359375, -4.6142578125, -4.392578125, -4.1708984375, -3.94921875, -3.7275390625, -3.505859375, -3.2841796875, -3.0625, -2.8408203125, -2.619140625, -2.3974609375, -2.17578125, -1.9541015625, -1.732421875, -1.5107421875, -1.2890625, -1.0673828125, -0.845703125, -0.6240234375, -0.40234375, -0.1806640625, 0.041015625, 0.2626953125, 0.484375, 0.7060546875, 0.927734375, 1.1494140625, 1.37109375, 1.5927734375, 1.814453125, 2.0361328125, 2.2578125, 2.4794921875, 2.701171875, 2.9228515625, 3.14453125, 3.3662109375, 3.587890625, 3.8095703125, 4.03125, 4.2529296875, 4.474609375, 4.6962890625, 4.91796875, 5.1396484375, 5.361328125, 5.5830078125, 5.8046875, 6.0263671875, 6.248046875, 6.4697265625, 6.69140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 10.0, 20.0, 28.0, 67.0, 132.0, 369.0, 151.0, 83.0, 58.0, 23.0, 15.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-258.5085144042969, -252.2935791015625, -246.07864379882812, -239.8636932373047, -233.6487579345703, -227.43382263183594, -221.2188720703125, -215.00393676757812, -208.78900146484375, -202.57406616210938, -196.359130859375, -190.14418029785156, -183.9292449951172, -177.7143096923828, -171.49935913085938, -165.284423828125, -159.06948852539062, -152.85455322265625, -146.63961791992188, -140.42466735839844, -134.20973205566406, -127.99479675292969, -121.77985382080078, -115.56491088867188, -109.3499755859375, -103.13504028320312, -96.92009735107422, -90.70515441894531, -84.49021911621094, -78.27528381347656, -72.06034088134766, -65.84539794921875, -59.63044738769531, -53.41550827026367, -47.20056915283203, -40.98563003540039, -34.77069091796875, -28.55575180053711, -22.34081268310547, -16.125873565673828, -9.910934448242188, -3.695995330810547, 2.5189437866210938, 8.733882904052734, 14.948822021484375, 21.163761138916016, 27.378700256347656, 33.5936393737793, 39.80857849121094, 46.02351760864258, 52.23845672607422, 58.45339584350586, 64.6683349609375, 70.88327026367188, 77.09821319580078, 83.31315612792969, 89.52809143066406, 95.74302673339844, 101.95796966552734, 108.17291259765625, 114.38784790039062, 120.602783203125, 126.8177261352539, 133.0326690673828, 139.2476043701172]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 3.0, 18.0, 12.0, 14.0, 22.0, 21.0, 19.0, 24.0, 24.0, 24.0, 42.0, 46.0, 65.0, 142.0, 143.0, 78.0, 38.0, 36.0, 32.0, 33.0, 30.0, 24.0, 11.0, 18.0, 10.0, 10.0, 16.0, 7.0, 4.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.66050720214844, -119.08990478515625, -114.51929473876953, -109.94868469238281, -105.37808227539062, -100.80747985839844, -96.23686981201172, -91.666259765625, -87.09565734863281, -82.52505493164062, -77.9544448852539, -73.38383483886719, -68.813232421875, -64.24263000488281, -59.672019958496094, -55.10141372680664, -50.53080749511719, -45.960201263427734, -41.38959503173828, -36.81898880004883, -32.248382568359375, -27.677776336669922, -23.10717010498047, -18.536563873291016, -13.965957641601562, -9.39535140991211, -4.824745178222656, -0.2541389465332031, 4.31646728515625, 8.887073516845703, 13.457679748535156, 18.02828598022461, 22.598907470703125, 27.169513702392578, 31.74011993408203, 36.310726165771484, 40.88133239746094, 45.45193862915039, 50.022544860839844, 54.5931510925293, 59.16375732421875, 63.7343635559082, 68.30496978759766, 72.87557983398438, 77.44618225097656, 82.01678466796875, 86.58739471435547, 91.15800476074219, 95.72860717773438, 100.29920959472656, 104.86981964111328, 109.4404296875, 114.01103210449219, 118.58163452148438, 123.1522445678711, 127.72285461425781, 132.29345703125, 136.8640594482422, 141.43466186523438, 146.00527954101562, 150.5758819580078, 155.146484375, 159.71710205078125, 164.28770446777344, 168.85830688476562]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 13.0, 21.0, 39.0, 74.0, 145.0, 352.0, 639.0, 1501.0, 3563.0, 10010.0, 38426.0, 262930.0, 2154525.0, 1514291.0, 166774.0, 27896.0, 7952.0, 2863.0, 1153.0, 575.0, 267.0, 122.0, 78.0, 38.0, 19.0, 16.0, 5.0, 3.0, 3.0], "bins": [-31.0, -30.352783203125, -29.70556640625, -29.058349609375, -28.4111328125, -27.763916015625, -27.11669921875, -26.469482421875, -25.822265625, -25.175048828125, -24.52783203125, -23.880615234375, -23.2333984375, -22.586181640625, -21.93896484375, -21.291748046875, -20.64453125, -19.997314453125, -19.35009765625, -18.702880859375, -18.0556640625, -17.408447265625, -16.76123046875, -16.114013671875, -15.466796875, -14.819580078125, -14.17236328125, -13.525146484375, -12.8779296875, -12.230712890625, -11.58349609375, -10.936279296875, -10.2890625, -9.641845703125, -8.99462890625, -8.347412109375, -7.7001953125, -7.052978515625, -6.40576171875, -5.758544921875, -5.111328125, -4.464111328125, -3.81689453125, -3.169677734375, -2.5224609375, -1.875244140625, -1.22802734375, -0.580810546875, 0.06640625, 0.713623046875, 1.36083984375, 2.008056640625, 2.6552734375, 3.302490234375, 3.94970703125, 4.596923828125, 5.244140625, 5.891357421875, 6.53857421875, 7.185791015625, 7.8330078125, 8.480224609375, 9.12744140625, 9.774658203125, 10.421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 9.0, 7.0, 12.0, 13.0, 21.0, 16.0, 17.0, 17.0, 24.0, 22.0, 25.0, 41.0, 41.0, 30.0, 34.0, 42.0, 42.0, 48.0, 37.0, 58.0, 40.0, 38.0, 38.0, 37.0, 26.0, 33.0, 31.0, 37.0, 24.0, 24.0, 24.0, 18.0, 15.0, 13.0, 6.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7890625, -6.5433349609375, -6.297607421875, -6.0518798828125, -5.80615234375, -5.5604248046875, -5.314697265625, -5.0689697265625, -4.8232421875, -4.5775146484375, -4.331787109375, -4.0860595703125, -3.84033203125, -3.5946044921875, -3.348876953125, -3.1031494140625, -2.857421875, -2.6116943359375, -2.365966796875, -2.1202392578125, -1.87451171875, -1.6287841796875, -1.383056640625, -1.1373291015625, -0.8916015625, -0.6458740234375, -0.400146484375, -0.1544189453125, 0.09130859375, 0.3370361328125, 0.582763671875, 0.8284912109375, 1.07421875, 1.3199462890625, 1.565673828125, 1.8114013671875, 2.05712890625, 2.3028564453125, 2.548583984375, 2.7943115234375, 3.0400390625, 3.2857666015625, 3.531494140625, 3.7772216796875, 4.02294921875, 4.2686767578125, 4.514404296875, 4.7601318359375, 5.005859375, 5.2515869140625, 5.497314453125, 5.7430419921875, 5.98876953125, 6.2344970703125, 6.480224609375, 6.7259521484375, 6.9716796875, 7.2174072265625, 7.463134765625, 7.7088623046875, 7.95458984375, 8.2003173828125, 8.446044921875, 8.6917724609375, 8.9375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 16.0, 22.0, 19.0, 37.0, 46.0, 69.0, 100.0, 127.0, 204.0, 338.0, 562.0, 1026.0, 2095.0, 5665.0, 23861.0, 288743.0, 3676634.0, 168450.0, 17538.0, 4594.0, 1790.0, 919.0, 483.0, 304.0, 185.0, 134.0, 98.0, 56.0, 38.0, 27.0, 21.0, 15.0, 10.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.6875, -34.650634765625, -33.61376953125, -32.576904296875, -31.5400390625, -30.503173828125, -29.46630859375, -28.429443359375, -27.392578125, -26.355712890625, -25.31884765625, -24.281982421875, -23.2451171875, -22.208251953125, -21.17138671875, -20.134521484375, -19.09765625, -18.060791015625, -17.02392578125, -15.987060546875, -14.9501953125, -13.913330078125, -12.87646484375, -11.839599609375, -10.802734375, -9.765869140625, -8.72900390625, -7.692138671875, -6.6552734375, -5.618408203125, -4.58154296875, -3.544677734375, -2.5078125, -1.470947265625, -0.43408203125, 0.602783203125, 1.6396484375, 2.676513671875, 3.71337890625, 4.750244140625, 5.787109375, 6.823974609375, 7.86083984375, 8.897705078125, 9.9345703125, 10.971435546875, 12.00830078125, 13.045166015625, 14.08203125, 15.118896484375, 16.15576171875, 17.192626953125, 18.2294921875, 19.266357421875, 20.30322265625, 21.340087890625, 22.376953125, 23.413818359375, 24.45068359375, 25.487548828125, 26.5244140625, 27.561279296875, 28.59814453125, 29.635009765625, 30.671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 3.0, 11.0, 16.0, 23.0, 23.0, 33.0, 41.0, 64.0, 84.0, 142.0, 204.0, 265.0, 356.0, 537.0, 659.0, 478.0, 330.0, 203.0, 181.0, 103.0, 83.0, 65.0, 50.0, 36.0, 23.0, 16.0, 11.0, 8.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.671875, -23.80322265625, -22.9345703125, -22.06591796875, -21.197265625, -20.32861328125, -19.4599609375, -18.59130859375, -17.72265625, -16.85400390625, -15.9853515625, -15.11669921875, -14.248046875, -13.37939453125, -12.5107421875, -11.64208984375, -10.7734375, -9.90478515625, -9.0361328125, -8.16748046875, -7.298828125, -6.43017578125, -5.5615234375, -4.69287109375, -3.82421875, -2.95556640625, -2.0869140625, -1.21826171875, -0.349609375, 0.51904296875, 1.3876953125, 2.25634765625, 3.125, 3.99365234375, 4.8623046875, 5.73095703125, 6.599609375, 7.46826171875, 8.3369140625, 9.20556640625, 10.07421875, 10.94287109375, 11.8115234375, 12.68017578125, 13.548828125, 14.41748046875, 15.2861328125, 16.15478515625, 17.0234375, 17.89208984375, 18.7607421875, 19.62939453125, 20.498046875, 21.36669921875, 22.2353515625, 23.10400390625, 23.97265625, 24.84130859375, 25.7099609375, 26.57861328125, 27.447265625, 28.31591796875, 29.1845703125, 30.05322265625, 30.921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 13.0, 14.0, 28.0, 49.0, 80.0, 165.0, 236.0, 183.0, 86.0, 55.0, 27.0, 24.0, 12.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-474.1300964355469, -462.73638916015625, -451.34271240234375, -439.94903564453125, -428.5553283691406, -417.16162109375, -405.7679443359375, -394.374267578125, -382.9805603027344, -371.58685302734375, -360.19317626953125, -348.79949951171875, -337.4057922363281, -326.0120849609375, -314.618408203125, -303.2247314453125, -291.8310241699219, -280.43731689453125, -269.04364013671875, -257.64996337890625, -246.25625610351562, -234.86256408691406, -223.4688720703125, -212.07518005371094, -200.68148803710938, -189.2877960205078, -177.89410400390625, -166.5004119873047, -155.10671997070312, -143.71302795410156, -132.3193359375, -120.92564392089844, -109.53195190429688, -98.13825988769531, -86.74456787109375, -75.35087585449219, -63.957183837890625, -52.56349182128906, -41.1697998046875, -29.776107788085938, -18.382415771484375, -6.9887237548828125, 4.40496826171875, 15.798660278320312, 27.192352294921875, 38.58604431152344, 49.979736328125, 61.37342834472656, 72.76712036132812, 84.16081237792969, 95.55450439453125, 106.94819641113281, 118.34188842773438, 129.73558044433594, 141.1292724609375, 152.52296447753906, 163.91665649414062, 175.3103485107422, 186.70404052734375, 198.0977325439453, 209.49142456054688, 220.88511657714844, 232.27880859375, 243.67250061035156, 255.06619262695312]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 6.0, 5.0, 11.0, 15.0, 16.0, 22.0, 24.0, 34.0, 25.0, 44.0, 37.0, 33.0, 47.0, 59.0, 76.0, 69.0, 64.0, 47.0, 45.0, 50.0, 48.0, 40.0, 35.0, 28.0, 30.0, 23.0, 18.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.65472412109375, -145.49755859375, -140.34039306640625, -135.18321228027344, -130.0260467529297, -124.86888122558594, -119.71171569824219, -114.55455017089844, -109.39737701416016, -104.2402114868164, -99.08303833007812, -93.92587280273438, -88.76870727539062, -83.61153411865234, -78.4543685913086, -73.29719543457031, -68.14002990722656, -62.98286056518555, -57.82569122314453, -52.66852569580078, -47.511356353759766, -42.35418701171875, -37.197021484375, -32.039852142333984, -26.88268280029297, -21.725513458251953, -16.56834602355957, -11.411177635192871, -6.254009246826172, -1.0968399047851562, 4.060327529907227, 9.21749496459961, 14.374664306640625, 19.53183364868164, 24.689001083374023, 29.846168518066406, 35.00333786010742, 40.16050720214844, 45.31767272949219, 50.4748420715332, 55.63201141357422, 60.789180755615234, 65.94635009765625, 71.103515625, 76.26068115234375, 81.41785430908203, 86.57501983642578, 91.73219299316406, 96.88935852050781, 102.04652404785156, 107.20369720458984, 112.3608627319336, 117.51803588867188, 122.67520141601562, 127.83236694335938, 132.98953247070312, 138.14669799804688, 143.30386352539062, 148.46102905273438, 153.6182098388672, 158.77537536621094, 163.9325408935547, 169.08970642089844, 174.2468719482422, 179.404052734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 11.0, 12.0, 15.0, 39.0, 45.0, 88.0, 126.0, 211.0, 350.0, 593.0, 995.0, 1798.0, 3788.0, 8079.0, 22348.0, 87130.0, 671554.0, 191377.0, 37424.0, 11995.0, 5014.0, 2429.0, 1298.0, 722.0, 433.0, 259.0, 157.0, 83.0, 64.0, 33.0, 23.0, 18.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-17.671875, -17.131591796875, -16.59130859375, -16.051025390625, -15.5107421875, -14.970458984375, -14.43017578125, -13.889892578125, -13.349609375, -12.809326171875, -12.26904296875, -11.728759765625, -11.1884765625, -10.648193359375, -10.10791015625, -9.567626953125, -9.02734375, -8.487060546875, -7.94677734375, -7.406494140625, -6.8662109375, -6.325927734375, -5.78564453125, -5.245361328125, -4.705078125, -4.164794921875, -3.62451171875, -3.084228515625, -2.5439453125, -2.003662109375, -1.46337890625, -0.923095703125, -0.3828125, 0.157470703125, 0.69775390625, 1.238037109375, 1.7783203125, 2.318603515625, 2.85888671875, 3.399169921875, 3.939453125, 4.479736328125, 5.02001953125, 5.560302734375, 6.1005859375, 6.640869140625, 7.18115234375, 7.721435546875, 8.26171875, 8.802001953125, 9.34228515625, 9.882568359375, 10.4228515625, 10.963134765625, 11.50341796875, 12.043701171875, 12.583984375, 13.124267578125, 13.66455078125, 14.204833984375, 14.7451171875, 15.285400390625, 15.82568359375, 16.365966796875, 16.90625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 13.0, 15.0, 12.0, 25.0, 32.0, 40.0, 52.0, 46.0, 55.0, 72.0, 71.0, 71.0, 73.0, 71.0, 62.0, 60.0, 49.0, 44.0, 33.0, 27.0, 23.0, 18.0, 8.0, 5.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.2222900390625, -11.749267578125, -11.2762451171875, -10.80322265625, -10.3302001953125, -9.857177734375, -9.3841552734375, -8.9111328125, -8.4381103515625, -7.965087890625, -7.4920654296875, -7.01904296875, -6.5460205078125, -6.072998046875, -5.5999755859375, -5.126953125, -4.6539306640625, -4.180908203125, -3.7078857421875, -3.23486328125, -2.7618408203125, -2.288818359375, -1.8157958984375, -1.3427734375, -0.8697509765625, -0.396728515625, 0.0762939453125, 0.54931640625, 1.0223388671875, 1.495361328125, 1.9683837890625, 2.44140625, 2.9144287109375, 3.387451171875, 3.8604736328125, 4.33349609375, 4.8065185546875, 5.279541015625, 5.7525634765625, 6.2255859375, 6.6986083984375, 7.171630859375, 7.6446533203125, 8.11767578125, 8.5906982421875, 9.063720703125, 9.5367431640625, 10.009765625, 10.4827880859375, 10.955810546875, 11.4288330078125, 11.90185546875, 12.3748779296875, 12.847900390625, 13.3209228515625, 13.7939453125, 14.2669677734375, 14.739990234375, 15.2130126953125, 15.68603515625, 16.1590576171875, 16.632080078125, 17.1051025390625, 17.578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 6.0, 7.0, 2.0, 15.0, 10.0, 21.0, 25.0, 31.0, 56.0, 68.0, 79.0, 105.0, 136.0, 218.0, 394.0, 655.0, 1433.0, 3983.0, 16326.0, 136597.0, 847708.0, 30188.0, 6272.0, 2021.0, 876.0, 463.0, 249.0, 166.0, 125.0, 72.0, 44.0, 39.0, 50.0, 30.0, 21.0, 15.0, 9.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-18.53125, -17.955322265625, -17.37939453125, -16.803466796875, -16.2275390625, -15.651611328125, -15.07568359375, -14.499755859375, -13.923828125, -13.347900390625, -12.77197265625, -12.196044921875, -11.6201171875, -11.044189453125, -10.46826171875, -9.892333984375, -9.31640625, -8.740478515625, -8.16455078125, -7.588623046875, -7.0126953125, -6.436767578125, -5.86083984375, -5.284912109375, -4.708984375, -4.133056640625, -3.55712890625, -2.981201171875, -2.4052734375, -1.829345703125, -1.25341796875, -0.677490234375, -0.1015625, 0.474365234375, 1.05029296875, 1.626220703125, 2.2021484375, 2.778076171875, 3.35400390625, 3.929931640625, 4.505859375, 5.081787109375, 5.65771484375, 6.233642578125, 6.8095703125, 7.385498046875, 7.96142578125, 8.537353515625, 9.11328125, 9.689208984375, 10.26513671875, 10.841064453125, 11.4169921875, 11.992919921875, 12.56884765625, 13.144775390625, 13.720703125, 14.296630859375, 14.87255859375, 15.448486328125, 16.0244140625, 16.600341796875, 17.17626953125, 17.752197265625, 18.328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 5.0, 7.0, 11.0, 6.0, 12.0, 16.0, 13.0, 16.0, 10.0, 17.0, 18.0, 24.0, 30.0, 40.0, 57.0, 60.0, 58.0, 70.0, 76.0, 52.0, 82.0, 57.0, 31.0, 27.0, 27.0, 30.0, 22.0, 22.0, 7.0, 17.0, 13.0, 14.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 0.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-36.375, -35.29052734375, -34.2060546875, -33.12158203125, -32.037109375, -30.95263671875, -29.8681640625, -28.78369140625, -27.69921875, -26.61474609375, -25.5302734375, -24.44580078125, -23.361328125, -22.27685546875, -21.1923828125, -20.10791015625, -19.0234375, -17.93896484375, -16.8544921875, -15.77001953125, -14.685546875, -13.60107421875, -12.5166015625, -11.43212890625, -10.34765625, -9.26318359375, -8.1787109375, -7.09423828125, -6.009765625, -4.92529296875, -3.8408203125, -2.75634765625, -1.671875, -0.58740234375, 0.4970703125, 1.58154296875, 2.666015625, 3.75048828125, 4.8349609375, 5.91943359375, 7.00390625, 8.08837890625, 9.1728515625, 10.25732421875, 11.341796875, 12.42626953125, 13.5107421875, 14.59521484375, 15.6796875, 16.76416015625, 17.8486328125, 18.93310546875, 20.017578125, 21.10205078125, 22.1865234375, 23.27099609375, 24.35546875, 25.43994140625, 26.5244140625, 27.60888671875, 28.693359375, 29.77783203125, 30.8623046875, 31.94677734375, 33.03125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 11.0, 21.0, 22.0, 19.0, 33.0, 53.0, 82.0, 101.0, 153.0, 264.0, 478.0, 880.0, 1905.0, 4061.0, 10970.0, 38237.0, 744950.0, 201056.0, 29259.0, 9028.0, 3398.0, 1600.0, 806.0, 371.0, 255.0, 158.0, 105.0, 61.0, 51.0, 38.0, 27.0, 22.0, 13.0, 13.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.347869873046875, -2.27191162109375, -2.195953369140625, -2.1199951171875, -2.044036865234375, -1.96807861328125, -1.892120361328125, -1.816162109375, -1.740203857421875, -1.66424560546875, -1.588287353515625, -1.5123291015625, -1.436370849609375, -1.36041259765625, -1.284454345703125, -1.20849609375, -1.132537841796875, -1.05657958984375, -0.980621337890625, -0.9046630859375, -0.828704833984375, -0.75274658203125, -0.676788330078125, -0.600830078125, -0.524871826171875, -0.44891357421875, -0.372955322265625, -0.2969970703125, -0.221038818359375, -0.14508056640625, -0.069122314453125, 0.0068359375, 0.082794189453125, 0.15875244140625, 0.234710693359375, 0.3106689453125, 0.386627197265625, 0.46258544921875, 0.538543701171875, 0.614501953125, 0.690460205078125, 0.76641845703125, 0.842376708984375, 0.9183349609375, 0.994293212890625, 1.07025146484375, 1.146209716796875, 1.22216796875, 1.298126220703125, 1.37408447265625, 1.450042724609375, 1.5260009765625, 1.601959228515625, 1.67791748046875, 1.753875732421875, 1.829833984375, 1.905792236328125, 1.98175048828125, 2.057708740234375, 2.1336669921875, 2.209625244140625, 2.28558349609375, 2.361541748046875, 2.4375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 9.0, 7.0, 12.0, 16.0, 18.0, 20.0, 25.0, 28.0, 35.0, 46.0, 78.0, 87.0, 103.0, 110.0, 87.0, 51.0, 55.0, 41.0, 26.0, 17.0, 17.0, 19.0, 16.0, 7.0, 6.0, 9.0, 2.0, 5.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005288124084472656, -0.0005111023783683777, -0.0004933923482894897, -0.0004756823182106018, -0.00045797228813171387, -0.00044026225805282593, -0.000422552227973938, -0.00040484219789505005, -0.0003871321678161621, -0.00036942213773727417, -0.00035171210765838623, -0.0003340020775794983, -0.00031629204750061035, -0.0002985820174217224, -0.00028087198734283447, -0.00026316195726394653, -0.0002454519271850586, -0.00022774189710617065, -0.00021003186702728271, -0.00019232183694839478, -0.00017461180686950684, -0.0001569017767906189, -0.00013919174671173096, -0.00012148171663284302, -0.00010377168655395508, -8.606165647506714e-05, -6.83516263961792e-05, -5.064159631729126e-05, -3.293156623840332e-05, -1.5221536159515381e-05, 2.4884939193725586e-06, 2.0198523998260498e-05, 3.790855407714844e-05, 5.561858415603638e-05, 7.332861423492432e-05, 9.103864431381226e-05, 0.0001087486743927002, 0.00012645870447158813, 0.00014416873455047607, 0.00016187876462936401, 0.00017958879470825195, 0.0001972988247871399, 0.00021500885486602783, 0.00023271888494491577, 0.0002504289150238037, 0.00026813894510269165, 0.0002858489751815796, 0.00030355900526046753, 0.00032126903533935547, 0.0003389790654182434, 0.00035668909549713135, 0.0003743991255760193, 0.0003921091556549072, 0.00040981918573379517, 0.0004275292158126831, 0.00044523924589157104, 0.000462949275970459, 0.0004806593060493469, 0.0004983693361282349, 0.0005160793662071228, 0.0005337893962860107, 0.0005514994263648987, 0.0005692094564437866, 0.0005869194865226746, 0.0006046295166015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 7.0, 16.0, 19.0, 36.0, 65.0, 120.0, 187.0, 384.0, 851.0, 1836.0, 5030.0, 16679.0, 86057.0, 862054.0, 55776.0, 12522.0, 3988.0, 1486.0, 676.0, 327.0, 175.0, 93.0, 63.0, 29.0, 20.0, 16.0, 12.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.158203125, -3.046966552734375, -2.93572998046875, -2.824493408203125, -2.7132568359375, -2.602020263671875, -2.49078369140625, -2.379547119140625, -2.268310546875, -2.157073974609375, -2.04583740234375, -1.934600830078125, -1.8233642578125, -1.712127685546875, -1.60089111328125, -1.489654541015625, -1.37841796875, -1.267181396484375, -1.15594482421875, -1.044708251953125, -0.9334716796875, -0.822235107421875, -0.71099853515625, -0.599761962890625, -0.488525390625, -0.377288818359375, -0.26605224609375, -0.154815673828125, -0.0435791015625, 0.067657470703125, 0.17889404296875, 0.290130615234375, 0.4013671875, 0.512603759765625, 0.62384033203125, 0.735076904296875, 0.8463134765625, 0.957550048828125, 1.06878662109375, 1.180023193359375, 1.291259765625, 1.402496337890625, 1.51373291015625, 1.624969482421875, 1.7362060546875, 1.847442626953125, 1.95867919921875, 2.069915771484375, 2.18115234375, 2.292388916015625, 2.40362548828125, 2.514862060546875, 2.6260986328125, 2.737335205078125, 2.84857177734375, 2.959808349609375, 3.071044921875, 3.182281494140625, 3.29351806640625, 3.404754638671875, 3.5159912109375, 3.627227783203125, 3.73846435546875, 3.849700927734375, 3.9609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 10.0, 14.0, 21.0, 22.0, 31.0, 58.0, 63.0, 96.0, 142.0, 165.0, 107.0, 64.0, 53.0, 24.0, 34.0, 20.0, 13.0, 11.0, 4.0, 3.0, 2.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.953125, -3.83734130859375, -3.7215576171875, -3.60577392578125, -3.489990234375, -3.37420654296875, -3.2584228515625, -3.14263916015625, -3.02685546875, -2.91107177734375, -2.7952880859375, -2.67950439453125, -2.563720703125, -2.44793701171875, -2.3321533203125, -2.21636962890625, -2.1005859375, -1.98480224609375, -1.8690185546875, -1.75323486328125, -1.637451171875, -1.52166748046875, -1.4058837890625, -1.29010009765625, -1.17431640625, -1.05853271484375, -0.9427490234375, -0.82696533203125, -0.711181640625, -0.59539794921875, -0.4796142578125, -0.36383056640625, -0.248046875, -0.13226318359375, -0.0164794921875, 0.09930419921875, 0.215087890625, 0.33087158203125, 0.4466552734375, 0.56243896484375, 0.67822265625, 0.79400634765625, 0.9097900390625, 1.02557373046875, 1.141357421875, 1.25714111328125, 1.3729248046875, 1.48870849609375, 1.6044921875, 1.72027587890625, 1.8360595703125, 1.95184326171875, 2.067626953125, 2.18341064453125, 2.2991943359375, 2.41497802734375, 2.53076171875, 2.64654541015625, 2.7623291015625, 2.87811279296875, 2.993896484375, 3.10968017578125, 3.2254638671875, 3.34124755859375, 3.45703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 10.0, 18.0, 22.0, 49.0, 95.0, 518.0, 128.0, 78.0, 35.0, 20.0, 11.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.0834732055664, -79.3087387084961, -74.53401184082031, -69.75927734375, -64.98455047607422, -60.209815979003906, -55.43508529663086, -50.66035461425781, -45.885623931884766, -41.11089324951172, -36.33616256713867, -31.561429977416992, -26.786699295043945, -22.0119686126709, -17.23723602294922, -12.462505340576172, -7.687774658203125, -2.91304349899292, 1.8616876602172852, 6.636419296264648, 11.411149978637695, 16.185880661010742, 20.960613250732422, 25.73534393310547, 30.510074615478516, 35.28480529785156, 40.05953598022461, 44.834266662597656, 49.60900115966797, 54.38372802734375, 59.15846252441406, 63.93319320678711, 68.70793151855469, 73.482666015625, 78.25739288330078, 83.0321273803711, 87.80685424804688, 92.58158874511719, 97.3563232421875, 102.13105010986328, 106.90577697753906, 111.68051147460938, 116.45523834228516, 121.22997283935547, 126.00469970703125, 130.77943420410156, 135.55416870117188, 140.32888793945312, 145.1036376953125, 149.8783721923828, 154.65310668945312, 159.42782592773438, 164.2025604248047, 168.977294921875, 173.7520294189453, 178.52676391601562, 183.30148315429688, 188.0762176513672, 192.8509521484375, 197.62567138671875, 202.40040588378906, 207.17514038085938, 211.9498748779297, 216.724609375, 221.49932861328125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 3.0, 4.0, 10.0, 9.0, 13.0, 14.0, 14.0, 24.0, 20.0, 17.0, 20.0, 30.0, 28.0, 30.0, 75.0, 271.0, 152.0, 38.0, 26.0, 22.0, 22.0, 16.0, 17.0, 13.0, 15.0, 15.0, 8.0, 14.0, 11.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.51122283935547, -88.42182922363281, -85.33242797851562, -82.24303436279297, -79.15364074707031, -76.06424713134766, -72.974853515625, -69.88545227050781, -66.79605865478516, -63.7066650390625, -60.61726760864258, -57.527870178222656, -54.4384765625, -51.349082946777344, -48.25968551635742, -45.1702880859375, -42.080894470214844, -38.99150085449219, -35.902103424072266, -32.812705993652344, -29.723312377929688, -26.6339168548584, -23.54452133178711, -20.45512580871582, -17.36573028564453, -14.276334762573242, -11.186939239501953, -8.097543716430664, -5.008148193359375, -1.918752670288086, 1.1706428527832031, 4.260038375854492, 7.3494415283203125, 10.438837051391602, 13.52823257446289, 16.61762809753418, 19.70702362060547, 22.796419143676758, 25.885814666748047, 28.975210189819336, 32.064605712890625, 35.15399932861328, 38.2433967590332, 41.332794189453125, 44.42218780517578, 47.51158142089844, 50.60097885131836, 53.69037628173828, 56.77976989746094, 59.869163513183594, 62.958560943603516, 66.04795837402344, 69.1373519897461, 72.22674560546875, 75.31614685058594, 78.4055404663086, 81.49493408203125, 84.5843276977539, 87.67372131347656, 90.76312255859375, 93.8525161743164, 96.94190979003906, 100.03131103515625, 103.1207046508789, 106.21009826660156]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 10.0, 11.0, 18.0, 15.0, 26.0, 22.0, 25.0, 34.0, 43.0, 44.0, 95.0, 278.0, 96.0, 42.0, 32.0, 30.0, 32.0, 28.0, 25.0, 22.0, 19.0, 13.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-16.0625, -15.683837890625, -15.30517578125, -14.926513671875, -14.5478515625, -14.169189453125, -13.79052734375, -13.411865234375, -13.033203125, -12.654541015625, -12.27587890625, -11.897216796875, -11.5185546875, -11.139892578125, -10.76123046875, -10.382568359375, -10.00390625, -9.625244140625, -9.24658203125, -8.867919921875, -8.4892578125, -8.110595703125, -7.73193359375, -7.353271484375, -6.974609375, -6.595947265625, -6.21728515625, -5.838623046875, -5.4599609375, -5.081298828125, -4.70263671875, -4.323974609375, -3.9453125, -3.566650390625, -3.18798828125, -2.809326171875, -2.4306640625, -2.052001953125, -1.67333984375, -1.294677734375, -0.916015625, -0.537353515625, -0.15869140625, 0.219970703125, 0.5986328125, 0.977294921875, 1.35595703125, 1.734619140625, 2.11328125, 2.491943359375, 2.87060546875, 3.249267578125, 3.6279296875, 4.006591796875, 4.38525390625, 4.763916015625, 5.142578125, 5.521240234375, 5.89990234375, 6.278564453125, 6.6572265625, 7.035888671875, 7.41455078125, 7.793212890625, 8.171875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 11.0, 18.0, 28.0, 48.0, 254.0, 1389.0, 68009.0, 8316406.0, 1992.0, 264.0, 92.0, 20.0, 23.0, 8.0, 2.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-206.9556884765625, -199.58267211914062, -192.20965576171875, -184.83663940429688, -177.46360778808594, -170.09059143066406, -162.7175750732422, -155.3445587158203, -147.97152709960938, -140.5985107421875, -133.22549438476562, -125.85247039794922, -118.47944641113281, -111.10643005371094, -103.73341369628906, -96.36039733886719, -88.98738098144531, -81.61436462402344, -74.24134063720703, -66.86832427978516, -59.495304107666016, -52.122283935546875, -44.749267578125, -37.37624740600586, -30.00322723388672, -22.630207061767578, -15.25718879699707, -7.8841705322265625, -0.5111503601074219, 6.861869812011719, 14.234886169433594, 21.607906341552734, 28.980926513671875, 36.353946685791016, 43.726966857910156, 51.09998321533203, 58.47300338745117, 65.84602355957031, 73.21903991699219, 80.59205627441406, 87.96508026123047, 95.33809661865234, 102.71112060546875, 110.08413696289062, 117.4571533203125, 124.8301773071289, 132.20318603515625, 139.5762176513672, 146.94923400878906, 154.32225036621094, 161.6952667236328, 169.06829833984375, 176.44131469726562, 183.8143310546875, 191.18734741210938, 198.56036376953125, 205.93338012695312, 213.306396484375, 220.67941284179688, 228.05242919921875, 235.4254608154297, 242.79847717285156, 250.17149353027344, 257.5445251464844, 264.91754150390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 9.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 2.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-117.1073226928711, -113.87486267089844, -110.64240264892578, -107.40994262695312, -104.177490234375, -100.94502258300781, -97.71257019042969, -94.48011016845703, -91.24765014648438, -88.01519012451172, -84.78273010253906, -81.5502700805664, -78.31781005859375, -75.08535766601562, -71.85289764404297, -68.62043762207031, -65.38797760009766, -62.155517578125, -58.923057556152344, -55.69060134887695, -52.4581413269043, -49.22568130493164, -45.99322509765625, -42.760765075683594, -39.52830505371094, -36.29584503173828, -33.063385009765625, -29.830928802490234, -26.598468780517578, -23.366008758544922, -20.1335506439209, -16.901092529296875, -13.668624877929688, -10.436165809631348, -7.203706741333008, -3.971247673034668, -0.7387886047363281, 2.493671417236328, 5.726129531860352, 8.958587646484375, 12.191047668457031, 15.423506736755371, 18.65596580505371, 21.888423919677734, 25.12088394165039, 28.353343963623047, 31.58580207824707, 34.818260192871094, 38.05072021484375, 41.283180236816406, 44.51564025878906, 47.74809646606445, 50.98055648803711, 54.213016510009766, 57.445472717285156, 60.67793273925781, 63.91039276123047, 67.14285278320312, 70.37531280517578, 73.60777282714844, 76.84022521972656, 80.07269287109375, 83.30514526367188, 86.53760528564453, 89.77006530761719]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 6.0, 11.0, 17.0, 26.0, 34.0, 51.0, 49.0, 83.0, 116.0, 164.0, 313.0, 512.0, 975.0, 1878.0, 4154.0, 9291.0, 24172.0, 67859.0, 172170.0, 151046.0, 55741.0, 20094.0, 8048.0, 3597.0, 1635.0, 859.0, 451.0, 274.0, 184.0, 101.0, 74.0, 67.0, 54.0, 32.0, 33.0, 17.0, 14.0, 7.0, 11.0, 8.0, 8.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -63.12890625, -60.9453125, -58.76171875, -56.578125, -54.39453125, -52.2109375, -50.02734375, -47.84375, -45.66015625, -43.4765625, -41.29296875, -39.109375, -36.92578125, -34.7421875, -32.55859375, -30.375, -28.19140625, -26.0078125, -23.82421875, -21.640625, -19.45703125, -17.2734375, -15.08984375, -12.90625, -10.72265625, -8.5390625, -6.35546875, -4.171875, -1.98828125, 0.1953125, 2.37890625, 4.5625, 6.74609375, 8.9296875, 11.11328125, 13.296875, 15.48046875, 17.6640625, 19.84765625, 22.03125, 24.21484375, 26.3984375, 28.58203125, 30.765625, 32.94921875, 35.1328125, 37.31640625, 39.5, 41.68359375, 43.8671875, 46.05078125, 48.234375, 50.41796875, 52.6015625, 54.78515625, 56.96875, 59.15234375, 61.3359375, 63.51953125, 65.703125, 67.88671875, 70.0703125, 72.25390625, 74.4375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 27.0, 33.0, 42.0, 44.0, 58.0, 57.0, 77.0, 98.0, 84.0, 102.0, 78.0, 59.0, 53.0, 46.0, 23.0, 36.0, 9.0, 16.0, 8.0, 10.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -10.8995361328125, -10.416259765625, -9.9329833984375, -9.44970703125, -8.9664306640625, -8.483154296875, -7.9998779296875, -7.5166015625, -7.0333251953125, -6.550048828125, -6.0667724609375, -5.58349609375, -5.1002197265625, -4.616943359375, -4.1336669921875, -3.650390625, -3.1671142578125, -2.683837890625, -2.2005615234375, -1.71728515625, -1.2340087890625, -0.750732421875, -0.2674560546875, 0.2158203125, 0.6990966796875, 1.182373046875, 1.6656494140625, 2.14892578125, 2.6322021484375, 3.115478515625, 3.5987548828125, 4.08203125, 4.5653076171875, 5.048583984375, 5.5318603515625, 6.01513671875, 6.4984130859375, 6.981689453125, 7.4649658203125, 7.9482421875, 8.4315185546875, 8.914794921875, 9.3980712890625, 9.88134765625, 10.3646240234375, 10.847900390625, 11.3311767578125, 11.814453125, 12.2977294921875, 12.781005859375, 13.2642822265625, 13.74755859375, 14.2308349609375, 14.714111328125, 15.1973876953125, 15.6806640625, 16.1639404296875, 16.647216796875, 17.1304931640625, 17.61376953125, 18.0970458984375, 18.580322265625, 19.0635986328125, 19.546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 9.0, 16.0, 21.0, 40.0, 85.0, 121.0, 94.0, 37.0, 17.0, 12.0, 6.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.69462585449219, -97.95364379882812, -94.21266174316406, -90.4716796875, -86.73069763183594, -82.98971557617188, -79.24874114990234, -75.50775909423828, -71.76677703857422, -68.02579498291016, -64.2848129272461, -60.5438346862793, -56.802852630615234, -53.06187057495117, -49.320892333984375, -45.57991027832031, -41.83892822265625, -38.09794616699219, -34.356964111328125, -30.615985870361328, -26.875003814697266, -23.134021759033203, -19.393041610717773, -15.652061462402344, -11.911079406738281, -8.170098304748535, -4.429117202758789, -0.688136100769043, 3.052845001220703, 6.793827056884766, 10.534807205200195, 14.275787353515625, 18.016769409179688, 21.75775146484375, 25.49873161315918, 29.23971176147461, 32.98069381713867, 36.721675872802734, 40.46265411376953, 44.203636169433594, 47.944618225097656, 51.68560028076172, 55.42658233642578, 59.16756057739258, 62.90854263305664, 66.64952087402344, 70.3905029296875, 74.13148498535156, 77.87246704101562, 81.61344909667969, 85.35443115234375, 89.09541320800781, 92.83639526367188, 96.57737731933594, 100.31835174560547, 104.05933380126953, 107.8003158569336, 111.54129791259766, 115.28227996826172, 119.02326202392578, 122.76423645019531, 126.50521850585938, 130.24620056152344, 133.9871826171875, 137.72816467285156]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 14.0, 20.0, 50.0, 65.0, 119.0, 86.0, 44.0, 19.0, 12.0, 6.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.49037170410156, -78.2115707397461, -75.93276977539062, -73.65397644042969, -71.37517547607422, -69.09637451171875, -66.81758117675781, -64.53878021240234, -62.259979248046875, -59.981178283691406, -57.7023811340332, -55.423583984375, -53.14478302001953, -50.86598205566406, -48.58718490600586, -46.308387756347656, -44.02958679199219, -41.75078582763672, -39.471988677978516, -37.19319152832031, -34.914390563964844, -32.635589599609375, -30.356792449951172, -28.077993392944336, -25.7991943359375, -23.520395278930664, -21.241596221923828, -18.962797164916992, -16.683998107910156, -14.40519905090332, -12.126399993896484, -9.847600936889648, -7.568809509277344, -5.290010452270508, -3.011211395263672, -0.7324123382568359, 1.54638671875, 3.825185775756836, 6.103984832763672, 8.382783889770508, 10.661582946777344, 12.94038200378418, 15.219181060791016, 17.49798011779785, 19.776779174804688, 22.055578231811523, 24.33437728881836, 26.613176345825195, 28.89197540283203, 31.170774459838867, 33.4495735168457, 35.728370666503906, 38.007171630859375, 40.285972595214844, 42.56476974487305, 44.84356689453125, 47.12236785888672, 49.40116882324219, 51.67996597290039, 53.958763122558594, 56.23756408691406, 58.51636505126953, 60.795162200927734, 63.07395935058594, 65.3527603149414]}, "eval/loss": 6.072827339172363, "eval/wer": 1.0588923943885549, "eval/runtime": 715.4795, "eval/samples_per_second": 3.693, "eval/steps_per_second": 0.463} \ No newline at end of file