diff --git "a/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" --- "a/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" +++ "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.6103, "train/learning_rate": 1.2676300578034681e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 19632, "_timestamp": 1646247315, "_step": 3001, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 115.0, 20.0, 8.0, 4.0, 12.0, 3.0, 29578.0, 621.0, 60.0, 29.0, 15.0, 11.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.6875, -105.2666015625, -101.845703125, -98.4248046875, -95.00390625, -91.5830078125, -88.162109375, -84.7412109375, -81.3203125, -77.8994140625, -74.478515625, -71.0576171875, -67.63671875, -64.2158203125, -60.794921875, -57.3740234375, -53.953125, -50.5322265625, -47.111328125, -43.6904296875, -40.26953125, -36.8486328125, -33.427734375, -30.0068359375, -26.5859375, -23.1650390625, -19.744140625, -16.3232421875, -12.90234375, -9.4814453125, -6.060546875, -2.6396484375, 0.78125, 4.2021484375, 7.623046875, 11.0439453125, 14.46484375, 17.8857421875, 21.306640625, 24.7275390625, 28.1484375, 31.5693359375, 34.990234375, 38.4111328125, 41.83203125, 45.2529296875, 48.673828125, 52.0947265625, 55.515625, 58.9365234375, 62.357421875, 65.7783203125, 69.19921875, 72.6201171875, 76.041015625, 79.4619140625, 82.8828125, 86.3037109375, 89.724609375, 93.1455078125, 96.56640625, 99.9873046875, 103.408203125, 106.8291015625, 110.25]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 10.0, 6.0, 8.0, 14.0, 16.0, 18.0, 16.0, 20.0, 33.0, 33.0, 32.0, 23.0, 39.0, 38.0, 48.0, 45.0, 46.0, 44.0, 37.0, 53.0, 43.0, 51.0, 48.0, 28.0, 32.0, 30.0, 21.0, 25.0, 25.0, 22.0, 17.0, 9.0, 12.0, 10.0, 10.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-32.042842864990234, -31.10605812072754, -30.169273376464844, -29.23248863220215, -28.295703887939453, -27.35892105102539, -26.422136306762695, -25.4853515625, -24.548566818237305, -23.61178207397461, -22.674997329711914, -21.73821258544922, -20.801429748535156, -19.864643096923828, -18.927860260009766, -17.99107551574707, -17.054290771484375, -16.11750602722168, -15.180721282958984, -14.243937492370605, -13.30715274810791, -12.370368003845215, -11.433584213256836, -10.49679946899414, -9.560014724731445, -8.62322998046875, -7.686445713043213, -6.749661445617676, -5.8128767013549805, -4.876091957092285, -3.939307689666748, -3.002523422241211, -2.0657386779785156, -1.1289541721343994, -0.1921696662902832, 0.744614839553833, 1.6813993453979492, 2.6181840896606445, 3.5549683570861816, 4.491752624511719, 5.428537368774414, 6.365322113037109, 7.3021063804626465, 8.238890647888184, 9.175675392150879, 10.112460136413574, 11.049243927001953, 11.986028671264648, 12.922813415527344, 13.859598159790039, 14.796382904052734, 15.733166694641113, 16.669952392578125, 17.606735229492188, 18.543519973754883, 19.480304718017578, 20.417089462280273, 21.35387420654297, 22.290658950805664, 23.22744369506836, 24.164226531982422, 25.10101318359375, 26.037796020507812, 26.974580764770508, 27.911365509033203]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 7.0, 6.0, 8.0, 15.0, 8.0, 11.0, 19.0, 15.0, 20.0, 20.0, 25.0, 33.0, 30.0, 30.0, 40.0, 29.0, 44.0, 41.0, 42.0, 43.0, 49.0, 32.0, 42.0, 46.0, 44.0, 28.0, 37.0, 29.0, 26.0, 20.0, 25.0, 23.0, 18.0, 22.0, 14.0, 10.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-30.515663146972656, -29.6275634765625, -28.73946189880371, -27.851362228393555, -26.963260650634766, -26.07516098022461, -25.187061309814453, -24.298961639404297, -23.410860061645508, -22.52276039123535, -21.634658813476562, -20.746559143066406, -19.85845947265625, -18.97035789489746, -18.082258224487305, -17.194156646728516, -16.30605697631836, -15.417956352233887, -14.529855728149414, -13.641756057739258, -12.753655433654785, -11.865554809570312, -10.977455139160156, -10.089354515075684, -9.201253890991211, -8.313153266906738, -7.425053119659424, -6.536952972412109, -5.648852348327637, -4.760751724243164, -3.8726515769958496, -2.984551429748535, -2.0964488983154297, -1.2083485126495361, -0.3202481269836426, 0.567852258682251, 1.4559526443481445, 2.344053268432617, 3.2321534156799316, 4.120253562927246, 5.008354187011719, 5.896454811096191, 6.784554958343506, 7.67265510559082, 8.560755729675293, 9.448856353759766, 10.336956024169922, 11.225056648254395, 12.113157272338867, 13.00125789642334, 13.889358520507812, 14.777458190917969, 15.665558815002441, 16.553659439086914, 17.44175910949707, 18.32986068725586, 19.217960357666016, 20.106060028076172, 20.99416160583496, 21.882261276245117, 22.770362854003906, 23.658462524414062, 24.54656219482422, 25.434661865234375, 26.322763442993164]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 7.0, 7.0, 10.0, 14.0, 29.0, 43.0, 55.0, 80.0, 162.0, 232.0, 354.0, 553.0, 861.0, 1233.0, 1948.0, 2906.0, 4434.0, 6466.0, 10079.0, 14822.0, 21662.0, 30904.0, 43877.0, 61372.0, 82614.0, 111358.0, 162492.0, 140596.0, 99106.0, 73780.0, 54136.0, 38591.0, 27356.0, 18575.0, 12531.0, 8540.0, 5723.0, 3749.0, 2486.0, 1682.0, 1080.0, 679.0, 500.0, 307.0, 202.0, 124.0, 77.0, 57.0, 38.0, 26.0, 19.0, 10.0, 4.0, 8.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-74.4375, -72.021484375, -69.60546875, -67.189453125, -64.7734375, -62.357421875, -59.94140625, -57.525390625, -55.109375, -52.693359375, -50.27734375, -47.861328125, -45.4453125, -43.029296875, -40.61328125, -38.197265625, -35.78125, -33.365234375, -30.94921875, -28.533203125, -26.1171875, -23.701171875, -21.28515625, -18.869140625, -16.453125, -14.037109375, -11.62109375, -9.205078125, -6.7890625, -4.373046875, -1.95703125, 0.458984375, 2.875, 5.291015625, 7.70703125, 10.123046875, 12.5390625, 14.955078125, 17.37109375, 19.787109375, 22.203125, 24.619140625, 27.03515625, 29.451171875, 31.8671875, 34.283203125, 36.69921875, 39.115234375, 41.53125, 43.947265625, 46.36328125, 48.779296875, 51.1953125, 53.611328125, 56.02734375, 58.443359375, 60.859375, 63.275390625, 65.69140625, 68.107421875, 70.5234375, 72.939453125, 75.35546875, 77.771484375, 80.1875]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 7.0, 18.0, 9.0, 15.0, 24.0, 20.0, 37.0, 24.0, 47.0, 35.0, 43.0, 53.0, 71.0, 76.0, 63.0, 53.0, 49.0, 49.0, 34.0, 28.0, 33.0, 24.0, 24.0, 19.0, 14.0, 22.0, 14.0, 10.0, 6.0, 5.0, 9.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-36.78125, -35.6630859375, -34.544921875, -33.4267578125, -32.30859375, -31.1904296875, -30.072265625, -28.9541015625, -27.8359375, -26.7177734375, -25.599609375, -24.4814453125, -23.36328125, -22.2451171875, -21.126953125, -20.0087890625, -18.890625, -17.7724609375, -16.654296875, -15.5361328125, -14.41796875, -13.2998046875, -12.181640625, -11.0634765625, -9.9453125, -8.8271484375, -7.708984375, -6.5908203125, -5.47265625, -4.3544921875, -3.236328125, -2.1181640625, -1.0, 0.1181640625, 1.236328125, 2.3544921875, 3.47265625, 4.5908203125, 5.708984375, 6.8271484375, 7.9453125, 9.0634765625, 10.181640625, 11.2998046875, 12.41796875, 13.5361328125, 14.654296875, 15.7724609375, 16.890625, 18.0087890625, 19.126953125, 20.2451171875, 21.36328125, 22.4814453125, 23.599609375, 24.7177734375, 25.8359375, 26.9541015625, 28.072265625, 29.1904296875, 30.30859375, 31.4267578125, 32.544921875, 33.6630859375, 34.78125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 11.0, 13.0, 14.0, 20.0, 13.0, 14.0, 27.0, 30.0, 28.0, 36.0, 36.0, 38.0, 49.0, 51.0, 49.0, 55.0, 47.0, 51.0, 42.0, 34.0, 44.0, 47.0, 36.0, 30.0, 26.0, 17.0, 23.0, 20.0, 13.0, 22.0, 9.0, 12.0, 9.0, 10.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.344266891479492, -18.66748046875, -17.99069595336914, -17.31390953063965, -16.63712501525879, -15.960338592529297, -15.283553123474121, -14.606767654418945, -13.92998218536377, -13.253196716308594, -12.576411247253418, -11.899625778198242, -11.22283935546875, -10.54605484008789, -9.869268417358398, -9.192482948303223, -8.515697479248047, -7.838912010192871, -7.162126541137695, -6.485340595245361, -5.8085551261901855, -5.13176965713501, -4.454983711242676, -3.7781982421875, -3.101412773132324, -2.4246273040771484, -1.7478415966033936, -1.0710558891296387, -0.3942704200744629, 0.2825150489807129, 0.9593009948730469, 1.6360864639282227, 2.3128719329833984, 2.989657402038574, 3.666443109512329, 4.343228816986084, 5.02001428604126, 5.6967997550964355, 6.3735857009887695, 7.050371170043945, 7.727156639099121, 8.403942108154297, 9.080727577209473, 9.757513046264648, 10.43429946899414, 11.111083984375, 11.787870407104492, 12.464655876159668, 13.141441345214844, 13.81822681427002, 14.495012283325195, 15.171798706054688, 15.848583221435547, 16.52536964416504, 17.20215606689453, 17.87894058227539, 18.55572509765625, 19.232511520385742, 19.9092960357666, 20.586082458496094, 21.262866973876953, 21.939653396606445, 22.616439819335938, 23.293224334716797, 23.97001075744629]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 9.0, 15.0, 4.0, 10.0, 15.0, 7.0, 41.0, 23.0, 21.0, 28.0, 32.0, 35.0, 32.0, 46.0, 27.0, 34.0, 48.0, 49.0, 52.0, 42.0, 44.0, 44.0, 38.0, 36.0, 36.0, 28.0, 30.0, 16.0, 22.0, 19.0, 23.0, 15.0, 14.0, 9.0, 7.0, 10.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-22.075908660888672, -21.42017936706543, -20.764450073242188, -20.108722686767578, -19.452993392944336, -18.797264099121094, -18.14153480529785, -17.48580551147461, -16.830078125, -16.174348831176758, -15.518620491027832, -14.86289119720459, -14.207162857055664, -13.551433563232422, -12.89570426940918, -12.239975929260254, -11.584246635437012, -10.92851734161377, -10.272789001464844, -9.617059707641602, -8.961331367492676, -8.305602073669434, -7.64987325668335, -6.994144439697266, -6.338415622711182, -5.682686805725098, -5.026957988739014, -4.37122917175293, -3.7155001163482666, -3.0597712993621826, -2.4040422439575195, -1.7483134269714355, -1.0925846099853516, -0.4368557333946228, 0.21887314319610596, 0.8746020793914795, 1.5303308963775635, 2.1860597133636475, 2.8417887687683105, 3.4975175857543945, 4.1532464027404785, 4.8089752197265625, 5.4647040367126465, 6.1204328536987305, 6.776162147521973, 7.431890487670898, 8.08761978149414, 8.743349075317383, 9.399077415466309, 10.05480670928955, 10.710535049438477, 11.366264343261719, 12.021992683410645, 12.677721977233887, 13.333450317382812, 13.989179611206055, 14.644908905029297, 15.300638198852539, 15.956366539001465, 16.61209487915039, 17.267824172973633, 17.923553466796875, 18.579282760620117, 19.23501205444336, 19.89073944091797]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 14.0, 31.0, 37.0, 59.0, 105.0, 192.0, 282.0, 495.0, 861.0, 1357.0, 2423.0, 4212.0, 7189.0, 12933.0, 23175.0, 42650.0, 79517.0, 152827.0, 293808.0, 537165.0, 807886.0, 855209.0, 621945.0, 350339.0, 185060.0, 96197.0, 51706.0, 28350.0, 15984.0, 9232.0, 5308.0, 3089.0, 1853.0, 1120.0, 647.0, 395.0, 247.0, 148.0, 88.0, 56.0, 30.0, 23.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.03125, -20.396728515625, -19.76220703125, -19.127685546875, -18.4931640625, -17.858642578125, -17.22412109375, -16.589599609375, -15.955078125, -15.320556640625, -14.68603515625, -14.051513671875, -13.4169921875, -12.782470703125, -12.14794921875, -11.513427734375, -10.87890625, -10.244384765625, -9.60986328125, -8.975341796875, -8.3408203125, -7.706298828125, -7.07177734375, -6.437255859375, -5.802734375, -5.168212890625, -4.53369140625, -3.899169921875, -3.2646484375, -2.630126953125, -1.99560546875, -1.361083984375, -0.7265625, -0.092041015625, 0.54248046875, 1.177001953125, 1.8115234375, 2.446044921875, 3.08056640625, 3.715087890625, 4.349609375, 4.984130859375, 5.61865234375, 6.253173828125, 6.8876953125, 7.522216796875, 8.15673828125, 8.791259765625, 9.42578125, 10.060302734375, 10.69482421875, 11.329345703125, 11.9638671875, 12.598388671875, 13.23291015625, 13.867431640625, 14.501953125, 15.136474609375, 15.77099609375, 16.405517578125, 17.0400390625, 17.674560546875, 18.30908203125, 18.943603515625, 19.578125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 11.0, 17.0, 13.0, 15.0, 23.0, 32.0, 31.0, 26.0, 32.0, 32.0, 36.0, 37.0, 39.0, 56.0, 46.0, 38.0, 46.0, 54.0, 38.0, 42.0, 53.0, 41.0, 40.0, 34.0, 25.0, 12.0, 17.0, 18.0, 14.0, 14.0, 17.0, 9.0, 5.0, 3.0, 3.0, 3.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.640625, -18.103271484375, -17.56591796875, -17.028564453125, -16.4912109375, -15.953857421875, -15.41650390625, -14.879150390625, -14.341796875, -13.804443359375, -13.26708984375, -12.729736328125, -12.1923828125, -11.655029296875, -11.11767578125, -10.580322265625, -10.04296875, -9.505615234375, -8.96826171875, -8.430908203125, -7.8935546875, -7.356201171875, -6.81884765625, -6.281494140625, -5.744140625, -5.206787109375, -4.66943359375, -4.132080078125, -3.5947265625, -3.057373046875, -2.52001953125, -1.982666015625, -1.4453125, -0.907958984375, -0.37060546875, 0.166748046875, 0.7041015625, 1.241455078125, 1.77880859375, 2.316162109375, 2.853515625, 3.390869140625, 3.92822265625, 4.465576171875, 5.0029296875, 5.540283203125, 6.07763671875, 6.614990234375, 7.15234375, 7.689697265625, 8.22705078125, 8.764404296875, 9.3017578125, 9.839111328125, 10.37646484375, 10.913818359375, 11.451171875, 11.988525390625, 12.52587890625, 13.063232421875, 13.6005859375, 14.137939453125, 14.67529296875, 15.212646484375, 15.75]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 22.0, 39.0, 75.0, 125.0, 159.0, 270.0, 378.0, 647.0, 1048.0, 1570.0, 2430.0, 3906.0, 6174.0, 9456.0, 15329.0, 23765.0, 37307.0, 58889.0, 90935.0, 140572.0, 210006.0, 303380.0, 418462.0, 532376.0, 581784.0, 515354.0, 396383.0, 284679.0, 195733.0, 129250.0, 85166.0, 54117.0, 34766.0, 22035.0, 13678.0, 8777.0, 5524.0, 3483.0, 2226.0, 1429.0, 872.0, 647.0, 393.0, 226.0, 170.0, 90.0, 56.0, 40.0, 28.0, 21.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-14.546875, -14.0980224609375, -13.649169921875, -13.2003173828125, -12.75146484375, -12.3026123046875, -11.853759765625, -11.4049072265625, -10.9560546875, -10.5072021484375, -10.058349609375, -9.6094970703125, -9.16064453125, -8.7117919921875, -8.262939453125, -7.8140869140625, -7.365234375, -6.9163818359375, -6.467529296875, -6.0186767578125, -5.56982421875, -5.1209716796875, -4.672119140625, -4.2232666015625, -3.7744140625, -3.3255615234375, -2.876708984375, -2.4278564453125, -1.97900390625, -1.5301513671875, -1.081298828125, -0.6324462890625, -0.18359375, 0.2652587890625, 0.714111328125, 1.1629638671875, 1.61181640625, 2.0606689453125, 2.509521484375, 2.9583740234375, 3.4072265625, 3.8560791015625, 4.304931640625, 4.7537841796875, 5.20263671875, 5.6514892578125, 6.100341796875, 6.5491943359375, 6.998046875, 7.4468994140625, 7.895751953125, 8.3446044921875, 8.79345703125, 9.2423095703125, 9.691162109375, 10.1400146484375, 10.5888671875, 11.0377197265625, 11.486572265625, 11.9354248046875, 12.38427734375, 12.8331298828125, 13.281982421875, 13.7308349609375, 14.1796875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 1.0, 6.0, 14.0, 11.0, 12.0, 17.0, 22.0, 27.0, 36.0, 41.0, 67.0, 68.0, 88.0, 112.0, 117.0, 157.0, 170.0, 195.0, 226.0, 232.0, 259.0, 227.0, 222.0, 238.0, 208.0, 174.0, 149.0, 177.0, 111.0, 102.0, 96.0, 65.0, 75.0, 67.0, 55.0, 37.0, 41.0, 36.0, 23.0, 12.0, 13.0, 13.0, 9.0, 13.0, 10.0, 5.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-6.9140625, -6.70245361328125, -6.4908447265625, -6.27923583984375, -6.067626953125, -5.85601806640625, -5.6444091796875, -5.43280029296875, -5.22119140625, -5.00958251953125, -4.7979736328125, -4.58636474609375, -4.374755859375, -4.16314697265625, -3.9515380859375, -3.73992919921875, -3.5283203125, -3.31671142578125, -3.1051025390625, -2.89349365234375, -2.681884765625, -2.47027587890625, -2.2586669921875, -2.04705810546875, -1.83544921875, -1.62384033203125, -1.4122314453125, -1.20062255859375, -0.989013671875, -0.77740478515625, -0.5657958984375, -0.35418701171875, -0.142578125, 0.06903076171875, 0.2806396484375, 0.49224853515625, 0.703857421875, 0.91546630859375, 1.1270751953125, 1.33868408203125, 1.55029296875, 1.76190185546875, 1.9735107421875, 2.18511962890625, 2.396728515625, 2.60833740234375, 2.8199462890625, 3.03155517578125, 3.2431640625, 3.45477294921875, 3.6663818359375, 3.87799072265625, 4.089599609375, 4.30120849609375, 4.5128173828125, 4.72442626953125, 4.93603515625, 5.14764404296875, 5.3592529296875, 5.57086181640625, 5.782470703125, 5.99407958984375, 6.2056884765625, 6.41729736328125, 6.62890625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 11.0, 17.0, 7.0, 27.0, 18.0, 30.0, 29.0, 43.0, 27.0, 41.0, 39.0, 52.0, 48.0, 30.0, 46.0, 50.0, 43.0, 47.0, 34.0, 32.0, 44.0, 34.0, 28.0, 35.0, 21.0, 21.0, 16.0, 19.0, 20.0, 11.0, 7.0, 8.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.748933792114258, -15.223359107971191, -14.697783470153809, -14.172208786010742, -13.64663314819336, -13.121058464050293, -12.595483779907227, -12.069908142089844, -11.544332504272461, -11.018757820129395, -10.493182182312012, -9.967607498168945, -9.442031860351562, -8.916457176208496, -8.39088249206543, -7.865306854248047, -7.3397321701049805, -6.814157009124756, -6.288581848144531, -5.763007164001465, -5.237431526184082, -4.711856842041016, -4.186281681060791, -3.6607065200805664, -3.135131359100342, -2.609556198120117, -2.0839810371398926, -1.558406114578247, -1.0328309535980225, -0.5072557926177979, 0.018319129943847656, 0.5438942909240723, 1.0694694519042969, 1.5950446128845215, 2.120619773864746, 2.6461946964263916, 3.171769857406616, 3.697345018386841, 4.222919940948486, 4.748495101928711, 5.2740702629089355, 5.79964542388916, 6.325220584869385, 6.850795745849609, 7.376370429992676, 7.901946067810059, 8.427520751953125, 8.953096389770508, 9.478671073913574, 10.00424575805664, 10.529821395874023, 11.05539608001709, 11.580971717834473, 12.106546401977539, 12.632122039794922, 13.157696723937988, 13.683271408081055, 14.208846092224121, 14.734421730041504, 15.25999641418457, 15.785572052001953, 16.311147689819336, 16.836721420288086, 17.36229705810547, 17.88787269592285]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 6.0, 13.0, 13.0, 16.0, 9.0, 13.0, 19.0, 27.0, 17.0, 30.0, 28.0, 37.0, 37.0, 47.0, 52.0, 57.0, 47.0, 50.0, 54.0, 54.0, 45.0, 49.0, 34.0, 35.0, 30.0, 19.0, 34.0, 23.0, 14.0, 15.0, 14.0, 9.0, 17.0, 13.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-21.823001861572266, -21.205474853515625, -20.58794593811035, -19.97041893005371, -19.352890014648438, -18.735363006591797, -18.117835998535156, -17.500308990478516, -16.882780075073242, -16.2652530670166, -15.647724151611328, -15.030197143554688, -14.41266918182373, -13.795141220092773, -13.177614212036133, -12.560086250305176, -11.942558288574219, -11.325030326843262, -10.707502365112305, -10.089975357055664, -9.472447395324707, -8.85491943359375, -8.23739242553711, -7.619864463806152, -7.002336502075195, -6.384808540344238, -5.7672810554504395, -5.149753570556641, -4.532225608825684, -3.9146978855133057, -3.2971701622009277, -2.679642677307129, -2.062114715576172, -1.444586992263794, -0.827059268951416, -0.20953154563903809, 0.40799617767333984, 1.0255239009857178, 1.6430516242980957, 2.2605791091918945, 2.8781070709228516, 3.4956347942352295, 4.113162517547607, 4.730690002441406, 5.348217964172363, 5.96574592590332, 6.583273410797119, 7.200800895690918, 7.818328857421875, 8.435856819152832, 9.053384780883789, 9.67091178894043, 10.288439750671387, 10.905967712402344, 11.523494720458984, 12.141022682189941, 12.758550643920898, 13.376078605651855, 13.993606567382812, 14.611133575439453, 15.22866153717041, 15.846189498901367, 16.463716506958008, 17.08124542236328, 17.698772430419922]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 11.0, 11.0, 23.0, 29.0, 33.0, 41.0, 67.0, 87.0, 133.0, 195.0, 302.0, 433.0, 624.0, 895.0, 1298.0, 1892.0, 3101.0, 4777.0, 7865.0, 13244.0, 24214.0, 46140.0, 93741.0, 190326.0, 284290.0, 183217.0, 89874.0, 44264.0, 23399.0, 12948.0, 7438.0, 4583.0, 3015.0, 1940.0, 1384.0, 809.0, 562.0, 421.0, 287.0, 187.0, 140.0, 80.0, 78.0, 47.0, 26.0, 28.0, 19.0, 13.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.5703125, -14.12158203125, -13.6728515625, -13.22412109375, -12.775390625, -12.32666015625, -11.8779296875, -11.42919921875, -10.98046875, -10.53173828125, -10.0830078125, -9.63427734375, -9.185546875, -8.73681640625, -8.2880859375, -7.83935546875, -7.390625, -6.94189453125, -6.4931640625, -6.04443359375, -5.595703125, -5.14697265625, -4.6982421875, -4.24951171875, -3.80078125, -3.35205078125, -2.9033203125, -2.45458984375, -2.005859375, -1.55712890625, -1.1083984375, -0.65966796875, -0.2109375, 0.23779296875, 0.6865234375, 1.13525390625, 1.583984375, 2.03271484375, 2.4814453125, 2.93017578125, 3.37890625, 3.82763671875, 4.2763671875, 4.72509765625, 5.173828125, 5.62255859375, 6.0712890625, 6.52001953125, 6.96875, 7.41748046875, 7.8662109375, 8.31494140625, 8.763671875, 9.21240234375, 9.6611328125, 10.10986328125, 10.55859375, 11.00732421875, 11.4560546875, 11.90478515625, 12.353515625, 12.80224609375, 13.2509765625, 13.69970703125, 14.1484375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 13.0, 12.0, 16.0, 13.0, 20.0, 15.0, 20.0, 28.0, 26.0, 30.0, 33.0, 40.0, 48.0, 40.0, 49.0, 51.0, 48.0, 55.0, 49.0, 34.0, 47.0, 41.0, 27.0, 35.0, 32.0, 20.0, 25.0, 23.0, 12.0, 18.0, 15.0, 9.0, 6.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-20.453125, -19.878173828125, -19.30322265625, -18.728271484375, -18.1533203125, -17.578369140625, -17.00341796875, -16.428466796875, -15.853515625, -15.278564453125, -14.70361328125, -14.128662109375, -13.5537109375, -12.978759765625, -12.40380859375, -11.828857421875, -11.25390625, -10.678955078125, -10.10400390625, -9.529052734375, -8.9541015625, -8.379150390625, -7.80419921875, -7.229248046875, -6.654296875, -6.079345703125, -5.50439453125, -4.929443359375, -4.3544921875, -3.779541015625, -3.20458984375, -2.629638671875, -2.0546875, -1.479736328125, -0.90478515625, -0.329833984375, 0.2451171875, 0.820068359375, 1.39501953125, 1.969970703125, 2.544921875, 3.119873046875, 3.69482421875, 4.269775390625, 4.8447265625, 5.419677734375, 5.99462890625, 6.569580078125, 7.14453125, 7.719482421875, 8.29443359375, 8.869384765625, 9.4443359375, 10.019287109375, 10.59423828125, 11.169189453125, 11.744140625, 12.319091796875, 12.89404296875, 13.468994140625, 14.0439453125, 14.618896484375, 15.19384765625, 15.768798828125, 16.34375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 2.0, 11.0, 11.0, 9.0, 13.0, 17.0, 27.0, 29.0, 37.0, 58.0, 77.0, 96.0, 120.0, 183.0, 232.0, 347.0, 519.0, 732.0, 1149.0, 1873.0, 3287.0, 5970.0, 12040.0, 27855.0, 76869.0, 241048.0, 408303.0, 169295.0, 54903.0, 21424.0, 9448.0, 4906.0, 2763.0, 1637.0, 1051.0, 674.0, 425.0, 290.0, 197.0, 153.0, 140.0, 77.0, 77.0, 46.0, 37.0, 24.0, 21.0, 20.0, 12.0, 9.0, 5.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.9609375, -11.5667724609375, -11.172607421875, -10.7784423828125, -10.38427734375, -9.9901123046875, -9.595947265625, -9.2017822265625, -8.8076171875, -8.4134521484375, -8.019287109375, -7.6251220703125, -7.23095703125, -6.8367919921875, -6.442626953125, -6.0484619140625, -5.654296875, -5.2601318359375, -4.865966796875, -4.4718017578125, -4.07763671875, -3.6834716796875, -3.289306640625, -2.8951416015625, -2.5009765625, -2.1068115234375, -1.712646484375, -1.3184814453125, -0.92431640625, -0.5301513671875, -0.135986328125, 0.2581787109375, 0.65234375, 1.0465087890625, 1.440673828125, 1.8348388671875, 2.22900390625, 2.6231689453125, 3.017333984375, 3.4114990234375, 3.8056640625, 4.1998291015625, 4.593994140625, 4.9881591796875, 5.38232421875, 5.7764892578125, 6.170654296875, 6.5648193359375, 6.958984375, 7.3531494140625, 7.747314453125, 8.1414794921875, 8.53564453125, 8.9298095703125, 9.323974609375, 9.7181396484375, 10.1123046875, 10.5064697265625, 10.900634765625, 11.2947998046875, 11.68896484375, 12.0831298828125, 12.477294921875, 12.8714599609375, 13.265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 11.0, 8.0, 13.0, 9.0, 19.0, 20.0, 12.0, 16.0, 23.0, 22.0, 26.0, 35.0, 27.0, 35.0, 43.0, 35.0, 41.0, 26.0, 40.0, 32.0, 32.0, 36.0, 40.0, 39.0, 43.0, 28.0, 35.0, 27.0, 25.0, 26.0, 29.0, 14.0, 24.0, 19.0, 12.0, 14.0, 14.0, 8.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.40625, -11.0323486328125, -10.658447265625, -10.2845458984375, -9.91064453125, -9.5367431640625, -9.162841796875, -8.7889404296875, -8.4150390625, -8.0411376953125, -7.667236328125, -7.2933349609375, -6.91943359375, -6.5455322265625, -6.171630859375, -5.7977294921875, -5.423828125, -5.0499267578125, -4.676025390625, -4.3021240234375, -3.92822265625, -3.5543212890625, -3.180419921875, -2.8065185546875, -2.4326171875, -2.0587158203125, -1.684814453125, -1.3109130859375, -0.93701171875, -0.5631103515625, -0.189208984375, 0.1846923828125, 0.55859375, 0.9324951171875, 1.306396484375, 1.6802978515625, 2.05419921875, 2.4281005859375, 2.802001953125, 3.1759033203125, 3.5498046875, 3.9237060546875, 4.297607421875, 4.6715087890625, 5.04541015625, 5.4193115234375, 5.793212890625, 6.1671142578125, 6.541015625, 6.9149169921875, 7.288818359375, 7.6627197265625, 8.03662109375, 8.4105224609375, 8.784423828125, 9.1583251953125, 9.5322265625, 9.9061279296875, 10.280029296875, 10.6539306640625, 11.02783203125, 11.4017333984375, 11.775634765625, 12.1495361328125, 12.5234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 8.0, 18.0, 21.0, 27.0, 49.0, 66.0, 107.0, 141.0, 215.0, 359.0, 632.0, 1006.0, 2022.0, 4896.0, 18259.0, 766718.0, 233787.0, 12285.0, 3867.0, 1686.0, 885.0, 527.0, 290.0, 203.0, 134.0, 116.0, 55.0, 47.0, 26.0, 22.0, 16.0, 11.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.03125, -29.99267578125, -28.9541015625, -27.91552734375, -26.876953125, -25.83837890625, -24.7998046875, -23.76123046875, -22.72265625, -21.68408203125, -20.6455078125, -19.60693359375, -18.568359375, -17.52978515625, -16.4912109375, -15.45263671875, -14.4140625, -13.37548828125, -12.3369140625, -11.29833984375, -10.259765625, -9.22119140625, -8.1826171875, -7.14404296875, -6.10546875, -5.06689453125, -4.0283203125, -2.98974609375, -1.951171875, -0.91259765625, 0.1259765625, 1.16455078125, 2.203125, 3.24169921875, 4.2802734375, 5.31884765625, 6.357421875, 7.39599609375, 8.4345703125, 9.47314453125, 10.51171875, 11.55029296875, 12.5888671875, 13.62744140625, 14.666015625, 15.70458984375, 16.7431640625, 17.78173828125, 18.8203125, 19.85888671875, 20.8974609375, 21.93603515625, 22.974609375, 24.01318359375, 25.0517578125, 26.09033203125, 27.12890625, 28.16748046875, 29.2060546875, 30.24462890625, 31.283203125, 32.32177734375, 33.3603515625, 34.39892578125, 35.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 24.0, 131.0, 678.0, 102.0, 23.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027446746826171875, -0.0026104748249053955, -0.0024762749671936035, -0.0023420751094818115, -0.0022078752517700195, -0.0020736753940582275, -0.0019394755363464355, -0.0018052756786346436, -0.0016710758209228516, -0.0015368759632110596, -0.0014026761054992676, -0.0012684762477874756, -0.0011342763900756836, -0.0010000765323638916, -0.0008658766746520996, -0.0007316768169403076, -0.0005974769592285156, -0.00046327710151672363, -0.00032907724380493164, -0.00019487738609313965, -6.0677528381347656e-05, 7.352232933044434e-05, 0.00020772218704223633, 0.0003419220447540283, 0.0004761219024658203, 0.0006103217601776123, 0.0007445216178894043, 0.0008787214756011963, 0.0010129213333129883, 0.0011471211910247803, 0.0012813210487365723, 0.0014155209064483643, 0.0015497207641601562, 0.0016839206218719482, 0.0018181204795837402, 0.0019523203372955322, 0.0020865201950073242, 0.002220720052719116, 0.002354919910430908, 0.0024891197681427, 0.002623319625854492, 0.002757519483566284, 0.002891719341278076, 0.003025919198989868, 0.00316011905670166, 0.003294318914413452, 0.003428518772125244, 0.003562718629837036, 0.003696918487548828, 0.00383111834526062, 0.003965318202972412, 0.004099518060684204, 0.004233717918395996, 0.004367917776107788, 0.00450211763381958, 0.004636317491531372, 0.004770517349243164, 0.004904717206954956, 0.005038917064666748, 0.00517311692237854, 0.005307316780090332, 0.005441516637802124, 0.005575716495513916, 0.005709916353225708, 0.0058441162109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 9.0, 11.0, 9.0, 19.0, 17.0, 34.0, 38.0, 56.0, 75.0, 100.0, 149.0, 209.0, 256.0, 350.0, 490.0, 719.0, 1042.0, 1459.0, 2110.0, 3047.0, 4633.0, 7486.0, 13898.0, 33250.0, 144098.0, 595652.0, 165366.0, 36258.0, 14599.0, 7842.0, 4872.0, 3095.0, 2165.0, 1451.0, 1009.0, 718.0, 561.0, 406.0, 260.0, 204.0, 148.0, 100.0, 84.0, 65.0, 42.0, 32.0, 20.0, 11.0, 19.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.0806884765625, -12.622314453125, -12.1639404296875, -11.70556640625, -11.2471923828125, -10.788818359375, -10.3304443359375, -9.8720703125, -9.4136962890625, -8.955322265625, -8.4969482421875, -8.03857421875, -7.5802001953125, -7.121826171875, -6.6634521484375, -6.205078125, -5.7467041015625, -5.288330078125, -4.8299560546875, -4.37158203125, -3.9132080078125, -3.454833984375, -2.9964599609375, -2.5380859375, -2.0797119140625, -1.621337890625, -1.1629638671875, -0.70458984375, -0.2462158203125, 0.212158203125, 0.6705322265625, 1.12890625, 1.5872802734375, 2.045654296875, 2.5040283203125, 2.96240234375, 3.4207763671875, 3.879150390625, 4.3375244140625, 4.7958984375, 5.2542724609375, 5.712646484375, 6.1710205078125, 6.62939453125, 7.0877685546875, 7.546142578125, 8.0045166015625, 8.462890625, 8.9212646484375, 9.379638671875, 9.8380126953125, 10.29638671875, 10.7547607421875, 11.213134765625, 11.6715087890625, 12.1298828125, 12.5882568359375, 13.046630859375, 13.5050048828125, 13.96337890625, 14.4217529296875, 14.880126953125, 15.3385009765625, 15.796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 2.0, 13.0, 15.0, 31.0, 50.0, 77.0, 168.0, 287.0, 155.0, 68.0, 35.0, 25.0, 13.0, 13.0, 10.0, 3.0, 6.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.8541259765625, -5.661376953125, -5.4686279296875, -5.27587890625, -5.0831298828125, -4.890380859375, -4.6976318359375, -4.5048828125, -4.3121337890625, -4.119384765625, -3.9266357421875, -3.73388671875, -3.5411376953125, -3.348388671875, -3.1556396484375, -2.962890625, -2.7701416015625, -2.577392578125, -2.3846435546875, -2.19189453125, -1.9991455078125, -1.806396484375, -1.6136474609375, -1.4208984375, -1.2281494140625, -1.035400390625, -0.8426513671875, -0.64990234375, -0.4571533203125, -0.264404296875, -0.0716552734375, 0.12109375, 0.3138427734375, 0.506591796875, 0.6993408203125, 0.89208984375, 1.0848388671875, 1.277587890625, 1.4703369140625, 1.6630859375, 1.8558349609375, 2.048583984375, 2.2413330078125, 2.43408203125, 2.6268310546875, 2.819580078125, 3.0123291015625, 3.205078125, 3.3978271484375, 3.590576171875, 3.7833251953125, 3.97607421875, 4.1688232421875, 4.361572265625, 4.5543212890625, 4.7470703125, 4.9398193359375, 5.132568359375, 5.3253173828125, 5.51806640625, 5.7108154296875, 5.903564453125, 6.0963134765625, 6.2890625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 7.0, 18.0, 20.0, 12.0, 16.0, 30.0, 27.0, 35.0, 37.0, 33.0, 48.0, 54.0, 54.0, 37.0, 36.0, 55.0, 42.0, 36.0, 44.0, 41.0, 35.0, 34.0, 34.0, 37.0, 28.0, 18.0, 21.0, 17.0, 14.0, 11.0, 9.0, 8.0, 2.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.02023696899414, -16.50851821899414, -15.996797561645508, -15.485077857971191, -14.973358154296875, -14.461638450622559, -13.949918746948242, -13.438199043273926, -12.92647933959961, -12.414759635925293, -11.903039932250977, -11.39132022857666, -10.879600524902344, -10.367880821228027, -9.856161117553711, -9.344441413879395, -8.832721710205078, -8.321002006530762, -7.809282302856445, -7.297562599182129, -6.7858428955078125, -6.274123191833496, -5.76240348815918, -5.250683784484863, -4.738964080810547, -4.2272443771362305, -3.715524673461914, -3.2038049697875977, -2.6920852661132812, -2.180365562438965, -1.6686458587646484, -1.156926155090332, -0.645207405090332, -0.13348770141601562, 0.3782320022583008, 0.8899517059326172, 1.4016714096069336, 1.91339111328125, 2.4251108169555664, 2.936830520629883, 3.448550224304199, 3.9602699279785156, 4.471989631652832, 4.983709335327148, 5.495429039001465, 6.007148742675781, 6.518868446350098, 7.030588150024414, 7.5423078536987305, 8.054027557373047, 8.565747261047363, 9.07746696472168, 9.589186668395996, 10.100906372070312, 10.612626075744629, 11.124345779418945, 11.636065483093262, 12.147785186767578, 12.659504890441895, 13.171224594116211, 13.682944297790527, 14.194664001464844, 14.70638370513916, 15.218103408813477, 15.729823112487793]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 6.0, 12.0, 12.0, 12.0, 14.0, 16.0, 20.0, 23.0, 22.0, 34.0, 36.0, 41.0, 47.0, 47.0, 53.0, 58.0, 59.0, 47.0, 60.0, 53.0, 39.0, 36.0, 29.0, 33.0, 27.0, 27.0, 25.0, 23.0, 15.0, 14.0, 12.0, 7.0, 8.0, 8.0, 2.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.799354553222656, -20.199270248413086, -19.599185943603516, -18.999099731445312, -18.399015426635742, -17.798931121826172, -17.1988468170166, -16.59876251220703, -15.998678207397461, -15.39859390258789, -14.798508644104004, -14.198424339294434, -13.598340034484863, -12.998254776000977, -12.398170471191406, -11.798086166381836, -11.19800090789795, -10.597916603088379, -9.997831344604492, -9.397747039794922, -8.797662734985352, -8.197578430175781, -7.5974931716918945, -6.997408866882324, -6.397324085235596, -5.797239303588867, -5.197154998779297, -4.597070217132568, -3.996985673904419, -3.3969011306762695, -2.796816349029541, -2.1967320442199707, -1.5966472625732422, -0.996562659740448, -0.3964780569076538, 0.20360660552978516, 0.8036911487579346, 1.403775691986084, 2.0038604736328125, 2.603944778442383, 3.2040295600891113, 3.8041141033172607, 4.40419864654541, 5.004283428192139, 5.604368209838867, 6.2044525146484375, 6.804537296295166, 7.404621601104736, 8.004706382751465, 8.604790687561035, 9.204875946044922, 9.804960250854492, 10.405044555664062, 11.005128860473633, 11.60521411895752, 12.20529842376709, 12.805383682250977, 13.405467987060547, 14.005553245544434, 14.605637550354004, 15.205721855163574, 15.805807113647461, 16.40589141845703, 17.0059757232666, 17.606060028076172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 11.0, 9.0, 15.0, 17.0, 30.0, 38.0, 67.0, 77.0, 134.0, 185.0, 267.0, 418.0, 658.0, 958.0, 1531.0, 2269.0, 3741.0, 5901.0, 9594.0, 15843.0, 25250.0, 39920.0, 61277.0, 87046.0, 114544.0, 133484.0, 136631.0, 121699.0, 95426.0, 68536.0, 45566.0, 28998.0, 18314.0, 11227.0, 6857.0, 4379.0, 2715.0, 1741.0, 1045.0, 720.0, 421.0, 332.0, 224.0, 147.0, 87.0, 70.0, 41.0, 40.0, 19.0, 17.0, 11.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.65625, -18.093505859375, -17.53076171875, -16.968017578125, -16.4052734375, -15.842529296875, -15.27978515625, -14.717041015625, -14.154296875, -13.591552734375, -13.02880859375, -12.466064453125, -11.9033203125, -11.340576171875, -10.77783203125, -10.215087890625, -9.65234375, -9.089599609375, -8.52685546875, -7.964111328125, -7.4013671875, -6.838623046875, -6.27587890625, -5.713134765625, -5.150390625, -4.587646484375, -4.02490234375, -3.462158203125, -2.8994140625, -2.336669921875, -1.77392578125, -1.211181640625, -0.6484375, -0.085693359375, 0.47705078125, 1.039794921875, 1.6025390625, 2.165283203125, 2.72802734375, 3.290771484375, 3.853515625, 4.416259765625, 4.97900390625, 5.541748046875, 6.1044921875, 6.667236328125, 7.22998046875, 7.792724609375, 8.35546875, 8.918212890625, 9.48095703125, 10.043701171875, 10.6064453125, 11.169189453125, 11.73193359375, 12.294677734375, 12.857421875, 13.420166015625, 13.98291015625, 14.545654296875, 15.1083984375, 15.671142578125, 16.23388671875, 16.796630859375, 17.359375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 11.0, 10.0, 11.0, 20.0, 18.0, 18.0, 16.0, 27.0, 29.0, 36.0, 46.0, 51.0, 54.0, 62.0, 51.0, 53.0, 72.0, 41.0, 48.0, 33.0, 44.0, 40.0, 30.0, 34.0, 24.0, 23.0, 19.0, 16.0, 9.0, 12.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.306884765625, -17.72314453125, -17.139404296875, -16.5556640625, -15.971923828125, -15.38818359375, -14.804443359375, -14.220703125, -13.636962890625, -13.05322265625, -12.469482421875, -11.8857421875, -11.302001953125, -10.71826171875, -10.134521484375, -9.55078125, -8.967041015625, -8.38330078125, -7.799560546875, -7.2158203125, -6.632080078125, -6.04833984375, -5.464599609375, -4.880859375, -4.297119140625, -3.71337890625, -3.129638671875, -2.5458984375, -1.962158203125, -1.37841796875, -0.794677734375, -0.2109375, 0.372802734375, 0.95654296875, 1.540283203125, 2.1240234375, 2.707763671875, 3.29150390625, 3.875244140625, 4.458984375, 5.042724609375, 5.62646484375, 6.210205078125, 6.7939453125, 7.377685546875, 7.96142578125, 8.545166015625, 9.12890625, 9.712646484375, 10.29638671875, 10.880126953125, 11.4638671875, 12.047607421875, 12.63134765625, 13.215087890625, 13.798828125, 14.382568359375, 14.96630859375, 15.550048828125, 16.1337890625, 16.717529296875, 17.30126953125, 17.885009765625, 18.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 18.0, 17.0, 25.0, 39.0, 64.0, 101.0, 158.0, 209.0, 375.0, 602.0, 892.0, 1379.0, 2059.0, 3372.0, 5103.0, 7877.0, 12179.0, 18392.0, 27797.0, 40672.0, 58086.0, 77385.0, 98659.0, 114270.0, 120240.0, 113675.0, 96559.0, 75655.0, 55680.0, 39396.0, 26501.0, 17760.0, 11742.0, 7677.0, 4975.0, 3196.0, 2037.0, 1357.0, 831.0, 559.0, 344.0, 234.0, 142.0, 90.0, 65.0, 44.0, 23.0, 13.0, 11.0, 7.0, 3.0, 2.0, 3.0], "bins": [-17.65625, -17.158203125, -16.66015625, -16.162109375, -15.6640625, -15.166015625, -14.66796875, -14.169921875, -13.671875, -13.173828125, -12.67578125, -12.177734375, -11.6796875, -11.181640625, -10.68359375, -10.185546875, -9.6875, -9.189453125, -8.69140625, -8.193359375, -7.6953125, -7.197265625, -6.69921875, -6.201171875, -5.703125, -5.205078125, -4.70703125, -4.208984375, -3.7109375, -3.212890625, -2.71484375, -2.216796875, -1.71875, -1.220703125, -0.72265625, -0.224609375, 0.2734375, 0.771484375, 1.26953125, 1.767578125, 2.265625, 2.763671875, 3.26171875, 3.759765625, 4.2578125, 4.755859375, 5.25390625, 5.751953125, 6.25, 6.748046875, 7.24609375, 7.744140625, 8.2421875, 8.740234375, 9.23828125, 9.736328125, 10.234375, 10.732421875, 11.23046875, 11.728515625, 12.2265625, 12.724609375, 13.22265625, 13.720703125, 14.21875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 6.0, 5.0, 12.0, 3.0, 12.0, 8.0, 11.0, 13.0, 24.0, 20.0, 17.0, 22.0, 25.0, 27.0, 26.0, 35.0, 19.0, 28.0, 44.0, 26.0, 40.0, 35.0, 39.0, 41.0, 31.0, 33.0, 32.0, 34.0, 31.0, 31.0, 31.0, 30.0, 36.0, 27.0, 18.0, 19.0, 14.0, 13.0, 14.0, 5.0, 9.0, 9.0, 5.0, 10.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1875, -7.9085693359375, -7.629638671875, -7.3507080078125, -7.07177734375, -6.7928466796875, -6.513916015625, -6.2349853515625, -5.9560546875, -5.6771240234375, -5.398193359375, -5.1192626953125, -4.84033203125, -4.5614013671875, -4.282470703125, -4.0035400390625, -3.724609375, -3.4456787109375, -3.166748046875, -2.8878173828125, -2.60888671875, -2.3299560546875, -2.051025390625, -1.7720947265625, -1.4931640625, -1.2142333984375, -0.935302734375, -0.6563720703125, -0.37744140625, -0.0985107421875, 0.180419921875, 0.4593505859375, 0.73828125, 1.0172119140625, 1.296142578125, 1.5750732421875, 1.85400390625, 2.1329345703125, 2.411865234375, 2.6907958984375, 2.9697265625, 3.2486572265625, 3.527587890625, 3.8065185546875, 4.08544921875, 4.3643798828125, 4.643310546875, 4.9222412109375, 5.201171875, 5.4801025390625, 5.759033203125, 6.0379638671875, 6.31689453125, 6.5958251953125, 6.874755859375, 7.1536865234375, 7.4326171875, 7.7115478515625, 7.990478515625, 8.2694091796875, 8.54833984375, 8.8272705078125, 9.106201171875, 9.3851318359375, 9.6640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 14.0, 8.0, 23.0, 33.0, 38.0, 51.0, 81.0, 128.0, 198.0, 309.0, 478.0, 787.0, 1191.0, 2200.0, 3762.0, 7241.0, 14055.0, 27844.0, 55226.0, 104056.0, 167104.0, 207927.0, 187634.0, 124762.0, 70264.0, 35192.0, 17508.0, 8897.0, 4766.0, 2621.0, 1579.0, 969.0, 572.0, 343.0, 217.0, 148.0, 99.0, 65.0, 54.0, 37.0, 26.0, 15.0, 11.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.89178466796875, -6.6741943359375, -6.45660400390625, -6.239013671875, -6.02142333984375, -5.8038330078125, -5.58624267578125, -5.36865234375, -5.15106201171875, -4.9334716796875, -4.71588134765625, -4.498291015625, -4.28070068359375, -4.0631103515625, -3.84552001953125, -3.6279296875, -3.41033935546875, -3.1927490234375, -2.97515869140625, -2.757568359375, -2.53997802734375, -2.3223876953125, -2.10479736328125, -1.88720703125, -1.66961669921875, -1.4520263671875, -1.23443603515625, -1.016845703125, -0.79925537109375, -0.5816650390625, -0.36407470703125, -0.146484375, 0.07110595703125, 0.2886962890625, 0.50628662109375, 0.723876953125, 0.94146728515625, 1.1590576171875, 1.37664794921875, 1.59423828125, 1.81182861328125, 2.0294189453125, 2.24700927734375, 2.464599609375, 2.68218994140625, 2.8997802734375, 3.11737060546875, 3.3349609375, 3.55255126953125, 3.7701416015625, 3.98773193359375, 4.205322265625, 4.42291259765625, 4.6405029296875, 4.85809326171875, 5.07568359375, 5.29327392578125, 5.5108642578125, 5.72845458984375, 5.946044921875, 6.16363525390625, 6.3812255859375, 6.59881591796875, 6.81640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 11.0, 12.0, 19.0, 18.0, 28.0, 37.0, 39.0, 62.0, 62.0, 65.0, 78.0, 56.0, 62.0, 74.0, 44.0, 56.0, 42.0, 32.0, 38.0, 27.0, 25.0, 21.0, 12.0, 14.0, 12.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006737709045410156, -0.0006525218486785889, -0.0006312727928161621, -0.0006100237369537354, -0.0005887746810913086, -0.0005675256252288818, -0.0005462765693664551, -0.0005250275135040283, -0.0005037784576416016, -0.0004825294017791748, -0.00046128034591674805, -0.0004400312900543213, -0.00041878223419189453, -0.0003975331783294678, -0.000376284122467041, -0.00035503506660461426, -0.0003337860107421875, -0.00031253695487976074, -0.000291287899017334, -0.0002700388431549072, -0.00024878978729248047, -0.0002275407314300537, -0.00020629167556762695, -0.0001850426197052002, -0.00016379356384277344, -0.00014254450798034668, -0.00012129545211791992, -0.00010004639625549316, -7.87973403930664e-05, -5.754828453063965e-05, -3.629922866821289e-05, -1.5050172805786133e-05, 6.198883056640625e-06, 2.7447938919067383e-05, 4.869699478149414e-05, 6.99460506439209e-05, 9.119510650634766e-05, 0.00011244416236877441, 0.00013369321823120117, 0.00015494227409362793, 0.0001761913299560547, 0.00019744038581848145, 0.0002186894416809082, 0.00023993849754333496, 0.0002611875534057617, 0.0002824366092681885, 0.00030368566513061523, 0.000324934720993042, 0.00034618377685546875, 0.0003674328327178955, 0.00038868188858032227, 0.000409930944442749, 0.0004311800003051758, 0.00045242905616760254, 0.0004736781120300293, 0.0004949271678924561, 0.0005161762237548828, 0.0005374252796173096, 0.0005586743354797363, 0.0005799233913421631, 0.0006011724472045898, 0.0006224215030670166, 0.0006436705589294434, 0.0006649196147918701, 0.0006861686706542969]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 18.0, 29.0, 27.0, 37.0, 71.0, 90.0, 145.0, 179.0, 279.0, 534.0, 803.0, 1359.0, 2214.0, 3509.0, 6041.0, 10106.0, 16622.0, 26758.0, 42480.0, 65035.0, 91459.0, 118986.0, 135882.0, 136224.0, 118794.0, 91879.0, 65804.0, 43446.0, 27236.0, 16736.0, 10137.0, 6173.0, 3715.0, 2169.0, 1323.0, 819.0, 520.0, 328.0, 206.0, 138.0, 84.0, 57.0, 27.0, 25.0, 14.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.35546875, -4.21502685546875, -4.0745849609375, -3.93414306640625, -3.793701171875, -3.65325927734375, -3.5128173828125, -3.37237548828125, -3.23193359375, -3.09149169921875, -2.9510498046875, -2.81060791015625, -2.670166015625, -2.52972412109375, -2.3892822265625, -2.24884033203125, -2.1083984375, -1.96795654296875, -1.8275146484375, -1.68707275390625, -1.546630859375, -1.40618896484375, -1.2657470703125, -1.12530517578125, -0.98486328125, -0.84442138671875, -0.7039794921875, -0.56353759765625, -0.423095703125, -0.28265380859375, -0.1422119140625, -0.00177001953125, 0.138671875, 0.27911376953125, 0.4195556640625, 0.55999755859375, 0.700439453125, 0.84088134765625, 0.9813232421875, 1.12176513671875, 1.26220703125, 1.40264892578125, 1.5430908203125, 1.68353271484375, 1.823974609375, 1.96441650390625, 2.1048583984375, 2.24530029296875, 2.3857421875, 2.52618408203125, 2.6666259765625, 2.80706787109375, 2.947509765625, 3.08795166015625, 3.2283935546875, 3.36883544921875, 3.50927734375, 3.64971923828125, 3.7901611328125, 3.93060302734375, 4.071044921875, 4.21148681640625, 4.3519287109375, 4.49237060546875, 4.6328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 9.0, 13.0, 15.0, 20.0, 19.0, 25.0, 25.0, 24.0, 30.0, 38.0, 55.0, 44.0, 47.0, 44.0, 51.0, 54.0, 55.0, 56.0, 49.0, 44.0, 44.0, 33.0, 25.0, 26.0, 29.0, 20.0, 20.0, 10.0, 15.0, 8.0, 9.0, 9.0, 4.0, 3.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.7631072998046875, -1.705902099609375, -1.6486968994140625, -1.59149169921875, -1.5342864990234375, -1.477081298828125, -1.4198760986328125, -1.3626708984375, -1.3054656982421875, -1.248260498046875, -1.1910552978515625, -1.13385009765625, -1.0766448974609375, -1.019439697265625, -0.9622344970703125, -0.905029296875, -0.8478240966796875, -0.790618896484375, -0.7334136962890625, -0.67620849609375, -0.6190032958984375, -0.561798095703125, -0.5045928955078125, -0.4473876953125, -0.3901824951171875, -0.332977294921875, -0.2757720947265625, -0.21856689453125, -0.1613616943359375, -0.104156494140625, -0.0469512939453125, 0.01025390625, 0.0674591064453125, 0.124664306640625, 0.1818695068359375, 0.23907470703125, 0.2962799072265625, 0.353485107421875, 0.4106903076171875, 0.4678955078125, 0.5251007080078125, 0.582305908203125, 0.6395111083984375, 0.69671630859375, 0.7539215087890625, 0.811126708984375, 0.8683319091796875, 0.925537109375, 0.9827423095703125, 1.039947509765625, 1.0971527099609375, 1.15435791015625, 1.2115631103515625, 1.268768310546875, 1.3259735107421875, 1.3831787109375, 1.4403839111328125, 1.497589111328125, 1.5547943115234375, 1.61199951171875, 1.6692047119140625, 1.726409912109375, 1.7836151123046875, 1.8408203125]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 12.0, 21.0, 17.0, 16.0, 12.0, 28.0, 28.0, 36.0, 34.0, 21.0, 36.0, 38.0, 44.0, 42.0, 44.0, 41.0, 36.0, 41.0, 30.0, 40.0, 39.0, 44.0, 40.0, 32.0, 34.0, 23.0, 24.0, 25.0, 19.0, 14.0, 12.0, 13.0, 7.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.889809608459473, -14.443861961364746, -13.99791431427002, -13.551966667175293, -13.106019020080566, -12.66007137298584, -12.21412467956543, -11.768177032470703, -11.322229385375977, -10.87628173828125, -10.430334091186523, -9.984386444091797, -9.53843879699707, -9.092491149902344, -8.646543502807617, -8.20059585571289, -7.754648208618164, -7.3087005615234375, -6.862752914428711, -6.416805267333984, -5.970857620239258, -5.524909973144531, -5.078962802886963, -4.633015155792236, -4.18706750869751, -3.741119861602783, -3.2951722145080566, -2.849224805831909, -2.4032771587371826, -1.957329511642456, -1.5113821029663086, -1.065434455871582, -0.6194877624511719, -0.1735401749610901, 0.2724074125289917, 0.7183549404144287, 1.1643025875091553, 1.6102502346038818, 2.0561976432800293, 2.502145290374756, 2.9480929374694824, 3.394040584564209, 3.8399882316589355, 4.285935401916504, 4.7318830490112305, 5.177830696105957, 5.623778343200684, 6.06972599029541, 6.515673637390137, 6.961621284484863, 7.40756893157959, 7.853516578674316, 8.299464225769043, 8.74541187286377, 9.19135856628418, 9.637306213378906, 10.083253860473633, 10.52920150756836, 10.975149154663086, 11.421096801757812, 11.867044448852539, 12.312992095947266, 12.758939743041992, 13.204887390136719, 13.650835037231445]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 8.0, 11.0, 11.0, 20.0, 20.0, 18.0, 25.0, 40.0, 28.0, 30.0, 34.0, 39.0, 43.0, 47.0, 37.0, 64.0, 54.0, 45.0, 46.0, 41.0, 49.0, 33.0, 38.0, 34.0, 25.0, 27.0, 28.0, 21.0, 15.0, 10.0, 8.0, 12.0, 6.0, 7.0, 1.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.127422332763672, -20.53099250793457, -19.93456268310547, -19.338132858276367, -18.741703033447266, -18.145273208618164, -17.548843383789062, -16.95241355895996, -16.35598373413086, -15.759553909301758, -15.163124084472656, -14.566694259643555, -13.970264434814453, -13.373834609985352, -12.77740478515625, -12.180974960327148, -11.584545135498047, -10.988115310668945, -10.391685485839844, -9.795255661010742, -9.19882583618164, -8.602396011352539, -8.005966186523438, -7.409536361694336, -6.813106536865234, -6.216676712036133, -5.620246887207031, -5.02381706237793, -4.427387237548828, -3.8309574127197266, -3.234527587890625, -2.6380977630615234, -2.041666030883789, -1.4452362060546875, -0.8488063812255859, -0.2523765563964844, 0.3440532684326172, 0.9404830932617188, 1.5369129180908203, 2.133342742919922, 2.7297725677490234, 3.326202392578125, 3.9226322174072266, 4.519062042236328, 5.11549186706543, 5.711921691894531, 6.308351516723633, 6.904781341552734, 7.501211166381836, 8.097640991210938, 8.694070816040039, 9.29050064086914, 9.886930465698242, 10.483360290527344, 11.079790115356445, 11.676219940185547, 12.272649765014648, 12.86907958984375, 13.465509414672852, 14.061939239501953, 14.658369064331055, 15.254798889160156, 15.851228713989258, 16.44765853881836, 17.04408836364746]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 14.0, 19.0, 35.0, 53.0, 80.0, 131.0, 240.0, 391.0, 607.0, 1004.0, 1637.0, 2506.0, 4329.0, 6930.0, 11178.0, 18774.0, 30753.0, 50651.0, 82819.0, 134466.0, 209781.0, 318596.0, 445751.0, 553626.0, 590985.0, 532430.0, 413621.0, 287514.0, 187742.0, 118582.0, 72915.0, 45054.0, 27392.0, 16893.0, 10170.0, 6219.0, 3941.0, 2445.0, 1464.0, 948.0, 575.0, 419.0, 224.0, 144.0, 91.0, 55.0, 38.0, 21.0, 12.0, 10.0, 4.0, 4.0, 3.0], "bins": [-13.265625, -12.8907470703125, -12.515869140625, -12.1409912109375, -11.76611328125, -11.3912353515625, -11.016357421875, -10.6414794921875, -10.2666015625, -9.8917236328125, -9.516845703125, -9.1419677734375, -8.76708984375, -8.3922119140625, -8.017333984375, -7.6424560546875, -7.267578125, -6.8927001953125, -6.517822265625, -6.1429443359375, -5.76806640625, -5.3931884765625, -5.018310546875, -4.6434326171875, -4.2685546875, -3.8936767578125, -3.518798828125, -3.1439208984375, -2.76904296875, -2.3941650390625, -2.019287109375, -1.6444091796875, -1.26953125, -0.8946533203125, -0.519775390625, -0.1448974609375, 0.22998046875, 0.6048583984375, 0.979736328125, 1.3546142578125, 1.7294921875, 2.1043701171875, 2.479248046875, 2.8541259765625, 3.22900390625, 3.6038818359375, 3.978759765625, 4.3536376953125, 4.728515625, 5.1033935546875, 5.478271484375, 5.8531494140625, 6.22802734375, 6.6029052734375, 6.977783203125, 7.3526611328125, 7.7275390625, 8.1024169921875, 8.477294921875, 8.8521728515625, 9.22705078125, 9.6019287109375, 9.976806640625, 10.3516845703125, 10.7265625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 10.0, 8.0, 19.0, 25.0, 22.0, 13.0, 24.0, 40.0, 32.0, 33.0, 31.0, 41.0, 56.0, 49.0, 48.0, 60.0, 42.0, 43.0, 45.0, 43.0, 55.0, 40.0, 30.0, 32.0, 26.0, 19.0, 17.0, 20.0, 11.0, 15.0, 8.0, 10.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.984375, -14.5416259765625, -14.098876953125, -13.6561279296875, -13.21337890625, -12.7706298828125, -12.327880859375, -11.8851318359375, -11.4423828125, -10.9996337890625, -10.556884765625, -10.1141357421875, -9.67138671875, -9.2286376953125, -8.785888671875, -8.3431396484375, -7.900390625, -7.4576416015625, -7.014892578125, -6.5721435546875, -6.12939453125, -5.6866455078125, -5.243896484375, -4.8011474609375, -4.3583984375, -3.9156494140625, -3.472900390625, -3.0301513671875, -2.58740234375, -2.1446533203125, -1.701904296875, -1.2591552734375, -0.81640625, -0.3736572265625, 0.069091796875, 0.5118408203125, 0.95458984375, 1.3973388671875, 1.840087890625, 2.2828369140625, 2.7255859375, 3.1683349609375, 3.611083984375, 4.0538330078125, 4.49658203125, 4.9393310546875, 5.382080078125, 5.8248291015625, 6.267578125, 6.7103271484375, 7.153076171875, 7.5958251953125, 8.03857421875, 8.4813232421875, 8.924072265625, 9.3668212890625, 9.8095703125, 10.2523193359375, 10.695068359375, 11.1378173828125, 11.58056640625, 12.0233154296875, 12.466064453125, 12.9088134765625, 13.3515625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 8.0, 5.0, 23.0, 38.0, 45.0, 73.0, 138.0, 201.0, 328.0, 558.0, 878.0, 1616.0, 2604.0, 4301.0, 7329.0, 12016.0, 19943.0, 32449.0, 52773.0, 83084.0, 129202.0, 192535.0, 273582.0, 364797.0, 450880.0, 503107.0, 498907.0, 439299.0, 353504.0, 260875.0, 182402.0, 121573.0, 79104.0, 49192.0, 30989.0, 18414.0, 11061.0, 6540.0, 3957.0, 2340.0, 1446.0, 855.0, 515.0, 324.0, 181.0, 120.0, 56.0, 44.0, 23.0, 19.0, 8.0, 9.0, 8.0, 2.0, 5.0, 2.0], "bins": [-11.328125, -10.9942626953125, -10.660400390625, -10.3265380859375, -9.99267578125, -9.6588134765625, -9.324951171875, -8.9910888671875, -8.6572265625, -8.3233642578125, -7.989501953125, -7.6556396484375, -7.32177734375, -6.9879150390625, -6.654052734375, -6.3201904296875, -5.986328125, -5.6524658203125, -5.318603515625, -4.9847412109375, -4.65087890625, -4.3170166015625, -3.983154296875, -3.6492919921875, -3.3154296875, -2.9815673828125, -2.647705078125, -2.3138427734375, -1.97998046875, -1.6461181640625, -1.312255859375, -0.9783935546875, -0.64453125, -0.3106689453125, 0.023193359375, 0.3570556640625, 0.69091796875, 1.0247802734375, 1.358642578125, 1.6925048828125, 2.0263671875, 2.3602294921875, 2.694091796875, 3.0279541015625, 3.36181640625, 3.6956787109375, 4.029541015625, 4.3634033203125, 4.697265625, 5.0311279296875, 5.364990234375, 5.6988525390625, 6.03271484375, 6.3665771484375, 6.700439453125, 7.0343017578125, 7.3681640625, 7.7020263671875, 8.035888671875, 8.3697509765625, 8.70361328125, 9.0374755859375, 9.371337890625, 9.7052001953125, 10.0390625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 6.0, 9.0, 21.0, 26.0, 39.0, 37.0, 54.0, 70.0, 82.0, 96.0, 115.0, 134.0, 141.0, 192.0, 196.0, 225.0, 232.0, 255.0, 228.0, 241.0, 224.0, 221.0, 209.0, 151.0, 139.0, 130.0, 111.0, 111.0, 76.0, 53.0, 58.0, 40.0, 38.0, 28.0, 22.0, 13.0, 7.0, 7.0, 6.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.88671875, -4.7044677734375, -4.522216796875, -4.3399658203125, -4.15771484375, -3.9754638671875, -3.793212890625, -3.6109619140625, -3.4287109375, -3.2464599609375, -3.064208984375, -2.8819580078125, -2.69970703125, -2.5174560546875, -2.335205078125, -2.1529541015625, -1.970703125, -1.7884521484375, -1.606201171875, -1.4239501953125, -1.24169921875, -1.0594482421875, -0.877197265625, -0.6949462890625, -0.5126953125, -0.3304443359375, -0.148193359375, 0.0340576171875, 0.21630859375, 0.3985595703125, 0.580810546875, 0.7630615234375, 0.9453125, 1.1275634765625, 1.309814453125, 1.4920654296875, 1.67431640625, 1.8565673828125, 2.038818359375, 2.2210693359375, 2.4033203125, 2.5855712890625, 2.767822265625, 2.9500732421875, 3.13232421875, 3.3145751953125, 3.496826171875, 3.6790771484375, 3.861328125, 4.0435791015625, 4.225830078125, 4.4080810546875, 4.59033203125, 4.7725830078125, 4.954833984375, 5.1370849609375, 5.3193359375, 5.5015869140625, 5.683837890625, 5.8660888671875, 6.04833984375, 6.2305908203125, 6.412841796875, 6.5950927734375, 6.77734375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 14.0, 9.0, 11.0, 14.0, 20.0, 31.0, 20.0, 27.0, 21.0, 30.0, 32.0, 29.0, 40.0, 40.0, 55.0, 42.0, 34.0, 46.0, 44.0, 56.0, 39.0, 45.0, 41.0, 29.0, 26.0, 28.0, 22.0, 24.0, 14.0, 17.0, 18.0, 11.0, 8.0, 13.0, 10.0, 6.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.307266235351562, -12.910691261291504, -12.514116287231445, -12.117541313171387, -11.720966339111328, -11.324392318725586, -10.927816390991211, -10.531242370605469, -10.13466739654541, -9.738092422485352, -9.341517448425293, -8.944942474365234, -8.548367500305176, -8.151792526245117, -7.755218029022217, -7.358643531799316, -6.9620680809021, -6.565493106842041, -6.168918132781982, -5.772343635559082, -5.375768661499023, -4.979193687438965, -4.582618713378906, -4.186043739318848, -3.789469003677368, -3.3928940296173096, -2.99631929397583, -2.5997443199157715, -2.203169345855713, -1.8065946102142334, -1.4100196361541748, -1.0134449005126953, -0.6168699264526367, -0.2202950417995453, 0.17627984285354614, 0.57285475730896, 0.969429612159729, 1.366004467010498, 1.7625794410705566, 2.159154176712036, 2.5557291507720947, 2.9523041248321533, 3.348878860473633, 3.7454538345336914, 4.14202880859375, 4.538603782653809, 4.935178756713867, 5.331753253936768, 5.728328227996826, 6.124903202056885, 6.521478176116943, 6.918052673339844, 7.314627647399902, 7.711202621459961, 8.10777759552002, 8.504352569580078, 8.900927543640137, 9.297502517700195, 9.694077491760254, 10.090652465820312, 10.487227439880371, 10.88380241394043, 11.280376434326172, 11.67695140838623, 12.073526382446289]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 4.0, 2.0, 10.0, 13.0, 11.0, 19.0, 17.0, 18.0, 25.0, 36.0, 24.0, 28.0, 27.0, 31.0, 45.0, 45.0, 47.0, 55.0, 54.0, 46.0, 40.0, 53.0, 42.0, 38.0, 29.0, 40.0, 25.0, 28.0, 29.0, 19.0, 22.0, 16.0, 15.0, 10.0, 6.0, 4.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.20598316192627, -14.741365432739258, -14.276748657226562, -13.812131881713867, -13.347514152526855, -12.882896423339844, -12.418279647827148, -11.953662872314453, -11.489045143127441, -11.02442741394043, -10.559810638427734, -10.095193862915039, -9.630576133728027, -9.165958404541016, -8.70134162902832, -8.236724853515625, -7.772107124328613, -7.30748987197876, -6.842872619628906, -6.378255367279053, -5.913638114929199, -5.449020862579346, -4.984403610229492, -4.519786357879639, -4.055169105529785, -3.5905518531799316, -3.125934600830078, -2.6613173484802246, -2.196700096130371, -1.7320828437805176, -1.267465591430664, -0.8028483390808105, -0.33823108673095703, 0.12638616561889648, 0.59100341796875, 1.0556206703186035, 1.520237922668457, 1.9848551750183105, 2.449472427368164, 2.9140896797180176, 3.378706932067871, 3.8433241844177246, 4.307941436767578, 4.772558689117432, 5.237175941467285, 5.701793193817139, 6.166410446166992, 6.631027698516846, 7.095644950866699, 7.560262203216553, 8.024879455566406, 8.489496231079102, 8.954113960266113, 9.418731689453125, 9.88334846496582, 10.347965240478516, 10.812582969665527, 11.277200698852539, 11.741817474365234, 12.20643424987793, 12.671051979064941, 13.135669708251953, 13.600286483764648, 14.064903259277344, 14.529520988464355]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 11.0, 8.0, 19.0, 19.0, 25.0, 47.0, 69.0, 93.0, 133.0, 180.0, 281.0, 422.0, 696.0, 1038.0, 1717.0, 2718.0, 4874.0, 9962.0, 21857.0, 52042.0, 134601.0, 309362.0, 294365.0, 123965.0, 48544.0, 20289.0, 9402.0, 4701.0, 2610.0, 1581.0, 956.0, 643.0, 409.0, 303.0, 185.0, 113.0, 89.0, 57.0, 44.0, 27.0, 21.0, 21.0, 13.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.65625, -14.1976318359375, -13.739013671875, -13.2803955078125, -12.82177734375, -12.3631591796875, -11.904541015625, -11.4459228515625, -10.9873046875, -10.5286865234375, -10.070068359375, -9.6114501953125, -9.15283203125, -8.6942138671875, -8.235595703125, -7.7769775390625, -7.318359375, -6.8597412109375, -6.401123046875, -5.9425048828125, -5.48388671875, -5.0252685546875, -4.566650390625, -4.1080322265625, -3.6494140625, -3.1907958984375, -2.732177734375, -2.2735595703125, -1.81494140625, -1.3563232421875, -0.897705078125, -0.4390869140625, 0.01953125, 0.4781494140625, 0.936767578125, 1.3953857421875, 1.85400390625, 2.3126220703125, 2.771240234375, 3.2298583984375, 3.6884765625, 4.1470947265625, 4.605712890625, 5.0643310546875, 5.52294921875, 5.9815673828125, 6.440185546875, 6.8988037109375, 7.357421875, 7.8160400390625, 8.274658203125, 8.7332763671875, 9.19189453125, 9.6505126953125, 10.109130859375, 10.5677490234375, 11.0263671875, 11.4849853515625, 11.943603515625, 12.4022216796875, 12.86083984375, 13.3194580078125, 13.778076171875, 14.2366943359375, 14.6953125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 5.0, 10.0, 18.0, 15.0, 23.0, 19.0, 22.0, 34.0, 29.0, 32.0, 40.0, 50.0, 38.0, 35.0, 52.0, 56.0, 61.0, 46.0, 49.0, 34.0, 45.0, 33.0, 42.0, 23.0, 27.0, 28.0, 23.0, 20.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.484375, -16.009033203125, -15.53369140625, -15.058349609375, -14.5830078125, -14.107666015625, -13.63232421875, -13.156982421875, -12.681640625, -12.206298828125, -11.73095703125, -11.255615234375, -10.7802734375, -10.304931640625, -9.82958984375, -9.354248046875, -8.87890625, -8.403564453125, -7.92822265625, -7.452880859375, -6.9775390625, -6.502197265625, -6.02685546875, -5.551513671875, -5.076171875, -4.600830078125, -4.12548828125, -3.650146484375, -3.1748046875, -2.699462890625, -2.22412109375, -1.748779296875, -1.2734375, -0.798095703125, -0.32275390625, 0.152587890625, 0.6279296875, 1.103271484375, 1.57861328125, 2.053955078125, 2.529296875, 3.004638671875, 3.47998046875, 3.955322265625, 4.4306640625, 4.906005859375, 5.38134765625, 5.856689453125, 6.33203125, 6.807373046875, 7.28271484375, 7.758056640625, 8.2333984375, 8.708740234375, 9.18408203125, 9.659423828125, 10.134765625, 10.610107421875, 11.08544921875, 11.560791015625, 12.0361328125, 12.511474609375, 12.98681640625, 13.462158203125, 13.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 12.0, 15.0, 23.0, 31.0, 39.0, 59.0, 63.0, 92.0, 131.0, 157.0, 231.0, 361.0, 558.0, 818.0, 1218.0, 2113.0, 3568.0, 6373.0, 12771.0, 27552.0, 70038.0, 197946.0, 377960.0, 212721.0, 74743.0, 29470.0, 13219.0, 6677.0, 3544.0, 2080.0, 1277.0, 841.0, 550.0, 377.0, 256.0, 175.0, 147.0, 89.0, 63.0, 62.0, 28.0, 30.0, 17.0, 17.0, 14.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-10.34375, -10.0157470703125, -9.687744140625, -9.3597412109375, -9.03173828125, -8.7037353515625, -8.375732421875, -8.0477294921875, -7.7197265625, -7.3917236328125, -7.063720703125, -6.7357177734375, -6.40771484375, -6.0797119140625, -5.751708984375, -5.4237060546875, -5.095703125, -4.7677001953125, -4.439697265625, -4.1116943359375, -3.78369140625, -3.4556884765625, -3.127685546875, -2.7996826171875, -2.4716796875, -2.1436767578125, -1.815673828125, -1.4876708984375, -1.15966796875, -0.8316650390625, -0.503662109375, -0.1756591796875, 0.15234375, 0.4803466796875, 0.808349609375, 1.1363525390625, 1.46435546875, 1.7923583984375, 2.120361328125, 2.4483642578125, 2.7763671875, 3.1043701171875, 3.432373046875, 3.7603759765625, 4.08837890625, 4.4163818359375, 4.744384765625, 5.0723876953125, 5.400390625, 5.7283935546875, 6.056396484375, 6.3843994140625, 6.71240234375, 7.0404052734375, 7.368408203125, 7.6964111328125, 8.0244140625, 8.3524169921875, 8.680419921875, 9.0084228515625, 9.33642578125, 9.6644287109375, 9.992431640625, 10.3204345703125, 10.6484375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 15.0, 15.0, 15.0, 17.0, 15.0, 19.0, 28.0, 23.0, 26.0, 27.0, 33.0, 45.0, 39.0, 46.0, 54.0, 44.0, 40.0, 31.0, 45.0, 34.0, 35.0, 31.0, 35.0, 36.0, 31.0, 24.0, 24.0, 15.0, 25.0, 10.0, 23.0, 14.0, 10.0, 11.0, 5.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.237060546875, -8.91162109375, -8.586181640625, -8.2607421875, -7.935302734375, -7.60986328125, -7.284423828125, -6.958984375, -6.633544921875, -6.30810546875, -5.982666015625, -5.6572265625, -5.331787109375, -5.00634765625, -4.680908203125, -4.35546875, -4.030029296875, -3.70458984375, -3.379150390625, -3.0537109375, -2.728271484375, -2.40283203125, -2.077392578125, -1.751953125, -1.426513671875, -1.10107421875, -0.775634765625, -0.4501953125, -0.124755859375, 0.20068359375, 0.526123046875, 0.8515625, 1.177001953125, 1.50244140625, 1.827880859375, 2.1533203125, 2.478759765625, 2.80419921875, 3.129638671875, 3.455078125, 3.780517578125, 4.10595703125, 4.431396484375, 4.7568359375, 5.082275390625, 5.40771484375, 5.733154296875, 6.05859375, 6.384033203125, 6.70947265625, 7.034912109375, 7.3603515625, 7.685791015625, 8.01123046875, 8.336669921875, 8.662109375, 8.987548828125, 9.31298828125, 9.638427734375, 9.9638671875, 10.289306640625, 10.61474609375, 10.940185546875, 11.265625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 9.0, 17.0, 14.0, 28.0, 40.0, 45.0, 56.0, 73.0, 117.0, 164.0, 247.0, 445.0, 674.0, 1137.0, 2285.0, 5311.0, 15582.0, 87733.0, 785862.0, 118405.0, 18605.0, 5946.0, 2493.0, 1269.0, 691.0, 417.0, 261.0, 180.0, 135.0, 91.0, 63.0, 54.0, 22.0, 16.0, 15.0, 12.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.78125, -14.3408203125, -13.900390625, -13.4599609375, -13.01953125, -12.5791015625, -12.138671875, -11.6982421875, -11.2578125, -10.8173828125, -10.376953125, -9.9365234375, -9.49609375, -9.0556640625, -8.615234375, -8.1748046875, -7.734375, -7.2939453125, -6.853515625, -6.4130859375, -5.97265625, -5.5322265625, -5.091796875, -4.6513671875, -4.2109375, -3.7705078125, -3.330078125, -2.8896484375, -2.44921875, -2.0087890625, -1.568359375, -1.1279296875, -0.6875, -0.2470703125, 0.193359375, 0.6337890625, 1.07421875, 1.5146484375, 1.955078125, 2.3955078125, 2.8359375, 3.2763671875, 3.716796875, 4.1572265625, 4.59765625, 5.0380859375, 5.478515625, 5.9189453125, 6.359375, 6.7998046875, 7.240234375, 7.6806640625, 8.12109375, 8.5615234375, 9.001953125, 9.4423828125, 9.8828125, 10.3232421875, 10.763671875, 11.2041015625, 11.64453125, 12.0849609375, 12.525390625, 12.9658203125, 13.40625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 13.0, 23.0, 32.0, 40.0, 69.0, 126.0, 155.0, 191.0, 112.0, 67.0, 52.0, 34.0, 16.0, 15.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008001327514648438, -0.0007715821266174316, -0.0007430315017700195, -0.0007144808769226074, -0.0006859302520751953, -0.0006573796272277832, -0.0006288290023803711, -0.000600278377532959, -0.0005717277526855469, -0.0005431771278381348, -0.0005146265029907227, -0.00048607587814331055, -0.00045752525329589844, -0.00042897462844848633, -0.0004004240036010742, -0.0003718733787536621, -0.00034332275390625, -0.0003147721290588379, -0.0002862215042114258, -0.00025767087936401367, -0.00022912025451660156, -0.00020056962966918945, -0.00017201900482177734, -0.00014346837997436523, -0.00011491775512695312, -8.636713027954102e-05, -5.7816505432128906e-05, -2.9265880584716797e-05, -7.152557373046875e-07, 2.7835369110107422e-05, 5.638599395751953e-05, 8.493661880493164e-05, 0.00011348724365234375, 0.00014203786849975586, 0.00017058849334716797, 0.00019913911819458008, 0.0002276897430419922, 0.0002562403678894043, 0.0002847909927368164, 0.0003133416175842285, 0.0003418922424316406, 0.00037044286727905273, 0.00039899349212646484, 0.00042754411697387695, 0.00045609474182128906, 0.00048464536666870117, 0.0005131959915161133, 0.0005417466163635254, 0.0005702972412109375, 0.0005988478660583496, 0.0006273984909057617, 0.0006559491157531738, 0.0006844997406005859, 0.000713050365447998, 0.0007416009902954102, 0.0007701516151428223, 0.0007987022399902344, 0.0008272528648376465, 0.0008558034896850586, 0.0008843541145324707, 0.0009129047393798828, 0.0009414553642272949, 0.000970005989074707, 0.0009985566139221191, 0.0010271072387695312]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 12.0, 29.0, 34.0, 36.0, 79.0, 132.0, 153.0, 301.0, 462.0, 719.0, 1232.0, 1926.0, 3353.0, 5913.0, 10990.0, 22801.0, 58060.0, 185172.0, 453739.0, 193955.0, 59947.0, 23592.0, 11215.0, 6027.0, 3471.0, 1971.0, 1209.0, 736.0, 450.0, 288.0, 178.0, 103.0, 83.0, 38.0, 34.0, 31.0, 21.0, 11.0, 6.0, 9.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.52587890625, -9.2236328125, -8.92138671875, -8.619140625, -8.31689453125, -8.0146484375, -7.71240234375, -7.41015625, -7.10791015625, -6.8056640625, -6.50341796875, -6.201171875, -5.89892578125, -5.5966796875, -5.29443359375, -4.9921875, -4.68994140625, -4.3876953125, -4.08544921875, -3.783203125, -3.48095703125, -3.1787109375, -2.87646484375, -2.57421875, -2.27197265625, -1.9697265625, -1.66748046875, -1.365234375, -1.06298828125, -0.7607421875, -0.45849609375, -0.15625, 0.14599609375, 0.4482421875, 0.75048828125, 1.052734375, 1.35498046875, 1.6572265625, 1.95947265625, 2.26171875, 2.56396484375, 2.8662109375, 3.16845703125, 3.470703125, 3.77294921875, 4.0751953125, 4.37744140625, 4.6796875, 4.98193359375, 5.2841796875, 5.58642578125, 5.888671875, 6.19091796875, 6.4931640625, 6.79541015625, 7.09765625, 7.39990234375, 7.7021484375, 8.00439453125, 8.306640625, 8.60888671875, 8.9111328125, 9.21337890625, 9.515625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 6.0, 18.0, 11.0, 17.0, 30.0, 31.0, 46.0, 41.0, 65.0, 89.0, 123.0, 121.0, 92.0, 47.0, 48.0, 37.0, 35.0, 28.0, 19.0, 15.0, 14.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.742706298828125, -2.65728759765625, -2.571868896484375, -2.4864501953125, -2.401031494140625, -2.31561279296875, -2.230194091796875, -2.144775390625, -2.059356689453125, -1.97393798828125, -1.888519287109375, -1.8031005859375, -1.717681884765625, -1.63226318359375, -1.546844482421875, -1.46142578125, -1.376007080078125, -1.29058837890625, -1.205169677734375, -1.1197509765625, -1.034332275390625, -0.94891357421875, -0.863494873046875, -0.778076171875, -0.692657470703125, -0.60723876953125, -0.521820068359375, -0.4364013671875, -0.350982666015625, -0.26556396484375, -0.180145263671875, -0.0947265625, -0.009307861328125, 0.07611083984375, 0.161529541015625, 0.2469482421875, 0.332366943359375, 0.41778564453125, 0.503204345703125, 0.588623046875, 0.674041748046875, 0.75946044921875, 0.844879150390625, 0.9302978515625, 1.015716552734375, 1.10113525390625, 1.186553955078125, 1.27197265625, 1.357391357421875, 1.44281005859375, 1.528228759765625, 1.6136474609375, 1.699066162109375, 1.78448486328125, 1.869903564453125, 1.955322265625, 2.040740966796875, 2.12615966796875, 2.211578369140625, 2.2969970703125, 2.382415771484375, 2.46783447265625, 2.553253173828125, 2.638671875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 8.0, 6.0, 8.0, 7.0, 12.0, 17.0, 16.0, 15.0, 15.0, 22.0, 21.0, 14.0, 21.0, 22.0, 27.0, 33.0, 39.0, 28.0, 53.0, 39.0, 32.0, 37.0, 32.0, 37.0, 58.0, 36.0, 39.0, 35.0, 24.0, 26.0, 24.0, 24.0, 26.0, 12.0, 25.0, 21.0, 9.0, 12.0, 11.0, 11.0, 11.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-11.563433647155762, -11.225764274597168, -10.888093948364258, -10.550424575805664, -10.21275520324707, -9.87508487701416, -9.537415504455566, -9.199745178222656, -8.862075805664062, -8.524406433105469, -8.186736106872559, -7.849066734313965, -7.511396884918213, -7.173727035522461, -6.836057662963867, -6.498387813568115, -6.160717964172363, -5.823048114776611, -5.485378265380859, -5.147708892822266, -4.810039043426514, -4.472369194030762, -4.134699821472168, -3.797029972076416, -3.459360122680664, -3.121690273284912, -2.7840206623077393, -2.4463510513305664, -2.1086812019348145, -1.771011471748352, -1.4333417415618896, -1.0956721305847168, -0.7580013275146484, -0.42033159732818604, -0.08266186714172363, 0.25500786304473877, 0.5926775932312012, 0.9303473234176636, 1.268017053604126, 1.6056866645812988, 1.9433565139770508, 2.2810263633728027, 2.6186959743499756, 2.9563655853271484, 3.2940354347229004, 3.6317052841186523, 3.969374895095825, 4.307044506072998, 4.64471435546875, 4.982384204864502, 5.320054054260254, 5.657723426818848, 5.9953932762146, 6.333063125610352, 6.670732498168945, 7.008402347564697, 7.346072196960449, 7.683742046356201, 8.021411895751953, 8.359081268310547, 8.69675064086914, 9.03442096710205, 9.372090339660645, 9.709760665893555, 10.047430038452148]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 4.0, 8.0, 13.0, 14.0, 16.0, 14.0, 21.0, 21.0, 30.0, 30.0, 27.0, 42.0, 45.0, 39.0, 39.0, 40.0, 49.0, 55.0, 63.0, 46.0, 29.0, 47.0, 37.0, 40.0, 30.0, 24.0, 34.0, 19.0, 25.0, 18.0, 13.0, 12.0, 10.0, 6.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.084700584411621, -14.633359909057617, -14.18202018737793, -13.730679512023926, -13.279338836669922, -12.827998161315918, -12.376657485961914, -11.925317764282227, -11.473977088928223, -11.022636413574219, -10.571296691894531, -10.119956016540527, -9.668615341186523, -9.21727466583252, -8.765933990478516, -8.314594268798828, -7.863253593444824, -7.41191291809082, -6.960572719573975, -6.509232521057129, -6.057891845703125, -5.606551170349121, -5.155210971832275, -4.70387077331543, -4.252530097961426, -3.801189661026001, -3.349849224090576, -2.8985087871551514, -2.4471683502197266, -1.9958279132843018, -1.544487476348877, -1.0931470394134521, -0.6418075561523438, -0.19046711921691895, 0.26087331771850586, 0.7122137546539307, 1.1635541915893555, 1.6148946285247803, 2.066235065460205, 2.51757550239563, 2.9689159393310547, 3.4202563762664795, 3.8715968132019043, 4.32293701171875, 4.774277687072754, 5.225618362426758, 5.6769585609436035, 6.128298759460449, 6.579639434814453, 7.030980110168457, 7.482320308685303, 7.933660507202148, 8.385001182556152, 8.836341857910156, 9.287681579589844, 9.739022254943848, 10.190362930297852, 10.641703605651855, 11.09304428100586, 11.544384002685547, 11.99572467803955, 12.447065353393555, 12.898405075073242, 13.349745750427246, 13.80108642578125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 10.0, 5.0, 14.0, 13.0, 33.0, 51.0, 85.0, 143.0, 259.0, 398.0, 729.0, 1288.0, 2304.0, 4144.0, 7584.0, 13815.0, 25290.0, 44446.0, 73377.0, 111958.0, 149783.0, 165904.0, 151587.0, 115221.0, 76111.0, 45620.0, 26020.0, 14660.0, 7953.0, 4285.0, 2319.0, 1313.0, 786.0, 434.0, 253.0, 143.0, 96.0, 47.0, 27.0, 14.0, 9.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.41943359375, -17.8701171875, -17.32080078125, -16.771484375, -16.22216796875, -15.6728515625, -15.12353515625, -14.57421875, -14.02490234375, -13.4755859375, -12.92626953125, -12.376953125, -11.82763671875, -11.2783203125, -10.72900390625, -10.1796875, -9.63037109375, -9.0810546875, -8.53173828125, -7.982421875, -7.43310546875, -6.8837890625, -6.33447265625, -5.78515625, -5.23583984375, -4.6865234375, -4.13720703125, -3.587890625, -3.03857421875, -2.4892578125, -1.93994140625, -1.390625, -0.84130859375, -0.2919921875, 0.25732421875, 0.806640625, 1.35595703125, 1.9052734375, 2.45458984375, 3.00390625, 3.55322265625, 4.1025390625, 4.65185546875, 5.201171875, 5.75048828125, 6.2998046875, 6.84912109375, 7.3984375, 7.94775390625, 8.4970703125, 9.04638671875, 9.595703125, 10.14501953125, 10.6943359375, 11.24365234375, 11.79296875, 12.34228515625, 12.8916015625, 13.44091796875, 13.990234375, 14.53955078125, 15.0888671875, 15.63818359375, 16.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 12.0, 9.0, 14.0, 16.0, 20.0, 18.0, 28.0, 28.0, 40.0, 42.0, 40.0, 36.0, 41.0, 42.0, 47.0, 54.0, 43.0, 52.0, 55.0, 35.0, 43.0, 38.0, 33.0, 22.0, 32.0, 23.0, 19.0, 25.0, 16.0, 9.0, 5.0, 13.0, 6.0, 7.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.78125, -13.34375, -12.90625, -12.46875, -12.03125, -11.59375, -11.15625, -10.71875, -10.28125, -9.84375, -9.40625, -8.96875, -8.53125, -8.09375, -7.65625, -7.21875, -6.78125, -6.34375, -5.90625, -5.46875, -5.03125, -4.59375, -4.15625, -3.71875, -3.28125, -2.84375, -2.40625, -1.96875, -1.53125, -1.09375, -0.65625, -0.21875, 0.21875, 0.65625, 1.09375, 1.53125, 1.96875, 2.40625, 2.84375, 3.28125, 3.71875, 4.15625, 4.59375, 5.03125, 5.46875, 5.90625, 6.34375, 6.78125, 7.21875, 7.65625, 8.09375, 8.53125, 8.96875, 9.40625, 9.84375, 10.28125, 10.71875, 11.15625, 11.59375, 12.03125, 12.46875, 12.90625, 13.34375, 13.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [7.0, 2.0, 4.0, 3.0, 19.0, 18.0, 23.0, 44.0, 77.0, 124.0, 191.0, 308.0, 447.0, 730.0, 1239.0, 2047.0, 3204.0, 5175.0, 8391.0, 13087.0, 20719.0, 31319.0, 46150.0, 64839.0, 86965.0, 106838.0, 120321.0, 122057.0, 110355.0, 90691.0, 68797.0, 49365.0, 33883.0, 22440.0, 14528.0, 9090.0, 5787.0, 3490.0, 2254.0, 1333.0, 872.0, 498.0, 303.0, 199.0, 137.0, 80.0, 39.0, 32.0, 16.0, 12.0, 12.0, 5.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.1651611328125, -9.775634765625, -9.3861083984375, -8.99658203125, -8.6070556640625, -8.217529296875, -7.8280029296875, -7.4384765625, -7.0489501953125, -6.659423828125, -6.2698974609375, -5.88037109375, -5.4908447265625, -5.101318359375, -4.7117919921875, -4.322265625, -3.9327392578125, -3.543212890625, -3.1536865234375, -2.76416015625, -2.3746337890625, -1.985107421875, -1.5955810546875, -1.2060546875, -0.8165283203125, -0.427001953125, -0.0374755859375, 0.35205078125, 0.7415771484375, 1.131103515625, 1.5206298828125, 1.91015625, 2.2996826171875, 2.689208984375, 3.0787353515625, 3.46826171875, 3.8577880859375, 4.247314453125, 4.6368408203125, 5.0263671875, 5.4158935546875, 5.805419921875, 6.1949462890625, 6.58447265625, 6.9739990234375, 7.363525390625, 7.7530517578125, 8.142578125, 8.5321044921875, 8.921630859375, 9.3111572265625, 9.70068359375, 10.0902099609375, 10.479736328125, 10.8692626953125, 11.2587890625, 11.6483154296875, 12.037841796875, 12.4273681640625, 12.81689453125, 13.2064208984375, 13.595947265625, 13.9854736328125, 14.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 5.0, 10.0, 8.0, 18.0, 10.0, 20.0, 19.0, 21.0, 16.0, 24.0, 29.0, 28.0, 33.0, 41.0, 25.0, 26.0, 30.0, 43.0, 30.0, 38.0, 36.0, 36.0, 46.0, 41.0, 37.0, 27.0, 29.0, 31.0, 38.0, 23.0, 30.0, 18.0, 19.0, 17.0, 18.0, 13.0, 16.0, 10.0, 10.0, 7.0, 2.0, 5.0, 3.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.5546875, -8.3154296875, -8.076171875, -7.8369140625, -7.59765625, -7.3583984375, -7.119140625, -6.8798828125, -6.640625, -6.4013671875, -6.162109375, -5.9228515625, -5.68359375, -5.4443359375, -5.205078125, -4.9658203125, -4.7265625, -4.4873046875, -4.248046875, -4.0087890625, -3.76953125, -3.5302734375, -3.291015625, -3.0517578125, -2.8125, -2.5732421875, -2.333984375, -2.0947265625, -1.85546875, -1.6162109375, -1.376953125, -1.1376953125, -0.8984375, -0.6591796875, -0.419921875, -0.1806640625, 0.05859375, 0.2978515625, 0.537109375, 0.7763671875, 1.015625, 1.2548828125, 1.494140625, 1.7333984375, 1.97265625, 2.2119140625, 2.451171875, 2.6904296875, 2.9296875, 3.1689453125, 3.408203125, 3.6474609375, 3.88671875, 4.1259765625, 4.365234375, 4.6044921875, 4.84375, 5.0830078125, 5.322265625, 5.5615234375, 5.80078125, 6.0400390625, 6.279296875, 6.5185546875, 6.7578125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 10.0, 20.0, 24.0, 29.0, 41.0, 94.0, 104.0, 159.0, 258.0, 383.0, 600.0, 1002.0, 1784.0, 3153.0, 5790.0, 12184.0, 25681.0, 57309.0, 120894.0, 212413.0, 249383.0, 179854.0, 94062.0, 43332.0, 19742.0, 9338.0, 4661.0, 2536.0, 1400.0, 846.0, 496.0, 334.0, 201.0, 139.0, 79.0, 67.0, 42.0, 30.0, 29.0, 17.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.098388671875, -8.79833984375, -8.498291015625, -8.1982421875, -7.898193359375, -7.59814453125, -7.298095703125, -6.998046875, -6.697998046875, -6.39794921875, -6.097900390625, -5.7978515625, -5.497802734375, -5.19775390625, -4.897705078125, -4.59765625, -4.297607421875, -3.99755859375, -3.697509765625, -3.3974609375, -3.097412109375, -2.79736328125, -2.497314453125, -2.197265625, -1.897216796875, -1.59716796875, -1.297119140625, -0.9970703125, -0.697021484375, -0.39697265625, -0.096923828125, 0.203125, 0.503173828125, 0.80322265625, 1.103271484375, 1.4033203125, 1.703369140625, 2.00341796875, 2.303466796875, 2.603515625, 2.903564453125, 3.20361328125, 3.503662109375, 3.8037109375, 4.103759765625, 4.40380859375, 4.703857421875, 5.00390625, 5.303955078125, 5.60400390625, 5.904052734375, 6.2041015625, 6.504150390625, 6.80419921875, 7.104248046875, 7.404296875, 7.704345703125, 8.00439453125, 8.304443359375, 8.6044921875, 8.904541015625, 9.20458984375, 9.504638671875, 9.8046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 4.0, 8.0, 10.0, 17.0, 28.0, 28.0, 37.0, 41.0, 46.0, 57.0, 62.0, 62.0, 84.0, 83.0, 63.0, 68.0, 55.0, 52.0, 44.0, 31.0, 26.0, 26.0, 18.0, 10.0, 10.0, 4.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0010585784912109375, -0.0010329410433769226, -0.0010073035955429077, -0.0009816661477088928, -0.0009560286998748779, -0.000930391252040863, -0.0009047538042068481, -0.0008791163563728333, -0.0008534789085388184, -0.0008278414607048035, -0.0008022040128707886, -0.0007765665650367737, -0.0007509291172027588, -0.0007252916693687439, -0.000699654221534729, -0.0006740167737007141, -0.0006483793258666992, -0.0006227418780326843, -0.0005971044301986694, -0.0005714669823646545, -0.0005458295345306396, -0.0005201920866966248, -0.0004945546388626099, -0.00046891719102859497, -0.0004432797431945801, -0.0004176422953605652, -0.0003920048475265503, -0.0003663673996925354, -0.0003407299518585205, -0.0003150925040245056, -0.0002894550561904907, -0.00026381760835647583, -0.00023818016052246094, -0.00021254271268844604, -0.00018690526485443115, -0.00016126781702041626, -0.00013563036918640137, -0.00010999292135238647, -8.435547351837158e-05, -5.871802568435669e-05, -3.30805778503418e-05, -7.443130016326904e-06, 1.8194317817687988e-05, 4.383176565170288e-05, 6.946921348571777e-05, 9.510666131973267e-05, 0.00012074410915374756, 0.00014638155698776245, 0.00017201900482177734, 0.00019765645265579224, 0.00022329390048980713, 0.000248931348323822, 0.0002745687961578369, 0.0003002062439918518, 0.0003258436918258667, 0.0003514811396598816, 0.0003771185874938965, 0.0004027560353279114, 0.00042839348316192627, 0.00045403093099594116, 0.00047966837882995605, 0.000505305826663971, 0.0005309432744979858, 0.0005565807223320007, 0.0005822181701660156]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 12.0, 11.0, 17.0, 28.0, 49.0, 80.0, 125.0, 214.0, 348.0, 565.0, 982.0, 1721.0, 3078.0, 5263.0, 9207.0, 15836.0, 26999.0, 45150.0, 73685.0, 110182.0, 146054.0, 162946.0, 147397.0, 111437.0, 75051.0, 46234.0, 27658.0, 16162.0, 9242.0, 5344.0, 2993.0, 1784.0, 1139.0, 658.0, 367.0, 203.0, 130.0, 83.0, 55.0, 30.0, 19.0, 8.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.41571044921875, -6.2298583984375, -6.04400634765625, -5.858154296875, -5.67230224609375, -5.4864501953125, -5.30059814453125, -5.11474609375, -4.92889404296875, -4.7430419921875, -4.55718994140625, -4.371337890625, -4.18548583984375, -3.9996337890625, -3.81378173828125, -3.6279296875, -3.44207763671875, -3.2562255859375, -3.07037353515625, -2.884521484375, -2.69866943359375, -2.5128173828125, -2.32696533203125, -2.14111328125, -1.95526123046875, -1.7694091796875, -1.58355712890625, -1.397705078125, -1.21185302734375, -1.0260009765625, -0.84014892578125, -0.654296875, -0.46844482421875, -0.2825927734375, -0.09674072265625, 0.089111328125, 0.27496337890625, 0.4608154296875, 0.64666748046875, 0.83251953125, 1.01837158203125, 1.2042236328125, 1.39007568359375, 1.575927734375, 1.76177978515625, 1.9476318359375, 2.13348388671875, 2.3193359375, 2.50518798828125, 2.6910400390625, 2.87689208984375, 3.062744140625, 3.24859619140625, 3.4344482421875, 3.62030029296875, 3.80615234375, 3.99200439453125, 4.1778564453125, 4.36370849609375, 4.549560546875, 4.73541259765625, 4.9212646484375, 5.10711669921875, 5.29296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 10.0, 7.0, 10.0, 14.0, 16.0, 16.0, 18.0, 32.0, 22.0, 33.0, 24.0, 36.0, 38.0, 40.0, 52.0, 43.0, 50.0, 55.0, 50.0, 48.0, 46.0, 39.0, 29.0, 27.0, 35.0, 27.0, 24.0, 20.0, 16.0, 12.0, 19.0, 14.0, 8.0, 12.0, 4.0, 8.0, 8.0, 1.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7587890625, -1.6927032470703125, -1.626617431640625, -1.5605316162109375, -1.49444580078125, -1.4283599853515625, -1.362274169921875, -1.2961883544921875, -1.2301025390625, -1.1640167236328125, -1.097930908203125, -1.0318450927734375, -0.96575927734375, -0.8996734619140625, -0.833587646484375, -0.7675018310546875, -0.701416015625, -0.6353302001953125, -0.569244384765625, -0.5031585693359375, -0.43707275390625, -0.3709869384765625, -0.304901123046875, -0.2388153076171875, -0.1727294921875, -0.1066436767578125, -0.040557861328125, 0.0255279541015625, 0.09161376953125, 0.1576995849609375, 0.223785400390625, 0.2898712158203125, 0.35595703125, 0.4220428466796875, 0.488128662109375, 0.5542144775390625, 0.62030029296875, 0.6863861083984375, 0.752471923828125, 0.8185577392578125, 0.8846435546875, 0.9507293701171875, 1.016815185546875, 1.0829010009765625, 1.14898681640625, 1.2150726318359375, 1.281158447265625, 1.3472442626953125, 1.413330078125, 1.4794158935546875, 1.545501708984375, 1.6115875244140625, 1.67767333984375, 1.7437591552734375, 1.809844970703125, 1.8759307861328125, 1.9420166015625, 2.0081024169921875, 2.074188232421875, 2.1402740478515625, 2.20635986328125, 2.2724456787109375, 2.338531494140625, 2.4046173095703125, 2.470703125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 11.0, 14.0, 26.0, 14.0, 18.0, 23.0, 24.0, 14.0, 24.0, 40.0, 31.0, 34.0, 40.0, 28.0, 45.0, 44.0, 39.0, 43.0, 35.0, 44.0, 42.0, 40.0, 42.0, 26.0, 28.0, 25.0, 28.0, 23.0, 21.0, 16.0, 10.0, 14.0, 11.0, 15.0, 10.0, 6.0, 11.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.298860549926758, -9.949592590332031, -9.600324630737305, -9.251056671142578, -8.901788711547852, -8.552520751953125, -8.203252792358398, -7.853984355926514, -7.504716396331787, -7.1554484367370605, -6.806180477142334, -6.456912040710449, -6.107644081115723, -5.758376121520996, -5.4091081619262695, -5.059840202331543, -4.710572242736816, -4.36130428314209, -4.012036323547363, -3.6627681255340576, -3.313500165939331, -2.9642322063446045, -2.614964008331299, -2.2656960487365723, -1.9164280891418457, -1.5671601295471191, -1.217892050743103, -0.8686239719390869, -0.5193560123443604, -0.1700880527496338, 0.17918014526367188, 0.5284481048583984, 0.8777151107788086, 1.2269830703735352, 1.5762511491775513, 1.9255192279815674, 2.274787187576294, 2.6240551471710205, 2.973323345184326, 3.3225913047790527, 3.6718592643737793, 4.021127223968506, 4.370395183563232, 4.719663619995117, 5.068931579589844, 5.41819953918457, 5.767467498779297, 6.116735458374023, 6.46600341796875, 6.815271377563477, 7.164539337158203, 7.51380729675293, 7.863075256347656, 8.212343215942383, 8.56161117553711, 8.910879135131836, 9.260147094726562, 9.609415054321289, 9.958683013916016, 10.307950973510742, 10.657218933105469, 11.006486892700195, 11.355754852294922, 11.705022811889648, 12.054291725158691]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 2.0, 14.0, 10.0, 7.0, 18.0, 23.0, 17.0, 25.0, 31.0, 30.0, 27.0, 35.0, 29.0, 47.0, 39.0, 33.0, 48.0, 49.0, 36.0, 64.0, 41.0, 38.0, 30.0, 43.0, 29.0, 32.0, 28.0, 24.0, 27.0, 29.0, 14.0, 17.0, 9.0, 5.0, 13.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.076319694519043, -13.638952255249023, -13.201584815979004, -12.764217376708984, -12.326849937438965, -11.889482498168945, -11.45211410522461, -11.014747619628906, -10.57737922668457, -10.14001178741455, -9.702644348144531, -9.265276908874512, -8.827909469604492, -8.390542030334473, -7.953174114227295, -7.515806674957275, -7.078439712524414, -6.6410722732543945, -6.203704833984375, -5.7663373947143555, -5.328969955444336, -4.891602516174316, -4.454234600067139, -4.016867160797119, -3.5794997215270996, -3.14213228225708, -2.7047648429870605, -2.267397165298462, -1.8300297260284424, -1.3926622867584229, -0.9552946090698242, -0.5179271697998047, -0.08055877685546875, 0.35680872201919556, 0.7941762208938599, 1.231543779373169, 1.6689112186431885, 2.106278657913208, 2.5436463356018066, 2.981013774871826, 3.4183812141418457, 3.8557486534118652, 4.293116092681885, 4.7304840087890625, 5.167851448059082, 5.605218887329102, 6.042586326599121, 6.479953765869141, 6.91732120513916, 7.35468864440918, 7.792056083679199, 8.229423522949219, 8.666790962219238, 9.104158401489258, 9.541526794433594, 9.978893280029297, 10.416261672973633, 10.853629112243652, 11.290996551513672, 11.728363990783691, 12.165731430053711, 12.60309886932373, 13.04046630859375, 13.477834701538086, 13.915201187133789]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 10.0, 22.0, 39.0, 48.0, 59.0, 142.0, 211.0, 367.0, 580.0, 1014.0, 1681.0, 2759.0, 4737.0, 8054.0, 13129.0, 22407.0, 37645.0, 61724.0, 99830.0, 158055.0, 240922.0, 345468.0, 455812.0, 539007.0, 553477.0, 491682.0, 387653.0, 275745.0, 185316.0, 118732.0, 74124.0, 45346.0, 27604.0, 16630.0, 9867.0, 5871.0, 3552.0, 2031.0, 1212.0, 738.0, 416.0, 248.0, 134.0, 84.0, 42.0, 27.0, 13.0, 11.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.276611328125, -7.98291015625, -7.689208984375, -7.3955078125, -7.101806640625, -6.80810546875, -6.514404296875, -6.220703125, -5.927001953125, -5.63330078125, -5.339599609375, -5.0458984375, -4.752197265625, -4.45849609375, -4.164794921875, -3.87109375, -3.577392578125, -3.28369140625, -2.989990234375, -2.6962890625, -2.402587890625, -2.10888671875, -1.815185546875, -1.521484375, -1.227783203125, -0.93408203125, -0.640380859375, -0.3466796875, -0.052978515625, 0.24072265625, 0.534423828125, 0.828125, 1.121826171875, 1.41552734375, 1.709228515625, 2.0029296875, 2.296630859375, 2.59033203125, 2.884033203125, 3.177734375, 3.471435546875, 3.76513671875, 4.058837890625, 4.3525390625, 4.646240234375, 4.93994140625, 5.233642578125, 5.52734375, 5.821044921875, 6.11474609375, 6.408447265625, 6.7021484375, 6.995849609375, 7.28955078125, 7.583251953125, 7.876953125, 8.170654296875, 8.46435546875, 8.758056640625, 9.0517578125, 9.345458984375, 9.63916015625, 9.932861328125, 10.2265625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 12.0, 18.0, 22.0, 23.0, 13.0, 22.0, 31.0, 33.0, 37.0, 33.0, 31.0, 37.0, 53.0, 38.0, 39.0, 53.0, 45.0, 47.0, 47.0, 38.0, 31.0, 41.0, 38.0, 24.0, 26.0, 28.0, 23.0, 24.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.03125, -10.709228515625, -10.38720703125, -10.065185546875, -9.7431640625, -9.421142578125, -9.09912109375, -8.777099609375, -8.455078125, -8.133056640625, -7.81103515625, -7.489013671875, -7.1669921875, -6.844970703125, -6.52294921875, -6.200927734375, -5.87890625, -5.556884765625, -5.23486328125, -4.912841796875, -4.5908203125, -4.268798828125, -3.94677734375, -3.624755859375, -3.302734375, -2.980712890625, -2.65869140625, -2.336669921875, -2.0146484375, -1.692626953125, -1.37060546875, -1.048583984375, -0.7265625, -0.404541015625, -0.08251953125, 0.239501953125, 0.5615234375, 0.883544921875, 1.20556640625, 1.527587890625, 1.849609375, 2.171630859375, 2.49365234375, 2.815673828125, 3.1376953125, 3.459716796875, 3.78173828125, 4.103759765625, 4.42578125, 4.747802734375, 5.06982421875, 5.391845703125, 5.7138671875, 6.035888671875, 6.35791015625, 6.679931640625, 7.001953125, 7.323974609375, 7.64599609375, 7.968017578125, 8.2900390625, 8.612060546875, 8.93408203125, 9.256103515625, 9.578125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 14.0, 14.0, 23.0, 37.0, 59.0, 135.0, 236.0, 348.0, 578.0, 959.0, 1889.0, 3178.0, 5538.0, 9387.0, 15832.0, 26815.0, 44021.0, 70960.0, 112410.0, 168365.0, 243909.0, 331222.0, 417421.0, 479678.0, 497679.0, 461094.0, 389850.0, 301469.0, 215709.0, 147284.0, 95826.0, 60750.0, 37229.0, 22204.0, 13310.0, 7846.0, 4517.0, 2633.0, 1596.0, 903.0, 559.0, 295.0, 213.0, 100.0, 80.0, 41.0, 30.0, 11.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8203125, -8.5474853515625, -8.274658203125, -8.0018310546875, -7.72900390625, -7.4561767578125, -7.183349609375, -6.9105224609375, -6.6376953125, -6.3648681640625, -6.092041015625, -5.8192138671875, -5.54638671875, -5.2735595703125, -5.000732421875, -4.7279052734375, -4.455078125, -4.1822509765625, -3.909423828125, -3.6365966796875, -3.36376953125, -3.0909423828125, -2.818115234375, -2.5452880859375, -2.2724609375, -1.9996337890625, -1.726806640625, -1.4539794921875, -1.18115234375, -0.9083251953125, -0.635498046875, -0.3626708984375, -0.08984375, 0.1829833984375, 0.455810546875, 0.7286376953125, 1.00146484375, 1.2742919921875, 1.547119140625, 1.8199462890625, 2.0927734375, 2.3656005859375, 2.638427734375, 2.9112548828125, 3.18408203125, 3.4569091796875, 3.729736328125, 4.0025634765625, 4.275390625, 4.5482177734375, 4.821044921875, 5.0938720703125, 5.36669921875, 5.6395263671875, 5.912353515625, 6.1851806640625, 6.4580078125, 6.7308349609375, 7.003662109375, 7.2764892578125, 7.54931640625, 7.8221435546875, 8.094970703125, 8.3677978515625, 8.640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 10.0, 5.0, 17.0, 20.0, 23.0, 27.0, 49.0, 52.0, 47.0, 52.0, 90.0, 96.0, 125.0, 165.0, 158.0, 167.0, 200.0, 201.0, 206.0, 184.0, 246.0, 206.0, 198.0, 187.0, 201.0, 176.0, 190.0, 122.0, 106.0, 101.0, 80.0, 64.0, 73.0, 53.0, 39.0, 31.0, 23.0, 14.0, 21.0, 16.0, 8.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46484375, -4.32598876953125, -4.1871337890625, -4.04827880859375, -3.909423828125, -3.77056884765625, -3.6317138671875, -3.49285888671875, -3.35400390625, -3.21514892578125, -3.0762939453125, -2.93743896484375, -2.798583984375, -2.65972900390625, -2.5208740234375, -2.38201904296875, -2.2431640625, -2.10430908203125, -1.9654541015625, -1.82659912109375, -1.687744140625, -1.54888916015625, -1.4100341796875, -1.27117919921875, -1.13232421875, -0.99346923828125, -0.8546142578125, -0.71575927734375, -0.576904296875, -0.43804931640625, -0.2991943359375, -0.16033935546875, -0.021484375, 0.11737060546875, 0.2562255859375, 0.39508056640625, 0.533935546875, 0.67279052734375, 0.8116455078125, 0.95050048828125, 1.08935546875, 1.22821044921875, 1.3670654296875, 1.50592041015625, 1.644775390625, 1.78363037109375, 1.9224853515625, 2.06134033203125, 2.2001953125, 2.33905029296875, 2.4779052734375, 2.61676025390625, 2.755615234375, 2.89447021484375, 3.0333251953125, 3.17218017578125, 3.31103515625, 3.44989013671875, 3.5887451171875, 3.72760009765625, 3.866455078125, 4.00531005859375, 4.1441650390625, 4.28302001953125, 4.421875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 7.0, 7.0, 8.0, 11.0, 18.0, 11.0, 15.0, 18.0, 20.0, 21.0, 20.0, 29.0, 32.0, 37.0, 47.0, 27.0, 29.0, 28.0, 48.0, 40.0, 44.0, 36.0, 45.0, 42.0, 57.0, 41.0, 39.0, 31.0, 27.0, 24.0, 17.0, 31.0, 16.0, 13.0, 15.0, 13.0, 9.0, 4.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.314350128173828, -9.002786636352539, -8.691222190856934, -8.379658699035645, -8.068095207214355, -7.756531238555908, -7.444967269897461, -7.133403778076172, -6.821839809417725, -6.510275840759277, -6.198712348937988, -5.887148380279541, -5.575584411621094, -5.264020919799805, -4.952456951141357, -4.64089298248291, -4.329329490661621, -4.017765522003174, -3.7062020301818848, -3.3946380615234375, -3.0830743312835693, -2.771510601043701, -2.459946632385254, -2.1483829021453857, -1.8368191719055176, -1.5252554416656494, -1.2136915922164917, -0.9021278023719788, -0.5905640125274658, -0.27900028228759766, 0.03256356716156006, 0.3441274166107178, 0.6556921005249023, 0.9672558903694153, 1.2788196802139282, 1.590383529663086, 1.901947259902954, 2.2135109901428223, 2.5250749588012695, 2.8366386890411377, 3.148202419281006, 3.459766149520874, 3.771329879760742, 4.0828938484191895, 4.394457817077637, 4.706021308898926, 5.017585277557373, 5.32914924621582, 5.640712738037109, 5.952276706695557, 6.263840198516846, 6.575404167175293, 6.886967658996582, 7.198531627655029, 7.510095596313477, 7.821659088134766, 8.133222579956055, 8.444786071777344, 8.75635051727295, 9.067914009094238, 9.379477500915527, 9.691041946411133, 10.002605438232422, 10.314168930053711, 10.625733375549316]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 12.0, 5.0, 12.0, 19.0, 21.0, 25.0, 38.0, 31.0, 35.0, 58.0, 45.0, 31.0, 62.0, 64.0, 63.0, 60.0, 41.0, 52.0, 39.0, 41.0, 45.0, 38.0, 36.0, 32.0, 14.0, 16.0, 9.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.942888259887695, -11.49248218536377, -11.042076110839844, -10.591670989990234, -10.141264915466309, -9.690858840942383, -9.240452766418457, -8.790046691894531, -8.339641571044922, -7.889235496520996, -7.4388298988342285, -6.988423824310303, -6.538018226623535, -6.087612152099609, -5.637206077575684, -5.186800479888916, -4.73639440536499, -4.2859883308410645, -3.835582733154297, -3.385176658630371, -2.9347710609436035, -2.4843649864196777, -2.033959150314331, -1.5835533142089844, -1.1331474781036377, -0.682741641998291, -0.23233574628829956, 0.2180701494216919, 0.6684759855270386, 1.1188819408416748, 1.5692877769470215, 2.019693613052368, 2.470099449157715, 2.9205052852630615, 3.370911121368408, 3.821317195892334, 4.271722793579102, 4.722128868103027, 5.172534942626953, 5.622940540313721, 6.073346138000488, 6.523752212524414, 6.974157810211182, 7.424563884735107, 7.874969482421875, 8.3253755569458, 8.775781631469727, 9.226186752319336, 9.676593780517578, 10.126999855041504, 10.57740592956543, 11.027811050415039, 11.478217124938965, 11.92862319946289, 12.379029273986816, 12.829435348510742, 13.279840469360352, 13.730246543884277, 14.180652618408203, 14.631057739257812, 15.081463813781738, 15.531869888305664, 15.98227596282959, 16.432682037353516, 16.883087158203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 11.0, 16.0, 17.0, 26.0, 49.0, 70.0, 136.0, 155.0, 249.0, 386.0, 544.0, 869.0, 1334.0, 2027.0, 3304.0, 5549.0, 9227.0, 17327.0, 32031.0, 64196.0, 124708.0, 224236.0, 246854.0, 149972.0, 77398.0, 39527.0, 20336.0, 11166.0, 6342.0, 3824.0, 2365.0, 1460.0, 900.0, 647.0, 438.0, 274.0, 174.0, 126.0, 82.0, 57.0, 46.0, 27.0, 17.0, 11.0, 7.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-8.7265625, -8.4632568359375, -8.199951171875, -7.9366455078125, -7.67333984375, -7.4100341796875, -7.146728515625, -6.8834228515625, -6.6201171875, -6.3568115234375, -6.093505859375, -5.8302001953125, -5.56689453125, -5.3035888671875, -5.040283203125, -4.7769775390625, -4.513671875, -4.2503662109375, -3.987060546875, -3.7237548828125, -3.46044921875, -3.1971435546875, -2.933837890625, -2.6705322265625, -2.4072265625, -2.1439208984375, -1.880615234375, -1.6173095703125, -1.35400390625, -1.0906982421875, -0.827392578125, -0.5640869140625, -0.30078125, -0.0374755859375, 0.225830078125, 0.4891357421875, 0.75244140625, 1.0157470703125, 1.279052734375, 1.5423583984375, 1.8056640625, 2.0689697265625, 2.332275390625, 2.5955810546875, 2.85888671875, 3.1221923828125, 3.385498046875, 3.6488037109375, 3.912109375, 4.1754150390625, 4.438720703125, 4.7020263671875, 4.96533203125, 5.2286376953125, 5.491943359375, 5.7552490234375, 6.0185546875, 6.2818603515625, 6.545166015625, 6.8084716796875, 7.07177734375, 7.3350830078125, 7.598388671875, 7.8616943359375, 8.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 11.0, 12.0, 21.0, 22.0, 17.0, 24.0, 22.0, 39.0, 48.0, 46.0, 40.0, 50.0, 51.0, 57.0, 48.0, 60.0, 43.0, 54.0, 49.0, 39.0, 39.0, 35.0, 37.0, 24.0, 18.0, 17.0, 15.0, 9.0, 13.0, 10.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.2962646484375, -10.850341796875, -10.4044189453125, -9.95849609375, -9.5125732421875, -9.066650390625, -8.6207275390625, -8.1748046875, -7.7288818359375, -7.282958984375, -6.8370361328125, -6.39111328125, -5.9451904296875, -5.499267578125, -5.0533447265625, -4.607421875, -4.1614990234375, -3.715576171875, -3.2696533203125, -2.82373046875, -2.3778076171875, -1.931884765625, -1.4859619140625, -1.0400390625, -0.5941162109375, -0.148193359375, 0.2977294921875, 0.74365234375, 1.1895751953125, 1.635498046875, 2.0814208984375, 2.52734375, 2.9732666015625, 3.419189453125, 3.8651123046875, 4.31103515625, 4.7569580078125, 5.202880859375, 5.6488037109375, 6.0947265625, 6.5406494140625, 6.986572265625, 7.4324951171875, 7.87841796875, 8.3243408203125, 8.770263671875, 9.2161865234375, 9.662109375, 10.1080322265625, 10.553955078125, 10.9998779296875, 11.44580078125, 11.8917236328125, 12.337646484375, 12.7835693359375, 13.2294921875, 13.6754150390625, 14.121337890625, 14.5672607421875, 15.01318359375, 15.4591064453125, 15.905029296875, 16.3509521484375, 16.796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 7.0, 13.0, 15.0, 31.0, 34.0, 60.0, 90.0, 168.0, 213.0, 321.0, 427.0, 723.0, 1102.0, 1811.0, 2905.0, 4975.0, 9132.0, 17480.0, 36313.0, 80081.0, 183300.0, 313870.0, 213548.0, 94720.0, 42127.0, 20283.0, 10358.0, 5557.0, 3293.0, 1971.0, 1255.0, 829.0, 502.0, 340.0, 226.0, 157.0, 106.0, 62.0, 41.0, 37.0, 25.0, 17.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.71484375, -7.4852294921875, -7.255615234375, -7.0260009765625, -6.79638671875, -6.5667724609375, -6.337158203125, -6.1075439453125, -5.8779296875, -5.6483154296875, -5.418701171875, -5.1890869140625, -4.95947265625, -4.7298583984375, -4.500244140625, -4.2706298828125, -4.041015625, -3.8114013671875, -3.581787109375, -3.3521728515625, -3.12255859375, -2.8929443359375, -2.663330078125, -2.4337158203125, -2.2041015625, -1.9744873046875, -1.744873046875, -1.5152587890625, -1.28564453125, -1.0560302734375, -0.826416015625, -0.5968017578125, -0.3671875, -0.1375732421875, 0.092041015625, 0.3216552734375, 0.55126953125, 0.7808837890625, 1.010498046875, 1.2401123046875, 1.4697265625, 1.6993408203125, 1.928955078125, 2.1585693359375, 2.38818359375, 2.6177978515625, 2.847412109375, 3.0770263671875, 3.306640625, 3.5362548828125, 3.765869140625, 3.9954833984375, 4.22509765625, 4.4547119140625, 4.684326171875, 4.9139404296875, 5.1435546875, 5.3731689453125, 5.602783203125, 5.8323974609375, 6.06201171875, 6.2916259765625, 6.521240234375, 6.7508544921875, 6.98046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 11.0, 10.0, 22.0, 21.0, 29.0, 19.0, 27.0, 32.0, 38.0, 40.0, 37.0, 48.0, 42.0, 42.0, 44.0, 47.0, 51.0, 49.0, 37.0, 50.0, 39.0, 34.0, 43.0, 40.0, 25.0, 27.0, 20.0, 22.0, 11.0, 13.0, 10.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.3984375, -12.066162109375, -11.73388671875, -11.401611328125, -11.0693359375, -10.737060546875, -10.40478515625, -10.072509765625, -9.740234375, -9.407958984375, -9.07568359375, -8.743408203125, -8.4111328125, -8.078857421875, -7.74658203125, -7.414306640625, -7.08203125, -6.749755859375, -6.41748046875, -6.085205078125, -5.7529296875, -5.420654296875, -5.08837890625, -4.756103515625, -4.423828125, -4.091552734375, -3.75927734375, -3.427001953125, -3.0947265625, -2.762451171875, -2.43017578125, -2.097900390625, -1.765625, -1.433349609375, -1.10107421875, -0.768798828125, -0.4365234375, -0.104248046875, 0.22802734375, 0.560302734375, 0.892578125, 1.224853515625, 1.55712890625, 1.889404296875, 2.2216796875, 2.553955078125, 2.88623046875, 3.218505859375, 3.55078125, 3.883056640625, 4.21533203125, 4.547607421875, 4.8798828125, 5.212158203125, 5.54443359375, 5.876708984375, 6.208984375, 6.541259765625, 6.87353515625, 7.205810546875, 7.5380859375, 7.870361328125, 8.20263671875, 8.534912109375, 8.8671875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 6.0, 7.0, 12.0, 21.0, 33.0, 46.0, 47.0, 78.0, 109.0, 160.0, 211.0, 292.0, 428.0, 665.0, 962.0, 1564.0, 2654.0, 4403.0, 8660.0, 19475.0, 67465.0, 649742.0, 227485.0, 35304.0, 12963.0, 6321.0, 3409.0, 2078.0, 1283.0, 808.0, 584.0, 376.0, 241.0, 162.0, 136.0, 94.0, 65.0, 59.0, 43.0, 27.0, 27.0, 17.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.78125, -9.4827880859375, -9.184326171875, -8.8858642578125, -8.58740234375, -8.2889404296875, -7.990478515625, -7.6920166015625, -7.3935546875, -7.0950927734375, -6.796630859375, -6.4981689453125, -6.19970703125, -5.9012451171875, -5.602783203125, -5.3043212890625, -5.005859375, -4.7073974609375, -4.408935546875, -4.1104736328125, -3.81201171875, -3.5135498046875, -3.215087890625, -2.9166259765625, -2.6181640625, -2.3197021484375, -2.021240234375, -1.7227783203125, -1.42431640625, -1.1258544921875, -0.827392578125, -0.5289306640625, -0.23046875, 0.0679931640625, 0.366455078125, 0.6649169921875, 0.96337890625, 1.2618408203125, 1.560302734375, 1.8587646484375, 2.1572265625, 2.4556884765625, 2.754150390625, 3.0526123046875, 3.35107421875, 3.6495361328125, 3.947998046875, 4.2464599609375, 4.544921875, 4.8433837890625, 5.141845703125, 5.4403076171875, 5.73876953125, 6.0372314453125, 6.335693359375, 6.6341552734375, 6.9326171875, 7.2310791015625, 7.529541015625, 7.8280029296875, 8.12646484375, 8.4249267578125, 8.723388671875, 9.0218505859375, 9.3203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 8.0, 9.0, 5.0, 17.0, 14.0, 24.0, 36.0, 82.0, 148.0, 209.0, 189.0, 87.0, 48.0, 24.0, 17.0, 12.0, 11.0, 9.0, 7.0, 4.0, 3.0, 6.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008530616760253906, -0.0008233413100242615, -0.0007936209440231323, -0.0007639005780220032, -0.000734180212020874, -0.0007044598460197449, -0.0006747394800186157, -0.0006450191140174866, -0.0006152987480163574, -0.0005855783820152283, -0.0005558580160140991, -0.00052613765001297, -0.0004964172840118408, -0.00046669691801071167, -0.0004369765520095825, -0.00040725618600845337, -0.0003775358200073242, -0.00034781545400619507, -0.0003180950880050659, -0.00028837472200393677, -0.0002586543560028076, -0.00022893399000167847, -0.00019921362400054932, -0.00016949325799942017, -0.00013977289199829102, -0.00011005252599716187, -8.033215999603271e-05, -5.0611793994903564e-05, -2.0891427993774414e-05, 8.828938007354736e-06, 3.854930400848389e-05, 6.826967000961304e-05, 9.799003601074219e-05, 0.00012771040201187134, 0.0001574307680130005, 0.00018715113401412964, 0.0002168715000152588, 0.00024659186601638794, 0.0002763122320175171, 0.00030603259801864624, 0.0003357529640197754, 0.00036547333002090454, 0.0003951936960220337, 0.00042491406202316284, 0.000454634428024292, 0.00048435479402542114, 0.0005140751600265503, 0.0005437955260276794, 0.0005735158920288086, 0.0006032362580299377, 0.0006329566240310669, 0.000662676990032196, 0.0006923973560333252, 0.0007221177220344543, 0.0007518380880355835, 0.0007815584540367126, 0.0008112788200378418, 0.000840999186038971, 0.0008707195520401001, 0.0009004399180412292, 0.0009301602840423584, 0.0009598806500434875, 0.0009896010160446167, 0.0010193213820457458, 0.001049041748046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 13.0, 13.0, 28.0, 40.0, 45.0, 83.0, 159.0, 259.0, 435.0, 740.0, 1303.0, 2298.0, 4158.0, 7597.0, 13878.0, 27736.0, 80763.0, 455180.0, 338835.0, 62966.0, 24307.0, 12294.0, 6730.0, 3742.0, 2058.0, 1215.0, 669.0, 383.0, 247.0, 152.0, 80.0, 51.0, 26.0, 16.0, 13.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2265625, -10.8511962890625, -10.475830078125, -10.1004638671875, -9.72509765625, -9.3497314453125, -8.974365234375, -8.5989990234375, -8.2236328125, -7.8482666015625, -7.472900390625, -7.0975341796875, -6.72216796875, -6.3468017578125, -5.971435546875, -5.5960693359375, -5.220703125, -4.8453369140625, -4.469970703125, -4.0946044921875, -3.71923828125, -3.3438720703125, -2.968505859375, -2.5931396484375, -2.2177734375, -1.8424072265625, -1.467041015625, -1.0916748046875, -0.71630859375, -0.3409423828125, 0.034423828125, 0.4097900390625, 0.78515625, 1.1605224609375, 1.535888671875, 1.9112548828125, 2.28662109375, 2.6619873046875, 3.037353515625, 3.4127197265625, 3.7880859375, 4.1634521484375, 4.538818359375, 4.9141845703125, 5.28955078125, 5.6649169921875, 6.040283203125, 6.4156494140625, 6.791015625, 7.1663818359375, 7.541748046875, 7.9171142578125, 8.29248046875, 8.6678466796875, 9.043212890625, 9.4185791015625, 9.7939453125, 10.1693115234375, 10.544677734375, 10.9200439453125, 11.29541015625, 11.6707763671875, 12.046142578125, 12.4215087890625, 12.796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 15.0, 22.0, 32.0, 64.0, 94.0, 185.0, 215.0, 142.0, 71.0, 29.0, 22.0, 15.0, 15.0, 19.0, 12.0, 3.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4296875, -6.27398681640625, -6.1182861328125, -5.96258544921875, -5.806884765625, -5.65118408203125, -5.4954833984375, -5.33978271484375, -5.18408203125, -5.02838134765625, -4.8726806640625, -4.71697998046875, -4.561279296875, -4.40557861328125, -4.2498779296875, -4.09417724609375, -3.9384765625, -3.78277587890625, -3.6270751953125, -3.47137451171875, -3.315673828125, -3.15997314453125, -3.0042724609375, -2.84857177734375, -2.69287109375, -2.53717041015625, -2.3814697265625, -2.22576904296875, -2.070068359375, -1.91436767578125, -1.7586669921875, -1.60296630859375, -1.447265625, -1.29156494140625, -1.1358642578125, -0.98016357421875, -0.824462890625, -0.66876220703125, -0.5130615234375, -0.35736083984375, -0.20166015625, -0.04595947265625, 0.1097412109375, 0.26544189453125, 0.421142578125, 0.57684326171875, 0.7325439453125, 0.88824462890625, 1.0439453125, 1.19964599609375, 1.3553466796875, 1.51104736328125, 1.666748046875, 1.82244873046875, 1.9781494140625, 2.13385009765625, 2.28955078125, 2.44525146484375, 2.6009521484375, 2.75665283203125, 2.912353515625, 3.06805419921875, 3.2237548828125, 3.37945556640625, 3.53515625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 9.0, 4.0, 3.0, 6.0, 4.0, 10.0, 10.0, 14.0, 6.0, 12.0, 18.0, 14.0, 25.0, 28.0, 31.0, 21.0, 32.0, 33.0, 31.0, 36.0, 31.0, 47.0, 39.0, 30.0, 31.0, 53.0, 38.0, 52.0, 43.0, 43.0, 40.0, 23.0, 28.0, 19.0, 20.0, 19.0, 19.0, 11.0, 14.0, 10.0, 8.0, 13.0, 10.0, 7.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.625786781311035, -9.325700759887695, -9.025615692138672, -8.725530624389648, -8.425444602966309, -8.125358581542969, -7.825273513793945, -7.525187969207764, -7.225102424621582, -6.9250168800354, -6.624931335449219, -6.324845790863037, -6.0247602462768555, -5.724674701690674, -5.424589157104492, -5.1245036125183105, -4.824418067932129, -4.524332523345947, -4.224246978759766, -3.924161434173584, -3.6240758895874023, -3.3239903450012207, -3.023904800415039, -2.7238192558288574, -2.423733711242676, -2.123648166656494, -1.8235626220703125, -1.5234770774841309, -1.2233915328979492, -0.9233059883117676, -0.6232204437255859, -0.3231348991394043, -0.02304840087890625, 0.2770371437072754, 0.577122688293457, 0.8772082328796387, 1.1772937774658203, 1.477379322052002, 1.7774648666381836, 2.0775504112243652, 2.377635955810547, 2.6777215003967285, 2.97780704498291, 3.277892589569092, 3.5779781341552734, 3.878063678741455, 4.178149223327637, 4.478234767913818, 4.7783203125, 5.078405857086182, 5.378491401672363, 5.678576946258545, 5.978662490844727, 6.278748035430908, 6.57883358001709, 6.8789191246032715, 7.179004669189453, 7.479090213775635, 7.779175758361816, 8.079261779785156, 8.37934684753418, 8.679431915283203, 8.979517936706543, 9.279603958129883, 9.579689025878906]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 5.0, 12.0, 9.0, 15.0, 8.0, 19.0, 17.0, 27.0, 25.0, 42.0, 41.0, 44.0, 48.0, 46.0, 51.0, 61.0, 65.0, 61.0, 50.0, 40.0, 43.0, 45.0, 32.0, 35.0, 35.0, 22.0, 24.0, 12.0, 16.0, 8.0, 8.0, 9.0, 7.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.239293098449707, -11.792688369750977, -11.346083641052246, -10.899478912353516, -10.452874183654785, -10.006269454956055, -9.55966567993164, -9.113059997558594, -8.66645622253418, -8.21985149383545, -7.773246765136719, -7.326642036437988, -6.880037307739258, -6.433432579040527, -5.986828327178955, -5.540223598480225, -5.093618392944336, -4.6470136642456055, -4.200408935546875, -3.7538044452667236, -3.307199716567993, -2.8605949878692627, -2.4139904975891113, -1.9673857688903809, -1.5207810401916504, -1.07417631149292, -0.627571702003479, -0.18096709251403809, 0.2656376361846924, 0.7122423648834229, 1.1588468551635742, 1.6054515838623047, 2.0520572662353516, 2.498661994934082, 2.9452667236328125, 3.391871213912964, 3.8384759426116943, 4.285080909729004, 4.731685161590576, 5.178289890289307, 5.624894618988037, 6.071499347686768, 6.518104076385498, 6.96470832824707, 7.411313056945801, 7.857917785644531, 8.304522514343262, 8.751127243041992, 9.197731971740723, 9.644336700439453, 10.090941429138184, 10.537546157836914, 10.984150886535645, 11.430755615234375, 11.877359390258789, 12.323965072631836, 12.77056884765625, 13.21717357635498, 13.663778305053711, 14.110383033752441, 14.556987762451172, 15.003592491149902, 15.450197219848633, 15.896800994873047, 16.343406677246094]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 12.0, 13.0, 33.0, 43.0, 66.0, 117.0, 146.0, 254.0, 364.0, 577.0, 923.0, 1468.0, 2334.0, 3707.0, 5933.0, 9193.0, 14555.0, 21856.0, 32466.0, 46700.0, 63598.0, 83384.0, 100550.0, 113351.0, 114511.0, 106211.0, 90584.0, 71216.0, 53297.0, 37811.0, 25759.0, 17051.0, 11035.0, 7054.0, 4560.0, 2854.0, 1817.0, 1192.0, 666.0, 449.0, 297.0, 194.0, 108.0, 87.0, 59.0, 45.0, 21.0, 16.0, 9.0, 10.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.2874755859375, -9.957763671875, -9.6280517578125, -9.29833984375, -8.9686279296875, -8.638916015625, -8.3092041015625, -7.9794921875, -7.6497802734375, -7.320068359375, -6.9903564453125, -6.66064453125, -6.3309326171875, -6.001220703125, -5.6715087890625, -5.341796875, -5.0120849609375, -4.682373046875, -4.3526611328125, -4.02294921875, -3.6932373046875, -3.363525390625, -3.0338134765625, -2.7041015625, -2.3743896484375, -2.044677734375, -1.7149658203125, -1.38525390625, -1.0555419921875, -0.725830078125, -0.3961181640625, -0.06640625, 0.2633056640625, 0.593017578125, 0.9227294921875, 1.25244140625, 1.5821533203125, 1.911865234375, 2.2415771484375, 2.5712890625, 2.9010009765625, 3.230712890625, 3.5604248046875, 3.89013671875, 4.2198486328125, 4.549560546875, 4.8792724609375, 5.208984375, 5.5386962890625, 5.868408203125, 6.1981201171875, 6.52783203125, 6.8575439453125, 7.187255859375, 7.5169677734375, 7.8466796875, 8.1763916015625, 8.506103515625, 8.8358154296875, 9.16552734375, 9.4952392578125, 9.824951171875, 10.1546630859375, 10.484375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 6.0, 11.0, 10.0, 11.0, 10.0, 18.0, 19.0, 35.0, 34.0, 37.0, 43.0, 28.0, 68.0, 47.0, 62.0, 43.0, 71.0, 58.0, 52.0, 42.0, 33.0, 41.0, 34.0, 39.0, 27.0, 21.0, 20.0, 18.0, 9.0, 13.0, 4.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.7952880859375, -11.371826171875, -10.9483642578125, -10.52490234375, -10.1014404296875, -9.677978515625, -9.2545166015625, -8.8310546875, -8.4075927734375, -7.984130859375, -7.5606689453125, -7.13720703125, -6.7137451171875, -6.290283203125, -5.8668212890625, -5.443359375, -5.0198974609375, -4.596435546875, -4.1729736328125, -3.74951171875, -3.3260498046875, -2.902587890625, -2.4791259765625, -2.0556640625, -1.6322021484375, -1.208740234375, -0.7852783203125, -0.36181640625, 0.0616455078125, 0.485107421875, 0.9085693359375, 1.33203125, 1.7554931640625, 2.178955078125, 2.6024169921875, 3.02587890625, 3.4493408203125, 3.872802734375, 4.2962646484375, 4.7197265625, 5.1431884765625, 5.566650390625, 5.9901123046875, 6.41357421875, 6.8370361328125, 7.260498046875, 7.6839599609375, 8.107421875, 8.5308837890625, 8.954345703125, 9.3778076171875, 9.80126953125, 10.2247314453125, 10.648193359375, 11.0716552734375, 11.4951171875, 11.9185791015625, 12.342041015625, 12.7655029296875, 13.18896484375, 13.6124267578125, 14.035888671875, 14.4593505859375, 14.8828125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 17.0, 24.0, 39.0, 42.0, 84.0, 131.0, 257.0, 405.0, 776.0, 1326.0, 2387.0, 4094.0, 7342.0, 12591.0, 21417.0, 35554.0, 56157.0, 82893.0, 111637.0, 133767.0, 141613.0, 128767.0, 104700.0, 75377.0, 50290.0, 31741.0, 19077.0, 11232.0, 6415.0, 3597.0, 2018.0, 1193.0, 655.0, 410.0, 215.0, 128.0, 80.0, 40.0, 28.0, 12.0, 10.0, 10.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.318359375, -11.92578125, -11.533203125, -11.140625, -10.748046875, -10.35546875, -9.962890625, -9.5703125, -9.177734375, -8.78515625, -8.392578125, -8.0, -7.607421875, -7.21484375, -6.822265625, -6.4296875, -6.037109375, -5.64453125, -5.251953125, -4.859375, -4.466796875, -4.07421875, -3.681640625, -3.2890625, -2.896484375, -2.50390625, -2.111328125, -1.71875, -1.326171875, -0.93359375, -0.541015625, -0.1484375, 0.244140625, 0.63671875, 1.029296875, 1.421875, 1.814453125, 2.20703125, 2.599609375, 2.9921875, 3.384765625, 3.77734375, 4.169921875, 4.5625, 4.955078125, 5.34765625, 5.740234375, 6.1328125, 6.525390625, 6.91796875, 7.310546875, 7.703125, 8.095703125, 8.48828125, 8.880859375, 9.2734375, 9.666015625, 10.05859375, 10.451171875, 10.84375, 11.236328125, 11.62890625, 12.021484375, 12.4140625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 8.0, 11.0, 7.0, 10.0, 16.0, 25.0, 17.0, 24.0, 22.0, 29.0, 16.0, 38.0, 28.0, 27.0, 45.0, 44.0, 53.0, 49.0, 48.0, 48.0, 45.0, 41.0, 38.0, 39.0, 29.0, 31.0, 27.0, 30.0, 26.0, 23.0, 24.0, 13.0, 17.0, 11.0, 11.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7734375, -7.53350830078125, -7.2935791015625, -7.05364990234375, -6.813720703125, -6.57379150390625, -6.3338623046875, -6.09393310546875, -5.85400390625, -5.61407470703125, -5.3741455078125, -5.13421630859375, -4.894287109375, -4.65435791015625, -4.4144287109375, -4.17449951171875, -3.9345703125, -3.69464111328125, -3.4547119140625, -3.21478271484375, -2.974853515625, -2.73492431640625, -2.4949951171875, -2.25506591796875, -2.01513671875, -1.77520751953125, -1.5352783203125, -1.29534912109375, -1.055419921875, -0.81549072265625, -0.5755615234375, -0.33563232421875, -0.095703125, 0.14422607421875, 0.3841552734375, 0.62408447265625, 0.864013671875, 1.10394287109375, 1.3438720703125, 1.58380126953125, 1.82373046875, 2.06365966796875, 2.3035888671875, 2.54351806640625, 2.783447265625, 3.02337646484375, 3.2633056640625, 3.50323486328125, 3.7431640625, 3.98309326171875, 4.2230224609375, 4.46295166015625, 4.702880859375, 4.94281005859375, 5.1827392578125, 5.42266845703125, 5.66259765625, 5.90252685546875, 6.1424560546875, 6.38238525390625, 6.622314453125, 6.86224365234375, 7.1021728515625, 7.34210205078125, 7.58203125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 20.0, 24.0, 42.0, 54.0, 108.0, 123.0, 183.0, 304.0, 422.0, 649.0, 957.0, 1444.0, 2200.0, 3252.0, 5262.0, 8238.0, 13234.0, 21664.0, 35509.0, 58999.0, 93196.0, 134752.0, 164233.0, 160220.0, 124302.0, 83701.0, 52074.0, 31637.0, 18998.0, 11756.0, 7397.0, 4685.0, 3044.0, 1982.0, 1233.0, 827.0, 581.0, 401.0, 238.0, 209.0, 118.0, 87.0, 62.0, 37.0, 24.0, 17.0, 10.0, 8.0, 9.0, 6.0, 4.0, 1.0, 3.0], "bins": [-7.40234375, -7.183837890625, -6.96533203125, -6.746826171875, -6.5283203125, -6.309814453125, -6.09130859375, -5.872802734375, -5.654296875, -5.435791015625, -5.21728515625, -4.998779296875, -4.7802734375, -4.561767578125, -4.34326171875, -4.124755859375, -3.90625, -3.687744140625, -3.46923828125, -3.250732421875, -3.0322265625, -2.813720703125, -2.59521484375, -2.376708984375, -2.158203125, -1.939697265625, -1.72119140625, -1.502685546875, -1.2841796875, -1.065673828125, -0.84716796875, -0.628662109375, -0.41015625, -0.191650390625, 0.02685546875, 0.245361328125, 0.4638671875, 0.682373046875, 0.90087890625, 1.119384765625, 1.337890625, 1.556396484375, 1.77490234375, 1.993408203125, 2.2119140625, 2.430419921875, 2.64892578125, 2.867431640625, 3.0859375, 3.304443359375, 3.52294921875, 3.741455078125, 3.9599609375, 4.178466796875, 4.39697265625, 4.615478515625, 4.833984375, 5.052490234375, 5.27099609375, 5.489501953125, 5.7080078125, 5.926513671875, 6.14501953125, 6.363525390625, 6.58203125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 7.0, 7.0, 10.0, 17.0, 23.0, 21.0, 31.0, 28.0, 56.0, 57.0, 61.0, 61.0, 65.0, 76.0, 59.0, 58.0, 50.0, 50.0, 57.0, 37.0, 33.0, 25.0, 22.0, 13.0, 16.0, 8.0, 3.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009527206420898438, -0.0009271800518035889, -0.000901639461517334, -0.0008760988712310791, -0.0008505582809448242, -0.0008250176906585693, -0.0007994771003723145, -0.0007739365100860596, -0.0007483959197998047, -0.0007228553295135498, -0.0006973147392272949, -0.00067177414894104, -0.0006462335586547852, -0.0006206929683685303, -0.0005951523780822754, -0.0005696117877960205, -0.0005440711975097656, -0.0005185306072235107, -0.0004929900169372559, -0.000467449426651001, -0.0004419088363647461, -0.0004163682460784912, -0.00039082765579223633, -0.00036528706550598145, -0.00033974647521972656, -0.0003142058849334717, -0.0002886652946472168, -0.0002631247043609619, -0.00023758411407470703, -0.00021204352378845215, -0.00018650293350219727, -0.00016096234321594238, -0.0001354217529296875, -0.00010988116264343262, -8.434057235717773e-05, -5.879998207092285e-05, -3.325939178466797e-05, -7.718801498413086e-06, 1.7821788787841797e-05, 4.336237907409668e-05, 6.890296936035156e-05, 9.444355964660645e-05, 0.00011998414993286133, 0.0001455247402191162, 0.0001710653305053711, 0.00019660592079162598, 0.00022214651107788086, 0.00024768710136413574, 0.0002732276916503906, 0.0002987682819366455, 0.0003243088722229004, 0.0003498494625091553, 0.00037539005279541016, 0.00040093064308166504, 0.0004264712333679199, 0.0004520118236541748, 0.0004775524139404297, 0.0005030930042266846, 0.0005286335945129395, 0.0005541741847991943, 0.0005797147750854492, 0.0006052553653717041, 0.000630795955657959, 0.0006563365459442139, 0.0006818771362304688]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 13.0, 20.0, 23.0, 33.0, 50.0, 81.0, 95.0, 173.0, 257.0, 412.0, 621.0, 1059.0, 1638.0, 2709.0, 4548.0, 7824.0, 13177.0, 22621.0, 38396.0, 64438.0, 99829.0, 138546.0, 162105.0, 155726.0, 122639.0, 83854.0, 52359.0, 30986.0, 18023.0, 10500.0, 6252.0, 3687.0, 2229.0, 1317.0, 820.0, 499.0, 315.0, 227.0, 149.0, 89.0, 67.0, 39.0, 26.0, 25.0, 20.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.23828125, -6.04205322265625, -5.8458251953125, -5.64959716796875, -5.453369140625, -5.25714111328125, -5.0609130859375, -4.86468505859375, -4.66845703125, -4.47222900390625, -4.2760009765625, -4.07977294921875, -3.883544921875, -3.68731689453125, -3.4910888671875, -3.29486083984375, -3.0986328125, -2.90240478515625, -2.7061767578125, -2.50994873046875, -2.313720703125, -2.11749267578125, -1.9212646484375, -1.72503662109375, -1.52880859375, -1.33258056640625, -1.1363525390625, -0.94012451171875, -0.743896484375, -0.54766845703125, -0.3514404296875, -0.15521240234375, 0.041015625, 0.23724365234375, 0.4334716796875, 0.62969970703125, 0.825927734375, 1.02215576171875, 1.2183837890625, 1.41461181640625, 1.61083984375, 1.80706787109375, 2.0032958984375, 2.19952392578125, 2.395751953125, 2.59197998046875, 2.7882080078125, 2.98443603515625, 3.1806640625, 3.37689208984375, 3.5731201171875, 3.76934814453125, 3.965576171875, 4.16180419921875, 4.3580322265625, 4.55426025390625, 4.75048828125, 4.94671630859375, 5.1429443359375, 5.33917236328125, 5.535400390625, 5.73162841796875, 5.9278564453125, 6.12408447265625, 6.3203125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 6.0, 4.0, 12.0, 13.0, 18.0, 11.0, 14.0, 18.0, 25.0, 35.0, 49.0, 49.0, 56.0, 65.0, 74.0, 74.0, 62.0, 74.0, 48.0, 57.0, 47.0, 37.0, 39.0, 29.0, 20.0, 14.0, 17.0, 13.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.568572998046875, -3.45941162109375, -3.350250244140625, -3.2410888671875, -3.131927490234375, -3.02276611328125, -2.913604736328125, -2.804443359375, -2.695281982421875, -2.58612060546875, -2.476959228515625, -2.3677978515625, -2.258636474609375, -2.14947509765625, -2.040313720703125, -1.93115234375, -1.821990966796875, -1.71282958984375, -1.603668212890625, -1.4945068359375, -1.385345458984375, -1.27618408203125, -1.167022705078125, -1.057861328125, -0.948699951171875, -0.83953857421875, -0.730377197265625, -0.6212158203125, -0.512054443359375, -0.40289306640625, -0.293731689453125, -0.1845703125, -0.075408935546875, 0.03375244140625, 0.142913818359375, 0.2520751953125, 0.361236572265625, 0.47039794921875, 0.579559326171875, 0.688720703125, 0.797882080078125, 0.90704345703125, 1.016204833984375, 1.1253662109375, 1.234527587890625, 1.34368896484375, 1.452850341796875, 1.56201171875, 1.671173095703125, 1.78033447265625, 1.889495849609375, 1.9986572265625, 2.107818603515625, 2.21697998046875, 2.326141357421875, 2.435302734375, 2.544464111328125, 2.65362548828125, 2.762786865234375, 2.8719482421875, 2.981109619140625, 3.09027099609375, 3.199432373046875, 3.30859375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 7.0, 5.0, 13.0, 7.0, 23.0, 16.0, 18.0, 22.0, 27.0, 33.0, 34.0, 43.0, 31.0, 44.0, 64.0, 55.0, 44.0, 48.0, 53.0, 37.0, 48.0, 47.0, 35.0, 35.0, 28.0, 28.0, 21.0, 15.0, 28.0, 14.0, 9.0, 9.0, 8.0, 11.0, 7.0, 8.0, 6.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.38177490234375, -10.044561386108398, -9.707348823547363, -9.370135307312012, -9.032922744750977, -8.695709228515625, -8.358495712280273, -8.021282196044922, -7.684069633483887, -7.346856594085693, -7.0096435546875, -6.672430038452148, -6.335216999053955, -5.998003959655762, -5.66079044342041, -5.323577404022217, -4.986364364624023, -4.64915132522583, -4.311938285827637, -3.974724769592285, -3.637511730194092, -3.3002986907958984, -2.963085412979126, -2.6258721351623535, -2.28865909576416, -1.9514459371566772, -1.6142327785491943, -1.2770196199417114, -0.9398064613342285, -0.6025933027267456, -0.2653801441192627, 0.07183313369750977, 0.4090461730957031, 0.746259331703186, 1.083472490310669, 1.4206856489181519, 1.7578988075256348, 2.095111846923828, 2.4323251247406006, 2.769538402557373, 3.1067514419555664, 3.4439644813537598, 3.7811777591705322, 4.118391036987305, 4.455604076385498, 4.792817115783691, 5.130030632019043, 5.467243671417236, 5.80445671081543, 6.141669750213623, 6.478882789611816, 6.816096305847168, 7.153309345245361, 7.490522384643555, 7.827735900878906, 8.164949417114258, 8.502161979675293, 8.839375495910645, 9.17658805847168, 9.513801574707031, 9.851015090942383, 10.188227653503418, 10.52544116973877, 10.862653732299805, 11.199867248535156]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 14.0, 7.0, 10.0, 13.0, 24.0, 21.0, 30.0, 44.0, 39.0, 46.0, 37.0, 46.0, 48.0, 57.0, 63.0, 55.0, 46.0, 61.0, 41.0, 43.0, 37.0, 39.0, 41.0, 26.0, 22.0, 13.0, 18.0, 17.0, 8.0, 9.0, 4.0, 6.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.638209342956543, -11.172743797302246, -10.70727825164795, -10.241812705993652, -9.776348114013672, -9.310882568359375, -8.845417022705078, -8.379951477050781, -7.914485931396484, -7.4490203857421875, -6.983554840087891, -6.518089771270752, -6.052624225616455, -5.587158679962158, -5.1216936111450195, -4.656228065490723, -4.190762519836426, -3.725296974182129, -3.259831666946411, -2.7943663597106934, -2.3289008140563965, -1.8634352684020996, -1.3979699611663818, -0.9325046539306641, -0.4670391082763672, -0.0015736818313598633, 0.46389174461364746, 0.9293571710586548, 1.394822597503662, 1.860288143157959, 2.3257534503936768, 2.7912187576293945, 3.256685256958008, 3.7221508026123047, 4.187616348266602, 4.65308141708374, 5.118546962738037, 5.584012508392334, 6.049477577209473, 6.5149431228637695, 6.980408668518066, 7.445874214172363, 7.91133975982666, 8.376805305480957, 8.842269897460938, 9.307735443115234, 9.773200988769531, 10.238666534423828, 10.704132080078125, 11.169597625732422, 11.635063171386719, 12.100528717041016, 12.565994262695312, 13.03145980834961, 13.49692440032959, 13.962389945983887, 14.427855491638184, 14.89332103729248, 15.358786582946777, 15.824252128601074, 16.289716720581055, 16.75518226623535, 17.22064781188965, 17.686113357543945, 18.151578903198242]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 8.0, 13.0, 17.0, 46.0, 49.0, 97.0, 157.0, 282.0, 440.0, 687.0, 1232.0, 2035.0, 3203.0, 5384.0, 8626.0, 14399.0, 23600.0, 38636.0, 62647.0, 99303.0, 155246.0, 234261.0, 333423.0, 441277.0, 524464.0, 544713.0, 492475.0, 392679.0, 286472.0, 194572.0, 126271.0, 80062.0, 49701.0, 30162.0, 18511.0, 11363.0, 6852.0, 4296.0, 2624.0, 1505.0, 974.0, 561.0, 380.0, 223.0, 152.0, 71.0, 50.0, 36.0, 25.0, 6.0, 7.0, 10.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.06646728515625, -6.8165283203125, -6.56658935546875, -6.316650390625, -6.06671142578125, -5.8167724609375, -5.56683349609375, -5.31689453125, -5.06695556640625, -4.8170166015625, -4.56707763671875, -4.317138671875, -4.06719970703125, -3.8172607421875, -3.56732177734375, -3.3173828125, -3.06744384765625, -2.8175048828125, -2.56756591796875, -2.317626953125, -2.06768798828125, -1.8177490234375, -1.56781005859375, -1.31787109375, -1.06793212890625, -0.8179931640625, -0.56805419921875, -0.318115234375, -0.06817626953125, 0.1817626953125, 0.43170166015625, 0.681640625, 0.93157958984375, 1.1815185546875, 1.43145751953125, 1.681396484375, 1.93133544921875, 2.1812744140625, 2.43121337890625, 2.68115234375, 2.93109130859375, 3.1810302734375, 3.43096923828125, 3.680908203125, 3.93084716796875, 4.1807861328125, 4.43072509765625, 4.6806640625, 4.93060302734375, 5.1805419921875, 5.43048095703125, 5.680419921875, 5.93035888671875, 6.1802978515625, 6.43023681640625, 6.68017578125, 6.93011474609375, 7.1800537109375, 7.42999267578125, 7.679931640625, 7.92987060546875, 8.1798095703125, 8.42974853515625, 8.6796875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 10.0, 15.0, 14.0, 18.0, 18.0, 26.0, 34.0, 32.0, 37.0, 43.0, 40.0, 47.0, 50.0, 45.0, 62.0, 51.0, 47.0, 44.0, 50.0, 53.0, 33.0, 44.0, 37.0, 40.0, 16.0, 15.0, 14.0, 14.0, 4.0, 16.0, 13.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.816162109375, -7.49169921875, -7.167236328125, -6.8427734375, -6.518310546875, -6.19384765625, -5.869384765625, -5.544921875, -5.220458984375, -4.89599609375, -4.571533203125, -4.2470703125, -3.922607421875, -3.59814453125, -3.273681640625, -2.94921875, -2.624755859375, -2.30029296875, -1.975830078125, -1.6513671875, -1.326904296875, -1.00244140625, -0.677978515625, -0.353515625, -0.029052734375, 0.29541015625, 0.619873046875, 0.9443359375, 1.268798828125, 1.59326171875, 1.917724609375, 2.2421875, 2.566650390625, 2.89111328125, 3.215576171875, 3.5400390625, 3.864501953125, 4.18896484375, 4.513427734375, 4.837890625, 5.162353515625, 5.48681640625, 5.811279296875, 6.1357421875, 6.460205078125, 6.78466796875, 7.109130859375, 7.43359375, 7.758056640625, 8.08251953125, 8.406982421875, 8.7314453125, 9.055908203125, 9.38037109375, 9.704833984375, 10.029296875, 10.353759765625, 10.67822265625, 11.002685546875, 11.3271484375, 11.651611328125, 11.97607421875, 12.300537109375, 12.625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 25.0, 21.0, 34.0, 40.0, 78.0, 141.0, 211.0, 321.0, 564.0, 898.0, 1480.0, 2468.0, 4041.0, 6596.0, 10704.0, 17870.0, 28455.0, 45479.0, 70730.0, 108339.0, 159678.0, 224211.0, 300867.0, 377162.0, 436527.0, 464267.0, 449175.0, 396749.0, 324058.0, 246118.0, 176251.0, 122704.0, 80635.0, 52060.0, 33076.0, 20376.0, 12415.0, 7673.0, 4697.0, 2758.0, 1694.0, 1028.0, 643.0, 354.0, 230.0, 143.0, 86.0, 58.0, 42.0, 16.0, 15.0, 7.0, 9.0, 3.0, 4.0, 3.0, 4.0], "bins": [-7.1875, -6.96734619140625, -6.7471923828125, -6.52703857421875, -6.306884765625, -6.08673095703125, -5.8665771484375, -5.64642333984375, -5.42626953125, -5.20611572265625, -4.9859619140625, -4.76580810546875, -4.545654296875, -4.32550048828125, -4.1053466796875, -3.88519287109375, -3.6650390625, -3.44488525390625, -3.2247314453125, -3.00457763671875, -2.784423828125, -2.56427001953125, -2.3441162109375, -2.12396240234375, -1.90380859375, -1.68365478515625, -1.4635009765625, -1.24334716796875, -1.023193359375, -0.80303955078125, -0.5828857421875, -0.36273193359375, -0.142578125, 0.07757568359375, 0.2977294921875, 0.51788330078125, 0.738037109375, 0.95819091796875, 1.1783447265625, 1.39849853515625, 1.61865234375, 1.83880615234375, 2.0589599609375, 2.27911376953125, 2.499267578125, 2.71942138671875, 2.9395751953125, 3.15972900390625, 3.3798828125, 3.60003662109375, 3.8201904296875, 4.04034423828125, 4.260498046875, 4.48065185546875, 4.7008056640625, 4.92095947265625, 5.14111328125, 5.36126708984375, 5.5814208984375, 5.80157470703125, 6.021728515625, 6.24188232421875, 6.4620361328125, 6.68218994140625, 6.90234375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 20.0, 15.0, 26.0, 30.0, 31.0, 48.0, 66.0, 77.0, 71.0, 109.0, 130.0, 114.0, 149.0, 151.0, 197.0, 182.0, 205.0, 205.0, 193.0, 217.0, 217.0, 199.0, 193.0, 167.0, 165.0, 129.0, 121.0, 104.0, 99.0, 69.0, 83.0, 50.0, 47.0, 33.0, 30.0, 27.0, 24.0, 26.0, 14.0, 9.0, 8.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.77734375, -3.657989501953125, -3.53863525390625, -3.419281005859375, -3.2999267578125, -3.180572509765625, -3.06121826171875, -2.941864013671875, -2.822509765625, -2.703155517578125, -2.58380126953125, -2.464447021484375, -2.3450927734375, -2.225738525390625, -2.10638427734375, -1.987030029296875, -1.86767578125, -1.748321533203125, -1.62896728515625, -1.509613037109375, -1.3902587890625, -1.270904541015625, -1.15155029296875, -1.032196044921875, -0.912841796875, -0.793487548828125, -0.67413330078125, -0.554779052734375, -0.4354248046875, -0.316070556640625, -0.19671630859375, -0.077362060546875, 0.0419921875, 0.161346435546875, 0.28070068359375, 0.400054931640625, 0.5194091796875, 0.638763427734375, 0.75811767578125, 0.877471923828125, 0.996826171875, 1.116180419921875, 1.23553466796875, 1.354888916015625, 1.4742431640625, 1.593597412109375, 1.71295166015625, 1.832305908203125, 1.95166015625, 2.071014404296875, 2.19036865234375, 2.309722900390625, 2.4290771484375, 2.548431396484375, 2.66778564453125, 2.787139892578125, 2.906494140625, 3.025848388671875, 3.14520263671875, 3.264556884765625, 3.3839111328125, 3.503265380859375, 3.62261962890625, 3.741973876953125, 3.861328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 9.0, 9.0, 11.0, 13.0, 17.0, 15.0, 24.0, 23.0, 34.0, 30.0, 35.0, 45.0, 57.0, 43.0, 43.0, 45.0, 69.0, 53.0, 49.0, 48.0, 47.0, 37.0, 42.0, 27.0, 18.0, 21.0, 24.0, 24.0, 17.0, 12.0, 11.0, 8.0, 5.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.858404159545898, -8.545279502868652, -8.23215389251709, -7.919029235839844, -7.6059041023254395, -7.292778968811035, -6.979654312133789, -6.666529178619385, -6.3534040451049805, -6.040278911590576, -5.72715425491333, -5.414029121398926, -5.1009039878845215, -4.787778854370117, -4.474654197692871, -4.161529064178467, -3.8484044075012207, -3.5352795124053955, -3.222154378890991, -2.909029483795166, -2.5959043502807617, -2.2827794551849365, -1.9696545600891113, -1.656529426574707, -1.3434045314788818, -1.030279517173767, -0.7171545624732971, -0.40402960777282715, -0.0909045934677124, 0.22222042083740234, 0.5353453159332275, 0.8484704494476318, 1.161595344543457, 1.4747203588485718, 1.7878453731536865, 2.1009702682495117, 2.414095401763916, 2.727220296859741, 3.0403451919555664, 3.3534703254699707, 3.666595220565796, 3.979720115661621, 4.292845249176025, 4.60597038269043, 4.919095039367676, 5.23222017288208, 5.545345306396484, 5.8584699630737305, 6.171595096588135, 6.484720230102539, 6.797844886779785, 7.1109700202941895, 7.424095153808594, 7.73721981048584, 8.050344467163086, 8.363470077514648, 8.676594734191895, 8.98971939086914, 9.302845001220703, 9.61596965789795, 9.929094314575195, 10.242219924926758, 10.555344581604004, 10.86846923828125, 11.181594848632812]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 10.0, 9.0, 8.0, 10.0, 17.0, 14.0, 19.0, 22.0, 26.0, 28.0, 30.0, 41.0, 44.0, 42.0, 47.0, 46.0, 42.0, 38.0, 58.0, 46.0, 41.0, 53.0, 40.0, 39.0, 25.0, 41.0, 23.0, 30.0, 16.0, 13.0, 21.0, 19.0, 11.0, 14.0, 5.0, 3.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.961770057678223, -8.617195129394531, -8.272619247436523, -7.928044319152832, -7.583468914031982, -7.238893508911133, -6.894318580627441, -6.549743175506592, -6.205167770385742, -5.860592365264893, -5.516016960144043, -5.171442031860352, -4.826866626739502, -4.482291221618652, -4.137716293334961, -3.7931408882141113, -3.4485654830932617, -3.103990077972412, -2.7594149112701416, -2.414839744567871, -2.0702643394470215, -1.7256890535354614, -1.3811137676239014, -1.0365386009216309, -0.6919631958007812, -0.3473879098892212, -0.002812623977661133, 0.3417626619338989, 0.686337947845459, 1.030913233757019, 1.375488519668579, 1.7200636863708496, 2.064639091491699, 2.409214496612549, 2.7537896633148193, 3.09836483001709, 3.4429402351379395, 3.787515640258789, 4.1320905685424805, 4.47666597366333, 4.82124137878418, 5.165816783905029, 5.510392189025879, 5.85496711730957, 6.19954252243042, 6.5441179275512695, 6.888692855834961, 7.2332682609558105, 7.57784366607666, 7.92241907119751, 8.26699447631836, 8.61156940460205, 8.956144332885742, 9.30072021484375, 9.645295143127441, 9.989870071411133, 10.33444595336914, 10.679020881652832, 11.02359676361084, 11.368171691894531, 11.712747573852539, 12.05732250213623, 12.401897430419922, 12.74647331237793, 13.091048240661621]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 2.0, 6.0, 10.0, 12.0, 22.0, 22.0, 32.0, 51.0, 61.0, 81.0, 130.0, 178.0, 290.0, 403.0, 585.0, 883.0, 1390.0, 2418.0, 4335.0, 8807.0, 21285.0, 56844.0, 161041.0, 384397.0, 255194.0, 90352.0, 32662.0, 12998.0, 5823.0, 3185.0, 1786.0, 1035.0, 688.0, 428.0, 332.0, 244.0, 142.0, 121.0, 83.0, 57.0, 42.0, 30.0, 24.0, 21.0, 8.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.8515625, -11.4658203125, -11.080078125, -10.6943359375, -10.30859375, -9.9228515625, -9.537109375, -9.1513671875, -8.765625, -8.3798828125, -7.994140625, -7.6083984375, -7.22265625, -6.8369140625, -6.451171875, -6.0654296875, -5.6796875, -5.2939453125, -4.908203125, -4.5224609375, -4.13671875, -3.7509765625, -3.365234375, -2.9794921875, -2.59375, -2.2080078125, -1.822265625, -1.4365234375, -1.05078125, -0.6650390625, -0.279296875, 0.1064453125, 0.4921875, 0.8779296875, 1.263671875, 1.6494140625, 2.03515625, 2.4208984375, 2.806640625, 3.1923828125, 3.578125, 3.9638671875, 4.349609375, 4.7353515625, 5.12109375, 5.5068359375, 5.892578125, 6.2783203125, 6.6640625, 7.0498046875, 7.435546875, 7.8212890625, 8.20703125, 8.5927734375, 8.978515625, 9.3642578125, 9.75, 10.1357421875, 10.521484375, 10.9072265625, 11.29296875, 11.6787109375, 12.064453125, 12.4501953125, 12.8359375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 4.0, 18.0, 12.0, 14.0, 25.0, 24.0, 24.0, 28.0, 34.0, 28.0, 36.0, 41.0, 40.0, 46.0, 50.0, 44.0, 47.0, 39.0, 49.0, 49.0, 45.0, 37.0, 30.0, 42.0, 25.0, 24.0, 25.0, 18.0, 12.0, 17.0, 11.0, 13.0, 5.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.984375, -8.6396484375, -8.294921875, -7.9501953125, -7.60546875, -7.2607421875, -6.916015625, -6.5712890625, -6.2265625, -5.8818359375, -5.537109375, -5.1923828125, -4.84765625, -4.5029296875, -4.158203125, -3.8134765625, -3.46875, -3.1240234375, -2.779296875, -2.4345703125, -2.08984375, -1.7451171875, -1.400390625, -1.0556640625, -0.7109375, -0.3662109375, -0.021484375, 0.3232421875, 0.66796875, 1.0126953125, 1.357421875, 1.7021484375, 2.046875, 2.3916015625, 2.736328125, 3.0810546875, 3.42578125, 3.7705078125, 4.115234375, 4.4599609375, 4.8046875, 5.1494140625, 5.494140625, 5.8388671875, 6.18359375, 6.5283203125, 6.873046875, 7.2177734375, 7.5625, 7.9072265625, 8.251953125, 8.5966796875, 8.94140625, 9.2861328125, 9.630859375, 9.9755859375, 10.3203125, 10.6650390625, 11.009765625, 11.3544921875, 11.69921875, 12.0439453125, 12.388671875, 12.7333984375, 13.078125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 12.0, 11.0, 19.0, 24.0, 29.0, 38.0, 66.0, 85.0, 130.0, 228.0, 338.0, 468.0, 780.0, 1280.0, 2254.0, 4042.0, 7730.0, 16264.0, 37605.0, 98257.0, 264041.0, 358920.0, 152637.0, 56732.0, 23219.0, 10576.0, 5400.0, 2954.0, 1638.0, 936.0, 603.0, 389.0, 266.0, 170.0, 109.0, 76.0, 50.0, 42.0, 48.0, 23.0, 16.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.3345947265625, -8.067626953125, -7.8006591796875, -7.53369140625, -7.2667236328125, -6.999755859375, -6.7327880859375, -6.4658203125, -6.1988525390625, -5.931884765625, -5.6649169921875, -5.39794921875, -5.1309814453125, -4.864013671875, -4.5970458984375, -4.330078125, -4.0631103515625, -3.796142578125, -3.5291748046875, -3.26220703125, -2.9952392578125, -2.728271484375, -2.4613037109375, -2.1943359375, -1.9273681640625, -1.660400390625, -1.3934326171875, -1.12646484375, -0.8594970703125, -0.592529296875, -0.3255615234375, -0.05859375, 0.2083740234375, 0.475341796875, 0.7423095703125, 1.00927734375, 1.2762451171875, 1.543212890625, 1.8101806640625, 2.0771484375, 2.3441162109375, 2.611083984375, 2.8780517578125, 3.14501953125, 3.4119873046875, 3.678955078125, 3.9459228515625, 4.212890625, 4.4798583984375, 4.746826171875, 5.0137939453125, 5.28076171875, 5.5477294921875, 5.814697265625, 6.0816650390625, 6.3486328125, 6.6156005859375, 6.882568359375, 7.1495361328125, 7.41650390625, 7.6834716796875, 7.950439453125, 8.2174072265625, 8.484375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 14.0, 5.0, 11.0, 19.0, 25.0, 16.0, 24.0, 21.0, 27.0, 32.0, 32.0, 30.0, 30.0, 45.0, 29.0, 39.0, 37.0, 53.0, 41.0, 36.0, 33.0, 32.0, 39.0, 41.0, 28.0, 37.0, 25.0, 26.0, 20.0, 22.0, 18.0, 17.0, 14.0, 12.0, 10.0, 7.0, 10.0, 10.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.12890625, -6.906005859375, -6.68310546875, -6.460205078125, -6.2373046875, -6.014404296875, -5.79150390625, -5.568603515625, -5.345703125, -5.122802734375, -4.89990234375, -4.677001953125, -4.4541015625, -4.231201171875, -4.00830078125, -3.785400390625, -3.5625, -3.339599609375, -3.11669921875, -2.893798828125, -2.6708984375, -2.447998046875, -2.22509765625, -2.002197265625, -1.779296875, -1.556396484375, -1.33349609375, -1.110595703125, -0.8876953125, -0.664794921875, -0.44189453125, -0.218994140625, 0.00390625, 0.226806640625, 0.44970703125, 0.672607421875, 0.8955078125, 1.118408203125, 1.34130859375, 1.564208984375, 1.787109375, 2.010009765625, 2.23291015625, 2.455810546875, 2.6787109375, 2.901611328125, 3.12451171875, 3.347412109375, 3.5703125, 3.793212890625, 4.01611328125, 4.239013671875, 4.4619140625, 4.684814453125, 4.90771484375, 5.130615234375, 5.353515625, 5.576416015625, 5.79931640625, 6.022216796875, 6.2451171875, 6.468017578125, 6.69091796875, 6.913818359375, 7.13671875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 5.0, 15.0, 24.0, 23.0, 42.0, 54.0, 79.0, 131.0, 196.0, 311.0, 556.0, 832.0, 1541.0, 3095.0, 6617.0, 18889.0, 115308.0, 810942.0, 63935.0, 14355.0, 5603.0, 2555.0, 1333.0, 821.0, 445.0, 258.0, 190.0, 131.0, 89.0, 44.0, 39.0, 29.0, 18.0, 10.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.828125, -10.51318359375, -10.1982421875, -9.88330078125, -9.568359375, -9.25341796875, -8.9384765625, -8.62353515625, -8.30859375, -7.99365234375, -7.6787109375, -7.36376953125, -7.048828125, -6.73388671875, -6.4189453125, -6.10400390625, -5.7890625, -5.47412109375, -5.1591796875, -4.84423828125, -4.529296875, -4.21435546875, -3.8994140625, -3.58447265625, -3.26953125, -2.95458984375, -2.6396484375, -2.32470703125, -2.009765625, -1.69482421875, -1.3798828125, -1.06494140625, -0.75, -0.43505859375, -0.1201171875, 0.19482421875, 0.509765625, 0.82470703125, 1.1396484375, 1.45458984375, 1.76953125, 2.08447265625, 2.3994140625, 2.71435546875, 3.029296875, 3.34423828125, 3.6591796875, 3.97412109375, 4.2890625, 4.60400390625, 4.9189453125, 5.23388671875, 5.548828125, 5.86376953125, 6.1787109375, 6.49365234375, 6.80859375, 7.12353515625, 7.4384765625, 7.75341796875, 8.068359375, 8.38330078125, 8.6982421875, 9.01318359375, 9.328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 4.0, 8.0, 12.0, 20.0, 17.0, 26.0, 39.0, 58.0, 89.0, 156.0, 183.0, 144.0, 72.0, 58.0, 28.0, 19.0, 10.0, 12.0, 7.0, 8.0, 9.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006003379821777344, -0.000581204891204834, -0.0005620718002319336, -0.0005429387092590332, -0.0005238056182861328, -0.0005046725273132324, -0.00048553943634033203, -0.00046640634536743164, -0.00044727325439453125, -0.00042814016342163086, -0.00040900707244873047, -0.0003898739814758301, -0.0003707408905029297, -0.0003516077995300293, -0.0003324747085571289, -0.0003133416175842285, -0.0002942085266113281, -0.00027507543563842773, -0.00025594234466552734, -0.00023680925369262695, -0.00021767616271972656, -0.00019854307174682617, -0.00017940998077392578, -0.0001602768898010254, -0.000141143798828125, -0.00012201070785522461, -0.00010287761688232422, -8.374452590942383e-05, -6.461143493652344e-05, -4.547834396362305e-05, -2.6345252990722656e-05, -7.212162017822266e-06, 1.1920928955078125e-05, 3.1054019927978516e-05, 5.0187110900878906e-05, 6.93202018737793e-05, 8.845329284667969e-05, 0.00010758638381958008, 0.00012671947479248047, 0.00014585256576538086, 0.00016498565673828125, 0.00018411874771118164, 0.00020325183868408203, 0.00022238492965698242, 0.0002415180206298828, 0.0002606511116027832, 0.0002797842025756836, 0.000298917293548584, 0.0003180503845214844, 0.00033718347549438477, 0.00035631656646728516, 0.00037544965744018555, 0.00039458274841308594, 0.00041371583938598633, 0.0004328489303588867, 0.0004519820213317871, 0.0004711151123046875, 0.0004902482032775879, 0.0005093812942504883, 0.0005285143852233887, 0.0005476474761962891, 0.0005667805671691895, 0.0005859136581420898, 0.0006050467491149902, 0.0006241798400878906]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 21.0, 15.0, 26.0, 51.0, 53.0, 88.0, 116.0, 194.0, 308.0, 451.0, 690.0, 1051.0, 1693.0, 2837.0, 4944.0, 9323.0, 22372.0, 84488.0, 450347.0, 362685.0, 67697.0, 19090.0, 8424.0, 4470.0, 2555.0, 1589.0, 994.0, 671.0, 432.0, 297.0, 193.0, 113.0, 92.0, 57.0, 48.0, 23.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.3245849609375, -8.055419921875, -7.7862548828125, -7.51708984375, -7.2479248046875, -6.978759765625, -6.7095947265625, -6.4404296875, -6.1712646484375, -5.902099609375, -5.6329345703125, -5.36376953125, -5.0946044921875, -4.825439453125, -4.5562744140625, -4.287109375, -4.0179443359375, -3.748779296875, -3.4796142578125, -3.21044921875, -2.9412841796875, -2.672119140625, -2.4029541015625, -2.1337890625, -1.8646240234375, -1.595458984375, -1.3262939453125, -1.05712890625, -0.7879638671875, -0.518798828125, -0.2496337890625, 0.01953125, 0.2886962890625, 0.557861328125, 0.8270263671875, 1.09619140625, 1.3653564453125, 1.634521484375, 1.9036865234375, 2.1728515625, 2.4420166015625, 2.711181640625, 2.9803466796875, 3.24951171875, 3.5186767578125, 3.787841796875, 4.0570068359375, 4.326171875, 4.5953369140625, 4.864501953125, 5.1336669921875, 5.40283203125, 5.6719970703125, 5.941162109375, 6.2103271484375, 6.4794921875, 6.7486572265625, 7.017822265625, 7.2869873046875, 7.55615234375, 7.8253173828125, 8.094482421875, 8.3636474609375, 8.6328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 7.0, 8.0, 10.0, 11.0, 12.0, 13.0, 13.0, 35.0, 30.0, 46.0, 48.0, 65.0, 87.0, 93.0, 113.0, 72.0, 63.0, 45.0, 40.0, 30.0, 21.0, 23.0, 13.0, 14.0, 10.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.4814453125, -1.4377288818359375, -1.394012451171875, -1.3502960205078125, -1.30657958984375, -1.2628631591796875, -1.219146728515625, -1.1754302978515625, -1.1317138671875, -1.0879974365234375, -1.044281005859375, -1.0005645751953125, -0.95684814453125, -0.9131317138671875, -0.869415283203125, -0.8256988525390625, -0.781982421875, -0.7382659912109375, -0.694549560546875, -0.6508331298828125, -0.60711669921875, -0.5634002685546875, -0.519683837890625, -0.4759674072265625, -0.4322509765625, -0.3885345458984375, -0.344818115234375, -0.3011016845703125, -0.25738525390625, -0.2136688232421875, -0.169952392578125, -0.1262359619140625, -0.08251953125, -0.0388031005859375, 0.004913330078125, 0.0486297607421875, 0.09234619140625, 0.1360626220703125, 0.179779052734375, 0.2234954833984375, 0.2672119140625, 0.3109283447265625, 0.354644775390625, 0.3983612060546875, 0.44207763671875, 0.4857940673828125, 0.529510498046875, 0.5732269287109375, 0.616943359375, 0.6606597900390625, 0.704376220703125, 0.7480926513671875, 0.79180908203125, 0.8355255126953125, 0.879241943359375, 0.9229583740234375, 0.9666748046875, 1.0103912353515625, 1.054107666015625, 1.0978240966796875, 1.14154052734375, 1.1852569580078125, 1.228973388671875, 1.2726898193359375, 1.31640625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 10.0, 6.0, 5.0, 16.0, 16.0, 22.0, 21.0, 31.0, 27.0, 32.0, 31.0, 34.0, 35.0, 57.0, 47.0, 45.0, 40.0, 49.0, 44.0, 41.0, 50.0, 40.0, 38.0, 41.0, 30.0, 19.0, 22.0, 25.0, 18.0, 18.0, 19.0, 8.0, 10.0, 4.0, 11.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-9.701379776000977, -9.41422176361084, -9.127063751220703, -8.839905738830566, -8.55274772644043, -8.265588760375977, -7.97843074798584, -7.691272735595703, -7.404114723205566, -7.11695671081543, -6.829798698425293, -6.542640209197998, -6.255482196807861, -5.968324184417725, -5.68116569519043, -5.394007682800293, -5.106849670410156, -4.8196916580200195, -4.532533645629883, -4.245375156402588, -3.958217144012451, -3.6710591316223145, -3.3839008808135986, -3.096742630004883, -2.809584617614746, -2.5224266052246094, -2.2352683544158936, -1.9481102228164673, -1.660952091217041, -1.3737939596176147, -1.0866358280181885, -0.7994775772094727, -0.5123205184936523, -0.22516238689422607, 0.061995744705200195, 0.34915387630462646, 0.6363120079040527, 0.923470139503479, 1.2106282711029053, 1.497786521911621, 1.7849445343017578, 2.0721025466918945, 2.3592607975006104, 2.646419048309326, 2.933577060699463, 3.2207350730895996, 3.5078933238983154, 3.7950515747070312, 4.082209587097168, 4.369367599487305, 4.656525611877441, 4.943684101104736, 5.230842113494873, 5.51800012588501, 5.805158615112305, 6.092316627502441, 6.379474639892578, 6.666632652282715, 6.953790664672852, 7.2409491539001465, 7.528107166290283, 7.81526517868042, 8.102423667907715, 8.389581680297852, 8.676739692687988]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 14.0, 5.0, 9.0, 11.0, 20.0, 14.0, 23.0, 33.0, 26.0, 27.0, 40.0, 33.0, 32.0, 39.0, 55.0, 42.0, 47.0, 40.0, 46.0, 37.0, 53.0, 39.0, 45.0, 32.0, 32.0, 29.0, 34.0, 20.0, 19.0, 19.0, 13.0, 20.0, 10.0, 8.0, 12.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.495927810668945, -8.164344787597656, -7.832762241363525, -7.5011796951293945, -7.1695966720581055, -6.838013648986816, -6.5064311027526855, -6.174848556518555, -5.843265533447266, -5.511682510375977, -5.180099964141846, -4.848517417907715, -4.516934394836426, -4.185351371765137, -3.853768825531006, -3.522186040878296, -3.190603256225586, -2.859020471572876, -2.527437686920166, -2.195854902267456, -1.864272117614746, -1.5326893329620361, -1.2011065483093262, -0.8695237636566162, -0.5379409790039062, -0.2063581943511963, 0.12522459030151367, 0.45680737495422363, 0.7883901596069336, 1.1199729442596436, 1.4515557289123535, 1.7831385135650635, 2.1147212982177734, 2.4463040828704834, 2.7778868675231934, 3.1094696521759033, 3.4410524368286133, 3.7726352214813232, 4.104218006134033, 4.435800552368164, 4.767383575439453, 5.098966598510742, 5.430549144744873, 5.762131690979004, 6.093714714050293, 6.425297737121582, 6.756880283355713, 7.088462829589844, 7.420045852661133, 7.751628875732422, 8.083211898803711, 8.414793968200684, 8.746376991271973, 9.077960014343262, 9.409542083740234, 9.741125106811523, 10.072708129882812, 10.404291152954102, 10.73587417602539, 11.067456245422363, 11.399039268493652, 11.730622291564941, 12.062204360961914, 12.393787384033203, 12.725370407104492]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 8.0, 4.0, 10.0, 16.0, 19.0, 28.0, 45.0, 51.0, 94.0, 155.0, 186.0, 328.0, 603.0, 910.0, 1389.0, 2283.0, 3726.0, 6290.0, 10278.0, 16972.0, 27046.0, 42172.0, 62173.0, 86441.0, 110316.0, 127765.0, 130519.0, 119022.0, 95964.0, 71142.0, 48442.0, 31897.0, 20206.0, 12350.0, 7654.0, 4582.0, 2783.0, 1731.0, 1085.0, 709.0, 415.0, 274.0, 169.0, 103.0, 68.0, 58.0, 30.0, 15.0, 13.0, 12.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-11.3671875, -11.024658203125, -10.68212890625, -10.339599609375, -9.9970703125, -9.654541015625, -9.31201171875, -8.969482421875, -8.626953125, -8.284423828125, -7.94189453125, -7.599365234375, -7.2568359375, -6.914306640625, -6.57177734375, -6.229248046875, -5.88671875, -5.544189453125, -5.20166015625, -4.859130859375, -4.5166015625, -4.174072265625, -3.83154296875, -3.489013671875, -3.146484375, -2.803955078125, -2.46142578125, -2.118896484375, -1.7763671875, -1.433837890625, -1.09130859375, -0.748779296875, -0.40625, -0.063720703125, 0.27880859375, 0.621337890625, 0.9638671875, 1.306396484375, 1.64892578125, 1.991455078125, 2.333984375, 2.676513671875, 3.01904296875, 3.361572265625, 3.7041015625, 4.046630859375, 4.38916015625, 4.731689453125, 5.07421875, 5.416748046875, 5.75927734375, 6.101806640625, 6.4443359375, 6.786865234375, 7.12939453125, 7.471923828125, 7.814453125, 8.156982421875, 8.49951171875, 8.842041015625, 9.1845703125, 9.527099609375, 9.86962890625, 10.212158203125, 10.5546875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 19.0, 17.0, 21.0, 19.0, 25.0, 32.0, 25.0, 29.0, 37.0, 46.0, 42.0, 36.0, 53.0, 53.0, 54.0, 35.0, 47.0, 49.0, 36.0, 41.0, 46.0, 33.0, 33.0, 19.0, 22.0, 19.0, 22.0, 18.0, 11.0, 5.0, 7.0, 9.0, 3.0, 5.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.283447265625, -7.95751953125, -7.631591796875, -7.3056640625, -6.979736328125, -6.65380859375, -6.327880859375, -6.001953125, -5.676025390625, -5.35009765625, -5.024169921875, -4.6982421875, -4.372314453125, -4.04638671875, -3.720458984375, -3.39453125, -3.068603515625, -2.74267578125, -2.416748046875, -2.0908203125, -1.764892578125, -1.43896484375, -1.113037109375, -0.787109375, -0.461181640625, -0.13525390625, 0.190673828125, 0.5166015625, 0.842529296875, 1.16845703125, 1.494384765625, 1.8203125, 2.146240234375, 2.47216796875, 2.798095703125, 3.1240234375, 3.449951171875, 3.77587890625, 4.101806640625, 4.427734375, 4.753662109375, 5.07958984375, 5.405517578125, 5.7314453125, 6.057373046875, 6.38330078125, 6.709228515625, 7.03515625, 7.361083984375, 7.68701171875, 8.012939453125, 8.3388671875, 8.664794921875, 8.99072265625, 9.316650390625, 9.642578125, 9.968505859375, 10.29443359375, 10.620361328125, 10.9462890625, 11.272216796875, 11.59814453125, 11.924072265625, 12.25]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 13.0, 19.0, 31.0, 32.0, 58.0, 107.0, 145.0, 258.0, 401.0, 629.0, 983.0, 1510.0, 2393.0, 3785.0, 5933.0, 9192.0, 13990.0, 21164.0, 30590.0, 43234.0, 59096.0, 77223.0, 93853.0, 107476.0, 112119.0, 107228.0, 92801.0, 76271.0, 57835.0, 42534.0, 29378.0, 20206.0, 13521.0, 8757.0, 5711.0, 3726.0, 2296.0, 1467.0, 917.0, 605.0, 386.0, 228.0, 165.0, 85.0, 59.0, 48.0, 38.0, 16.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.4296875, -8.1617431640625, -7.893798828125, -7.6258544921875, -7.35791015625, -7.0899658203125, -6.822021484375, -6.5540771484375, -6.2861328125, -6.0181884765625, -5.750244140625, -5.4822998046875, -5.21435546875, -4.9464111328125, -4.678466796875, -4.4105224609375, -4.142578125, -3.8746337890625, -3.606689453125, -3.3387451171875, -3.07080078125, -2.8028564453125, -2.534912109375, -2.2669677734375, -1.9990234375, -1.7310791015625, -1.463134765625, -1.1951904296875, -0.92724609375, -0.6593017578125, -0.391357421875, -0.1234130859375, 0.14453125, 0.4124755859375, 0.680419921875, 0.9483642578125, 1.21630859375, 1.4842529296875, 1.752197265625, 2.0201416015625, 2.2880859375, 2.5560302734375, 2.823974609375, 3.0919189453125, 3.35986328125, 3.6278076171875, 3.895751953125, 4.1636962890625, 4.431640625, 4.6995849609375, 4.967529296875, 5.2354736328125, 5.50341796875, 5.7713623046875, 6.039306640625, 6.3072509765625, 6.5751953125, 6.8431396484375, 7.111083984375, 7.3790283203125, 7.64697265625, 7.9149169921875, 8.182861328125, 8.4508056640625, 8.71875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 9.0, 8.0, 12.0, 5.0, 7.0, 17.0, 15.0, 20.0, 30.0, 35.0, 37.0, 31.0, 37.0, 38.0, 45.0, 55.0, 36.0, 38.0, 45.0, 47.0, 44.0, 35.0, 32.0, 31.0, 39.0, 31.0, 33.0, 21.0, 28.0, 21.0, 19.0, 22.0, 12.0, 18.0, 13.0, 13.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.24822998046875, -6.0394287109375, -5.83062744140625, -5.621826171875, -5.41302490234375, -5.2042236328125, -4.99542236328125, -4.78662109375, -4.57781982421875, -4.3690185546875, -4.16021728515625, -3.951416015625, -3.74261474609375, -3.5338134765625, -3.32501220703125, -3.1162109375, -2.90740966796875, -2.6986083984375, -2.48980712890625, -2.281005859375, -2.07220458984375, -1.8634033203125, -1.65460205078125, -1.44580078125, -1.23699951171875, -1.0281982421875, -0.81939697265625, -0.610595703125, -0.40179443359375, -0.1929931640625, 0.01580810546875, 0.224609375, 0.43341064453125, 0.6422119140625, 0.85101318359375, 1.059814453125, 1.26861572265625, 1.4774169921875, 1.68621826171875, 1.89501953125, 2.10382080078125, 2.3126220703125, 2.52142333984375, 2.730224609375, 2.93902587890625, 3.1478271484375, 3.35662841796875, 3.5654296875, 3.77423095703125, 3.9830322265625, 4.19183349609375, 4.400634765625, 4.60943603515625, 4.8182373046875, 5.02703857421875, 5.23583984375, 5.44464111328125, 5.6534423828125, 5.86224365234375, 6.071044921875, 6.27984619140625, 6.4886474609375, 6.69744873046875, 6.90625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 9.0, 23.0, 17.0, 24.0, 25.0, 51.0, 59.0, 105.0, 156.0, 223.0, 324.0, 469.0, 776.0, 1097.0, 1925.0, 2943.0, 4640.0, 8086.0, 14038.0, 25027.0, 45142.0, 80563.0, 135012.0, 188181.0, 193099.0, 143458.0, 88275.0, 49579.0, 27325.0, 15376.0, 8716.0, 5144.0, 3193.0, 1894.0, 1176.0, 764.0, 485.0, 337.0, 257.0, 182.0, 121.0, 77.0, 42.0, 52.0, 29.0, 17.0, 11.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0], "bins": [-8.6875, -8.43255615234375, -8.1776123046875, -7.92266845703125, -7.667724609375, -7.41278076171875, -7.1578369140625, -6.90289306640625, -6.64794921875, -6.39300537109375, -6.1380615234375, -5.88311767578125, -5.628173828125, -5.37322998046875, -5.1182861328125, -4.86334228515625, -4.6083984375, -4.35345458984375, -4.0985107421875, -3.84356689453125, -3.588623046875, -3.33367919921875, -3.0787353515625, -2.82379150390625, -2.56884765625, -2.31390380859375, -2.0589599609375, -1.80401611328125, -1.549072265625, -1.29412841796875, -1.0391845703125, -0.78424072265625, -0.529296875, -0.27435302734375, -0.0194091796875, 0.23553466796875, 0.490478515625, 0.74542236328125, 1.0003662109375, 1.25531005859375, 1.51025390625, 1.76519775390625, 2.0201416015625, 2.27508544921875, 2.530029296875, 2.78497314453125, 3.0399169921875, 3.29486083984375, 3.5498046875, 3.80474853515625, 4.0596923828125, 4.31463623046875, 4.569580078125, 4.82452392578125, 5.0794677734375, 5.33441162109375, 5.58935546875, 5.84429931640625, 6.0992431640625, 6.35418701171875, 6.609130859375, 6.86407470703125, 7.1190185546875, 7.37396240234375, 7.62890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 10.0, 17.0, 13.0, 20.0, 36.0, 47.0, 48.0, 51.0, 76.0, 75.0, 80.0, 89.0, 81.0, 69.0, 58.0, 45.0, 42.0, 28.0, 25.0, 17.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011587142944335938, -0.001127198338508606, -0.0010956823825836182, -0.0010641664266586304, -0.0010326504707336426, -0.0010011345148086548, -0.000969618558883667, -0.0009381026029586792, -0.0009065866470336914, -0.0008750706911087036, -0.0008435547351837158, -0.000812038779258728, -0.0007805228233337402, -0.0007490068674087524, -0.0007174909114837646, -0.0006859749555587769, -0.0006544589996337891, -0.0006229430437088013, -0.0005914270877838135, -0.0005599111318588257, -0.0005283951759338379, -0.0004968792200088501, -0.0004653632640838623, -0.0004338473081588745, -0.0004023313522338867, -0.0003708153963088989, -0.00033929944038391113, -0.00030778348445892334, -0.00027626752853393555, -0.00024475157260894775, -0.00021323561668395996, -0.00018171966075897217, -0.00015020370483398438, -0.00011868774890899658, -8.717179298400879e-05, -5.5655837059020996e-05, -2.4139881134033203e-05, 7.37607479095459e-06, 3.889203071594238e-05, 7.040798664093018e-05, 0.00010192394256591797, 0.00013343989849090576, 0.00016495585441589355, 0.00019647181034088135, 0.00022798776626586914, 0.00025950372219085693, 0.0002910196781158447, 0.0003225356340408325, 0.0003540515899658203, 0.0003855675458908081, 0.0004170835018157959, 0.0004485994577407837, 0.0004801154136657715, 0.0005116313695907593, 0.0005431473255157471, 0.0005746632814407349, 0.0006061792373657227, 0.0006376951932907104, 0.0006692111492156982, 0.000700727105140686, 0.0007322430610656738, 0.0007637590169906616, 0.0007952749729156494, 0.0008267909288406372, 0.000858306884765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 9.0, 14.0, 29.0, 31.0, 54.0, 89.0, 119.0, 211.0, 288.0, 516.0, 734.0, 1401.0, 2111.0, 3578.0, 6051.0, 10185.0, 17533.0, 31027.0, 54904.0, 93430.0, 145371.0, 183947.0, 175878.0, 130090.0, 81238.0, 46826.0, 26179.0, 14799.0, 8827.0, 5165.0, 3068.0, 1827.0, 1140.0, 656.0, 455.0, 260.0, 208.0, 116.0, 65.0, 50.0, 28.0, 23.0, 9.0, 4.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.10943603515625, -6.8790283203125, -6.64862060546875, -6.418212890625, -6.18780517578125, -5.9573974609375, -5.72698974609375, -5.49658203125, -5.26617431640625, -5.0357666015625, -4.80535888671875, -4.574951171875, -4.34454345703125, -4.1141357421875, -3.88372802734375, -3.6533203125, -3.42291259765625, -3.1925048828125, -2.96209716796875, -2.731689453125, -2.50128173828125, -2.2708740234375, -2.04046630859375, -1.81005859375, -1.57965087890625, -1.3492431640625, -1.11883544921875, -0.888427734375, -0.65802001953125, -0.4276123046875, -0.19720458984375, 0.033203125, 0.26361083984375, 0.4940185546875, 0.72442626953125, 0.954833984375, 1.18524169921875, 1.4156494140625, 1.64605712890625, 1.87646484375, 2.10687255859375, 2.3372802734375, 2.56768798828125, 2.798095703125, 3.02850341796875, 3.2589111328125, 3.48931884765625, 3.7197265625, 3.95013427734375, 4.1805419921875, 4.41094970703125, 4.641357421875, 4.87176513671875, 5.1021728515625, 5.33258056640625, 5.56298828125, 5.79339599609375, 6.0238037109375, 6.25421142578125, 6.484619140625, 6.71502685546875, 6.9454345703125, 7.17584228515625, 7.40625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 6.0, 10.0, 2.0, 9.0, 11.0, 10.0, 12.0, 12.0, 11.0, 18.0, 17.0, 15.0, 26.0, 25.0, 33.0, 42.0, 44.0, 38.0, 50.0, 50.0, 58.0, 50.0, 41.0, 53.0, 39.0, 50.0, 39.0, 42.0, 33.0, 21.0, 18.0, 13.0, 20.0, 15.0, 18.0, 19.0, 11.0, 4.0, 4.0, 6.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.68359375, -2.607269287109375, -2.53094482421875, -2.454620361328125, -2.3782958984375, -2.301971435546875, -2.22564697265625, -2.149322509765625, -2.072998046875, -1.996673583984375, -1.92034912109375, -1.844024658203125, -1.7677001953125, -1.691375732421875, -1.61505126953125, -1.538726806640625, -1.46240234375, -1.386077880859375, -1.30975341796875, -1.233428955078125, -1.1571044921875, -1.080780029296875, -1.00445556640625, -0.928131103515625, -0.851806640625, -0.775482177734375, -0.69915771484375, -0.622833251953125, -0.5465087890625, -0.470184326171875, -0.39385986328125, -0.317535400390625, -0.2412109375, -0.164886474609375, -0.08856201171875, -0.012237548828125, 0.0640869140625, 0.140411376953125, 0.21673583984375, 0.293060302734375, 0.369384765625, 0.445709228515625, 0.52203369140625, 0.598358154296875, 0.6746826171875, 0.751007080078125, 0.82733154296875, 0.903656005859375, 0.97998046875, 1.056304931640625, 1.13262939453125, 1.208953857421875, 1.2852783203125, 1.361602783203125, 1.43792724609375, 1.514251708984375, 1.590576171875, 1.666900634765625, 1.74322509765625, 1.819549560546875, 1.8958740234375, 1.972198486328125, 2.04852294921875, 2.124847412109375, 2.201171875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 12.0, 9.0, 16.0, 11.0, 9.0, 19.0, 21.0, 23.0, 20.0, 40.0, 28.0, 27.0, 46.0, 47.0, 45.0, 47.0, 50.0, 42.0, 42.0, 47.0, 40.0, 41.0, 40.0, 42.0, 31.0, 31.0, 26.0, 24.0, 16.0, 21.0, 20.0, 9.0, 13.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95775842666626, -7.672265529632568, -7.386772632598877, -7.1012797355651855, -6.815786838531494, -6.530293941497803, -6.2448015213012695, -5.959308624267578, -5.673815727233887, -5.388322830200195, -5.102829933166504, -4.8173370361328125, -4.531844139099121, -4.24635124206543, -3.9608585834503174, -3.675365686416626, -3.3898725509643555, -3.104379653930664, -2.8188867568969727, -2.5333938598632812, -2.24790096282959, -1.962408185005188, -1.6769154071807861, -1.3914225101470947, -1.1059296131134033, -0.8204367160797119, -0.5349438786506653, -0.24945104122161865, 0.036041855812072754, 0.32153475284576416, 0.607027530670166, 0.8925204277038574, 1.178013801574707, 1.4635066986083984, 1.7489995956420898, 2.0344924926757812, 2.3199853897094727, 2.605478286743164, 2.8909709453582764, 3.1764638423919678, 3.461956739425659, 3.7474496364593506, 4.032942295074463, 4.318435192108154, 4.603928089141846, 4.889420986175537, 5.1749138832092285, 5.46040678024292, 5.745899677276611, 6.031392574310303, 6.316885471343994, 6.6023783683776855, 6.887871265411377, 7.173364162445068, 7.458856582641602, 7.744349479675293, 8.029842376708984, 8.315335273742676, 8.600828170776367, 8.886321067810059, 9.17181396484375, 9.457306861877441, 9.742799758911133, 10.028292655944824, 10.313785552978516]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 4.0, 7.0, 4.0, 6.0, 4.0, 11.0, 3.0, 13.0, 12.0, 17.0, 23.0, 22.0, 37.0, 21.0, 26.0, 29.0, 31.0, 38.0, 36.0, 47.0, 36.0, 53.0, 49.0, 45.0, 36.0, 27.0, 32.0, 35.0, 29.0, 33.0, 36.0, 31.0, 28.0, 22.0, 22.0, 16.0, 18.0, 13.0, 12.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.487324714660645, -8.173551559448242, -7.85977840423584, -7.5460052490234375, -7.232231616973877, -6.918458461761475, -6.604685306549072, -6.290911674499512, -5.977138519287109, -5.663365364074707, -5.349592208862305, -5.035819053649902, -4.722045421600342, -4.4082722663879395, -4.094499111175537, -3.7807257175445557, -3.4669528007507324, -3.15317964553833, -2.8394062519073486, -2.5256330966949463, -2.211859703063965, -1.8980865478515625, -1.5843133926391602, -1.2705399990081787, -0.9567668437957764, -0.6429935693740845, -0.32922035455703735, -0.015447139739990234, 0.29832613468170166, 0.6120994091033936, 0.9258725643157959, 1.2396459579467773, 1.5534191131591797, 1.8671923875808716, 2.1809656620025635, 2.494738817214966, 2.8085122108459473, 3.1222853660583496, 3.436058521270752, 3.7498319149017334, 4.063605308532715, 4.377378463745117, 4.6911516189575195, 5.004924774169922, 5.318698406219482, 5.632471561431885, 5.946244716644287, 6.260018348693848, 6.573791027069092, 6.887564182281494, 7.2013373374938965, 7.515110969543457, 7.828884124755859, 8.142657279968262, 8.456430435180664, 8.770203590393066, 9.083976745605469, 9.397749900817871, 9.711523056030273, 10.025296211242676, 10.339069366455078, 10.652843475341797, 10.966615676879883, 11.280389785766602, 11.594162940979004]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 18.0, 21.0, 37.0, 56.0, 72.0, 156.0, 257.0, 442.0, 682.0, 1069.0, 1753.0, 2980.0, 4998.0, 8409.0, 13469.0, 23041.0, 38128.0, 61645.0, 100829.0, 157165.0, 239686.0, 343199.0, 453803.0, 535017.0, 552064.0, 493554.0, 387724.0, 278702.0, 186472.0, 120107.0, 74799.0, 45340.0, 27064.0, 16492.0, 10058.0, 5956.0, 3506.0, 2191.0, 1229.0, 823.0, 493.0, 322.0, 180.0, 103.0, 75.0, 38.0, 23.0, 15.0, 16.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.14453125, -6.92266845703125, -6.7008056640625, -6.47894287109375, -6.257080078125, -6.03521728515625, -5.8133544921875, -5.59149169921875, -5.36962890625, -5.14776611328125, -4.9259033203125, -4.70404052734375, -4.482177734375, -4.26031494140625, -4.0384521484375, -3.81658935546875, -3.5947265625, -3.37286376953125, -3.1510009765625, -2.92913818359375, -2.707275390625, -2.48541259765625, -2.2635498046875, -2.04168701171875, -1.81982421875, -1.59796142578125, -1.3760986328125, -1.15423583984375, -0.932373046875, -0.71051025390625, -0.4886474609375, -0.26678466796875, -0.044921875, 0.17694091796875, 0.3988037109375, 0.62066650390625, 0.842529296875, 1.06439208984375, 1.2862548828125, 1.50811767578125, 1.72998046875, 1.95184326171875, 2.1737060546875, 2.39556884765625, 2.617431640625, 2.83929443359375, 3.0611572265625, 3.28302001953125, 3.5048828125, 3.72674560546875, 3.9486083984375, 4.17047119140625, 4.392333984375, 4.61419677734375, 4.8360595703125, 5.05792236328125, 5.27978515625, 5.50164794921875, 5.7235107421875, 5.94537353515625, 6.167236328125, 6.38909912109375, 6.6109619140625, 6.83282470703125, 7.0546875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 4.0, 9.0, 12.0, 6.0, 13.0, 13.0, 19.0, 23.0, 19.0, 22.0, 31.0, 33.0, 27.0, 30.0, 41.0, 31.0, 34.0, 45.0, 47.0, 39.0, 31.0, 35.0, 39.0, 42.0, 34.0, 38.0, 33.0, 26.0, 25.0, 26.0, 30.0, 20.0, 18.0, 18.0, 19.0, 7.0, 8.0, 6.0, 9.0, 5.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.125, -5.914794921875, -5.70458984375, -5.494384765625, -5.2841796875, -5.073974609375, -4.86376953125, -4.653564453125, -4.443359375, -4.233154296875, -4.02294921875, -3.812744140625, -3.6025390625, -3.392333984375, -3.18212890625, -2.971923828125, -2.76171875, -2.551513671875, -2.34130859375, -2.131103515625, -1.9208984375, -1.710693359375, -1.50048828125, -1.290283203125, -1.080078125, -0.869873046875, -0.65966796875, -0.449462890625, -0.2392578125, -0.029052734375, 0.18115234375, 0.391357421875, 0.6015625, 0.811767578125, 1.02197265625, 1.232177734375, 1.4423828125, 1.652587890625, 1.86279296875, 2.072998046875, 2.283203125, 2.493408203125, 2.70361328125, 2.913818359375, 3.1240234375, 3.334228515625, 3.54443359375, 3.754638671875, 3.96484375, 4.175048828125, 4.38525390625, 4.595458984375, 4.8056640625, 5.015869140625, 5.22607421875, 5.436279296875, 5.646484375, 5.856689453125, 6.06689453125, 6.277099609375, 6.4873046875, 6.697509765625, 6.90771484375, 7.117919921875, 7.328125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 15.0, 28.0, 56.0, 79.0, 103.0, 226.0, 367.0, 629.0, 980.0, 1706.0, 2774.0, 4737.0, 7817.0, 12708.0, 21077.0, 33930.0, 53579.0, 83904.0, 127224.0, 186015.0, 259159.0, 338979.0, 413743.0, 463534.0, 471796.0, 435618.0, 367697.0, 287393.0, 209202.0, 145554.0, 97391.0, 63117.0, 39686.0, 24852.0, 15510.0, 9073.0, 5617.0, 3365.0, 2039.0, 1177.0, 708.0, 415.0, 263.0, 166.0, 111.0, 58.0, 38.0, 22.0, 10.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.6802978515625, -5.485595703125, -5.2908935546875, -5.09619140625, -4.9014892578125, -4.706787109375, -4.5120849609375, -4.3173828125, -4.1226806640625, -3.927978515625, -3.7332763671875, -3.53857421875, -3.3438720703125, -3.149169921875, -2.9544677734375, -2.759765625, -2.5650634765625, -2.370361328125, -2.1756591796875, -1.98095703125, -1.7862548828125, -1.591552734375, -1.3968505859375, -1.2021484375, -1.0074462890625, -0.812744140625, -0.6180419921875, -0.42333984375, -0.2286376953125, -0.033935546875, 0.1607666015625, 0.35546875, 0.5501708984375, 0.744873046875, 0.9395751953125, 1.13427734375, 1.3289794921875, 1.523681640625, 1.7183837890625, 1.9130859375, 2.1077880859375, 2.302490234375, 2.4971923828125, 2.69189453125, 2.8865966796875, 3.081298828125, 3.2760009765625, 3.470703125, 3.6654052734375, 3.860107421875, 4.0548095703125, 4.24951171875, 4.4442138671875, 4.638916015625, 4.8336181640625, 5.0283203125, 5.2230224609375, 5.417724609375, 5.6124267578125, 5.80712890625, 6.0018310546875, 6.196533203125, 6.3912353515625, 6.5859375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 8.0, 11.0, 11.0, 22.0, 23.0, 33.0, 33.0, 45.0, 59.0, 64.0, 90.0, 97.0, 105.0, 116.0, 133.0, 161.0, 164.0, 192.0, 217.0, 188.0, 210.0, 221.0, 197.0, 232.0, 207.0, 167.0, 149.0, 166.0, 141.0, 115.0, 78.0, 91.0, 77.0, 51.0, 30.0, 38.0, 36.0, 20.0, 19.0, 14.0, 9.0, 9.0, 13.0, 11.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.3359375, -3.231597900390625, -3.12725830078125, -3.022918701171875, -2.9185791015625, -2.814239501953125, -2.70989990234375, -2.605560302734375, -2.501220703125, -2.396881103515625, -2.29254150390625, -2.188201904296875, -2.0838623046875, -1.979522705078125, -1.87518310546875, -1.770843505859375, -1.66650390625, -1.562164306640625, -1.45782470703125, -1.353485107421875, -1.2491455078125, -1.144805908203125, -1.04046630859375, -0.936126708984375, -0.831787109375, -0.727447509765625, -0.62310791015625, -0.518768310546875, -0.4144287109375, -0.310089111328125, -0.20574951171875, -0.101409912109375, 0.0029296875, 0.107269287109375, 0.21160888671875, 0.315948486328125, 0.4202880859375, 0.524627685546875, 0.62896728515625, 0.733306884765625, 0.837646484375, 0.941986083984375, 1.04632568359375, 1.150665283203125, 1.2550048828125, 1.359344482421875, 1.46368408203125, 1.568023681640625, 1.67236328125, 1.776702880859375, 1.88104248046875, 1.985382080078125, 2.0897216796875, 2.194061279296875, 2.29840087890625, 2.402740478515625, 2.507080078125, 2.611419677734375, 2.71575927734375, 2.820098876953125, 2.9244384765625, 3.028778076171875, 3.13311767578125, 3.237457275390625, 3.341796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 7.0, 13.0, 15.0, 15.0, 20.0, 18.0, 24.0, 23.0, 32.0, 36.0, 43.0, 45.0, 35.0, 44.0, 44.0, 58.0, 45.0, 55.0, 47.0, 38.0, 47.0, 37.0, 37.0, 35.0, 23.0, 22.0, 16.0, 20.0, 26.0, 16.0, 14.0, 11.0, 9.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.941447734832764, -7.678990364074707, -7.41653299331665, -7.154075622558594, -6.891618251800537, -6.6291608810424805, -6.366703033447266, -6.104246139526367, -5.841788291931152, -5.579330921173096, -5.316873550415039, -5.054416179656982, -4.791958808898926, -4.529501438140869, -4.2670440673828125, -4.004586219787598, -3.742129325866699, -3.4796719551086426, -3.217214584350586, -2.9547572135925293, -2.6922998428344727, -2.429842472076416, -2.1673848628997803, -1.9049274921417236, -1.642470121383667, -1.3800127506256104, -1.1175553798675537, -0.8550978899002075, -0.5926405191421509, -0.33018314838409424, -0.06772565841674805, 0.1947317123413086, 0.45718860626220703, 0.7196459770202637, 0.9821034073829651, 1.2445608377456665, 1.5070182085037231, 1.7694755792617798, 2.031933069229126, 2.2943904399871826, 2.5568478107452393, 2.819305181503296, 3.0817625522613525, 3.3442201614379883, 3.606677532196045, 3.8691349029541016, 4.131592273712158, 4.394049644470215, 4.6565070152282715, 4.918964385986328, 5.181421756744385, 5.443879127502441, 5.706336498260498, 5.968793869018555, 6.2312517166137695, 6.493708610534668, 6.756166458129883, 7.0186238288879395, 7.281081199645996, 7.543538570404053, 7.805995941162109, 8.068453788757324, 8.330910682678223, 8.593368530273438, 8.855825424194336]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 12.0, 12.0, 12.0, 13.0, 13.0, 12.0, 17.0, 20.0, 31.0, 18.0, 22.0, 38.0, 31.0, 35.0, 21.0, 30.0, 54.0, 41.0, 36.0, 50.0, 43.0, 36.0, 31.0, 46.0, 36.0, 38.0, 29.0, 29.0, 24.0, 27.0, 19.0, 23.0, 19.0, 17.0, 10.0, 8.0, 9.0, 7.0, 5.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9827880859375, -6.728200912475586, -6.47361421585083, -6.219027042388916, -5.96444034576416, -5.709853172302246, -5.455265998840332, -5.200678825378418, -4.946092128753662, -4.691504955291748, -4.436918258666992, -4.182331085205078, -3.927744150161743, -3.673157215118408, -3.418570041656494, -3.163983106613159, -2.909396171569824, -2.6548092365264893, -2.4002223014831543, -2.1456351280212402, -1.8910481929779053, -1.6364612579345703, -1.3818742036819458, -1.1272871494293213, -0.8727002143859863, -0.6181132197380066, -0.36352622509002686, -0.10893923044204712, 0.14564776420593262, 0.4002346992492676, 0.6548217535018921, 0.9094088077545166, 1.1639947891235352, 1.4185817241668701, 1.6731687784194946, 1.9277558326721191, 2.182342767715454, 2.436929702758789, 2.691516876220703, 2.946103811264038, 3.200690746307373, 3.455277681350708, 3.709864616394043, 3.964451789855957, 4.219038963317871, 4.473625659942627, 4.728212833404541, 4.982799530029297, 5.237386703491211, 5.491973876953125, 5.746560573577881, 6.001147747039795, 6.255734443664551, 6.510321617126465, 6.764908790588379, 7.019495964050293, 7.274082660675049, 7.528669834136963, 7.783256530761719, 8.037843704223633, 8.292430877685547, 8.547018051147461, 8.801604270935059, 9.056191444396973, 9.310778617858887]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 10.0, 12.0, 21.0, 45.0, 67.0, 77.0, 119.0, 171.0, 244.0, 378.0, 598.0, 927.0, 1522.0, 2431.0, 4330.0, 7148.0, 12947.0, 22910.0, 42222.0, 77621.0, 138308.0, 210174.0, 210523.0, 139726.0, 78831.0, 42568.0, 23396.0, 12838.0, 7375.0, 4251.0, 2612.0, 1483.0, 888.0, 618.0, 384.0, 241.0, 183.0, 112.0, 70.0, 42.0, 27.0, 31.0, 16.0, 17.0, 12.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.55078125, -5.3875732421875, -5.224365234375, -5.0611572265625, -4.89794921875, -4.7347412109375, -4.571533203125, -4.4083251953125, -4.2451171875, -4.0819091796875, -3.918701171875, -3.7554931640625, -3.59228515625, -3.4290771484375, -3.265869140625, -3.1026611328125, -2.939453125, -2.7762451171875, -2.613037109375, -2.4498291015625, -2.28662109375, -2.1234130859375, -1.960205078125, -1.7969970703125, -1.6337890625, -1.4705810546875, -1.307373046875, -1.1441650390625, -0.98095703125, -0.8177490234375, -0.654541015625, -0.4913330078125, -0.328125, -0.1649169921875, -0.001708984375, 0.1614990234375, 0.32470703125, 0.4879150390625, 0.651123046875, 0.8143310546875, 0.9775390625, 1.1407470703125, 1.303955078125, 1.4671630859375, 1.63037109375, 1.7935791015625, 1.956787109375, 2.1199951171875, 2.283203125, 2.4464111328125, 2.609619140625, 2.7728271484375, 2.93603515625, 3.0992431640625, 3.262451171875, 3.4256591796875, 3.5888671875, 3.7520751953125, 3.915283203125, 4.0784912109375, 4.24169921875, 4.4049072265625, 4.568115234375, 4.7313232421875, 4.89453125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 9.0, 12.0, 15.0, 14.0, 22.0, 9.0, 14.0, 20.0, 24.0, 31.0, 22.0, 35.0, 35.0, 42.0, 34.0, 56.0, 42.0, 31.0, 37.0, 48.0, 40.0, 50.0, 49.0, 26.0, 33.0, 35.0, 25.0, 29.0, 20.0, 20.0, 19.0, 18.0, 20.0, 11.0, 10.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.3433837890625, -6.069580078125, -5.7957763671875, -5.52197265625, -5.2481689453125, -4.974365234375, -4.7005615234375, -4.4267578125, -4.1529541015625, -3.879150390625, -3.6053466796875, -3.33154296875, -3.0577392578125, -2.783935546875, -2.5101318359375, -2.236328125, -1.9625244140625, -1.688720703125, -1.4149169921875, -1.14111328125, -0.8673095703125, -0.593505859375, -0.3197021484375, -0.0458984375, 0.2279052734375, 0.501708984375, 0.7755126953125, 1.04931640625, 1.3231201171875, 1.596923828125, 1.8707275390625, 2.14453125, 2.4183349609375, 2.692138671875, 2.9659423828125, 3.23974609375, 3.5135498046875, 3.787353515625, 4.0611572265625, 4.3349609375, 4.6087646484375, 4.882568359375, 5.1563720703125, 5.43017578125, 5.7039794921875, 5.977783203125, 6.2515869140625, 6.525390625, 6.7991943359375, 7.072998046875, 7.3468017578125, 7.62060546875, 7.8944091796875, 8.168212890625, 8.4420166015625, 8.7158203125, 8.9896240234375, 9.263427734375, 9.5372314453125, 9.81103515625, 10.0848388671875, 10.358642578125, 10.6324462890625, 10.90625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 11.0, 6.0, 15.0, 28.0, 41.0, 63.0, 102.0, 156.0, 221.0, 399.0, 658.0, 1169.0, 2010.0, 3671.0, 7133.0, 14503.0, 31347.0, 74337.0, 183183.0, 346571.0, 220725.0, 89680.0, 37784.0, 16953.0, 8155.0, 4245.0, 2229.0, 1232.0, 767.0, 436.0, 257.0, 180.0, 111.0, 67.0, 33.0, 33.0, 17.0, 21.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.71807861328125, -5.5181884765625, -5.31829833984375, -5.118408203125, -4.91851806640625, -4.7186279296875, -4.51873779296875, -4.31884765625, -4.11895751953125, -3.9190673828125, -3.71917724609375, -3.519287109375, -3.31939697265625, -3.1195068359375, -2.91961669921875, -2.7197265625, -2.51983642578125, -2.3199462890625, -2.12005615234375, -1.920166015625, -1.72027587890625, -1.5203857421875, -1.32049560546875, -1.12060546875, -0.92071533203125, -0.7208251953125, -0.52093505859375, -0.321044921875, -0.12115478515625, 0.0787353515625, 0.27862548828125, 0.478515625, 0.67840576171875, 0.8782958984375, 1.07818603515625, 1.278076171875, 1.47796630859375, 1.6778564453125, 1.87774658203125, 2.07763671875, 2.27752685546875, 2.4774169921875, 2.67730712890625, 2.877197265625, 3.07708740234375, 3.2769775390625, 3.47686767578125, 3.6767578125, 3.87664794921875, 4.0765380859375, 4.27642822265625, 4.476318359375, 4.67620849609375, 4.8760986328125, 5.07598876953125, 5.27587890625, 5.47576904296875, 5.6756591796875, 5.87554931640625, 6.075439453125, 6.27532958984375, 6.4752197265625, 6.67510986328125, 6.875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 3.0, 2.0, 6.0, 15.0, 11.0, 10.0, 18.0, 13.0, 15.0, 12.0, 17.0, 32.0, 26.0, 36.0, 29.0, 32.0, 35.0, 48.0, 48.0, 36.0, 41.0, 29.0, 45.0, 40.0, 38.0, 41.0, 30.0, 32.0, 31.0, 36.0, 28.0, 30.0, 18.0, 19.0, 16.0, 18.0, 11.0, 6.0, 8.0, 8.0, 12.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.31500244140625, -5.1221923828125, -4.92938232421875, -4.736572265625, -4.54376220703125, -4.3509521484375, -4.15814208984375, -3.96533203125, -3.77252197265625, -3.5797119140625, -3.38690185546875, -3.194091796875, -3.00128173828125, -2.8084716796875, -2.61566162109375, -2.4228515625, -2.23004150390625, -2.0372314453125, -1.84442138671875, -1.651611328125, -1.45880126953125, -1.2659912109375, -1.07318115234375, -0.88037109375, -0.68756103515625, -0.4947509765625, -0.30194091796875, -0.109130859375, 0.08367919921875, 0.2764892578125, 0.46929931640625, 0.662109375, 0.85491943359375, 1.0477294921875, 1.24053955078125, 1.433349609375, 1.62615966796875, 1.8189697265625, 2.01177978515625, 2.20458984375, 2.39739990234375, 2.5902099609375, 2.78302001953125, 2.975830078125, 3.16864013671875, 3.3614501953125, 3.55426025390625, 3.7470703125, 3.93988037109375, 4.1326904296875, 4.32550048828125, 4.518310546875, 4.71112060546875, 4.9039306640625, 5.09674072265625, 5.28955078125, 5.48236083984375, 5.6751708984375, 5.86798095703125, 6.060791015625, 6.25360107421875, 6.4464111328125, 6.63922119140625, 6.83203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 9.0, 4.0, 3.0, 7.0, 17.0, 15.0, 22.0, 31.0, 37.0, 58.0, 78.0, 129.0, 172.0, 252.0, 337.0, 468.0, 737.0, 1143.0, 1678.0, 2769.0, 4610.0, 7883.0, 15336.0, 34486.0, 112671.0, 462943.0, 284121.0, 66118.0, 24173.0, 11473.0, 6338.0, 3690.0, 2275.0, 1429.0, 967.0, 573.0, 434.0, 320.0, 209.0, 146.0, 105.0, 96.0, 53.0, 38.0, 34.0, 23.0, 13.0, 13.0, 7.0, 9.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.806640625, -2.71246337890625, -2.6182861328125, -2.52410888671875, -2.429931640625, -2.33575439453125, -2.2415771484375, -2.14739990234375, -2.05322265625, -1.95904541015625, -1.8648681640625, -1.77069091796875, -1.676513671875, -1.58233642578125, -1.4881591796875, -1.39398193359375, -1.2998046875, -1.20562744140625, -1.1114501953125, -1.01727294921875, -0.923095703125, -0.82891845703125, -0.7347412109375, -0.64056396484375, -0.54638671875, -0.45220947265625, -0.3580322265625, -0.26385498046875, -0.169677734375, -0.07550048828125, 0.0186767578125, 0.11285400390625, 0.20703125, 0.30120849609375, 0.3953857421875, 0.48956298828125, 0.583740234375, 0.67791748046875, 0.7720947265625, 0.86627197265625, 0.96044921875, 1.05462646484375, 1.1488037109375, 1.24298095703125, 1.337158203125, 1.43133544921875, 1.5255126953125, 1.61968994140625, 1.7138671875, 1.80804443359375, 1.9022216796875, 1.99639892578125, 2.090576171875, 2.18475341796875, 2.2789306640625, 2.37310791015625, 2.46728515625, 2.56146240234375, 2.6556396484375, 2.74981689453125, 2.843994140625, 2.93817138671875, 3.0323486328125, 3.12652587890625, 3.220703125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 12.0, 13.0, 17.0, 26.0, 41.0, 69.0, 78.0, 110.0, 133.0, 125.0, 103.0, 57.0, 48.0, 29.0, 20.0, 22.0, 14.0, 18.0, 8.0, 4.0, 9.0, 4.0, 8.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003237724304199219, -0.00031254813075065613, -0.0003013238310813904, -0.00029009953141212463, -0.0002788752317428589, -0.00026765093207359314, -0.0002564266324043274, -0.00024520233273506165, -0.0002339780330657959, -0.00022275373339653015, -0.0002115294337272644, -0.00020030513405799866, -0.0001890808343887329, -0.00017785653471946716, -0.00016663223505020142, -0.00015540793538093567, -0.00014418363571166992, -0.00013295933604240417, -0.00012173503637313843, -0.00011051073670387268, -9.928643703460693e-05, -8.806213736534119e-05, -7.683783769607544e-05, -6.561353802680969e-05, -5.4389238357543945e-05, -4.31649386882782e-05, -3.194063901901245e-05, -2.0716339349746704e-05, -9.492039680480957e-06, 1.73225998878479e-06, 1.2956559658050537e-05, 2.4180859327316284e-05, 3.540515899658203e-05, 4.662945866584778e-05, 5.7853758335113525e-05, 6.907805800437927e-05, 8.030235767364502e-05, 9.152665734291077e-05, 0.00010275095701217651, 0.00011397525668144226, 0.000125199556350708, 0.00013642385601997375, 0.0001476481556892395, 0.00015887245535850525, 0.000170096755027771, 0.00018132105469703674, 0.0001925453543663025, 0.00020376965403556824, 0.00021499395370483398, 0.00022621825337409973, 0.00023744255304336548, 0.0002486668527126312, 0.00025989115238189697, 0.0002711154520511627, 0.00028233975172042847, 0.0002935640513896942, 0.00030478835105895996, 0.0003160126507282257, 0.00032723695039749146, 0.0003384612500667572, 0.00034968554973602295, 0.0003609098494052887, 0.00037213414907455444, 0.0003833584487438202, 0.00039458274841308594]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 13.0, 18.0, 22.0, 37.0, 38.0, 61.0, 69.0, 93.0, 124.0, 175.0, 248.0, 310.0, 415.0, 658.0, 897.0, 1411.0, 2079.0, 3192.0, 5133.0, 8916.0, 17284.0, 36545.0, 80115.0, 174188.0, 293419.0, 220492.0, 104820.0, 47331.0, 22047.0, 11211.0, 6104.0, 3568.0, 2345.0, 1471.0, 1001.0, 745.0, 523.0, 383.0, 294.0, 198.0, 136.0, 96.0, 97.0, 60.0, 40.0, 39.0, 20.0, 22.0, 17.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.515625, -2.436187744140625, -2.35675048828125, -2.277313232421875, -2.1978759765625, -2.118438720703125, -2.03900146484375, -1.959564208984375, -1.880126953125, -1.800689697265625, -1.72125244140625, -1.641815185546875, -1.5623779296875, -1.482940673828125, -1.40350341796875, -1.324066162109375, -1.24462890625, -1.165191650390625, -1.08575439453125, -1.006317138671875, -0.9268798828125, -0.847442626953125, -0.76800537109375, -0.688568115234375, -0.609130859375, -0.529693603515625, -0.45025634765625, -0.370819091796875, -0.2913818359375, -0.211944580078125, -0.13250732421875, -0.053070068359375, 0.0263671875, 0.105804443359375, 0.18524169921875, 0.264678955078125, 0.3441162109375, 0.423553466796875, 0.50299072265625, 0.582427978515625, 0.661865234375, 0.741302490234375, 0.82073974609375, 0.900177001953125, 0.9796142578125, 1.059051513671875, 1.13848876953125, 1.217926025390625, 1.29736328125, 1.376800537109375, 1.45623779296875, 1.535675048828125, 1.6151123046875, 1.694549560546875, 1.77398681640625, 1.853424072265625, 1.932861328125, 2.012298583984375, 2.09173583984375, 2.171173095703125, 2.2506103515625, 2.330047607421875, 2.40948486328125, 2.488922119140625, 2.568359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 13.0, 9.0, 18.0, 31.0, 48.0, 57.0, 80.0, 97.0, 100.0, 109.0, 103.0, 84.0, 62.0, 51.0, 27.0, 34.0, 18.0, 9.0, 3.0, 2.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.5068359375, -1.4614105224609375, -1.415985107421875, -1.3705596923828125, -1.32513427734375, -1.2797088623046875, -1.234283447265625, -1.1888580322265625, -1.1434326171875, -1.0980072021484375, -1.052581787109375, -1.0071563720703125, -0.96173095703125, -0.9163055419921875, -0.870880126953125, -0.8254547119140625, -0.780029296875, -0.7346038818359375, -0.689178466796875, -0.6437530517578125, -0.59832763671875, -0.5529022216796875, -0.507476806640625, -0.4620513916015625, -0.4166259765625, -0.3712005615234375, -0.325775146484375, -0.2803497314453125, -0.23492431640625, -0.1894989013671875, -0.144073486328125, -0.0986480712890625, -0.05322265625, -0.0077972412109375, 0.037628173828125, 0.0830535888671875, 0.12847900390625, 0.1739044189453125, 0.219329833984375, 0.2647552490234375, 0.3101806640625, 0.3556060791015625, 0.401031494140625, 0.4464569091796875, 0.49188232421875, 0.5373077392578125, 0.582733154296875, 0.6281585693359375, 0.673583984375, 0.7190093994140625, 0.764434814453125, 0.8098602294921875, 0.85528564453125, 0.9007110595703125, 0.946136474609375, 0.9915618896484375, 1.0369873046875, 1.0824127197265625, 1.127838134765625, 1.1732635498046875, 1.21868896484375, 1.2641143798828125, 1.309539794921875, 1.3549652099609375, 1.400390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 6.0, 7.0, 8.0, 12.0, 16.0, 18.0, 21.0, 20.0, 23.0, 33.0, 31.0, 34.0, 39.0, 37.0, 47.0, 52.0, 41.0, 55.0, 46.0, 48.0, 41.0, 43.0, 40.0, 34.0, 38.0, 24.0, 32.0, 21.0, 18.0, 15.0, 23.0, 20.0, 8.0, 13.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.071625709533691, -7.82106876373291, -7.570511817932129, -7.319954872131348, -7.069397926330566, -6.818840980529785, -6.568284511566162, -6.317727565765381, -6.0671706199646, -5.816613674163818, -5.566056728363037, -5.315499782562256, -5.064943313598633, -4.814386367797852, -4.56382942199707, -4.313272476196289, -4.062715530395508, -3.8121585845947266, -3.5616016387939453, -3.311044931411743, -3.060487985610962, -2.8099310398101807, -2.5593743324279785, -2.3088173866271973, -2.058260440826416, -1.8077034950256348, -1.557146668434143, -1.3065898418426514, -1.0560328960418701, -0.8054759502410889, -0.5549191236495972, -0.30436229705810547, -0.053804874420166016, 0.19675201177597046, 0.44730889797210693, 0.6978657841682434, 0.9484226703643799, 1.1989796161651611, 1.4495364427566528, 1.7000932693481445, 1.9506502151489258, 2.201207160949707, 2.4517641067504883, 2.7023208141326904, 2.9528777599334717, 3.203434705734253, 3.453991413116455, 3.7045483589172363, 3.9551053047180176, 4.205662250518799, 4.45621919631958, 4.706776142120361, 4.957332611083984, 5.207889556884766, 5.458446502685547, 5.709003448486328, 5.959560394287109, 6.210117340087891, 6.460674285888672, 6.711231231689453, 6.961788177490234, 7.212345123291016, 7.462901592254639, 7.71345853805542, 7.964015483856201]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 9.0, 8.0, 16.0, 14.0, 16.0, 10.0, 12.0, 21.0, 24.0, 19.0, 28.0, 31.0, 40.0, 26.0, 32.0, 19.0, 41.0, 46.0, 41.0, 43.0, 50.0, 36.0, 39.0, 32.0, 46.0, 34.0, 28.0, 33.0, 34.0, 23.0, 20.0, 17.0, 26.0, 17.0, 9.0, 6.0, 11.0, 8.0, 6.0, 5.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.755190849304199, -6.502392292022705, -6.249593734741211, -5.996794700622559, -5.7439961433410645, -5.49119758605957, -5.238398551940918, -4.985599994659424, -4.73280143737793, -4.4800028800964355, -4.227204322814941, -3.974405288696289, -3.721606731414795, -3.468808174133301, -3.2160093784332275, -2.9632105827331543, -2.71041202545166, -2.457613468170166, -2.2048146724700928, -1.952015995979309, -1.6992173194885254, -1.4464186429977417, -1.193619966506958, -0.9408212900161743, -0.6880226135253906, -0.43522393703460693, -0.18242526054382324, 0.07037341594696045, 0.32317209243774414, 0.5759707689285278, 0.8287694454193115, 1.0815681219100952, 1.3343658447265625, 1.5871645212173462, 1.8399631977081299, 2.092761993408203, 2.3455605506896973, 2.5983591079711914, 2.8511579036712646, 3.103956699371338, 3.356755256652832, 3.609553813934326, 3.8623526096343994, 4.115151405334473, 4.367949962615967, 4.620748519897461, 4.873547554016113, 5.126346111297607, 5.379144668579102, 5.631943225860596, 5.88474178314209, 6.137540817260742, 6.390339374542236, 6.6431379318237305, 6.895936965942383, 7.148735523223877, 7.401534080505371, 7.654332637786865, 7.907131195068359, 8.159930229187012, 8.412729263305664, 8.66552734375, 8.918326377868652, 9.171124458312988, 9.42392349243164]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 17.0, 23.0, 45.0, 89.0, 110.0, 213.0, 367.0, 600.0, 1051.0, 1736.0, 2973.0, 5025.0, 8724.0, 14738.0, 23977.0, 38701.0, 60266.0, 87980.0, 116988.0, 138069.0, 141657.0, 125495.0, 97117.0, 68233.0, 44850.0, 27876.0, 16824.0, 10285.0, 6048.0, 3524.0, 1967.0, 1233.0, 685.0, 418.0, 246.0, 147.0, 80.0, 59.0, 35.0, 26.0, 22.0, 8.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.40625, -8.107666015625, -7.80908203125, -7.510498046875, -7.2119140625, -6.913330078125, -6.61474609375, -6.316162109375, -6.017578125, -5.718994140625, -5.42041015625, -5.121826171875, -4.8232421875, -4.524658203125, -4.22607421875, -3.927490234375, -3.62890625, -3.330322265625, -3.03173828125, -2.733154296875, -2.4345703125, -2.135986328125, -1.83740234375, -1.538818359375, -1.240234375, -0.941650390625, -0.64306640625, -0.344482421875, -0.0458984375, 0.252685546875, 0.55126953125, 0.849853515625, 1.1484375, 1.447021484375, 1.74560546875, 2.044189453125, 2.3427734375, 2.641357421875, 2.93994140625, 3.238525390625, 3.537109375, 3.835693359375, 4.13427734375, 4.432861328125, 4.7314453125, 5.030029296875, 5.32861328125, 5.627197265625, 5.92578125, 6.224365234375, 6.52294921875, 6.821533203125, 7.1201171875, 7.418701171875, 7.71728515625, 8.015869140625, 8.314453125, 8.613037109375, 8.91162109375, 9.210205078125, 9.5087890625, 9.807373046875, 10.10595703125, 10.404541015625, 10.703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 12.0, 15.0, 14.0, 19.0, 15.0, 24.0, 31.0, 30.0, 30.0, 26.0, 32.0, 42.0, 41.0, 34.0, 43.0, 51.0, 56.0, 42.0, 35.0, 51.0, 30.0, 32.0, 36.0, 36.0, 31.0, 27.0, 22.0, 22.0, 18.0, 13.0, 7.0, 13.0, 10.0, 4.0, 5.0, 3.0, 6.0, 6.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.28515625, -7.02728271484375, -6.7694091796875, -6.51153564453125, -6.253662109375, -5.99578857421875, -5.7379150390625, -5.48004150390625, -5.22216796875, -4.96429443359375, -4.7064208984375, -4.44854736328125, -4.190673828125, -3.93280029296875, -3.6749267578125, -3.41705322265625, -3.1591796875, -2.90130615234375, -2.6434326171875, -2.38555908203125, -2.127685546875, -1.86981201171875, -1.6119384765625, -1.35406494140625, -1.09619140625, -0.83831787109375, -0.5804443359375, -0.32257080078125, -0.064697265625, 0.19317626953125, 0.4510498046875, 0.70892333984375, 0.966796875, 1.22467041015625, 1.4825439453125, 1.74041748046875, 1.998291015625, 2.25616455078125, 2.5140380859375, 2.77191162109375, 3.02978515625, 3.28765869140625, 3.5455322265625, 3.80340576171875, 4.061279296875, 4.31915283203125, 4.5770263671875, 4.83489990234375, 5.0927734375, 5.35064697265625, 5.6085205078125, 5.86639404296875, 6.124267578125, 6.38214111328125, 6.6400146484375, 6.89788818359375, 7.15576171875, 7.41363525390625, 7.6715087890625, 7.92938232421875, 8.187255859375, 8.44512939453125, 8.7030029296875, 8.96087646484375, 9.21875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 15.0, 18.0, 27.0, 49.0, 77.0, 96.0, 154.0, 251.0, 330.0, 476.0, 798.0, 1154.0, 1710.0, 2608.0, 3852.0, 5778.0, 8269.0, 12216.0, 17765.0, 25193.0, 35375.0, 47567.0, 62315.0, 77712.0, 91441.0, 99662.0, 102235.0, 96736.0, 85382.0, 70974.0, 56182.0, 42089.0, 31235.0, 21725.0, 15234.0, 10450.0, 6947.0, 4637.0, 3225.0, 2173.0, 1469.0, 973.0, 632.0, 463.0, 307.0, 217.0, 119.0, 87.0, 70.0, 32.0, 18.0, 14.0, 9.0, 4.0, 6.0, 3.0, 3.0], "bins": [-6.71875, -6.51690673828125, -6.3150634765625, -6.11322021484375, -5.911376953125, -5.70953369140625, -5.5076904296875, -5.30584716796875, -5.10400390625, -4.90216064453125, -4.7003173828125, -4.49847412109375, -4.296630859375, -4.09478759765625, -3.8929443359375, -3.69110107421875, -3.4892578125, -3.28741455078125, -3.0855712890625, -2.88372802734375, -2.681884765625, -2.48004150390625, -2.2781982421875, -2.07635498046875, -1.87451171875, -1.67266845703125, -1.4708251953125, -1.26898193359375, -1.067138671875, -0.86529541015625, -0.6634521484375, -0.46160888671875, -0.259765625, -0.05792236328125, 0.1439208984375, 0.34576416015625, 0.547607421875, 0.74945068359375, 0.9512939453125, 1.15313720703125, 1.35498046875, 1.55682373046875, 1.7586669921875, 1.96051025390625, 2.162353515625, 2.36419677734375, 2.5660400390625, 2.76788330078125, 2.9697265625, 3.17156982421875, 3.3734130859375, 3.57525634765625, 3.777099609375, 3.97894287109375, 4.1807861328125, 4.38262939453125, 4.58447265625, 4.78631591796875, 4.9881591796875, 5.19000244140625, 5.391845703125, 5.59368896484375, 5.7955322265625, 5.99737548828125, 6.19921875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 7.0, 7.0, 6.0, 5.0, 16.0, 18.0, 21.0, 22.0, 18.0, 27.0, 25.0, 25.0, 24.0, 37.0, 52.0, 34.0, 31.0, 46.0, 35.0, 39.0, 41.0, 39.0, 24.0, 25.0, 44.0, 36.0, 30.0, 23.0, 26.0, 25.0, 20.0, 15.0, 23.0, 13.0, 21.0, 21.0, 16.0, 5.0, 9.0, 9.0, 6.0, 7.0, 3.0, 3.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.39447021484375, -4.2459716796875, -4.09747314453125, -3.948974609375, -3.80047607421875, -3.6519775390625, -3.50347900390625, -3.35498046875, -3.20648193359375, -3.0579833984375, -2.90948486328125, -2.760986328125, -2.61248779296875, -2.4639892578125, -2.31549072265625, -2.1669921875, -2.01849365234375, -1.8699951171875, -1.72149658203125, -1.572998046875, -1.42449951171875, -1.2760009765625, -1.12750244140625, -0.97900390625, -0.83050537109375, -0.6820068359375, -0.53350830078125, -0.385009765625, -0.23651123046875, -0.0880126953125, 0.06048583984375, 0.208984375, 0.35748291015625, 0.5059814453125, 0.65447998046875, 0.802978515625, 0.95147705078125, 1.0999755859375, 1.24847412109375, 1.39697265625, 1.54547119140625, 1.6939697265625, 1.84246826171875, 1.990966796875, 2.13946533203125, 2.2879638671875, 2.43646240234375, 2.5849609375, 2.73345947265625, 2.8819580078125, 3.03045654296875, 3.178955078125, 3.32745361328125, 3.4759521484375, 3.62445068359375, 3.77294921875, 3.92144775390625, 4.0699462890625, 4.21844482421875, 4.366943359375, 4.51544189453125, 4.6639404296875, 4.81243896484375, 4.9609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 12.0, 11.0, 18.0, 21.0, 33.0, 44.0, 79.0, 83.0, 149.0, 235.0, 311.0, 411.0, 557.0, 829.0, 1233.0, 1801.0, 2893.0, 5055.0, 9258.0, 18845.0, 42101.0, 97659.0, 204579.0, 278957.0, 203078.0, 97064.0, 41670.0, 18663.0, 9183.0, 5007.0, 2939.0, 1733.0, 1229.0, 800.0, 583.0, 429.0, 289.0, 220.0, 135.0, 102.0, 91.0, 53.0, 33.0, 31.0, 15.0, 12.0, 8.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-9.71875, -9.4285888671875, -9.138427734375, -8.8482666015625, -8.55810546875, -8.2679443359375, -7.977783203125, -7.6876220703125, -7.3974609375, -7.1072998046875, -6.817138671875, -6.5269775390625, -6.23681640625, -5.9466552734375, -5.656494140625, -5.3663330078125, -5.076171875, -4.7860107421875, -4.495849609375, -4.2056884765625, -3.91552734375, -3.6253662109375, -3.335205078125, -3.0450439453125, -2.7548828125, -2.4647216796875, -2.174560546875, -1.8843994140625, -1.59423828125, -1.3040771484375, -1.013916015625, -0.7237548828125, -0.43359375, -0.1434326171875, 0.146728515625, 0.4368896484375, 0.72705078125, 1.0172119140625, 1.307373046875, 1.5975341796875, 1.8876953125, 2.1778564453125, 2.468017578125, 2.7581787109375, 3.04833984375, 3.3385009765625, 3.628662109375, 3.9188232421875, 4.208984375, 4.4991455078125, 4.789306640625, 5.0794677734375, 5.36962890625, 5.6597900390625, 5.949951171875, 6.2401123046875, 6.5302734375, 6.8204345703125, 7.110595703125, 7.4007568359375, 7.69091796875, 7.9810791015625, 8.271240234375, 8.5614013671875, 8.8515625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 9.0, 7.0, 4.0, 14.0, 31.0, 35.0, 55.0, 91.0, 109.0, 145.0, 135.0, 98.0, 83.0, 67.0, 42.0, 23.0, 16.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015497207641601562, -0.0015099048614501953, -0.0014700889587402344, -0.0014302730560302734, -0.0013904571533203125, -0.0013506412506103516, -0.0013108253479003906, -0.0012710094451904297, -0.0012311935424804688, -0.0011913776397705078, -0.0011515617370605469, -0.001111745834350586, -0.001071929931640625, -0.001032114028930664, -0.0009922981262207031, -0.0009524822235107422, -0.0009126663208007812, -0.0008728504180908203, -0.0008330345153808594, -0.0007932186126708984, -0.0007534027099609375, -0.0007135868072509766, -0.0006737709045410156, -0.0006339550018310547, -0.0005941390991210938, -0.0005543231964111328, -0.0005145072937011719, -0.00047469139099121094, -0.00043487548828125, -0.00039505958557128906, -0.0003552436828613281, -0.0003154277801513672, -0.00027561187744140625, -0.0002357959747314453, -0.00019598007202148438, -0.00015616416931152344, -0.0001163482666015625, -7.653236389160156e-05, -3.6716461181640625e-05, 3.0994415283203125e-06, 4.291534423828125e-05, 8.273124694824219e-05, 0.00012254714965820312, 0.00016236305236816406, 0.000202178955078125, 0.00024199485778808594, 0.0002818107604980469, 0.0003216266632080078, 0.00036144256591796875, 0.0004012584686279297, 0.0004410743713378906, 0.00048089027404785156, 0.0005207061767578125, 0.0005605220794677734, 0.0006003379821777344, 0.0006401538848876953, 0.0006799697875976562, 0.0007197856903076172, 0.0007596015930175781, 0.0007994174957275391, 0.0008392333984375, 0.0008790493011474609, 0.0009188652038574219, 0.0009586811065673828, 0.0009984970092773438]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 21.0, 23.0, 29.0, 56.0, 72.0, 137.0, 199.0, 275.0, 532.0, 788.0, 1313.0, 2308.0, 4029.0, 7374.0, 13386.0, 25029.0, 46471.0, 83079.0, 136043.0, 184393.0, 190830.0, 146600.0, 91977.0, 51617.0, 27861.0, 15063.0, 8216.0, 4349.0, 2586.0, 1438.0, 904.0, 551.0, 312.0, 216.0, 154.0, 91.0, 71.0, 43.0, 24.0, 18.0, 21.0, 16.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.54296875, -5.3587646484375, -5.174560546875, -4.9903564453125, -4.80615234375, -4.6219482421875, -4.437744140625, -4.2535400390625, -4.0693359375, -3.8851318359375, -3.700927734375, -3.5167236328125, -3.33251953125, -3.1483154296875, -2.964111328125, -2.7799072265625, -2.595703125, -2.4114990234375, -2.227294921875, -2.0430908203125, -1.85888671875, -1.6746826171875, -1.490478515625, -1.3062744140625, -1.1220703125, -0.9378662109375, -0.753662109375, -0.5694580078125, -0.38525390625, -0.2010498046875, -0.016845703125, 0.1673583984375, 0.3515625, 0.5357666015625, 0.719970703125, 0.9041748046875, 1.08837890625, 1.2725830078125, 1.456787109375, 1.6409912109375, 1.8251953125, 2.0093994140625, 2.193603515625, 2.3778076171875, 2.56201171875, 2.7462158203125, 2.930419921875, 3.1146240234375, 3.298828125, 3.4830322265625, 3.667236328125, 3.8514404296875, 4.03564453125, 4.2198486328125, 4.404052734375, 4.5882568359375, 4.7724609375, 4.9566650390625, 5.140869140625, 5.3250732421875, 5.50927734375, 5.6934814453125, 5.877685546875, 6.0618896484375, 6.24609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 18.0, 12.0, 25.0, 27.0, 43.0, 39.0, 61.0, 54.0, 69.0, 91.0, 76.0, 67.0, 83.0, 62.0, 55.0, 34.0, 44.0, 27.0, 25.0, 10.0, 19.0, 10.0, 5.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.896484375, -2.812164306640625, -2.72784423828125, -2.643524169921875, -2.5592041015625, -2.474884033203125, -2.39056396484375, -2.306243896484375, -2.221923828125, -2.137603759765625, -2.05328369140625, -1.968963623046875, -1.8846435546875, -1.800323486328125, -1.71600341796875, -1.631683349609375, -1.54736328125, -1.463043212890625, -1.37872314453125, -1.294403076171875, -1.2100830078125, -1.125762939453125, -1.04144287109375, -0.957122802734375, -0.872802734375, -0.788482666015625, -0.70416259765625, -0.619842529296875, -0.5355224609375, -0.451202392578125, -0.36688232421875, -0.282562255859375, -0.1982421875, -0.113922119140625, -0.02960205078125, 0.054718017578125, 0.1390380859375, 0.223358154296875, 0.30767822265625, 0.391998291015625, 0.476318359375, 0.560638427734375, 0.64495849609375, 0.729278564453125, 0.8135986328125, 0.897918701171875, 0.98223876953125, 1.066558837890625, 1.15087890625, 1.235198974609375, 1.31951904296875, 1.403839111328125, 1.4881591796875, 1.572479248046875, 1.65679931640625, 1.741119384765625, 1.825439453125, 1.909759521484375, 1.99407958984375, 2.078399658203125, 2.1627197265625, 2.247039794921875, 2.33135986328125, 2.415679931640625, 2.5]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 9.0, 7.0, 8.0, 10.0, 8.0, 11.0, 21.0, 19.0, 23.0, 28.0, 23.0, 27.0, 45.0, 23.0, 40.0, 39.0, 45.0, 35.0, 48.0, 47.0, 48.0, 43.0, 45.0, 46.0, 27.0, 32.0, 34.0, 34.0, 27.0, 23.0, 34.0, 18.0, 17.0, 8.0, 10.0, 6.0, 7.0, 4.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.42365837097168, -8.180757522583008, -7.937856197357178, -7.694955348968506, -7.452054023742676, -7.209153175354004, -6.966252326965332, -6.72335147857666, -6.48045015335083, -6.237549304962158, -5.994647979736328, -5.751747131347656, -5.508846282958984, -5.265944957733154, -5.023044109344482, -4.780142784118652, -4.5372419357299805, -4.294341087341309, -4.0514397621154785, -3.8085389137268066, -3.5656378269195557, -3.3227367401123047, -3.079835891723633, -2.836934804916382, -2.594033718109131, -2.35113263130188, -2.108231544494629, -1.865330696105957, -1.622429609298706, -1.379528522491455, -1.1366275548934937, -0.8937265872955322, -0.650825023651123, -0.40792399644851685, -0.16502296924591064, 0.07787805795669556, 0.32077908515930176, 0.5636801719665527, 0.8065811395645142, 1.0494821071624756, 1.2923831939697266, 1.5352842807769775, 1.778185248374939, 2.0210862159729004, 2.2639873027801514, 2.5068883895874023, 2.749789237976074, 2.992690324783325, 3.235591411590576, 3.478492498397827, 3.721393585205078, 3.96429443359375, 4.207195281982422, 4.450096607208252, 4.692997455596924, 4.935898780822754, 5.178799629211426, 5.421700477600098, 5.664601802825928, 5.9075026512146, 6.15040397644043, 6.393304824829102, 6.636205673217773, 6.879106521606445, 7.122007846832275]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 7.0, 4.0, 8.0, 6.0, 11.0, 13.0, 13.0, 14.0, 18.0, 22.0, 16.0, 31.0, 26.0, 30.0, 29.0, 42.0, 27.0, 28.0, 39.0, 37.0, 38.0, 45.0, 49.0, 38.0, 41.0, 28.0, 38.0, 37.0, 41.0, 41.0, 23.0, 21.0, 25.0, 26.0, 18.0, 19.0, 9.0, 11.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.072776794433594, -7.809809684753418, -7.546842098236084, -7.283874988555908, -7.020907402038574, -6.757940292358398, -6.494973182678223, -6.232005596160889, -5.969038009643555, -5.706070899963379, -5.443103313446045, -5.180136203765869, -4.917168617248535, -4.654201507568359, -4.391234397888184, -4.12826681137085, -3.865299701690674, -3.602332353591919, -3.339365005493164, -3.0763978958129883, -2.8134303092956543, -2.5504631996154785, -2.2874958515167236, -2.0245285034179688, -1.7615611553192139, -1.498593807220459, -1.235626459121704, -0.9726592302322388, -0.7096918821334839, -0.446724534034729, -0.18375730514526367, 0.07921004295349121, 0.3421773910522461, 0.605144739151001, 0.8681120276451111, 1.1310793161392212, 1.394046664237976, 1.657014012336731, 1.9199812412261963, 2.182948589324951, 2.445915937423706, 2.708883285522461, 2.971850633621216, 3.2348179817199707, 3.4977850914001465, 3.7607526779174805, 4.023719787597656, 4.286686897277832, 4.549654483795166, 4.812621593475342, 5.075589179992676, 5.338556289672852, 5.6015238761901855, 5.864490985870361, 6.127458572387695, 6.390425682067871, 6.653392791748047, 6.916359901428223, 7.179327487945557, 7.442294597625732, 7.705262184143066, 7.968229293823242, 8.231196403503418, 8.494163513183594, 8.757131576538086]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 27.0, 44.0, 53.0, 111.0, 167.0, 259.0, 409.0, 726.0, 1113.0, 1902.0, 3114.0, 4905.0, 8250.0, 13421.0, 22077.0, 35381.0, 57423.0, 91219.0, 142091.0, 214527.0, 310892.0, 419515.0, 512880.0, 549256.0, 510015.0, 415673.0, 305555.0, 209431.0, 137638.0, 87592.0, 54458.0, 33164.0, 20404.0, 12031.0, 7428.0, 4380.0, 2647.0, 1582.0, 946.0, 625.0, 382.0, 238.0, 137.0, 88.0, 38.0, 28.0, 12.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.921875, -5.733642578125, -5.54541015625, -5.357177734375, -5.1689453125, -4.980712890625, -4.79248046875, -4.604248046875, -4.416015625, -4.227783203125, -4.03955078125, -3.851318359375, -3.6630859375, -3.474853515625, -3.28662109375, -3.098388671875, -2.91015625, -2.721923828125, -2.53369140625, -2.345458984375, -2.1572265625, -1.968994140625, -1.78076171875, -1.592529296875, -1.404296875, -1.216064453125, -1.02783203125, -0.839599609375, -0.6513671875, -0.463134765625, -0.27490234375, -0.086669921875, 0.1015625, 0.289794921875, 0.47802734375, 0.666259765625, 0.8544921875, 1.042724609375, 1.23095703125, 1.419189453125, 1.607421875, 1.795654296875, 1.98388671875, 2.172119140625, 2.3603515625, 2.548583984375, 2.73681640625, 2.925048828125, 3.11328125, 3.301513671875, 3.48974609375, 3.677978515625, 3.8662109375, 4.054443359375, 4.24267578125, 4.430908203125, 4.619140625, 4.807373046875, 4.99560546875, 5.183837890625, 5.3720703125, 5.560302734375, 5.74853515625, 5.936767578125, 6.125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 15.0, 8.0, 16.0, 17.0, 16.0, 23.0, 19.0, 23.0, 31.0, 36.0, 32.0, 30.0, 34.0, 40.0, 30.0, 39.0, 47.0, 54.0, 36.0, 33.0, 36.0, 44.0, 43.0, 39.0, 27.0, 38.0, 25.0, 22.0, 32.0, 19.0, 21.0, 15.0, 13.0, 7.0, 5.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7734375, -5.58453369140625, -5.3956298828125, -5.20672607421875, -5.017822265625, -4.82891845703125, -4.6400146484375, -4.45111083984375, -4.26220703125, -4.07330322265625, -3.8843994140625, -3.69549560546875, -3.506591796875, -3.31768798828125, -3.1287841796875, -2.93988037109375, -2.7509765625, -2.56207275390625, -2.3731689453125, -2.18426513671875, -1.995361328125, -1.80645751953125, -1.6175537109375, -1.42864990234375, -1.23974609375, -1.05084228515625, -0.8619384765625, -0.67303466796875, -0.484130859375, -0.29522705078125, -0.1063232421875, 0.08258056640625, 0.271484375, 0.46038818359375, 0.6492919921875, 0.83819580078125, 1.027099609375, 1.21600341796875, 1.4049072265625, 1.59381103515625, 1.78271484375, 1.97161865234375, 2.1605224609375, 2.34942626953125, 2.538330078125, 2.72723388671875, 2.9161376953125, 3.10504150390625, 3.2939453125, 3.48284912109375, 3.6717529296875, 3.86065673828125, 4.049560546875, 4.23846435546875, 4.4273681640625, 4.61627197265625, 4.80517578125, 4.99407958984375, 5.1829833984375, 5.37188720703125, 5.560791015625, 5.74969482421875, 5.9385986328125, 6.12750244140625, 6.31640625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 14.0, 46.0, 74.0, 138.0, 285.0, 460.0, 840.0, 1538.0, 2738.0, 5111.0, 9224.0, 16474.0, 28424.0, 49403.0, 83600.0, 135133.0, 212145.0, 312334.0, 422144.0, 515785.0, 554884.0, 521337.0, 432298.0, 321517.0, 219883.0, 141813.0, 87237.0, 51559.0, 29683.0, 16948.0, 9417.0, 5214.0, 2985.0, 1598.0, 888.0, 531.0, 268.0, 137.0, 77.0, 40.0, 22.0, 20.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.73931884765625, -5.5450439453125, -5.35076904296875, -5.156494140625, -4.96221923828125, -4.7679443359375, -4.57366943359375, -4.37939453125, -4.18511962890625, -3.9908447265625, -3.79656982421875, -3.602294921875, -3.40802001953125, -3.2137451171875, -3.01947021484375, -2.8251953125, -2.63092041015625, -2.4366455078125, -2.24237060546875, -2.048095703125, -1.85382080078125, -1.6595458984375, -1.46527099609375, -1.27099609375, -1.07672119140625, -0.8824462890625, -0.68817138671875, -0.493896484375, -0.29962158203125, -0.1053466796875, 0.08892822265625, 0.283203125, 0.47747802734375, 0.6717529296875, 0.86602783203125, 1.060302734375, 1.25457763671875, 1.4488525390625, 1.64312744140625, 1.83740234375, 2.03167724609375, 2.2259521484375, 2.42022705078125, 2.614501953125, 2.80877685546875, 3.0030517578125, 3.19732666015625, 3.3916015625, 3.58587646484375, 3.7801513671875, 3.97442626953125, 4.168701171875, 4.36297607421875, 4.5572509765625, 4.75152587890625, 4.94580078125, 5.14007568359375, 5.3343505859375, 5.52862548828125, 5.722900390625, 5.91717529296875, 6.1114501953125, 6.30572509765625, 6.5]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 9.0, 14.0, 19.0, 17.0, 20.0, 25.0, 28.0, 57.0, 49.0, 56.0, 76.0, 77.0, 91.0, 100.0, 104.0, 127.0, 138.0, 160.0, 162.0, 151.0, 174.0, 193.0, 176.0, 193.0, 191.0, 178.0, 155.0, 174.0, 146.0, 131.0, 123.0, 115.0, 90.0, 72.0, 79.0, 71.0, 51.0, 63.0, 42.0, 34.0, 23.0, 22.0, 20.0, 14.0, 20.0, 7.0, 9.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0], "bins": [-2.33984375, -2.266265869140625, -2.19268798828125, -2.119110107421875, -2.0455322265625, -1.971954345703125, -1.89837646484375, -1.824798583984375, -1.751220703125, -1.677642822265625, -1.60406494140625, -1.530487060546875, -1.4569091796875, -1.383331298828125, -1.30975341796875, -1.236175537109375, -1.16259765625, -1.089019775390625, -1.01544189453125, -0.941864013671875, -0.8682861328125, -0.794708251953125, -0.72113037109375, -0.647552490234375, -0.573974609375, -0.500396728515625, -0.42681884765625, -0.353240966796875, -0.2796630859375, -0.206085205078125, -0.13250732421875, -0.058929443359375, 0.0146484375, 0.088226318359375, 0.16180419921875, 0.235382080078125, 0.3089599609375, 0.382537841796875, 0.45611572265625, 0.529693603515625, 0.603271484375, 0.676849365234375, 0.75042724609375, 0.824005126953125, 0.8975830078125, 0.971160888671875, 1.04473876953125, 1.118316650390625, 1.19189453125, 1.265472412109375, 1.33905029296875, 1.412628173828125, 1.4862060546875, 1.559783935546875, 1.63336181640625, 1.706939697265625, 1.780517578125, 1.854095458984375, 1.92767333984375, 2.001251220703125, 2.0748291015625, 2.148406982421875, 2.22198486328125, 2.295562744140625, 2.369140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 5.0, 13.0, 17.0, 16.0, 19.0, 29.0, 28.0, 23.0, 21.0, 41.0, 34.0, 36.0, 44.0, 39.0, 52.0, 42.0, 49.0, 53.0, 51.0, 28.0, 36.0, 42.0, 36.0, 35.0, 31.0, 27.0, 21.0, 24.0, 14.0, 12.0, 17.0, 18.0, 6.0, 4.0, 4.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0], "bins": [-8.455150604248047, -8.24014663696289, -8.025141716003418, -7.8101372718811035, -7.595132827758789, -7.380128860473633, -7.165124416351318, -6.950119972229004, -6.7351155281066895, -6.520111083984375, -6.3051066398620605, -6.090102195739746, -5.87509822845459, -5.660093307495117, -5.445089340209961, -5.2300848960876465, -5.015080451965332, -4.800076007843018, -4.585071563720703, -4.370067119598389, -4.155062675476074, -3.940058469772339, -3.7250542640686035, -3.510049819946289, -3.2950453758239746, -3.08004093170166, -2.8650364875793457, -2.6500322818756104, -2.435027837753296, -2.2200233936309814, -2.005019187927246, -1.7900147438049316, -1.5750102996826172, -1.3600058555603027, -1.1450015306472778, -0.9299971461296082, -0.7149927616119385, -0.499988317489624, -0.2849839925765991, -0.06997966766357422, 0.14502477645874023, 0.3600291609764099, 0.5750335454940796, 0.7900379300117493, 1.005042314529419, 1.2200467586517334, 1.4350510835647583, 1.6500554084777832, 1.8650598526000977, 2.080064296722412, 2.2950687408447266, 2.510072946548462, 2.7250773906707764, 2.940081834793091, 3.155086040496826, 3.3700904846191406, 3.585094928741455, 3.8000993728637695, 4.015103816986084, 4.230108261108398, 4.445112228393555, 4.660117149353027, 4.875121116638184, 5.090125560760498, 5.3051300048828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 6.0, 15.0, 10.0, 12.0, 11.0, 15.0, 20.0, 20.0, 19.0, 29.0, 29.0, 30.0, 34.0, 32.0, 30.0, 30.0, 32.0, 42.0, 41.0, 35.0, 35.0, 46.0, 36.0, 41.0, 36.0, 34.0, 27.0, 34.0, 29.0, 17.0, 17.0, 25.0, 23.0, 18.0, 15.0, 13.0, 15.0, 9.0, 5.0, 6.0, 4.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.844540119171143, -5.646524429321289, -5.448508262634277, -5.250492572784424, -5.05247688293457, -4.854460716247559, -4.656445026397705, -4.458429336547852, -4.26041316986084, -4.062397480010986, -3.8643813133239746, -3.666365623474121, -3.4683496952056885, -3.270333766937256, -3.0723180770874023, -2.8743021488189697, -2.676286220550537, -2.4782702922821045, -2.280254364013672, -2.0822386741638184, -1.8842227458953857, -1.6862068176269531, -1.48819100856781, -1.290175199508667, -1.0921592712402344, -0.8941434025764465, -0.6961275339126587, -0.49811166524887085, -0.300095796585083, -0.10207992792129517, 0.09593594074249268, 0.29395174980163574, 0.49196720123291016, 0.689983069896698, 0.8879989385604858, 1.086014747619629, 1.2840306758880615, 1.4820466041564941, 1.6800624132156372, 1.8780782222747803, 2.076094150543213, 2.2741100788116455, 2.472126007080078, 2.6701416969299316, 2.8681576251983643, 3.066173553466797, 3.2641892433166504, 3.462205171585083, 3.6602210998535156, 3.8582370281219482, 4.056252956390381, 4.254268646240234, 4.452284812927246, 4.6503005027771, 4.848316192626953, 5.046332359313965, 5.244348049163818, 5.442363739013672, 5.640379905700684, 5.838395595550537, 6.036411285400391, 6.234427452087402, 6.432443141937256, 6.630458831787109, 6.828474998474121]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 5.0, 6.0, 13.0, 19.0, 32.0, 35.0, 48.0, 78.0, 92.0, 129.0, 191.0, 264.0, 406.0, 628.0, 907.0, 1614.0, 2726.0, 5006.0, 9125.0, 17896.0, 38153.0, 87868.0, 203328.0, 314818.0, 201427.0, 86826.0, 37860.0, 17842.0, 9213.0, 4822.0, 2693.0, 1547.0, 965.0, 632.0, 368.0, 283.0, 192.0, 144.0, 97.0, 68.0, 44.0, 43.0, 28.0, 21.0, 19.0, 13.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.98046875, -4.817138671875, -4.65380859375, -4.490478515625, -4.3271484375, -4.163818359375, -4.00048828125, -3.837158203125, -3.673828125, -3.510498046875, -3.34716796875, -3.183837890625, -3.0205078125, -2.857177734375, -2.69384765625, -2.530517578125, -2.3671875, -2.203857421875, -2.04052734375, -1.877197265625, -1.7138671875, -1.550537109375, -1.38720703125, -1.223876953125, -1.060546875, -0.897216796875, -0.73388671875, -0.570556640625, -0.4072265625, -0.243896484375, -0.08056640625, 0.082763671875, 0.24609375, 0.409423828125, 0.57275390625, 0.736083984375, 0.8994140625, 1.062744140625, 1.22607421875, 1.389404296875, 1.552734375, 1.716064453125, 1.87939453125, 2.042724609375, 2.2060546875, 2.369384765625, 2.53271484375, 2.696044921875, 2.859375, 3.022705078125, 3.18603515625, 3.349365234375, 3.5126953125, 3.676025390625, 3.83935546875, 4.002685546875, 4.166015625, 4.329345703125, 4.49267578125, 4.656005859375, 4.8193359375, 4.982666015625, 5.14599609375, 5.309326171875, 5.47265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 16.0, 19.0, 11.0, 17.0, 24.0, 25.0, 26.0, 31.0, 33.0, 29.0, 43.0, 33.0, 49.0, 47.0, 37.0, 38.0, 50.0, 50.0, 47.0, 53.0, 50.0, 23.0, 27.0, 25.0, 23.0, 22.0, 20.0, 17.0, 24.0, 15.0, 13.0, 10.0, 7.0, 12.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.5146484375, -6.279296875, -6.0439453125, -5.80859375, -5.5732421875, -5.337890625, -5.1025390625, -4.8671875, -4.6318359375, -4.396484375, -4.1611328125, -3.92578125, -3.6904296875, -3.455078125, -3.2197265625, -2.984375, -2.7490234375, -2.513671875, -2.2783203125, -2.04296875, -1.8076171875, -1.572265625, -1.3369140625, -1.1015625, -0.8662109375, -0.630859375, -0.3955078125, -0.16015625, 0.0751953125, 0.310546875, 0.5458984375, 0.78125, 1.0166015625, 1.251953125, 1.4873046875, 1.72265625, 1.9580078125, 2.193359375, 2.4287109375, 2.6640625, 2.8994140625, 3.134765625, 3.3701171875, 3.60546875, 3.8408203125, 4.076171875, 4.3115234375, 4.546875, 4.7822265625, 5.017578125, 5.2529296875, 5.48828125, 5.7236328125, 5.958984375, 6.1943359375, 6.4296875, 6.6650390625, 6.900390625, 7.1357421875, 7.37109375, 7.6064453125, 7.841796875, 8.0771484375, 8.3125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 9.0, 2.0, 7.0, 16.0, 25.0, 27.0, 49.0, 66.0, 107.0, 146.0, 258.0, 306.0, 477.0, 703.0, 1140.0, 1769.0, 2843.0, 4743.0, 8378.0, 15658.0, 30501.0, 63207.0, 134710.0, 268071.0, 260065.0, 129856.0, 59985.0, 29652.0, 15223.0, 8131.0, 4647.0, 2800.0, 1793.0, 1047.0, 697.0, 446.0, 307.0, 208.0, 141.0, 116.0, 76.0, 43.0, 40.0, 20.0, 16.0, 11.0, 8.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.41796875, -4.27978515625, -4.1416015625, -4.00341796875, -3.865234375, -3.72705078125, -3.5888671875, -3.45068359375, -3.3125, -3.17431640625, -3.0361328125, -2.89794921875, -2.759765625, -2.62158203125, -2.4833984375, -2.34521484375, -2.20703125, -2.06884765625, -1.9306640625, -1.79248046875, -1.654296875, -1.51611328125, -1.3779296875, -1.23974609375, -1.1015625, -0.96337890625, -0.8251953125, -0.68701171875, -0.548828125, -0.41064453125, -0.2724609375, -0.13427734375, 0.00390625, 0.14208984375, 0.2802734375, 0.41845703125, 0.556640625, 0.69482421875, 0.8330078125, 0.97119140625, 1.109375, 1.24755859375, 1.3857421875, 1.52392578125, 1.662109375, 1.80029296875, 1.9384765625, 2.07666015625, 2.21484375, 2.35302734375, 2.4912109375, 2.62939453125, 2.767578125, 2.90576171875, 3.0439453125, 3.18212890625, 3.3203125, 3.45849609375, 3.5966796875, 3.73486328125, 3.873046875, 4.01123046875, 4.1494140625, 4.28759765625, 4.42578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 15.0, 14.0, 12.0, 12.0, 18.0, 21.0, 22.0, 26.0, 29.0, 39.0, 31.0, 30.0, 39.0, 39.0, 58.0, 50.0, 40.0, 44.0, 46.0, 35.0, 49.0, 23.0, 35.0, 42.0, 29.0, 29.0, 23.0, 21.0, 18.0, 15.0, 14.0, 12.0, 10.0, 12.0, 4.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.654052734375, -4.48779296875, -4.321533203125, -4.1552734375, -3.989013671875, -3.82275390625, -3.656494140625, -3.490234375, -3.323974609375, -3.15771484375, -2.991455078125, -2.8251953125, -2.658935546875, -2.49267578125, -2.326416015625, -2.16015625, -1.993896484375, -1.82763671875, -1.661376953125, -1.4951171875, -1.328857421875, -1.16259765625, -0.996337890625, -0.830078125, -0.663818359375, -0.49755859375, -0.331298828125, -0.1650390625, 0.001220703125, 0.16748046875, 0.333740234375, 0.5, 0.666259765625, 0.83251953125, 0.998779296875, 1.1650390625, 1.331298828125, 1.49755859375, 1.663818359375, 1.830078125, 1.996337890625, 2.16259765625, 2.328857421875, 2.4951171875, 2.661376953125, 2.82763671875, 2.993896484375, 3.16015625, 3.326416015625, 3.49267578125, 3.658935546875, 3.8251953125, 3.991455078125, 4.15771484375, 4.323974609375, 4.490234375, 4.656494140625, 4.82275390625, 4.989013671875, 5.1552734375, 5.321533203125, 5.48779296875, 5.654052734375, 5.8203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 10.0, 8.0, 23.0, 27.0, 29.0, 44.0, 64.0, 71.0, 119.0, 124.0, 220.0, 294.0, 467.0, 704.0, 1076.0, 1890.0, 3328.0, 6422.0, 14407.0, 38550.0, 133476.0, 449396.0, 280903.0, 71967.0, 23807.0, 9884.0, 4665.0, 2495.0, 1406.0, 842.0, 545.0, 385.0, 248.0, 166.0, 151.0, 87.0, 63.0, 56.0, 36.0, 22.0, 21.0, 14.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.125, -2.060150146484375, -1.99530029296875, -1.930450439453125, -1.8656005859375, -1.800750732421875, -1.73590087890625, -1.671051025390625, -1.606201171875, -1.541351318359375, -1.47650146484375, -1.411651611328125, -1.3468017578125, -1.281951904296875, -1.21710205078125, -1.152252197265625, -1.08740234375, -1.022552490234375, -0.95770263671875, -0.892852783203125, -0.8280029296875, -0.763153076171875, -0.69830322265625, -0.633453369140625, -0.568603515625, -0.503753662109375, -0.43890380859375, -0.374053955078125, -0.3092041015625, -0.244354248046875, -0.17950439453125, -0.114654541015625, -0.0498046875, 0.015045166015625, 0.07989501953125, 0.144744873046875, 0.2095947265625, 0.274444580078125, 0.33929443359375, 0.404144287109375, 0.468994140625, 0.533843994140625, 0.59869384765625, 0.663543701171875, 0.7283935546875, 0.793243408203125, 0.85809326171875, 0.922943115234375, 0.98779296875, 1.052642822265625, 1.11749267578125, 1.182342529296875, 1.2471923828125, 1.312042236328125, 1.37689208984375, 1.441741943359375, 1.506591796875, 1.571441650390625, 1.63629150390625, 1.701141357421875, 1.7659912109375, 1.830841064453125, 1.89569091796875, 1.960540771484375, 2.025390625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 21.0, 23.0, 40.0, 44.0, 56.0, 94.0, 92.0, 114.0, 117.0, 87.0, 71.0, 63.0, 39.0, 32.0, 18.0, 12.0, 9.0, 11.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000286102294921875, -0.00027739256620407104, -0.0002686828374862671, -0.00025997310876846313, -0.0002512633800506592, -0.00024255365133285522, -0.00023384392261505127, -0.00022513419389724731, -0.00021642446517944336, -0.0002077147364616394, -0.00019900500774383545, -0.0001902952790260315, -0.00018158555030822754, -0.00017287582159042358, -0.00016416609287261963, -0.00015545636415481567, -0.00014674663543701172, -0.00013803690671920776, -0.0001293271780014038, -0.00012061744928359985, -0.0001119077205657959, -0.00010319799184799194, -9.448826313018799e-05, -8.577853441238403e-05, -7.706880569458008e-05, -6.835907697677612e-05, -5.964934825897217e-05, -5.093961954116821e-05, -4.222989082336426e-05, -3.35201621055603e-05, -2.4810433387756348e-05, -1.6100704669952393e-05, -7.3909759521484375e-06, 1.3187527656555176e-06, 1.0028481483459473e-05, 1.8738210201263428e-05, 2.7447938919067383e-05, 3.615766763687134e-05, 4.486739635467529e-05, 5.357712507247925e-05, 6.22868537902832e-05, 7.099658250808716e-05, 7.970631122589111e-05, 8.841603994369507e-05, 9.712576866149902e-05, 0.00010583549737930298, 0.00011454522609710693, 0.0001232549548149109, 0.00013196468353271484, 0.0001406744122505188, 0.00014938414096832275, 0.0001580938696861267, 0.00016680359840393066, 0.00017551332712173462, 0.00018422305583953857, 0.00019293278455734253, 0.00020164251327514648, 0.00021035224199295044, 0.0002190619707107544, 0.00022777169942855835, 0.0002364814281463623, 0.00024519115686416626, 0.0002539008855819702, 0.00026261061429977417, 0.0002713203430175781]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 9.0, 10.0, 10.0, 22.0, 15.0, 16.0, 24.0, 36.0, 61.0, 82.0, 124.0, 164.0, 205.0, 279.0, 396.0, 522.0, 715.0, 1081.0, 1525.0, 2449.0, 4024.0, 7335.0, 14552.0, 29786.0, 63854.0, 135293.0, 257002.0, 259982.0, 138892.0, 64920.0, 30834.0, 14785.0, 7415.0, 4194.0, 2533.0, 1575.0, 1060.0, 749.0, 558.0, 379.0, 271.0, 206.0, 187.0, 113.0, 90.0, 61.0, 48.0, 41.0, 29.0, 21.0, 7.0, 13.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.5224609375, -1.47174072265625, -1.4210205078125, -1.37030029296875, -1.319580078125, -1.26885986328125, -1.2181396484375, -1.16741943359375, -1.11669921875, -1.06597900390625, -1.0152587890625, -0.96453857421875, -0.913818359375, -0.86309814453125, -0.8123779296875, -0.76165771484375, -0.7109375, -0.66021728515625, -0.6094970703125, -0.55877685546875, -0.508056640625, -0.45733642578125, -0.4066162109375, -0.35589599609375, -0.30517578125, -0.25445556640625, -0.2037353515625, -0.15301513671875, -0.102294921875, -0.05157470703125, -0.0008544921875, 0.04986572265625, 0.1005859375, 0.15130615234375, 0.2020263671875, 0.25274658203125, 0.303466796875, 0.35418701171875, 0.4049072265625, 0.45562744140625, 0.50634765625, 0.55706787109375, 0.6077880859375, 0.65850830078125, 0.709228515625, 0.75994873046875, 0.8106689453125, 0.86138916015625, 0.912109375, 0.96282958984375, 1.0135498046875, 1.06427001953125, 1.114990234375, 1.16571044921875, 1.2164306640625, 1.26715087890625, 1.31787109375, 1.36859130859375, 1.4193115234375, 1.47003173828125, 1.520751953125, 1.57147216796875, 1.6221923828125, 1.67291259765625, 1.7236328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 7.0, 3.0, 2.0, 3.0, 7.0, 9.0, 8.0, 13.0, 10.0, 15.0, 21.0, 25.0, 37.0, 40.0, 60.0, 79.0, 101.0, 79.0, 90.0, 85.0, 68.0, 59.0, 41.0, 36.0, 26.0, 14.0, 14.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.445556640625, -0.4300956726074219, -0.41463470458984375, -0.3991737365722656, -0.3837127685546875, -0.3682518005371094, -0.35279083251953125, -0.3373298645019531, -0.321868896484375, -0.3064079284667969, -0.29094696044921875, -0.2754859924316406, -0.2600250244140625, -0.24456405639648438, -0.22910308837890625, -0.21364212036132812, -0.19818115234375, -0.18272018432617188, -0.16725921630859375, -0.15179824829101562, -0.1363372802734375, -0.12087631225585938, -0.10541534423828125, -0.08995437622070312, -0.074493408203125, -0.059032440185546875, -0.04357147216796875, -0.028110504150390625, -0.0126495361328125, 0.002811431884765625, 0.01827239990234375, 0.033733367919921875, 0.0491943359375, 0.06465530395507812, 0.08011627197265625, 0.09557723999023438, 0.1110382080078125, 0.12649917602539062, 0.14196014404296875, 0.15742111206054688, 0.172882080078125, 0.18834304809570312, 0.20380401611328125, 0.21926498413085938, 0.2347259521484375, 0.2501869201660156, 0.26564788818359375, 0.2811088562011719, 0.29656982421875, 0.3120307922363281, 0.32749176025390625, 0.3429527282714844, 0.3584136962890625, 0.3738746643066406, 0.38933563232421875, 0.4047966003417969, 0.420257568359375, 0.4357185363769531, 0.45117950439453125, 0.4666404724121094, 0.4821014404296875, 0.4975624084472656, 0.5130233764648438, 0.5284843444824219, 0.5439453125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 3.0, 5.0, 9.0, 17.0, 7.0, 12.0, 18.0, 21.0, 23.0, 21.0, 30.0, 38.0, 27.0, 28.0, 36.0, 44.0, 35.0, 58.0, 43.0, 58.0, 35.0, 32.0, 49.0, 32.0, 33.0, 42.0, 32.0, 35.0, 35.0, 18.0, 16.0, 20.0, 16.0, 10.0, 13.0, 9.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-7.860047340393066, -7.652993679046631, -7.445939540863037, -7.238885879516602, -7.031831741333008, -6.824778079986572, -6.617724418640137, -6.410670280456543, -6.203616142272949, -5.996562480926514, -5.78950834274292, -5.582454681396484, -5.375400543212891, -5.168346881866455, -4.9612932205200195, -4.754239082336426, -4.54718542098999, -4.340131759643555, -4.133077621459961, -3.9260239601135254, -3.7189698219299316, -3.511916160583496, -3.3048622608184814, -3.097808361053467, -2.890754461288452, -2.6837005615234375, -2.476646661758423, -2.269592761993408, -2.0625391006469727, -1.8554850816726685, -1.6484313011169434, -1.4413774013519287, -1.234323501586914, -1.0272696018218994, -0.8202157616615295, -0.6131619215011597, -0.406108021736145, -0.19905412197113037, 0.007999658584594727, 0.21505355834960938, 0.422107458114624, 0.6291613578796387, 0.8362151980400085, 1.0432690382003784, 1.250322937965393, 1.4573768377304077, 1.6644306182861328, 1.8714845180511475, 2.078538417816162, 2.2855923175811768, 2.4926462173461914, 2.699699878692627, 2.9067540168762207, 3.1138076782226562, 3.320861577987671, 3.5279154777526855, 3.7349693775177, 3.942023277282715, 4.14907693862915, 4.356131076812744, 4.56318473815918, 4.770238876342773, 4.977292537689209, 5.1843461990356445, 5.391400337219238]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 5.0, 13.0, 10.0, 15.0, 13.0, 20.0, 16.0, 21.0, 26.0, 31.0, 30.0, 31.0, 27.0, 41.0, 28.0, 35.0, 38.0, 39.0, 37.0, 32.0, 44.0, 42.0, 37.0, 48.0, 34.0, 28.0, 33.0, 30.0, 19.0, 23.0, 21.0, 17.0, 19.0, 19.0, 13.0, 18.0, 8.0, 3.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.081484794616699, -5.878680229187012, -5.675875663757324, -5.473071575164795, -5.270267009735107, -5.06746244430542, -4.864658355712891, -4.661853790283203, -4.459049224853516, -4.256244659423828, -4.053440093994141, -3.8506360054016113, -3.647831439971924, -3.4450268745422363, -3.242222547531128, -3.0394182205200195, -2.836613655090332, -2.6338090896606445, -2.431004762649536, -2.2282004356384277, -2.0253958702087402, -1.8225914239883423, -1.6197869777679443, -1.4169825315475464, -1.2141780853271484, -1.0113736391067505, -0.8085691928863525, -0.6057647466659546, -0.40296030044555664, -0.2001558542251587, 0.002648591995239258, 0.2054530382156372, 0.40825700759887695, 0.6110614538192749, 0.8138659000396729, 1.0166703462600708, 1.2194747924804688, 1.4222792387008667, 1.6250836849212646, 1.8278881311416626, 2.0306925773620605, 2.233497142791748, 2.4363014698028564, 2.639105796813965, 2.8419103622436523, 3.04471492767334, 3.2475192546844482, 3.4503235816955566, 3.653128147125244, 3.8559327125549316, 4.058736801147461, 4.261541366577148, 4.464345932006836, 4.667150497436523, 4.869955062866211, 5.07275915145874, 5.275563716888428, 5.478368282318115, 5.6811723709106445, 5.883976936340332, 6.0867815017700195, 6.289586067199707, 6.4923906326293945, 6.695194721221924, 6.897999286651611]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 2.0, 3.0, 13.0, 20.0, 21.0, 36.0, 54.0, 74.0, 151.0, 249.0, 384.0, 572.0, 888.0, 1377.0, 2075.0, 3233.0, 4985.0, 7645.0, 11464.0, 17669.0, 26127.0, 38172.0, 54058.0, 72846.0, 93122.0, 110361.0, 118361.0, 114424.0, 99391.0, 79837.0, 59853.0, 42874.0, 29599.0, 20275.0, 13269.0, 8781.0, 5599.0, 3773.0, 2448.0, 1612.0, 985.0, 660.0, 436.0, 287.0, 175.0, 105.0, 87.0, 45.0, 28.0, 26.0, 13.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.98046875, -5.77886962890625, -5.5772705078125, -5.37567138671875, -5.174072265625, -4.97247314453125, -4.7708740234375, -4.56927490234375, -4.36767578125, -4.16607666015625, -3.9644775390625, -3.76287841796875, -3.561279296875, -3.35968017578125, -3.1580810546875, -2.95648193359375, -2.7548828125, -2.55328369140625, -2.3516845703125, -2.15008544921875, -1.948486328125, -1.74688720703125, -1.5452880859375, -1.34368896484375, -1.14208984375, -0.94049072265625, -0.7388916015625, -0.53729248046875, -0.335693359375, -0.13409423828125, 0.0675048828125, 0.26910400390625, 0.470703125, 0.67230224609375, 0.8739013671875, 1.07550048828125, 1.277099609375, 1.47869873046875, 1.6802978515625, 1.88189697265625, 2.08349609375, 2.28509521484375, 2.4866943359375, 2.68829345703125, 2.889892578125, 3.09149169921875, 3.2930908203125, 3.49468994140625, 3.6962890625, 3.89788818359375, 4.0994873046875, 4.30108642578125, 4.502685546875, 4.70428466796875, 4.9058837890625, 5.10748291015625, 5.30908203125, 5.51068115234375, 5.7122802734375, 5.91387939453125, 6.115478515625, 6.31707763671875, 6.5186767578125, 6.72027587890625, 6.921875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 5.0, 7.0, 10.0, 12.0, 19.0, 14.0, 16.0, 18.0, 21.0, 13.0, 23.0, 18.0, 33.0, 33.0, 40.0, 44.0, 35.0, 41.0, 37.0, 38.0, 37.0, 41.0, 50.0, 53.0, 33.0, 38.0, 31.0, 37.0, 14.0, 18.0, 23.0, 26.0, 24.0, 19.0, 18.0, 13.0, 8.0, 7.0, 12.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.69921875, -5.49676513671875, -5.2943115234375, -5.09185791015625, -4.889404296875, -4.68695068359375, -4.4844970703125, -4.28204345703125, -4.07958984375, -3.87713623046875, -3.6746826171875, -3.47222900390625, -3.269775390625, -3.06732177734375, -2.8648681640625, -2.66241455078125, -2.4599609375, -2.25750732421875, -2.0550537109375, -1.85260009765625, -1.650146484375, -1.44769287109375, -1.2452392578125, -1.04278564453125, -0.84033203125, -0.63787841796875, -0.4354248046875, -0.23297119140625, -0.030517578125, 0.17193603515625, 0.3743896484375, 0.57684326171875, 0.779296875, 0.98175048828125, 1.1842041015625, 1.38665771484375, 1.589111328125, 1.79156494140625, 1.9940185546875, 2.19647216796875, 2.39892578125, 2.60137939453125, 2.8038330078125, 3.00628662109375, 3.208740234375, 3.41119384765625, 3.6136474609375, 3.81610107421875, 4.0185546875, 4.22100830078125, 4.4234619140625, 4.62591552734375, 4.828369140625, 5.03082275390625, 5.2332763671875, 5.43572998046875, 5.63818359375, 5.84063720703125, 6.0430908203125, 6.24554443359375, 6.447998046875, 6.65045166015625, 6.8529052734375, 7.05535888671875, 7.2578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 13.0, 14.0, 15.0, 33.0, 48.0, 58.0, 88.0, 169.0, 248.0, 390.0, 645.0, 933.0, 1494.0, 2386.0, 3960.0, 6423.0, 10240.0, 16329.0, 25033.0, 38327.0, 55614.0, 76587.0, 99278.0, 118077.0, 125707.0, 118652.0, 100884.0, 78923.0, 57271.0, 39365.0, 26182.0, 16862.0, 10647.0, 6673.0, 4171.0, 2582.0, 1584.0, 962.0, 607.0, 402.0, 245.0, 168.0, 76.0, 75.0, 32.0, 33.0, 16.0, 11.0, 13.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.4609375, -6.268310546875, -6.07568359375, -5.883056640625, -5.6904296875, -5.497802734375, -5.30517578125, -5.112548828125, -4.919921875, -4.727294921875, -4.53466796875, -4.342041015625, -4.1494140625, -3.956787109375, -3.76416015625, -3.571533203125, -3.37890625, -3.186279296875, -2.99365234375, -2.801025390625, -2.6083984375, -2.415771484375, -2.22314453125, -2.030517578125, -1.837890625, -1.645263671875, -1.45263671875, -1.260009765625, -1.0673828125, -0.874755859375, -0.68212890625, -0.489501953125, -0.296875, -0.104248046875, 0.08837890625, 0.281005859375, 0.4736328125, 0.666259765625, 0.85888671875, 1.051513671875, 1.244140625, 1.436767578125, 1.62939453125, 1.822021484375, 2.0146484375, 2.207275390625, 2.39990234375, 2.592529296875, 2.78515625, 2.977783203125, 3.17041015625, 3.363037109375, 3.5556640625, 3.748291015625, 3.94091796875, 4.133544921875, 4.326171875, 4.518798828125, 4.71142578125, 4.904052734375, 5.0966796875, 5.289306640625, 5.48193359375, 5.674560546875, 5.8671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 4.0, 7.0, 11.0, 8.0, 12.0, 17.0, 15.0, 17.0, 22.0, 27.0, 15.0, 21.0, 18.0, 29.0, 26.0, 22.0, 31.0, 33.0, 26.0, 31.0, 33.0, 35.0, 38.0, 40.0, 33.0, 48.0, 27.0, 36.0, 39.0, 30.0, 20.0, 31.0, 16.0, 27.0, 22.0, 12.0, 20.0, 10.0, 14.0, 6.0, 9.0, 13.0, 5.0, 6.0, 11.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.623046875, -3.510498046875, -3.39794921875, -3.285400390625, -3.1728515625, -3.060302734375, -2.94775390625, -2.835205078125, -2.72265625, -2.610107421875, -2.49755859375, -2.385009765625, -2.2724609375, -2.159912109375, -2.04736328125, -1.934814453125, -1.822265625, -1.709716796875, -1.59716796875, -1.484619140625, -1.3720703125, -1.259521484375, -1.14697265625, -1.034423828125, -0.921875, -0.809326171875, -0.69677734375, -0.584228515625, -0.4716796875, -0.359130859375, -0.24658203125, -0.134033203125, -0.021484375, 0.091064453125, 0.20361328125, 0.316162109375, 0.4287109375, 0.541259765625, 0.65380859375, 0.766357421875, 0.87890625, 0.991455078125, 1.10400390625, 1.216552734375, 1.3291015625, 1.441650390625, 1.55419921875, 1.666748046875, 1.779296875, 1.891845703125, 2.00439453125, 2.116943359375, 2.2294921875, 2.342041015625, 2.45458984375, 2.567138671875, 2.6796875, 2.792236328125, 2.90478515625, 3.017333984375, 3.1298828125, 3.242431640625, 3.35498046875, 3.467529296875, 3.580078125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 22.0, 34.0, 43.0, 79.0, 88.0, 126.0, 222.0, 296.0, 408.0, 592.0, 881.0, 1298.0, 2082.0, 3162.0, 5043.0, 7792.0, 13233.0, 22418.0, 39640.0, 69585.0, 118601.0, 175295.0, 195425.0, 156233.0, 98996.0, 56521.0, 32015.0, 18502.0, 10965.0, 6704.0, 4113.0, 2636.0, 1861.0, 1109.0, 833.0, 554.0, 356.0, 245.0, 168.0, 124.0, 85.0, 58.0, 40.0, 20.0, 16.0, 13.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.1070556640625, -4.932861328125, -4.7586669921875, -4.58447265625, -4.4102783203125, -4.236083984375, -4.0618896484375, -3.8876953125, -3.7135009765625, -3.539306640625, -3.3651123046875, -3.19091796875, -3.0167236328125, -2.842529296875, -2.6683349609375, -2.494140625, -2.3199462890625, -2.145751953125, -1.9715576171875, -1.79736328125, -1.6231689453125, -1.448974609375, -1.2747802734375, -1.1005859375, -0.9263916015625, -0.752197265625, -0.5780029296875, -0.40380859375, -0.2296142578125, -0.055419921875, 0.1187744140625, 0.29296875, 0.4671630859375, 0.641357421875, 0.8155517578125, 0.98974609375, 1.1639404296875, 1.338134765625, 1.5123291015625, 1.6865234375, 1.8607177734375, 2.034912109375, 2.2091064453125, 2.38330078125, 2.5574951171875, 2.731689453125, 2.9058837890625, 3.080078125, 3.2542724609375, 3.428466796875, 3.6026611328125, 3.77685546875, 3.9510498046875, 4.125244140625, 4.2994384765625, 4.4736328125, 4.6478271484375, 4.822021484375, 4.9962158203125, 5.17041015625, 5.3446044921875, 5.518798828125, 5.6929931640625, 5.8671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 14.0, 14.0, 23.0, 20.0, 42.0, 38.0, 73.0, 73.0, 103.0, 110.0, 84.0, 81.0, 81.0, 51.0, 42.0, 44.0, 16.0, 21.0, 9.0, 12.0, 7.0, 0.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006756782531738281, -0.0006514415144920349, -0.0006272047758102417, -0.0006029680371284485, -0.0005787312984466553, -0.0005544945597648621, -0.0005302578210830688, -0.0005060210824012756, -0.0004817843437194824, -0.0004575476050376892, -0.000433310866355896, -0.0004090741276741028, -0.00038483738899230957, -0.00036060065031051636, -0.00033636391162872314, -0.00031212717294692993, -0.0002878904342651367, -0.0002636536955833435, -0.0002394169569015503, -0.00021518021821975708, -0.00019094347953796387, -0.00016670674085617065, -0.00014247000217437744, -0.00011823326349258423, -9.399652481079102e-05, -6.97597861289978e-05, -4.552304744720459e-05, -2.1286308765411377e-05, 2.950429916381836e-06, 2.718716859817505e-05, 5.142390727996826e-05, 7.566064596176147e-05, 9.989738464355469e-05, 0.0001241341233253479, 0.0001483708620071411, 0.00017260760068893433, 0.00019684433937072754, 0.00022108107805252075, 0.00024531781673431396, 0.0002695545554161072, 0.0002937912940979004, 0.0003180280327796936, 0.0003422647714614868, 0.00036650151014328003, 0.00039073824882507324, 0.00041497498750686646, 0.00043921172618865967, 0.0004634484648704529, 0.0004876852035522461, 0.0005119219422340393, 0.0005361586809158325, 0.0005603954195976257, 0.0005846321582794189, 0.0006088688969612122, 0.0006331056356430054, 0.0006573423743247986, 0.0006815791130065918, 0.000705815851688385, 0.0007300525903701782, 0.0007542893290519714, 0.0007785260677337646, 0.0008027628064155579, 0.0008269995450973511, 0.0008512362837791443, 0.0008754730224609375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 6.0, 14.0, 16.0, 24.0, 34.0, 67.0, 110.0, 195.0, 269.0, 467.0, 761.0, 1331.0, 2188.0, 3681.0, 6487.0, 10809.0, 18712.0, 32730.0, 55909.0, 91564.0, 136814.0, 172101.0, 169960.0, 131984.0, 86580.0, 52615.0, 30614.0, 17700.0, 10216.0, 5899.0, 3498.0, 2111.0, 1199.0, 738.0, 434.0, 280.0, 166.0, 112.0, 64.0, 41.0, 28.0, 14.0, 10.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -5.00054931640625, -4.8487548828125, -4.69696044921875, -4.545166015625, -4.39337158203125, -4.2415771484375, -4.08978271484375, -3.93798828125, -3.78619384765625, -3.6343994140625, -3.48260498046875, -3.330810546875, -3.17901611328125, -3.0272216796875, -2.87542724609375, -2.7236328125, -2.57183837890625, -2.4200439453125, -2.26824951171875, -2.116455078125, -1.96466064453125, -1.8128662109375, -1.66107177734375, -1.50927734375, -1.35748291015625, -1.2056884765625, -1.05389404296875, -0.902099609375, -0.75030517578125, -0.5985107421875, -0.44671630859375, -0.294921875, -0.14312744140625, 0.0086669921875, 0.16046142578125, 0.312255859375, 0.46405029296875, 0.6158447265625, 0.76763916015625, 0.91943359375, 1.07122802734375, 1.2230224609375, 1.37481689453125, 1.526611328125, 1.67840576171875, 1.8302001953125, 1.98199462890625, 2.1337890625, 2.28558349609375, 2.4373779296875, 2.58917236328125, 2.740966796875, 2.89276123046875, 3.0445556640625, 3.19635009765625, 3.34814453125, 3.49993896484375, 3.6517333984375, 3.80352783203125, 3.955322265625, 4.10711669921875, 4.2589111328125, 4.41070556640625, 4.5625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 7.0, 2.0, 13.0, 8.0, 13.0, 13.0, 27.0, 30.0, 37.0, 27.0, 40.0, 39.0, 43.0, 49.0, 67.0, 61.0, 46.0, 51.0, 37.0, 61.0, 51.0, 41.0, 34.0, 39.0, 20.0, 29.0, 22.0, 22.0, 11.0, 8.0, 7.0, 5.0, 10.0, 2.0, 9.0, 0.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.38922119140625, -1.3389892578125, -1.28875732421875, -1.238525390625, -1.18829345703125, -1.1380615234375, -1.08782958984375, -1.03759765625, -0.98736572265625, -0.9371337890625, -0.88690185546875, -0.836669921875, -0.78643798828125, -0.7362060546875, -0.68597412109375, -0.6357421875, -0.58551025390625, -0.5352783203125, -0.48504638671875, -0.434814453125, -0.38458251953125, -0.3343505859375, -0.28411865234375, -0.23388671875, -0.18365478515625, -0.1334228515625, -0.08319091796875, -0.032958984375, 0.01727294921875, 0.0675048828125, 0.11773681640625, 0.16796875, 0.21820068359375, 0.2684326171875, 0.31866455078125, 0.368896484375, 0.41912841796875, 0.4693603515625, 0.51959228515625, 0.56982421875, 0.62005615234375, 0.6702880859375, 0.72052001953125, 0.770751953125, 0.82098388671875, 0.8712158203125, 0.92144775390625, 0.9716796875, 1.02191162109375, 1.0721435546875, 1.12237548828125, 1.172607421875, 1.22283935546875, 1.2730712890625, 1.32330322265625, 1.37353515625, 1.42376708984375, 1.4739990234375, 1.52423095703125, 1.574462890625, 1.62469482421875, 1.6749267578125, 1.72515869140625, 1.775390625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 5.0, 10.0, 10.0, 17.0, 17.0, 22.0, 20.0, 12.0, 26.0, 27.0, 28.0, 39.0, 37.0, 47.0, 28.0, 44.0, 40.0, 38.0, 45.0, 45.0, 35.0, 43.0, 33.0, 27.0, 47.0, 34.0, 24.0, 31.0, 26.0, 22.0, 20.0, 20.0, 16.0, 8.0, 5.0, 5.0, 12.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.479530334472656, -6.284248352050781, -6.088966369628906, -5.893684387207031, -5.698402404785156, -5.503120422363281, -5.307838439941406, -5.112556457519531, -4.917274475097656, -4.721992492675781, -4.526710510253906, -4.331428527832031, -4.136146545410156, -3.9408645629882812, -3.7455828189849854, -3.5503008365631104, -3.3550190925598145, -3.1597371101379395, -2.9644551277160645, -2.7691731452941895, -2.5738911628723145, -2.3786091804504395, -2.1833274364471436, -1.9880454540252686, -1.7927634716033936, -1.5974814891815186, -1.4021995067596436, -1.206917643547058, -1.011635661125183, -0.8163536787033081, -0.6210718154907227, -0.42578983306884766, -0.23050785064697266, -0.035225898027420044, 0.16005605459213257, 0.3553379774093628, 0.5506199598312378, 0.7459019422531128, 0.9411838054656982, 1.1364657878875732, 1.3317477703094482, 1.5270297527313232, 1.7223117351531982, 1.9175935983657837, 2.112875461578369, 2.308157444000244, 2.503439426422119, 2.698721408843994, 2.894003391265869, 3.089285373687744, 3.284567356109619, 3.479849338531494, 3.675131320953369, 3.870413303375244, 4.065694808959961, 4.260976791381836, 4.456258773803711, 4.651540756225586, 4.846822738647461, 5.042104721069336, 5.237386703491211, 5.432668685913086, 5.627950668334961, 5.823232650756836, 6.018514633178711]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 11.0, 8.0, 11.0, 19.0, 7.0, 11.0, 18.0, 16.0, 19.0, 27.0, 34.0, 28.0, 27.0, 45.0, 34.0, 34.0, 42.0, 31.0, 48.0, 37.0, 37.0, 41.0, 29.0, 44.0, 42.0, 30.0, 28.0, 29.0, 21.0, 19.0, 20.0, 30.0, 23.0, 14.0, 11.0, 14.0, 6.0, 9.0, 4.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31535530090332, -6.115519046783447, -5.915683269500732, -5.715847015380859, -5.5160112380981445, -5.3161749839782715, -5.116338729858398, -4.916502952575684, -4.716667175292969, -4.516830921173096, -4.316995143890381, -4.117158889770508, -3.917323112487793, -3.71748685836792, -3.517650842666626, -3.317814826965332, -3.117978572845459, -2.918142557144165, -2.718306541442871, -2.518470287322998, -2.318634510040283, -2.11879825592041, -1.9189622402191162, -1.7191262245178223, -1.5192902088165283, -1.3194541931152344, -1.1196181774139404, -0.9197820425033569, -0.719946026802063, -0.520110011100769, -0.32027387619018555, -0.1204378604888916, 0.07939815521240234, 0.2792342007160187, 0.479070246219635, 0.6789063215255737, 0.8787423372268677, 1.0785783529281616, 1.2784144878387451, 1.478250503540039, 1.678086519241333, 1.877922534942627, 2.077758550643921, 2.277594566345215, 2.477430820465088, 2.6772665977478027, 2.877102851867676, 3.0769388675689697, 3.2767748832702637, 3.4766108989715576, 3.6764469146728516, 3.8762831687927246, 4.0761189460754395, 4.2759552001953125, 4.475790977478027, 4.6756272315979, 4.875463485717773, 5.0752997398376465, 5.275135517120361, 5.474971771240234, 5.674807548522949, 5.874643802642822, 6.074480056762695, 6.27431583404541, 6.474151611328125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 22.0, 31.0, 50.0, 81.0, 146.0, 262.0, 415.0, 730.0, 1156.0, 2016.0, 3335.0, 5570.0, 9185.0, 15603.0, 25678.0, 42449.0, 69456.0, 111847.0, 174882.0, 263494.0, 377036.0, 491772.0, 562186.0, 551537.0, 468678.0, 350936.0, 244050.0, 160267.0, 101067.0, 63202.0, 38463.0, 23391.0, 14072.0, 8584.0, 4981.0, 3046.0, 1837.0, 1087.0, 615.0, 422.0, 245.0, 163.0, 93.0, 55.0, 33.0, 24.0, 16.0, 4.0, 1.0, 8.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.955322265625, -4.78955078125, -4.623779296875, -4.4580078125, -4.292236328125, -4.12646484375, -3.960693359375, -3.794921875, -3.629150390625, -3.46337890625, -3.297607421875, -3.1318359375, -2.966064453125, -2.80029296875, -2.634521484375, -2.46875, -2.302978515625, -2.13720703125, -1.971435546875, -1.8056640625, -1.639892578125, -1.47412109375, -1.308349609375, -1.142578125, -0.976806640625, -0.81103515625, -0.645263671875, -0.4794921875, -0.313720703125, -0.14794921875, 0.017822265625, 0.18359375, 0.349365234375, 0.51513671875, 0.680908203125, 0.8466796875, 1.012451171875, 1.17822265625, 1.343994140625, 1.509765625, 1.675537109375, 1.84130859375, 2.007080078125, 2.1728515625, 2.338623046875, 2.50439453125, 2.670166015625, 2.8359375, 3.001708984375, 3.16748046875, 3.333251953125, 3.4990234375, 3.664794921875, 3.83056640625, 3.996337890625, 4.162109375, 4.327880859375, 4.49365234375, 4.659423828125, 4.8251953125, 4.990966796875, 5.15673828125, 5.322509765625, 5.48828125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 11.0, 7.0, 9.0, 7.0, 14.0, 8.0, 17.0, 21.0, 19.0, 34.0, 24.0, 25.0, 34.0, 33.0, 33.0, 32.0, 43.0, 35.0, 35.0, 48.0, 47.0, 44.0, 33.0, 54.0, 42.0, 30.0, 26.0, 27.0, 22.0, 20.0, 18.0, 24.0, 12.0, 19.0, 17.0, 16.0, 5.0, 11.0, 6.0, 6.0, 13.0, 4.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.58203125, -4.44244384765625, -4.3028564453125, -4.16326904296875, -4.023681640625, -3.88409423828125, -3.7445068359375, -3.60491943359375, -3.46533203125, -3.32574462890625, -3.1861572265625, -3.04656982421875, -2.906982421875, -2.76739501953125, -2.6278076171875, -2.48822021484375, -2.3486328125, -2.20904541015625, -2.0694580078125, -1.92987060546875, -1.790283203125, -1.65069580078125, -1.5111083984375, -1.37152099609375, -1.23193359375, -1.09234619140625, -0.9527587890625, -0.81317138671875, -0.673583984375, -0.53399658203125, -0.3944091796875, -0.25482177734375, -0.115234375, 0.02435302734375, 0.1639404296875, 0.30352783203125, 0.443115234375, 0.58270263671875, 0.7222900390625, 0.86187744140625, 1.00146484375, 1.14105224609375, 1.2806396484375, 1.42022705078125, 1.559814453125, 1.69940185546875, 1.8389892578125, 1.97857666015625, 2.1181640625, 2.25775146484375, 2.3973388671875, 2.53692626953125, 2.676513671875, 2.81610107421875, 2.9556884765625, 3.09527587890625, 3.23486328125, 3.37445068359375, 3.5140380859375, 3.65362548828125, 3.793212890625, 3.93280029296875, 4.0723876953125, 4.21197509765625, 4.3515625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 9.0, 10.0, 9.0, 17.0, 23.0, 49.0, 69.0, 95.0, 194.0, 277.0, 476.0, 795.0, 1261.0, 2038.0, 3443.0, 5729.0, 9173.0, 15008.0, 24613.0, 39365.0, 62148.0, 96176.0, 144659.0, 208137.0, 285420.0, 368808.0, 438058.0, 477240.0, 467962.0, 416973.0, 339991.0, 256634.0, 182807.0, 125141.0, 82441.0, 52821.0, 33218.0, 20500.0, 12721.0, 7697.0, 4771.0, 2749.0, 1756.0, 1041.0, 658.0, 422.0, 275.0, 144.0, 110.0, 57.0, 44.0, 27.0, 9.0, 14.0, 4.0, 7.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.3359375, -4.19525146484375, -4.0545654296875, -3.91387939453125, -3.773193359375, -3.63250732421875, -3.4918212890625, -3.35113525390625, -3.21044921875, -3.06976318359375, -2.9290771484375, -2.78839111328125, -2.647705078125, -2.50701904296875, -2.3663330078125, -2.22564697265625, -2.0849609375, -1.94427490234375, -1.8035888671875, -1.66290283203125, -1.522216796875, -1.38153076171875, -1.2408447265625, -1.10015869140625, -0.95947265625, -0.81878662109375, -0.6781005859375, -0.53741455078125, -0.396728515625, -0.25604248046875, -0.1153564453125, 0.02532958984375, 0.166015625, 0.30670166015625, 0.4473876953125, 0.58807373046875, 0.728759765625, 0.86944580078125, 1.0101318359375, 1.15081787109375, 1.29150390625, 1.43218994140625, 1.5728759765625, 1.71356201171875, 1.854248046875, 1.99493408203125, 2.1356201171875, 2.27630615234375, 2.4169921875, 2.55767822265625, 2.6983642578125, 2.83905029296875, 2.979736328125, 3.12042236328125, 3.2611083984375, 3.40179443359375, 3.54248046875, 3.68316650390625, 3.8238525390625, 3.96453857421875, 4.105224609375, 4.24591064453125, 4.3865966796875, 4.52728271484375, 4.66796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 10.0, 11.0, 15.0, 20.0, 24.0, 32.0, 44.0, 60.0, 65.0, 78.0, 104.0, 102.0, 134.0, 148.0, 148.0, 168.0, 179.0, 160.0, 179.0, 215.0, 234.0, 208.0, 217.0, 192.0, 169.0, 155.0, 141.0, 155.0, 125.0, 102.0, 88.0, 70.0, 66.0, 49.0, 44.0, 30.0, 35.0, 20.0, 18.0, 16.0, 12.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.392578125, -2.3249969482421875, -2.257415771484375, -2.1898345947265625, -2.12225341796875, -2.0546722412109375, -1.987091064453125, -1.9195098876953125, -1.8519287109375, -1.7843475341796875, -1.716766357421875, -1.6491851806640625, -1.58160400390625, -1.5140228271484375, -1.446441650390625, -1.3788604736328125, -1.311279296875, -1.2436981201171875, -1.176116943359375, -1.1085357666015625, -1.04095458984375, -0.9733734130859375, -0.905792236328125, -0.8382110595703125, -0.7706298828125, -0.7030487060546875, -0.635467529296875, -0.5678863525390625, -0.50030517578125, -0.4327239990234375, -0.365142822265625, -0.2975616455078125, -0.22998046875, -0.1623992919921875, -0.094818115234375, -0.0272369384765625, 0.04034423828125, 0.1079254150390625, 0.175506591796875, 0.2430877685546875, 0.3106689453125, 0.3782501220703125, 0.445831298828125, 0.5134124755859375, 0.58099365234375, 0.6485748291015625, 0.716156005859375, 0.7837371826171875, 0.851318359375, 0.9188995361328125, 0.986480712890625, 1.0540618896484375, 1.12164306640625, 1.1892242431640625, 1.256805419921875, 1.3243865966796875, 1.3919677734375, 1.4595489501953125, 1.527130126953125, 1.5947113037109375, 1.66229248046875, 1.7298736572265625, 1.797454833984375, 1.8650360107421875, 1.9326171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 9.0, 16.0, 15.0, 21.0, 21.0, 24.0, 27.0, 34.0, 25.0, 32.0, 40.0, 38.0, 54.0, 53.0, 41.0, 58.0, 49.0, 43.0, 34.0, 43.0, 29.0, 37.0, 31.0, 37.0, 27.0, 28.0, 16.0, 16.0, 15.0, 18.0, 11.0, 9.0, 8.0, 11.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.5608696937561035, -6.3761887550354, -6.191507339477539, -6.006826400756836, -5.822145462036133, -5.63746452331543, -5.452783584594727, -5.268102169036865, -5.083421230316162, -4.898740291595459, -4.714058876037598, -4.5293779373168945, -4.344696998596191, -4.160016059875488, -3.975334882736206, -3.790653705596924, -3.6059727668762207, -3.4212918281555176, -3.2366106510162354, -3.051929473876953, -2.86724853515625, -2.682567596435547, -2.4978864192962646, -2.3132052421569824, -2.1285243034362793, -1.9438432455062866, -1.759162187576294, -1.5744811296463013, -1.3898000717163086, -1.205119013786316, -1.0204379558563232, -0.8357568979263306, -0.6510753631591797, -0.466394305229187, -0.28171324729919434, -0.09703218936920166, 0.08764886856079102, 0.2723299264907837, 0.45701098442077637, 0.641692042350769, 0.8263731002807617, 1.0110541582107544, 1.195735216140747, 1.3804162740707397, 1.5650973320007324, 1.749778389930725, 1.9344594478607178, 2.119140625, 2.303821563720703, 2.4885025024414062, 2.6731836795806885, 2.8578648567199707, 3.042545795440674, 3.227226734161377, 3.411907911300659, 3.5965890884399414, 3.7812700271606445, 3.9659509658813477, 4.150631904602051, 4.335313320159912, 4.519994258880615, 4.704675197601318, 4.88935661315918, 5.074037551879883, 5.258718490600586]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 12.0, 12.0, 14.0, 15.0, 23.0, 29.0, 21.0, 25.0, 27.0, 30.0, 33.0, 39.0, 36.0, 41.0, 41.0, 36.0, 57.0, 58.0, 30.0, 37.0, 34.0, 38.0, 35.0, 37.0, 27.0, 27.0, 24.0, 22.0, 19.0, 14.0, 23.0, 14.0, 14.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.529987335205078, -5.351332664489746, -5.172677993774414, -4.994023323059082, -4.81536865234375, -4.636713981628418, -4.458059310913086, -4.279405117034912, -4.10075044631958, -3.922095775604248, -3.743441104888916, -3.564786434173584, -3.386132001876831, -3.207477331161499, -3.028822660446167, -2.850168228149414, -2.671513319015503, -2.492858648300171, -2.314203977584839, -2.135549545288086, -1.956894874572754, -1.7782402038574219, -1.5995855331420898, -1.4209309816360474, -1.2422763109207153, -1.0636216402053833, -0.8849670886993408, -0.7063124179840088, -0.5276578068733215, -0.3490031957626343, -0.17034852504730225, 0.008306026458740234, 0.18696069717407227, 0.3656153082847595, 0.5442699193954468, 0.7229245901107788, 0.9015792012214661, 1.0802338123321533, 1.2588884830474854, 1.4375430345535278, 1.6161977052688599, 1.794852375984192, 1.9735069274902344, 2.1521615982055664, 2.3308162689208984, 2.5094709396362305, 2.6881256103515625, 2.8667800426483154, 3.0454347133636475, 3.2240893840789795, 3.4027440547943115, 3.5813984870910645, 3.7600531578063965, 3.9387078285217285, 4.1173624992370605, 4.296017169952393, 4.474671840667725, 4.653326511383057, 4.831981182098389, 5.010635852813721, 5.189290523529053, 5.367944717407227, 5.546599388122559, 5.725254058837891, 5.903908729553223]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 13.0, 17.0, 18.0, 28.0, 35.0, 51.0, 70.0, 96.0, 144.0, 175.0, 245.0, 371.0, 598.0, 904.0, 1372.0, 2571.0, 4798.0, 10501.0, 24477.0, 64006.0, 173748.0, 349918.0, 252346.0, 96102.0, 36260.0, 14681.0, 6650.0, 3294.0, 1787.0, 1116.0, 696.0, 430.0, 303.0, 212.0, 135.0, 121.0, 67.0, 51.0, 41.0, 23.0, 19.0, 26.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.05859375, -4.9039306640625, -4.749267578125, -4.5946044921875, -4.43994140625, -4.2852783203125, -4.130615234375, -3.9759521484375, -3.8212890625, -3.6666259765625, -3.511962890625, -3.3572998046875, -3.20263671875, -3.0479736328125, -2.893310546875, -2.7386474609375, -2.583984375, -2.4293212890625, -2.274658203125, -2.1199951171875, -1.96533203125, -1.8106689453125, -1.656005859375, -1.5013427734375, -1.3466796875, -1.1920166015625, -1.037353515625, -0.8826904296875, -0.72802734375, -0.5733642578125, -0.418701171875, -0.2640380859375, -0.109375, 0.0452880859375, 0.199951171875, 0.3546142578125, 0.50927734375, 0.6639404296875, 0.818603515625, 0.9732666015625, 1.1279296875, 1.2825927734375, 1.437255859375, 1.5919189453125, 1.74658203125, 1.9012451171875, 2.055908203125, 2.2105712890625, 2.365234375, 2.5198974609375, 2.674560546875, 2.8292236328125, 2.98388671875, 3.1385498046875, 3.293212890625, 3.4478759765625, 3.6025390625, 3.7572021484375, 3.911865234375, 4.0665283203125, 4.22119140625, 4.3758544921875, 4.530517578125, 4.6851806640625, 4.83984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 7.0, 9.0, 15.0, 11.0, 21.0, 19.0, 13.0, 19.0, 20.0, 22.0, 29.0, 28.0, 23.0, 32.0, 40.0, 32.0, 33.0, 46.0, 33.0, 40.0, 33.0, 33.0, 44.0, 42.0, 32.0, 27.0, 40.0, 35.0, 34.0, 23.0, 26.0, 17.0, 17.0, 20.0, 13.0, 11.0, 10.0, 10.0, 11.0, 11.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.27716064453125, -5.1051025390625, -4.93304443359375, -4.760986328125, -4.58892822265625, -4.4168701171875, -4.24481201171875, -4.07275390625, -3.90069580078125, -3.7286376953125, -3.55657958984375, -3.384521484375, -3.21246337890625, -3.0404052734375, -2.86834716796875, -2.6962890625, -2.52423095703125, -2.3521728515625, -2.18011474609375, -2.008056640625, -1.83599853515625, -1.6639404296875, -1.49188232421875, -1.31982421875, -1.14776611328125, -0.9757080078125, -0.80364990234375, -0.631591796875, -0.45953369140625, -0.2874755859375, -0.11541748046875, 0.056640625, 0.22869873046875, 0.4007568359375, 0.57281494140625, 0.744873046875, 0.91693115234375, 1.0889892578125, 1.26104736328125, 1.43310546875, 1.60516357421875, 1.7772216796875, 1.94927978515625, 2.121337890625, 2.29339599609375, 2.4654541015625, 2.63751220703125, 2.8095703125, 2.98162841796875, 3.1536865234375, 3.32574462890625, 3.497802734375, 3.66986083984375, 3.8419189453125, 4.01397705078125, 4.18603515625, 4.35809326171875, 4.5301513671875, 4.70220947265625, 4.874267578125, 5.04632568359375, 5.2183837890625, 5.39044189453125, 5.5625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 10.0, 8.0, 18.0, 16.0, 30.0, 48.0, 73.0, 78.0, 117.0, 179.0, 259.0, 449.0, 668.0, 1156.0, 2064.0, 3815.0, 7884.0, 17075.0, 41079.0, 106241.0, 263490.0, 336590.0, 158982.0, 61215.0, 24660.0, 10819.0, 5048.0, 2643.0, 1457.0, 830.0, 513.0, 350.0, 237.0, 159.0, 87.0, 64.0, 50.0, 30.0, 20.0, 11.0, 10.0, 8.0, 7.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.0574951171875, -3.927490234375, -3.7974853515625, -3.66748046875, -3.5374755859375, -3.407470703125, -3.2774658203125, -3.1474609375, -3.0174560546875, -2.887451171875, -2.7574462890625, -2.62744140625, -2.4974365234375, -2.367431640625, -2.2374267578125, -2.107421875, -1.9774169921875, -1.847412109375, -1.7174072265625, -1.58740234375, -1.4573974609375, -1.327392578125, -1.1973876953125, -1.0673828125, -0.9373779296875, -0.807373046875, -0.6773681640625, -0.54736328125, -0.4173583984375, -0.287353515625, -0.1573486328125, -0.02734375, 0.1026611328125, 0.232666015625, 0.3626708984375, 0.49267578125, 0.6226806640625, 0.752685546875, 0.8826904296875, 1.0126953125, 1.1427001953125, 1.272705078125, 1.4027099609375, 1.53271484375, 1.6627197265625, 1.792724609375, 1.9227294921875, 2.052734375, 2.1827392578125, 2.312744140625, 2.4427490234375, 2.57275390625, 2.7027587890625, 2.832763671875, 2.9627685546875, 3.0927734375, 3.2227783203125, 3.352783203125, 3.4827880859375, 3.61279296875, 3.7427978515625, 3.872802734375, 4.0028076171875, 4.1328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 12.0, 10.0, 5.0, 19.0, 16.0, 16.0, 20.0, 29.0, 19.0, 34.0, 39.0, 38.0, 34.0, 50.0, 45.0, 42.0, 38.0, 44.0, 58.0, 48.0, 36.0, 39.0, 41.0, 25.0, 36.0, 24.0, 22.0, 17.0, 21.0, 21.0, 15.0, 14.0, 19.0, 8.0, 13.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9923095703125, -3.859619140625, -3.7269287109375, -3.59423828125, -3.4615478515625, -3.328857421875, -3.1961669921875, -3.0634765625, -2.9307861328125, -2.798095703125, -2.6654052734375, -2.53271484375, -2.4000244140625, -2.267333984375, -2.1346435546875, -2.001953125, -1.8692626953125, -1.736572265625, -1.6038818359375, -1.47119140625, -1.3385009765625, -1.205810546875, -1.0731201171875, -0.9404296875, -0.8077392578125, -0.675048828125, -0.5423583984375, -0.40966796875, -0.2769775390625, -0.144287109375, -0.0115966796875, 0.12109375, 0.2537841796875, 0.386474609375, 0.5191650390625, 0.65185546875, 0.7845458984375, 0.917236328125, 1.0499267578125, 1.1826171875, 1.3153076171875, 1.447998046875, 1.5806884765625, 1.71337890625, 1.8460693359375, 1.978759765625, 2.1114501953125, 2.244140625, 2.3768310546875, 2.509521484375, 2.6422119140625, 2.77490234375, 2.9075927734375, 3.040283203125, 3.1729736328125, 3.3056640625, 3.4383544921875, 3.571044921875, 3.7037353515625, 3.83642578125, 3.9691162109375, 4.101806640625, 4.2344970703125, 4.3671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 15.0, 16.0, 30.0, 49.0, 48.0, 73.0, 96.0, 142.0, 188.0, 266.0, 339.0, 486.0, 669.0, 996.0, 1451.0, 2169.0, 3456.0, 5673.0, 10423.0, 21694.0, 53081.0, 159501.0, 400863.0, 245899.0, 78763.0, 29388.0, 13384.0, 7099.0, 4103.0, 2568.0, 1672.0, 1122.0, 789.0, 562.0, 399.0, 264.0, 226.0, 149.0, 129.0, 88.0, 53.0, 45.0, 31.0, 28.0, 20.0, 10.0, 9.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0888671875, -1.0555572509765625, -1.022247314453125, -0.9889373779296875, -0.95562744140625, -0.9223175048828125, -0.889007568359375, -0.8556976318359375, -0.8223876953125, -0.7890777587890625, -0.755767822265625, -0.7224578857421875, -0.68914794921875, -0.6558380126953125, -0.622528076171875, -0.5892181396484375, -0.555908203125, -0.5225982666015625, -0.489288330078125, -0.4559783935546875, -0.42266845703125, -0.3893585205078125, -0.356048583984375, -0.3227386474609375, -0.2894287109375, -0.2561187744140625, -0.222808837890625, -0.1894989013671875, -0.15618896484375, -0.1228790283203125, -0.089569091796875, -0.0562591552734375, -0.02294921875, 0.0103607177734375, 0.043670654296875, 0.0769805908203125, 0.11029052734375, 0.1436004638671875, 0.176910400390625, 0.2102203369140625, 0.2435302734375, 0.2768402099609375, 0.310150146484375, 0.3434600830078125, 0.37677001953125, 0.4100799560546875, 0.443389892578125, 0.4766998291015625, 0.510009765625, 0.5433197021484375, 0.576629638671875, 0.6099395751953125, 0.64324951171875, 0.6765594482421875, 0.709869384765625, 0.7431793212890625, 0.7764892578125, 0.8097991943359375, 0.843109130859375, 0.8764190673828125, 0.90972900390625, 0.9430389404296875, 0.976348876953125, 1.0096588134765625, 1.04296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 10.0, 8.0, 9.0, 10.0, 10.0, 23.0, 33.0, 44.0, 48.0, 69.0, 91.0, 86.0, 99.0, 105.0, 88.0, 74.0, 54.0, 40.0, 22.0, 22.0, 18.0, 13.0, 6.0, 3.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011969637125730515, -0.00011589191854000092, -0.00011208746582269669, -0.00010828301310539246, -0.00010447856038808823, -0.000100674107670784, -9.686965495347977e-05, -9.306520223617554e-05, -8.926074951887131e-05, -8.545629680156708e-05, -8.165184408426285e-05, -7.784739136695862e-05, -7.404293864965439e-05, -7.023848593235016e-05, -6.643403321504593e-05, -6.26295804977417e-05, -5.882512778043747e-05, -5.502067506313324e-05, -5.121622234582901e-05, -4.741176962852478e-05, -4.360731691122055e-05, -3.980286419391632e-05, -3.599841147661209e-05, -3.219395875930786e-05, -2.838950604200363e-05, -2.4585053324699402e-05, -2.0780600607395172e-05, -1.6976147890090942e-05, -1.3171695172786713e-05, -9.367242455482483e-06, -5.562789738178253e-06, -1.7583370208740234e-06, 2.0461156964302063e-06, 5.850568413734436e-06, 9.655021131038666e-06, 1.3459473848342896e-05, 1.7263926565647125e-05, 2.1068379282951355e-05, 2.4872832000255585e-05, 2.8677284717559814e-05, 3.2481737434864044e-05, 3.6286190152168274e-05, 4.0090642869472504e-05, 4.3895095586776733e-05, 4.769954830408096e-05, 5.150400102138519e-05, 5.530845373868942e-05, 5.911290645599365e-05, 6.291735917329788e-05, 6.672181189060211e-05, 7.052626460790634e-05, 7.433071732521057e-05, 7.81351700425148e-05, 8.193962275981903e-05, 8.574407547712326e-05, 8.954852819442749e-05, 9.335298091173172e-05, 9.715743362903595e-05, 0.00010096188634634018, 0.00010476633906364441, 0.00010857079178094864, 0.00011237524449825287, 0.0001161796972155571, 0.00011998414993286133]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 11.0, 19.0, 22.0, 27.0, 43.0, 38.0, 61.0, 91.0, 134.0, 160.0, 203.0, 305.0, 406.0, 525.0, 756.0, 1008.0, 1632.0, 2283.0, 3567.0, 5841.0, 9607.0, 17331.0, 32988.0, 64740.0, 128320.0, 229697.0, 245669.0, 144317.0, 73078.0, 37175.0, 19305.0, 10723.0, 6382.0, 3849.0, 2440.0, 1729.0, 1160.0, 752.0, 552.0, 440.0, 301.0, 202.0, 180.0, 134.0, 93.0, 76.0, 52.0, 41.0, 27.0, 26.0, 6.0, 7.0, 13.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.0458984375, -1.011138916015625, -0.97637939453125, -0.941619873046875, -0.9068603515625, -0.872100830078125, -0.83734130859375, -0.802581787109375, -0.767822265625, -0.733062744140625, -0.69830322265625, -0.663543701171875, -0.6287841796875, -0.594024658203125, -0.55926513671875, -0.524505615234375, -0.48974609375, -0.454986572265625, -0.42022705078125, -0.385467529296875, -0.3507080078125, -0.315948486328125, -0.28118896484375, -0.246429443359375, -0.211669921875, -0.176910400390625, -0.14215087890625, -0.107391357421875, -0.0726318359375, -0.037872314453125, -0.00311279296875, 0.031646728515625, 0.06640625, 0.101165771484375, 0.13592529296875, 0.170684814453125, 0.2054443359375, 0.240203857421875, 0.27496337890625, 0.309722900390625, 0.344482421875, 0.379241943359375, 0.41400146484375, 0.448760986328125, 0.4835205078125, 0.518280029296875, 0.55303955078125, 0.587799072265625, 0.62255859375, 0.657318115234375, 0.69207763671875, 0.726837158203125, 0.7615966796875, 0.796356201171875, 0.83111572265625, 0.865875244140625, 0.900634765625, 0.935394287109375, 0.97015380859375, 1.004913330078125, 1.0396728515625, 1.074432373046875, 1.10919189453125, 1.143951416015625, 1.1787109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 8.0, 0.0, 8.0, 5.0, 10.0, 12.0, 12.0, 25.0, 28.0, 35.0, 48.0, 63.0, 81.0, 79.0, 102.0, 108.0, 84.0, 70.0, 45.0, 44.0, 40.0, 20.0, 22.0, 13.0, 10.0, 6.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.50537109375, -0.4903450012207031, -0.47531890869140625, -0.4602928161621094, -0.4452667236328125, -0.4302406311035156, -0.41521453857421875, -0.4001884460449219, -0.385162353515625, -0.3701362609863281, -0.35511016845703125, -0.3400840759277344, -0.3250579833984375, -0.3100318908691406, -0.29500579833984375, -0.2799797058105469, -0.26495361328125, -0.24992752075195312, -0.23490142822265625, -0.21987533569335938, -0.2048492431640625, -0.18982315063476562, -0.17479705810546875, -0.15977096557617188, -0.144744873046875, -0.12971878051757812, -0.11469268798828125, -0.09966659545898438, -0.0846405029296875, -0.06961441040039062, -0.05458831787109375, -0.039562225341796875, -0.0245361328125, -0.009510040283203125, 0.00551605224609375, 0.020542144775390625, 0.0355682373046875, 0.050594329833984375, 0.06562042236328125, 0.08064651489257812, 0.095672607421875, 0.11069869995117188, 0.12572479248046875, 0.14075088500976562, 0.1557769775390625, 0.17080307006835938, 0.18582916259765625, 0.20085525512695312, 0.21588134765625, 0.23090744018554688, 0.24593353271484375, 0.2609596252441406, 0.2759857177734375, 0.2910118103027344, 0.30603790283203125, 0.3210639953613281, 0.336090087890625, 0.3511161804199219, 0.36614227294921875, 0.3811683654785156, 0.3961944580078125, 0.4112205505371094, 0.42624664306640625, 0.4412727355957031, 0.456298828125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 15.0, 17.0, 22.0, 19.0, 21.0, 33.0, 28.0, 33.0, 23.0, 43.0, 48.0, 36.0, 55.0, 41.0, 53.0, 53.0, 40.0, 44.0, 28.0, 32.0, 30.0, 37.0, 30.0, 36.0, 29.0, 25.0, 20.0, 13.0, 13.0, 13.0, 12.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.5756964683532715, -6.394256591796875, -6.212817192077637, -6.03137731552124, -5.849937438964844, -5.6684980392456055, -5.487058162689209, -5.3056182861328125, -5.124178886413574, -4.942739009857178, -4.7612996101379395, -4.579859733581543, -4.398420333862305, -4.216980457305908, -4.035540580749512, -3.8541009426116943, -3.672661304473877, -3.4912216663360596, -3.309782028198242, -3.1283421516418457, -2.9469025135040283, -2.765462875366211, -2.5840229988098145, -2.402583360671997, -2.2211437225341797, -2.0397040843963623, -1.8582643270492554, -1.6768245697021484, -1.495384931564331, -1.3139452934265137, -1.1325055360794067, -0.9510657787322998, -0.7696256637573242, -0.5881859660148621, -0.4067462682723999, -0.22530657052993774, -0.043866872787475586, 0.13757282495498657, 0.31901252269744873, 0.5004522800445557, 0.681891918182373, 0.8633316159248352, 1.0447713136672974, 1.2262110710144043, 1.4076507091522217, 1.589090347290039, 1.770530104637146, 1.951969861984253, 2.1334095001220703, 2.3148491382598877, 2.496288776397705, 2.6777286529541016, 2.859168291091919, 3.0406079292297363, 3.222047805786133, 3.40348744392395, 3.5849270820617676, 3.766366720199585, 3.9478063583374023, 4.129246234893799, 4.310686111450195, 4.492125511169434, 4.67356538772583, 4.855005264282227, 5.036444664001465]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 5.0, 8.0, 7.0, 15.0, 11.0, 16.0, 23.0, 24.0, 22.0, 22.0, 35.0, 24.0, 31.0, 37.0, 35.0, 39.0, 40.0, 39.0, 43.0, 59.0, 46.0, 35.0, 37.0, 29.0, 44.0, 36.0, 32.0, 22.0, 27.0, 23.0, 23.0, 12.0, 21.0, 22.0, 15.0, 9.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.604013919830322, -5.424798011779785, -5.24558162689209, -5.066365718841553, -4.887149333953857, -4.70793342590332, -4.528717041015625, -4.349501132965088, -4.170285224914551, -3.9910690784454346, -3.8118529319763184, -3.6326370239257812, -3.453420639038086, -3.274204730987549, -3.0949885845184326, -2.9157724380493164, -2.736556053161621, -2.557339906692505, -2.3781237602233887, -2.1989078521728516, -2.0196914672851562, -1.8404754400253296, -1.661259412765503, -1.4820432662963867, -1.3028271198272705, -1.1236109733581543, -0.9443948864936829, -0.7651787996292114, -0.5859626531600952, -0.406746506690979, -0.22753047943115234, -0.04831433296203613, 0.13090229034423828, 0.3101184070110321, 0.4893345236778259, 0.6685506105422974, 0.8477667570114136, 1.0269829034805298, 1.2061989307403564, 1.3854150772094727, 1.5646312236785889, 1.743847370147705, 1.9230635166168213, 2.1022796630859375, 2.2814955711364746, 2.46071195602417, 2.639927864074707, 2.8191440105438232, 2.9983601570129395, 3.1775763034820557, 3.356792449951172, 3.536008358001709, 3.7152247428894043, 3.8944406509399414, 4.073657035827637, 4.252872943878174, 4.432088851928711, 4.611304759979248, 4.790521144866943, 4.9697370529174805, 5.148953437805176, 5.328169345855713, 5.50738525390625, 5.686601638793945, 5.865818023681641]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 3.0, 14.0, 17.0, 24.0, 33.0, 37.0, 86.0, 132.0, 169.0, 262.0, 477.0, 788.0, 1236.0, 1972.0, 3265.0, 5606.0, 9238.0, 15469.0, 25577.0, 41001.0, 62779.0, 90609.0, 119055.0, 137678.0, 139233.0, 121674.0, 94394.0, 65618.0, 43505.0, 27366.0, 16489.0, 9908.0, 5971.0, 3452.0, 2047.0, 1288.0, 803.0, 450.0, 312.0, 192.0, 118.0, 78.0, 48.0, 30.0, 17.0, 11.0, 10.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.7501220703125, -5.558837890625, -5.3675537109375, -5.17626953125, -4.9849853515625, -4.793701171875, -4.6024169921875, -4.4111328125, -4.2198486328125, -4.028564453125, -3.8372802734375, -3.64599609375, -3.4547119140625, -3.263427734375, -3.0721435546875, -2.880859375, -2.6895751953125, -2.498291015625, -2.3070068359375, -2.11572265625, -1.9244384765625, -1.733154296875, -1.5418701171875, -1.3505859375, -1.1593017578125, -0.968017578125, -0.7767333984375, -0.58544921875, -0.3941650390625, -0.202880859375, -0.0115966796875, 0.1796875, 0.3709716796875, 0.562255859375, 0.7535400390625, 0.94482421875, 1.1361083984375, 1.327392578125, 1.5186767578125, 1.7099609375, 1.9012451171875, 2.092529296875, 2.2838134765625, 2.47509765625, 2.6663818359375, 2.857666015625, 3.0489501953125, 3.240234375, 3.4315185546875, 3.622802734375, 3.8140869140625, 4.00537109375, 4.1966552734375, 4.387939453125, 4.5792236328125, 4.7705078125, 4.9617919921875, 5.153076171875, 5.3443603515625, 5.53564453125, 5.7269287109375, 5.918212890625, 6.1094970703125, 6.30078125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 11.0, 11.0, 17.0, 16.0, 16.0, 18.0, 17.0, 25.0, 32.0, 33.0, 32.0, 24.0, 32.0, 45.0, 31.0, 33.0, 48.0, 52.0, 45.0, 40.0, 39.0, 35.0, 43.0, 34.0, 41.0, 21.0, 28.0, 25.0, 16.0, 13.0, 24.0, 17.0, 23.0, 8.0, 8.0, 11.0, 11.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.9033203125, -4.728515625, -4.5537109375, -4.37890625, -4.2041015625, -4.029296875, -3.8544921875, -3.6796875, -3.5048828125, -3.330078125, -3.1552734375, -2.98046875, -2.8056640625, -2.630859375, -2.4560546875, -2.28125, -2.1064453125, -1.931640625, -1.7568359375, -1.58203125, -1.4072265625, -1.232421875, -1.0576171875, -0.8828125, -0.7080078125, -0.533203125, -0.3583984375, -0.18359375, -0.0087890625, 0.166015625, 0.3408203125, 0.515625, 0.6904296875, 0.865234375, 1.0400390625, 1.21484375, 1.3896484375, 1.564453125, 1.7392578125, 1.9140625, 2.0888671875, 2.263671875, 2.4384765625, 2.61328125, 2.7880859375, 2.962890625, 3.1376953125, 3.3125, 3.4873046875, 3.662109375, 3.8369140625, 4.01171875, 4.1865234375, 4.361328125, 4.5361328125, 4.7109375, 4.8857421875, 5.060546875, 5.2353515625, 5.41015625, 5.5849609375, 5.759765625, 5.9345703125, 6.109375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 15.0, 26.0, 31.0, 55.0, 71.0, 108.0, 173.0, 218.0, 395.0, 601.0, 973.0, 1429.0, 2191.0, 3311.0, 5269.0, 7809.0, 12381.0, 18808.0, 27763.0, 40668.0, 57069.0, 76065.0, 96171.0, 111492.0, 116690.0, 111153.0, 96825.0, 77508.0, 58174.0, 41556.0, 28509.0, 19147.0, 12526.0, 8270.0, 5270.0, 3426.0, 2218.0, 1451.0, 989.0, 606.0, 392.0, 258.0, 164.0, 122.0, 52.0, 64.0, 36.0, 24.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.81640625, -4.6683349609375, -4.520263671875, -4.3721923828125, -4.22412109375, -4.0760498046875, -3.927978515625, -3.7799072265625, -3.6318359375, -3.4837646484375, -3.335693359375, -3.1876220703125, -3.03955078125, -2.8914794921875, -2.743408203125, -2.5953369140625, -2.447265625, -2.2991943359375, -2.151123046875, -2.0030517578125, -1.85498046875, -1.7069091796875, -1.558837890625, -1.4107666015625, -1.2626953125, -1.1146240234375, -0.966552734375, -0.8184814453125, -0.67041015625, -0.5223388671875, -0.374267578125, -0.2261962890625, -0.078125, 0.0699462890625, 0.218017578125, 0.3660888671875, 0.51416015625, 0.6622314453125, 0.810302734375, 0.9583740234375, 1.1064453125, 1.2545166015625, 1.402587890625, 1.5506591796875, 1.69873046875, 1.8468017578125, 1.994873046875, 2.1429443359375, 2.291015625, 2.4390869140625, 2.587158203125, 2.7352294921875, 2.88330078125, 3.0313720703125, 3.179443359375, 3.3275146484375, 3.4755859375, 3.6236572265625, 3.771728515625, 3.9197998046875, 4.06787109375, 4.2159423828125, 4.364013671875, 4.5120849609375, 4.66015625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 4.0, 5.0, 15.0, 22.0, 11.0, 10.0, 21.0, 19.0, 29.0, 35.0, 27.0, 29.0, 33.0, 35.0, 41.0, 51.0, 40.0, 34.0, 32.0, 34.0, 39.0, 33.0, 36.0, 30.0, 29.0, 35.0, 39.0, 24.0, 26.0, 31.0, 24.0, 21.0, 18.0, 10.0, 10.0, 9.0, 5.0, 4.0, 10.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0], "bins": [-3.7734375, -3.66619873046875, -3.5589599609375, -3.45172119140625, -3.344482421875, -3.23724365234375, -3.1300048828125, -3.02276611328125, -2.91552734375, -2.80828857421875, -2.7010498046875, -2.59381103515625, -2.486572265625, -2.37933349609375, -2.2720947265625, -2.16485595703125, -2.0576171875, -1.95037841796875, -1.8431396484375, -1.73590087890625, -1.628662109375, -1.52142333984375, -1.4141845703125, -1.30694580078125, -1.19970703125, -1.09246826171875, -0.9852294921875, -0.87799072265625, -0.770751953125, -0.66351318359375, -0.5562744140625, -0.44903564453125, -0.341796875, -0.23455810546875, -0.1273193359375, -0.02008056640625, 0.087158203125, 0.19439697265625, 0.3016357421875, 0.40887451171875, 0.51611328125, 0.62335205078125, 0.7305908203125, 0.83782958984375, 0.945068359375, 1.05230712890625, 1.1595458984375, 1.26678466796875, 1.3740234375, 1.48126220703125, 1.5885009765625, 1.69573974609375, 1.802978515625, 1.91021728515625, 2.0174560546875, 2.12469482421875, 2.23193359375, 2.33917236328125, 2.4464111328125, 2.55364990234375, 2.660888671875, 2.76812744140625, 2.8753662109375, 2.98260498046875, 3.08984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 9.0, 10.0, 18.0, 15.0, 25.0, 33.0, 57.0, 74.0, 114.0, 139.0, 204.0, 324.0, 483.0, 729.0, 1255.0, 1996.0, 3381.0, 5745.0, 10218.0, 18590.0, 33975.0, 61869.0, 106587.0, 162622.0, 195225.0, 172138.0, 117357.0, 68702.0, 38048.0, 20977.0, 11563.0, 6444.0, 3676.0, 2193.0, 1317.0, 789.0, 536.0, 340.0, 229.0, 170.0, 120.0, 86.0, 51.0, 43.0, 30.0, 13.0, 18.0, 12.0, 4.0, 6.0, 4.0, 1.0, 1.0, 4.0], "bins": [-4.62109375, -4.487518310546875, -4.35394287109375, -4.220367431640625, -4.0867919921875, -3.953216552734375, -3.81964111328125, -3.686065673828125, -3.552490234375, -3.418914794921875, -3.28533935546875, -3.151763916015625, -3.0181884765625, -2.884613037109375, -2.75103759765625, -2.617462158203125, -2.48388671875, -2.350311279296875, -2.21673583984375, -2.083160400390625, -1.9495849609375, -1.816009521484375, -1.68243408203125, -1.548858642578125, -1.415283203125, -1.281707763671875, -1.14813232421875, -1.014556884765625, -0.8809814453125, -0.747406005859375, -0.61383056640625, -0.480255126953125, -0.3466796875, -0.213104248046875, -0.07952880859375, 0.054046630859375, 0.1876220703125, 0.321197509765625, 0.45477294921875, 0.588348388671875, 0.721923828125, 0.855499267578125, 0.98907470703125, 1.122650146484375, 1.2562255859375, 1.389801025390625, 1.52337646484375, 1.656951904296875, 1.79052734375, 1.924102783203125, 2.05767822265625, 2.191253662109375, 2.3248291015625, 2.458404541015625, 2.59197998046875, 2.725555419921875, 2.859130859375, 2.992706298828125, 3.12628173828125, 3.259857177734375, 3.3934326171875, 3.527008056640625, 3.66058349609375, 3.794158935546875, 3.927734375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 1.0, 4.0, 7.0, 16.0, 13.0, 18.0, 30.0, 28.0, 45.0, 52.0, 55.0, 57.0, 65.0, 65.0, 56.0, 83.0, 66.0, 68.0, 58.0, 36.0, 41.0, 40.0, 24.0, 13.0, 17.0, 12.0, 7.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004124641418457031, -0.00039836764335632324, -0.00038427114486694336, -0.0003701746463775635, -0.0003560781478881836, -0.0003419816493988037, -0.00032788515090942383, -0.00031378865242004395, -0.00029969215393066406, -0.0002855956554412842, -0.0002714991569519043, -0.0002574026584625244, -0.00024330615997314453, -0.00022920966148376465, -0.00021511316299438477, -0.00020101666450500488, -0.000186920166015625, -0.00017282366752624512, -0.00015872716903686523, -0.00014463067054748535, -0.00013053417205810547, -0.00011643767356872559, -0.0001023411750793457, -8.824467658996582e-05, -7.414817810058594e-05, -6.0051679611206055e-05, -4.595518112182617e-05, -3.185868263244629e-05, -1.7762184143066406e-05, -3.6656856536865234e-06, 1.043081283569336e-05, 2.4527311325073242e-05, 3.8623809814453125e-05, 5.272030830383301e-05, 6.681680679321289e-05, 8.091330528259277e-05, 9.500980377197266e-05, 0.00010910630226135254, 0.00012320280075073242, 0.0001372992992401123, 0.0001513957977294922, 0.00016549229621887207, 0.00017958879470825195, 0.00019368529319763184, 0.00020778179168701172, 0.0002218782901763916, 0.00023597478866577148, 0.00025007128715515137, 0.00026416778564453125, 0.00027826428413391113, 0.000292360782623291, 0.0003064572811126709, 0.0003205537796020508, 0.00033465027809143066, 0.00034874677658081055, 0.00036284327507019043, 0.0003769397735595703, 0.0003910362720489502, 0.0004051327705383301, 0.00041922926902770996, 0.00043332576751708984, 0.0004474222660064697, 0.0004615187644958496, 0.0004756152629852295, 0.0004897117614746094]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 13.0, 18.0, 18.0, 37.0, 42.0, 64.0, 91.0, 129.0, 181.0, 317.0, 500.0, 751.0, 1343.0, 2279.0, 3984.0, 7205.0, 13245.0, 25492.0, 48172.0, 87704.0, 142916.0, 190700.0, 190661.0, 142441.0, 87242.0, 47828.0, 25163.0, 13379.0, 7054.0, 3896.0, 2219.0, 1326.0, 730.0, 465.0, 297.0, 217.0, 120.0, 97.0, 44.0, 41.0, 32.0, 24.0, 26.0, 14.0, 5.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0, -3.86663818359375, -3.7332763671875, -3.59991455078125, -3.466552734375, -3.33319091796875, -3.1998291015625, -3.06646728515625, -2.93310546875, -2.79974365234375, -2.6663818359375, -2.53302001953125, -2.399658203125, -2.26629638671875, -2.1329345703125, -1.99957275390625, -1.8662109375, -1.73284912109375, -1.5994873046875, -1.46612548828125, -1.332763671875, -1.19940185546875, -1.0660400390625, -0.93267822265625, -0.79931640625, -0.66595458984375, -0.5325927734375, -0.39923095703125, -0.265869140625, -0.13250732421875, 0.0008544921875, 0.13421630859375, 0.267578125, 0.40093994140625, 0.5343017578125, 0.66766357421875, 0.801025390625, 0.93438720703125, 1.0677490234375, 1.20111083984375, 1.33447265625, 1.46783447265625, 1.6011962890625, 1.73455810546875, 1.867919921875, 2.00128173828125, 2.1346435546875, 2.26800537109375, 2.4013671875, 2.53472900390625, 2.6680908203125, 2.80145263671875, 2.934814453125, 3.06817626953125, 3.2015380859375, 3.33489990234375, 3.46826171875, 3.60162353515625, 3.7349853515625, 3.86834716796875, 4.001708984375, 4.13507080078125, 4.2684326171875, 4.40179443359375, 4.53515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 14.0, 18.0, 24.0, 30.0, 45.0, 44.0, 58.0, 65.0, 64.0, 93.0, 71.0, 84.0, 76.0, 59.0, 42.0, 37.0, 36.0, 32.0, 19.0, 19.0, 17.0, 9.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6955718994140625, -1.641143798828125, -1.5867156982421875, -1.53228759765625, -1.4778594970703125, -1.423431396484375, -1.3690032958984375, -1.3145751953125, -1.2601470947265625, -1.205718994140625, -1.1512908935546875, -1.09686279296875, -1.0424346923828125, -0.988006591796875, -0.9335784912109375, -0.879150390625, -0.8247222900390625, -0.770294189453125, -0.7158660888671875, -0.66143798828125, -0.6070098876953125, -0.552581787109375, -0.4981536865234375, -0.4437255859375, -0.3892974853515625, -0.334869384765625, -0.2804412841796875, -0.22601318359375, -0.1715850830078125, -0.117156982421875, -0.0627288818359375, -0.00830078125, 0.0461273193359375, 0.100555419921875, 0.1549835205078125, 0.20941162109375, 0.2638397216796875, 0.318267822265625, 0.3726959228515625, 0.4271240234375, 0.4815521240234375, 0.535980224609375, 0.5904083251953125, 0.64483642578125, 0.6992645263671875, 0.753692626953125, 0.8081207275390625, 0.862548828125, 0.9169769287109375, 0.971405029296875, 1.0258331298828125, 1.08026123046875, 1.1346893310546875, 1.189117431640625, 1.2435455322265625, 1.2979736328125, 1.3524017333984375, 1.406829833984375, 1.4612579345703125, 1.51568603515625, 1.5701141357421875, 1.624542236328125, 1.6789703369140625, 1.7333984375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 6.0, 10.0, 13.0, 15.0, 17.0, 23.0, 24.0, 21.0, 34.0, 24.0, 28.0, 40.0, 47.0, 51.0, 50.0, 66.0, 48.0, 54.0, 47.0, 45.0, 43.0, 48.0, 33.0, 31.0, 26.0, 32.0, 27.0, 18.0, 17.0, 11.0, 10.0, 10.0, 9.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-7.919622898101807, -7.723224639892578, -7.52682638168335, -7.330428123474121, -7.134030342102051, -6.937632083892822, -6.741233825683594, -6.544835567474365, -6.348437309265137, -6.152039051055908, -5.95564079284668, -5.759242534637451, -5.562844276428223, -5.366446495056152, -5.170048236846924, -4.973649978637695, -4.777251720428467, -4.580853462219238, -4.38445520401001, -4.188056945800781, -3.991658926010132, -3.7952606678009033, -3.598862648010254, -3.4024643898010254, -3.206066131591797, -3.0096678733825684, -2.81326961517334, -2.6168715953826904, -2.420473337173462, -2.2240750789642334, -2.027677059173584, -1.8312788009643555, -1.6348800659179688, -1.4384818077087402, -1.2420836687088013, -1.0456855297088623, -0.8492872714996338, -0.65288907289505, -0.4564908742904663, -0.26009273529052734, -0.06369447708129883, 0.1327037215232849, 0.32910192012786865, 0.5255001187324524, 0.7218983173370361, 0.9182965159416199, 1.1146947145462036, 1.3110928535461426, 1.507491111755371, 1.7038893699645996, 1.9002875089645386, 2.0966856479644775, 2.293083906173706, 2.4894821643829346, 2.685880184173584, 2.8822784423828125, 3.078676700592041, 3.2750749588012695, 3.471473217010498, 3.6678712368011475, 3.864269495010376, 4.060667514801025, 4.257065773010254, 4.453464031219482, 4.649862289428711]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 10.0, 8.0, 11.0, 11.0, 16.0, 20.0, 22.0, 19.0, 20.0, 20.0, 33.0, 19.0, 36.0, 32.0, 35.0, 34.0, 42.0, 39.0, 40.0, 35.0, 41.0, 32.0, 25.0, 28.0, 28.0, 40.0, 42.0, 18.0, 43.0, 20.0, 23.0, 18.0, 17.0, 16.0, 13.0, 17.0, 13.0, 15.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.544193267822266, -5.378626823425293, -5.213059902191162, -5.0474934577941895, -4.881927013397217, -4.716360092163086, -4.550793647766113, -4.385227203369141, -4.219660758972168, -4.054094314575195, -3.8885276317596436, -3.722960948944092, -3.557394504547119, -3.3918278217315674, -3.2262611389160156, -3.060694694519043, -2.895127773284912, -2.7295610904693604, -2.5639946460723877, -2.398427963256836, -2.2328615188598633, -2.0672948360443115, -1.9017281532287598, -1.7361615896224976, -1.5705950260162354, -1.4050284624099731, -1.239461898803711, -1.0738952159881592, -0.908328652381897, -0.7427620887756348, -0.5771954655647278, -0.4116288423538208, -0.2460622787475586, -0.080495685338974, 0.0850709080696106, 0.2506375014781952, 0.4162040948867798, 0.581770658493042, 0.747337281703949, 0.912903904914856, 1.0784704685211182, 1.2440370321273804, 1.4096035957336426, 1.5751702785491943, 1.7407368421554565, 1.9063034057617188, 2.0718700885772705, 2.2374367713928223, 2.403003215789795, 2.5685698986053467, 2.7341363430023193, 2.899703025817871, 3.0652694702148438, 3.2308361530303955, 3.3964028358459473, 3.56196928024292, 3.7275359630584717, 3.8931026458740234, 4.058669090270996, 4.224235534667969, 4.3898024559021, 4.555368900299072, 4.720935344696045, 4.886502265930176, 5.052068710327148]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [8.0, 7.0, 8.0, 5.0, 14.0, 13.0, 52.0, 58.0, 98.0, 156.0, 223.0, 396.0, 591.0, 811.0, 1396.0, 2036.0, 3118.0, 4806.0, 7309.0, 11159.0, 17077.0, 26776.0, 40149.0, 60661.0, 91525.0, 134014.0, 193893.0, 267564.0, 351267.0, 428887.0, 477266.0, 474320.0, 422897.0, 344463.0, 260691.0, 186002.0, 129344.0, 87301.0, 57964.0, 38154.0, 25114.0, 16420.0, 10732.0, 6904.0, 4524.0, 2877.0, 1831.0, 1224.0, 788.0, 502.0, 274.0, 228.0, 160.0, 100.0, 51.0, 31.0, 18.0, 12.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0], "bins": [-3.66015625, -3.541900634765625, -3.42364501953125, -3.305389404296875, -3.1871337890625, -3.068878173828125, -2.95062255859375, -2.832366943359375, -2.714111328125, -2.595855712890625, -2.47760009765625, -2.359344482421875, -2.2410888671875, -2.122833251953125, -2.00457763671875, -1.886322021484375, -1.76806640625, -1.649810791015625, -1.53155517578125, -1.413299560546875, -1.2950439453125, -1.176788330078125, -1.05853271484375, -0.940277099609375, -0.822021484375, -0.703765869140625, -0.58551025390625, -0.467254638671875, -0.3489990234375, -0.230743408203125, -0.11248779296875, 0.005767822265625, 0.1240234375, 0.242279052734375, 0.36053466796875, 0.478790283203125, 0.5970458984375, 0.715301513671875, 0.83355712890625, 0.951812744140625, 1.070068359375, 1.188323974609375, 1.30657958984375, 1.424835205078125, 1.5430908203125, 1.661346435546875, 1.77960205078125, 1.897857666015625, 2.01611328125, 2.134368896484375, 2.25262451171875, 2.370880126953125, 2.4891357421875, 2.607391357421875, 2.72564697265625, 2.843902587890625, 2.962158203125, 3.080413818359375, 3.19866943359375, 3.316925048828125, 3.4351806640625, 3.553436279296875, 3.67169189453125, 3.789947509765625, 3.908203125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 11.0, 17.0, 13.0, 10.0, 17.0, 26.0, 17.0, 20.0, 24.0, 28.0, 38.0, 34.0, 30.0, 32.0, 45.0, 42.0, 41.0, 40.0, 27.0, 36.0, 39.0, 29.0, 39.0, 27.0, 42.0, 29.0, 35.0, 21.0, 19.0, 30.0, 19.0, 20.0, 19.0, 13.0, 10.0, 6.0, 14.0, 3.0, 8.0, 2.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.62872314453125, -3.5093994140625, -3.39007568359375, -3.270751953125, -3.15142822265625, -3.0321044921875, -2.91278076171875, -2.79345703125, -2.67413330078125, -2.5548095703125, -2.43548583984375, -2.316162109375, -2.19683837890625, -2.0775146484375, -1.95819091796875, -1.8388671875, -1.71954345703125, -1.6002197265625, -1.48089599609375, -1.361572265625, -1.24224853515625, -1.1229248046875, -1.00360107421875, -0.88427734375, -0.76495361328125, -0.6456298828125, -0.52630615234375, -0.406982421875, -0.28765869140625, -0.1683349609375, -0.04901123046875, 0.0703125, 0.18963623046875, 0.3089599609375, 0.42828369140625, 0.547607421875, 0.66693115234375, 0.7862548828125, 0.90557861328125, 1.02490234375, 1.14422607421875, 1.2635498046875, 1.38287353515625, 1.502197265625, 1.62152099609375, 1.7408447265625, 1.86016845703125, 1.9794921875, 2.09881591796875, 2.2181396484375, 2.33746337890625, 2.456787109375, 2.57611083984375, 2.6954345703125, 2.81475830078125, 2.93408203125, 3.05340576171875, 3.1727294921875, 3.29205322265625, 3.411376953125, 3.53070068359375, 3.6500244140625, 3.76934814453125, 3.888671875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 14.0, 13.0, 34.0, 55.0, 84.0, 129.0, 217.0, 323.0, 588.0, 1044.0, 1817.0, 3112.0, 5305.0, 9064.0, 15331.0, 25985.0, 44236.0, 73050.0, 117546.0, 182669.0, 270217.0, 373409.0, 469857.0, 531857.0, 526974.0, 461360.0, 361883.0, 259574.0, 175520.0, 111576.0, 69633.0, 42012.0, 24676.0, 14561.0, 8490.0, 4968.0, 2958.0, 1693.0, 941.0, 628.0, 362.0, 222.0, 109.0, 71.0, 38.0, 35.0, 14.0, 9.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.4140625, -4.28009033203125, -4.1461181640625, -4.01214599609375, -3.878173828125, -3.74420166015625, -3.6102294921875, -3.47625732421875, -3.34228515625, -3.20831298828125, -3.0743408203125, -2.94036865234375, -2.806396484375, -2.67242431640625, -2.5384521484375, -2.40447998046875, -2.2705078125, -2.13653564453125, -2.0025634765625, -1.86859130859375, -1.734619140625, -1.60064697265625, -1.4666748046875, -1.33270263671875, -1.19873046875, -1.06475830078125, -0.9307861328125, -0.79681396484375, -0.662841796875, -0.52886962890625, -0.3948974609375, -0.26092529296875, -0.126953125, 0.00701904296875, 0.1409912109375, 0.27496337890625, 0.408935546875, 0.54290771484375, 0.6768798828125, 0.81085205078125, 0.94482421875, 1.07879638671875, 1.2127685546875, 1.34674072265625, 1.480712890625, 1.61468505859375, 1.7486572265625, 1.88262939453125, 2.0166015625, 2.15057373046875, 2.2845458984375, 2.41851806640625, 2.552490234375, 2.68646240234375, 2.8204345703125, 2.95440673828125, 3.08837890625, 3.22235107421875, 3.3563232421875, 3.49029541015625, 3.624267578125, 3.75823974609375, 3.8922119140625, 4.02618408203125, 4.16015625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 6.0, 13.0, 13.0, 19.0, 21.0, 26.0, 33.0, 48.0, 63.0, 68.0, 71.0, 92.0, 119.0, 121.0, 144.0, 147.0, 166.0, 166.0, 175.0, 197.0, 205.0, 186.0, 184.0, 183.0, 181.0, 164.0, 151.0, 171.0, 132.0, 115.0, 132.0, 110.0, 77.0, 65.0, 60.0, 50.0, 38.0, 34.0, 33.0, 21.0, 18.0, 14.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0], "bins": [-1.8291015625, -1.7745361328125, -1.719970703125, -1.6654052734375, -1.61083984375, -1.5562744140625, -1.501708984375, -1.4471435546875, -1.392578125, -1.3380126953125, -1.283447265625, -1.2288818359375, -1.17431640625, -1.1197509765625, -1.065185546875, -1.0106201171875, -0.9560546875, -0.9014892578125, -0.846923828125, -0.7923583984375, -0.73779296875, -0.6832275390625, -0.628662109375, -0.5740966796875, -0.51953125, -0.4649658203125, -0.410400390625, -0.3558349609375, -0.30126953125, -0.2467041015625, -0.192138671875, -0.1375732421875, -0.0830078125, -0.0284423828125, 0.026123046875, 0.0806884765625, 0.13525390625, 0.1898193359375, 0.244384765625, 0.2989501953125, 0.353515625, 0.4080810546875, 0.462646484375, 0.5172119140625, 0.57177734375, 0.6263427734375, 0.680908203125, 0.7354736328125, 0.7900390625, 0.8446044921875, 0.899169921875, 0.9537353515625, 1.00830078125, 1.0628662109375, 1.117431640625, 1.1719970703125, 1.2265625, 1.2811279296875, 1.335693359375, 1.3902587890625, 1.44482421875, 1.4993896484375, 1.553955078125, 1.6085205078125, 1.6630859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 12.0, 10.0, 9.0, 28.0, 24.0, 26.0, 22.0, 37.0, 45.0, 31.0, 45.0, 45.0, 52.0, 41.0, 40.0, 50.0, 62.0, 53.0, 45.0, 41.0, 31.0, 35.0, 33.0, 34.0, 20.0, 21.0, 15.0, 14.0, 19.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.178255558013916, -5.010586738586426, -4.8429179191589355, -4.675249099731445, -4.507580280303955, -4.339911460876465, -4.172242641448975, -4.004573822021484, -3.836905002593994, -3.669236183166504, -3.5015673637390137, -3.3338985443115234, -3.166229724884033, -2.998560905456543, -2.8308920860290527, -2.6632232666015625, -2.4955546855926514, -2.327885866165161, -2.160217046737671, -1.9925482273101807, -1.8248794078826904, -1.6572105884552002, -1.4895418882369995, -1.3218730688095093, -1.154204249382019, -0.9865354299545288, -0.8188666105270386, -0.6511978507041931, -0.4835290312767029, -0.31586021184921265, -0.1481914520263672, 0.019477367401123047, 0.18714618682861328, 0.3548150062561035, 0.5224838256835938, 0.6901525855064392, 0.8578214049339294, 1.0254902839660645, 1.1931589841842651, 1.3608278036117554, 1.5284966230392456, 1.6961654424667358, 1.863834261894226, 2.0315029621124268, 2.199171781539917, 2.3668406009674072, 2.5345094203948975, 2.7021782398223877, 2.869847059249878, 3.037515878677368, 3.2051846981048584, 3.3728535175323486, 3.540522336959839, 3.708191156387329, 3.8758597373962402, 4.0435285568237305, 4.211197376251221, 4.378866195678711, 4.546535015106201, 4.714203834533691, 4.881872653961182, 5.049541473388672, 5.217210292816162, 5.384879112243652, 5.552547931671143]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 8.0, 8.0, 10.0, 16.0, 19.0, 22.0, 17.0, 22.0, 23.0, 26.0, 29.0, 32.0, 31.0, 30.0, 39.0, 33.0, 45.0, 44.0, 41.0, 44.0, 32.0, 26.0, 44.0, 43.0, 27.0, 35.0, 28.0, 26.0, 30.0, 24.0, 14.0, 22.0, 15.0, 9.0, 11.0, 8.0, 13.0, 12.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.264418601989746, -4.119522571563721, -3.9746267795562744, -3.829730987548828, -3.6848349571228027, -3.5399389266967773, -3.395043134689331, -3.2501473426818848, -3.1052513122558594, -2.960355281829834, -2.8154594898223877, -2.6705636978149414, -2.525667667388916, -2.3807716369628906, -2.2358758449554443, -2.090980052947998, -1.9460840225219727, -1.8011881113052368, -1.656292200088501, -1.5113962888717651, -1.3665003776550293, -1.2216044664382935, -1.0767085552215576, -0.9318126440048218, -0.7869167327880859, -0.6420208215713501, -0.49712491035461426, -0.3522289991378784, -0.20733308792114258, -0.06243717670440674, 0.0824587345123291, 0.22735464572906494, 0.372251033782959, 0.5171469449996948, 0.6620428562164307, 0.8069387674331665, 0.9518346786499023, 1.0967305898666382, 1.241626501083374, 1.3865224123001099, 1.5314183235168457, 1.6763142347335815, 1.8212101459503174, 1.9661060571670532, 2.111001968383789, 2.2558979988098145, 2.4007937908172607, 2.545689582824707, 2.6905856132507324, 2.835481643676758, 2.980377435684204, 3.1252732276916504, 3.270169258117676, 3.415065288543701, 3.5599610805511475, 3.7048568725585938, 3.849752902984619, 3.9946489334106445, 4.139544486999512, 4.284440517425537, 4.4293365478515625, 4.574232578277588, 4.719128608703613, 4.8640241622924805, 5.008920192718506]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 8.0, 17.0, 19.0, 35.0, 49.0, 79.0, 78.0, 164.0, 246.0, 390.0, 617.0, 981.0, 1567.0, 2569.0, 4105.0, 7184.0, 12706.0, 23323.0, 42424.0, 77954.0, 137226.0, 204136.0, 207571.0, 142366.0, 81437.0, 44936.0, 24304.0, 13383.0, 7532.0, 4411.0, 2559.0, 1549.0, 934.0, 584.0, 373.0, 269.0, 164.0, 120.0, 51.0, 42.0, 33.0, 25.0, 6.0, 3.0, 14.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.083984375, -2.020904541015625, -1.95782470703125, -1.894744873046875, -1.8316650390625, -1.768585205078125, -1.70550537109375, -1.642425537109375, -1.579345703125, -1.516265869140625, -1.45318603515625, -1.390106201171875, -1.3270263671875, -1.263946533203125, -1.20086669921875, -1.137786865234375, -1.07470703125, -1.011627197265625, -0.94854736328125, -0.885467529296875, -0.8223876953125, -0.759307861328125, -0.69622802734375, -0.633148193359375, -0.570068359375, -0.506988525390625, -0.44390869140625, -0.380828857421875, -0.3177490234375, -0.254669189453125, -0.19158935546875, -0.128509521484375, -0.0654296875, -0.002349853515625, 0.06072998046875, 0.123809814453125, 0.1868896484375, 0.249969482421875, 0.31304931640625, 0.376129150390625, 0.439208984375, 0.502288818359375, 0.56536865234375, 0.628448486328125, 0.6915283203125, 0.754608154296875, 0.81768798828125, 0.880767822265625, 0.94384765625, 1.006927490234375, 1.07000732421875, 1.133087158203125, 1.1961669921875, 1.259246826171875, 1.32232666015625, 1.385406494140625, 1.448486328125, 1.511566162109375, 1.57464599609375, 1.637725830078125, 1.7008056640625, 1.763885498046875, 1.82696533203125, 1.890045166015625, 1.953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 9.0, 9.0, 9.0, 10.0, 13.0, 14.0, 18.0, 23.0, 22.0, 23.0, 28.0, 29.0, 41.0, 35.0, 38.0, 27.0, 43.0, 55.0, 28.0, 42.0, 51.0, 35.0, 33.0, 37.0, 37.0, 43.0, 26.0, 31.0, 27.0, 29.0, 19.0, 14.0, 11.0, 13.0, 7.0, 13.0, 7.0, 12.0, 7.0, 6.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.151123046875, -3.99365234375, -3.836181640625, -3.6787109375, -3.521240234375, -3.36376953125, -3.206298828125, -3.048828125, -2.891357421875, -2.73388671875, -2.576416015625, -2.4189453125, -2.261474609375, -2.10400390625, -1.946533203125, -1.7890625, -1.631591796875, -1.47412109375, -1.316650390625, -1.1591796875, -1.001708984375, -0.84423828125, -0.686767578125, -0.529296875, -0.371826171875, -0.21435546875, -0.056884765625, 0.1005859375, 0.258056640625, 0.41552734375, 0.572998046875, 0.73046875, 0.887939453125, 1.04541015625, 1.202880859375, 1.3603515625, 1.517822265625, 1.67529296875, 1.832763671875, 1.990234375, 2.147705078125, 2.30517578125, 2.462646484375, 2.6201171875, 2.777587890625, 2.93505859375, 3.092529296875, 3.25, 3.407470703125, 3.56494140625, 3.722412109375, 3.8798828125, 4.037353515625, 4.19482421875, 4.352294921875, 4.509765625, 4.667236328125, 4.82470703125, 4.982177734375, 5.1396484375, 5.297119140625, 5.45458984375, 5.612060546875, 5.76953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 5.0, 10.0, 19.0, 25.0, 40.0, 50.0, 74.0, 103.0, 195.0, 253.0, 380.0, 566.0, 869.0, 1376.0, 2172.0, 3795.0, 6442.0, 11190.0, 20342.0, 37651.0, 70602.0, 130578.0, 218400.0, 228648.0, 143218.0, 77818.0, 41187.0, 22456.0, 12468.0, 6969.0, 3958.0, 2424.0, 1540.0, 954.0, 589.0, 385.0, 274.0, 185.0, 97.0, 53.0, 64.0, 39.0, 24.0, 22.0, 18.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.271484375, -2.20672607421875, -2.1419677734375, -2.07720947265625, -2.012451171875, -1.94769287109375, -1.8829345703125, -1.81817626953125, -1.75341796875, -1.68865966796875, -1.6239013671875, -1.55914306640625, -1.494384765625, -1.42962646484375, -1.3648681640625, -1.30010986328125, -1.2353515625, -1.17059326171875, -1.1058349609375, -1.04107666015625, -0.976318359375, -0.91156005859375, -0.8468017578125, -0.78204345703125, -0.71728515625, -0.65252685546875, -0.5877685546875, -0.52301025390625, -0.458251953125, -0.39349365234375, -0.3287353515625, -0.26397705078125, -0.19921875, -0.13446044921875, -0.0697021484375, -0.00494384765625, 0.059814453125, 0.12457275390625, 0.1893310546875, 0.25408935546875, 0.31884765625, 0.38360595703125, 0.4483642578125, 0.51312255859375, 0.577880859375, 0.64263916015625, 0.7073974609375, 0.77215576171875, 0.8369140625, 0.90167236328125, 0.9664306640625, 1.03118896484375, 1.095947265625, 1.16070556640625, 1.2254638671875, 1.29022216796875, 1.35498046875, 1.41973876953125, 1.4844970703125, 1.54925537109375, 1.614013671875, 1.67877197265625, 1.7435302734375, 1.80828857421875, 1.873046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 4.0, 4.0, 9.0, 13.0, 18.0, 16.0, 17.0, 21.0, 23.0, 25.0, 31.0, 34.0, 30.0, 31.0, 37.0, 38.0, 34.0, 43.0, 43.0, 44.0, 44.0, 36.0, 47.0, 37.0, 39.0, 30.0, 33.0, 19.0, 34.0, 28.0, 20.0, 17.0, 15.0, 17.0, 10.0, 8.0, 10.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.024261474609375, -2.91961669921875, -2.814971923828125, -2.7103271484375, -2.605682373046875, -2.50103759765625, -2.396392822265625, -2.291748046875, -2.187103271484375, -2.08245849609375, -1.977813720703125, -1.8731689453125, -1.768524169921875, -1.66387939453125, -1.559234619140625, -1.45458984375, -1.349945068359375, -1.24530029296875, -1.140655517578125, -1.0360107421875, -0.931365966796875, -0.82672119140625, -0.722076416015625, -0.617431640625, -0.512786865234375, -0.40814208984375, -0.303497314453125, -0.1988525390625, -0.094207763671875, 0.01043701171875, 0.115081787109375, 0.2197265625, 0.324371337890625, 0.42901611328125, 0.533660888671875, 0.6383056640625, 0.742950439453125, 0.84759521484375, 0.952239990234375, 1.056884765625, 1.161529541015625, 1.26617431640625, 1.370819091796875, 1.4754638671875, 1.580108642578125, 1.68475341796875, 1.789398193359375, 1.89404296875, 1.998687744140625, 2.10333251953125, 2.207977294921875, 2.3126220703125, 2.417266845703125, 2.52191162109375, 2.626556396484375, 2.731201171875, 2.835845947265625, 2.94049072265625, 3.045135498046875, 3.1497802734375, 3.254425048828125, 3.35906982421875, 3.463714599609375, 3.568359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 18.0, 26.0, 38.0, 36.0, 44.0, 99.0, 107.0, 174.0, 229.0, 305.0, 429.0, 630.0, 919.0, 1305.0, 2078.0, 3287.0, 5706.0, 10211.0, 20468.0, 46733.0, 123996.0, 312612.0, 306869.0, 120550.0, 46255.0, 19974.0, 10146.0, 5476.0, 3297.0, 1968.0, 1390.0, 919.0, 645.0, 453.0, 326.0, 232.0, 156.0, 119.0, 76.0, 64.0, 40.0, 31.0, 30.0, 16.0, 13.0, 9.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.61279296875, -0.593017578125, -0.5732421875, -0.553466796875, -0.53369140625, -0.513916015625, -0.494140625, -0.474365234375, -0.45458984375, -0.434814453125, -0.4150390625, -0.395263671875, -0.37548828125, -0.355712890625, -0.3359375, -0.316162109375, -0.29638671875, -0.276611328125, -0.2568359375, -0.237060546875, -0.21728515625, -0.197509765625, -0.177734375, -0.157958984375, -0.13818359375, -0.118408203125, -0.0986328125, -0.078857421875, -0.05908203125, -0.039306640625, -0.01953125, 0.000244140625, 0.02001953125, 0.039794921875, 0.0595703125, 0.079345703125, 0.09912109375, 0.118896484375, 0.138671875, 0.158447265625, 0.17822265625, 0.197998046875, 0.2177734375, 0.237548828125, 0.25732421875, 0.277099609375, 0.296875, 0.316650390625, 0.33642578125, 0.356201171875, 0.3759765625, 0.395751953125, 0.41552734375, 0.435302734375, 0.455078125, 0.474853515625, 0.49462890625, 0.514404296875, 0.5341796875, 0.553955078125, 0.57373046875, 0.593505859375, 0.61328125, 0.633056640625, 0.65283203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 4.0, 7.0, 5.0, 12.0, 12.0, 21.0, 23.0, 19.0, 21.0, 41.0, 45.0, 57.0, 52.0, 65.0, 78.0, 56.0, 64.0, 55.0, 55.0, 58.0, 44.0, 35.0, 35.0, 26.0, 15.0, 16.0, 17.0, 10.0, 11.0, 5.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.519390106201172e-05, -5.347840487957001e-05, -5.1762908697128296e-05, -5.0047412514686584e-05, -4.833191633224487e-05, -4.661642014980316e-05, -4.490092396736145e-05, -4.318542778491974e-05, -4.146993160247803e-05, -3.9754435420036316e-05, -3.8038939237594604e-05, -3.632344305515289e-05, -3.460794687271118e-05, -3.289245069026947e-05, -3.117695450782776e-05, -2.9461458325386047e-05, -2.7745962142944336e-05, -2.6030465960502625e-05, -2.4314969778060913e-05, -2.25994735956192e-05, -2.088397741317749e-05, -1.916848123073578e-05, -1.7452985048294067e-05, -1.5737488865852356e-05, -1.4021992683410645e-05, -1.2306496500968933e-05, -1.0591000318527222e-05, -8.87550413608551e-06, -7.160007953643799e-06, -5.444511771202087e-06, -3.729015588760376e-06, -2.0135194063186646e-06, -2.980232238769531e-07, 1.4174729585647583e-06, 3.1329691410064697e-06, 4.848465323448181e-06, 6.563961505889893e-06, 8.279457688331604e-06, 9.994953870773315e-06, 1.1710450053215027e-05, 1.3425946235656738e-05, 1.514144241809845e-05, 1.685693860054016e-05, 1.8572434782981873e-05, 2.0287930965423584e-05, 2.2003427147865295e-05, 2.3718923330307007e-05, 2.5434419512748718e-05, 2.714991569519043e-05, 2.886541187763214e-05, 3.058090806007385e-05, 3.2296404242515564e-05, 3.4011900424957275e-05, 3.572739660739899e-05, 3.74428927898407e-05, 3.915838897228241e-05, 4.087388515472412e-05, 4.258938133716583e-05, 4.4304877519607544e-05, 4.6020373702049255e-05, 4.773586988449097e-05, 4.945136606693268e-05, 5.116686224937439e-05, 5.28823584318161e-05, 5.459785461425781e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 17.0, 24.0, 25.0, 41.0, 45.0, 62.0, 96.0, 173.0, 203.0, 276.0, 384.0, 665.0, 926.0, 1485.0, 2246.0, 3446.0, 5546.0, 8981.0, 15172.0, 26152.0, 46037.0, 82259.0, 142008.0, 210570.0, 199360.0, 127944.0, 73295.0, 41403.0, 23460.0, 13699.0, 8092.0, 5075.0, 3127.0, 2078.0, 1351.0, 891.0, 670.0, 371.0, 278.0, 180.0, 136.0, 93.0, 55.0, 56.0, 31.0, 22.0, 20.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5885238647460938, -0.5681610107421875, -0.5477981567382812, -0.527435302734375, -0.5070724487304688, -0.4867095947265625, -0.46634674072265625, -0.44598388671875, -0.42562103271484375, -0.4052581787109375, -0.38489532470703125, -0.364532470703125, -0.34416961669921875, -0.3238067626953125, -0.30344390869140625, -0.2830810546875, -0.26271820068359375, -0.2423553466796875, -0.22199249267578125, -0.201629638671875, -0.18126678466796875, -0.1609039306640625, -0.14054107666015625, -0.12017822265625, -0.09981536865234375, -0.0794525146484375, -0.05908966064453125, -0.038726806640625, -0.01836395263671875, 0.0019989013671875, 0.02236175537109375, 0.042724609375, 0.06308746337890625, 0.0834503173828125, 0.10381317138671875, 0.124176025390625, 0.14453887939453125, 0.1649017333984375, 0.18526458740234375, 0.20562744140625, 0.22599029541015625, 0.2463531494140625, 0.26671600341796875, 0.287078857421875, 0.30744171142578125, 0.3278045654296875, 0.34816741943359375, 0.3685302734375, 0.38889312744140625, 0.4092559814453125, 0.42961883544921875, 0.449981689453125, 0.47034454345703125, 0.4907073974609375, 0.5110702514648438, 0.53143310546875, 0.5517959594726562, 0.5721588134765625, 0.5925216674804688, 0.612884521484375, 0.6332473754882812, 0.6536102294921875, 0.6739730834960938, 0.6943359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 1.0, 5.0, 12.0, 13.0, 16.0, 17.0, 16.0, 28.0, 40.0, 27.0, 42.0, 52.0, 54.0, 74.0, 69.0, 71.0, 66.0, 69.0, 58.0, 46.0, 45.0, 28.0, 29.0, 20.0, 13.0, 15.0, 14.0, 9.0, 11.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2198486328125, -0.2130279541015625, -0.206207275390625, -0.1993865966796875, -0.19256591796875, -0.1857452392578125, -0.178924560546875, -0.1721038818359375, -0.165283203125, -0.1584625244140625, -0.151641845703125, -0.1448211669921875, -0.13800048828125, -0.1311798095703125, -0.124359130859375, -0.1175384521484375, -0.1107177734375, -0.1038970947265625, -0.097076416015625, -0.0902557373046875, -0.08343505859375, -0.0766143798828125, -0.069793701171875, -0.0629730224609375, -0.05615234375, -0.0493316650390625, -0.042510986328125, -0.0356903076171875, -0.02886962890625, -0.0220489501953125, -0.015228271484375, -0.0084075927734375, -0.0015869140625, 0.0052337646484375, 0.012054443359375, 0.0188751220703125, 0.02569580078125, 0.0325164794921875, 0.039337158203125, 0.0461578369140625, 0.052978515625, 0.0597991943359375, 0.066619873046875, 0.0734405517578125, 0.08026123046875, 0.0870819091796875, 0.093902587890625, 0.1007232666015625, 0.1075439453125, 0.1143646240234375, 0.121185302734375, 0.1280059814453125, 0.13482666015625, 0.1416473388671875, 0.148468017578125, 0.1552886962890625, 0.162109375, 0.1689300537109375, 0.175750732421875, 0.1825714111328125, 0.18939208984375, 0.1962127685546875, 0.203033447265625, 0.2098541259765625, 0.2166748046875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 10.0, 18.0, 11.0, 15.0, 17.0, 20.0, 33.0, 27.0, 40.0, 38.0, 39.0, 43.0, 59.0, 36.0, 37.0, 52.0, 35.0, 61.0, 51.0, 40.0, 42.0, 34.0, 41.0, 23.0, 33.0, 26.0, 23.0, 12.0, 12.0, 18.0, 15.0, 7.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.248227119445801, -5.083939552307129, -4.919651508331299, -4.755363464355469, -4.591075897216797, -4.426788330078125, -4.262500286102295, -4.098212242126465, -3.933924674987793, -3.769636869430542, -3.605349063873291, -3.44106125831604, -3.276773452758789, -3.112485647201538, -2.948197841644287, -2.783910036087036, -2.619622230529785, -2.455334424972534, -2.291046619415283, -2.1267588138580322, -1.9624710083007812, -1.7981832027435303, -1.6338953971862793, -1.4696075916290283, -1.3053197860717773, -1.1410319805145264, -0.9767441749572754, -0.8124563694000244, -0.6481685638427734, -0.48388075828552246, -0.3195929527282715, -0.1553051471710205, 0.008982181549072266, 0.17326998710632324, 0.3375577926635742, 0.5018455982208252, 0.6661334037780762, 0.8304212093353271, 0.9947090148925781, 1.158996820449829, 1.32328462600708, 1.487572431564331, 1.651860237121582, 1.816148042678833, 1.980435848236084, 2.144723653793335, 2.309011459350586, 2.473299264907837, 2.637587070465088, 2.801874876022339, 2.96616268157959, 3.130450487136841, 3.294738292694092, 3.4590260982513428, 3.6233139038085938, 3.7876017093658447, 3.9518895149230957, 4.116177558898926, 4.280465126037598, 4.4447526931762695, 4.6090407371521, 4.77332878112793, 4.937616348266602, 5.101903915405273, 5.2661919593811035]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 11.0, 4.0, 7.0, 7.0, 10.0, 14.0, 21.0, 19.0, 18.0, 21.0, 27.0, 26.0, 29.0, 26.0, 34.0, 35.0, 34.0, 33.0, 45.0, 42.0, 47.0, 48.0, 31.0, 22.0, 40.0, 51.0, 33.0, 35.0, 22.0, 27.0, 29.0, 23.0, 18.0, 21.0, 14.0, 11.0, 7.0, 10.0, 14.0, 11.0, 5.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.327061176300049, -4.181493282318115, -4.035924911499023, -3.89035701751709, -3.7447891235351562, -3.5992212295532227, -3.45365309715271, -3.3080849647521973, -3.1625170707702637, -3.01694917678833, -2.8713810443878174, -2.7258129119873047, -2.580245018005371, -2.4346771240234375, -2.289108991622925, -2.143540859222412, -1.9979729652404785, -1.8524049520492554, -1.7068369388580322, -1.561268925666809, -1.415700912475586, -1.2701328992843628, -1.1245648860931396, -0.9789968729019165, -0.8334288597106934, -0.6878608465194702, -0.5422928333282471, -0.3967248201370239, -0.2511568069458008, -0.10558879375457764, 0.03997921943664551, 0.18554723262786865, 0.3311147689819336, 0.47668278217315674, 0.6222507953643799, 0.767818808555603, 0.9133868217468262, 1.0589548349380493, 1.2045228481292725, 1.3500908613204956, 1.4956588745117188, 1.641226887702942, 1.786794900894165, 1.9323629140853882, 2.0779309272766113, 2.223498821258545, 2.3690669536590576, 2.5146350860595703, 2.660202980041504, 2.8057708740234375, 2.95133900642395, 3.096907138824463, 3.2424750328063965, 3.38804292678833, 3.5336110591888428, 3.6791791915893555, 3.824747085571289, 3.9703149795532227, 4.115882873535156, 4.261451244354248, 4.407019138336182, 4.552587032318115, 4.698155403137207, 4.843723297119141, 4.989291191101074]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 2.0, 0.0, 6.0, 11.0, 23.0, 24.0, 40.0, 76.0, 77.0, 135.0, 188.0, 282.0, 417.0, 620.0, 945.0, 1359.0, 2097.0, 3189.0, 4773.0, 6813.0, 10266.0, 15195.0, 21969.0, 31517.0, 44045.0, 59240.0, 76087.0, 92153.0, 103142.0, 107787.0, 102919.0, 90846.0, 74648.0, 57896.0, 42975.0, 30584.0, 21502.0, 14478.0, 9941.0, 6728.0, 4440.0, 3008.0, 1984.0, 1376.0, 910.0, 571.0, 420.0, 301.0, 167.0, 134.0, 66.0, 57.0, 40.0, 35.0, 22.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0], "bins": [-3.833984375, -3.715850830078125, -3.59771728515625, -3.479583740234375, -3.3614501953125, -3.243316650390625, -3.12518310546875, -3.007049560546875, -2.888916015625, -2.770782470703125, -2.65264892578125, -2.534515380859375, -2.4163818359375, -2.298248291015625, -2.18011474609375, -2.061981201171875, -1.94384765625, -1.825714111328125, -1.70758056640625, -1.589447021484375, -1.4713134765625, -1.353179931640625, -1.23504638671875, -1.116912841796875, -0.998779296875, -0.880645751953125, -0.76251220703125, -0.644378662109375, -0.5262451171875, -0.408111572265625, -0.28997802734375, -0.171844482421875, -0.0537109375, 0.064422607421875, 0.18255615234375, 0.300689697265625, 0.4188232421875, 0.536956787109375, 0.65509033203125, 0.773223876953125, 0.891357421875, 1.009490966796875, 1.12762451171875, 1.245758056640625, 1.3638916015625, 1.482025146484375, 1.60015869140625, 1.718292236328125, 1.83642578125, 1.954559326171875, 2.07269287109375, 2.190826416015625, 2.3089599609375, 2.427093505859375, 2.54522705078125, 2.663360595703125, 2.781494140625, 2.899627685546875, 3.01776123046875, 3.135894775390625, 3.2540283203125, 3.372161865234375, 3.49029541015625, 3.608428955078125, 3.7265625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 9.0, 5.0, 7.0, 5.0, 13.0, 8.0, 21.0, 14.0, 21.0, 20.0, 14.0, 29.0, 20.0, 39.0, 38.0, 45.0, 38.0, 34.0, 44.0, 34.0, 25.0, 38.0, 33.0, 33.0, 47.0, 43.0, 43.0, 37.0, 26.0, 26.0, 27.0, 23.0, 13.0, 16.0, 16.0, 20.0, 10.0, 15.0, 12.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.89892578125, -3.7548828125, -3.61083984375, -3.466796875, -3.32275390625, -3.1787109375, -3.03466796875, -2.890625, -2.74658203125, -2.6025390625, -2.45849609375, -2.314453125, -2.17041015625, -2.0263671875, -1.88232421875, -1.73828125, -1.59423828125, -1.4501953125, -1.30615234375, -1.162109375, -1.01806640625, -0.8740234375, -0.72998046875, -0.5859375, -0.44189453125, -0.2978515625, -0.15380859375, -0.009765625, 0.13427734375, 0.2783203125, 0.42236328125, 0.56640625, 0.71044921875, 0.8544921875, 0.99853515625, 1.142578125, 1.28662109375, 1.4306640625, 1.57470703125, 1.71875, 1.86279296875, 2.0068359375, 2.15087890625, 2.294921875, 2.43896484375, 2.5830078125, 2.72705078125, 2.87109375, 3.01513671875, 3.1591796875, 3.30322265625, 3.447265625, 3.59130859375, 3.7353515625, 3.87939453125, 4.0234375, 4.16748046875, 4.3115234375, 4.45556640625, 4.599609375, 4.74365234375, 4.8876953125, 5.03173828125, 5.17578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 12.0, 24.0, 37.0, 54.0, 84.0, 132.0, 221.0, 306.0, 436.0, 761.0, 1084.0, 1658.0, 2592.0, 3894.0, 5928.0, 9003.0, 13415.0, 20108.0, 29169.0, 41199.0, 56743.0, 74054.0, 90834.0, 104175.0, 109676.0, 106413.0, 95213.0, 78014.0, 60498.0, 45014.0, 31820.0, 21812.0, 15024.0, 9878.0, 6755.0, 4392.0, 2786.0, 1860.0, 1223.0, 740.0, 489.0, 361.0, 231.0, 148.0, 93.0, 69.0, 45.0, 23.0, 23.0, 5.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-3.787109375, -3.6710205078125, -3.554931640625, -3.4388427734375, -3.32275390625, -3.2066650390625, -3.090576171875, -2.9744873046875, -2.8583984375, -2.7423095703125, -2.626220703125, -2.5101318359375, -2.39404296875, -2.2779541015625, -2.161865234375, -2.0457763671875, -1.9296875, -1.8135986328125, -1.697509765625, -1.5814208984375, -1.46533203125, -1.3492431640625, -1.233154296875, -1.1170654296875, -1.0009765625, -0.8848876953125, -0.768798828125, -0.6527099609375, -0.53662109375, -0.4205322265625, -0.304443359375, -0.1883544921875, -0.072265625, 0.0438232421875, 0.159912109375, 0.2760009765625, 0.39208984375, 0.5081787109375, 0.624267578125, 0.7403564453125, 0.8564453125, 0.9725341796875, 1.088623046875, 1.2047119140625, 1.32080078125, 1.4368896484375, 1.552978515625, 1.6690673828125, 1.78515625, 1.9012451171875, 2.017333984375, 2.1334228515625, 2.24951171875, 2.3656005859375, 2.481689453125, 2.5977783203125, 2.7138671875, 2.8299560546875, 2.946044921875, 3.0621337890625, 3.17822265625, 3.2943115234375, 3.410400390625, 3.5264892578125, 3.642578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 7.0, 14.0, 9.0, 17.0, 19.0, 23.0, 34.0, 28.0, 26.0, 31.0, 36.0, 50.0, 38.0, 46.0, 55.0, 41.0, 50.0, 37.0, 42.0, 45.0, 49.0, 38.0, 34.0, 40.0, 29.0, 25.0, 18.0, 25.0, 16.0, 12.0, 10.0, 11.0, 14.0, 7.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.899658203125, -2.79150390625, -2.683349609375, -2.5751953125, -2.467041015625, -2.35888671875, -2.250732421875, -2.142578125, -2.034423828125, -1.92626953125, -1.818115234375, -1.7099609375, -1.601806640625, -1.49365234375, -1.385498046875, -1.27734375, -1.169189453125, -1.06103515625, -0.952880859375, -0.8447265625, -0.736572265625, -0.62841796875, -0.520263671875, -0.412109375, -0.303955078125, -0.19580078125, -0.087646484375, 0.0205078125, 0.128662109375, 0.23681640625, 0.344970703125, 0.453125, 0.561279296875, 0.66943359375, 0.777587890625, 0.8857421875, 0.993896484375, 1.10205078125, 1.210205078125, 1.318359375, 1.426513671875, 1.53466796875, 1.642822265625, 1.7509765625, 1.859130859375, 1.96728515625, 2.075439453125, 2.18359375, 2.291748046875, 2.39990234375, 2.508056640625, 2.6162109375, 2.724365234375, 2.83251953125, 2.940673828125, 3.048828125, 3.156982421875, 3.26513671875, 3.373291015625, 3.4814453125, 3.589599609375, 3.69775390625, 3.805908203125, 3.9140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 10.0, 8.0, 25.0, 37.0, 45.0, 71.0, 97.0, 182.0, 243.0, 396.0, 581.0, 944.0, 1488.0, 2507.0, 4147.0, 7152.0, 12263.0, 21417.0, 37253.0, 62918.0, 101103.0, 145714.0, 171785.0, 161789.0, 122323.0, 79764.0, 47994.0, 27655.0, 15565.0, 9343.0, 5225.0, 3172.0, 1928.0, 1193.0, 805.0, 482.0, 333.0, 193.0, 132.0, 91.0, 57.0, 46.0, 26.0, 17.0, 11.0, 12.0, 2.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.549041748046875, -2.46331787109375, -2.377593994140625, -2.2918701171875, -2.206146240234375, -2.12042236328125, -2.034698486328125, -1.948974609375, -1.863250732421875, -1.77752685546875, -1.691802978515625, -1.6060791015625, -1.520355224609375, -1.43463134765625, -1.348907470703125, -1.26318359375, -1.177459716796875, -1.09173583984375, -1.006011962890625, -0.9202880859375, -0.834564208984375, -0.74884033203125, -0.663116455078125, -0.577392578125, -0.491668701171875, -0.40594482421875, -0.320220947265625, -0.2344970703125, -0.148773193359375, -0.06304931640625, 0.022674560546875, 0.1083984375, 0.194122314453125, 0.27984619140625, 0.365570068359375, 0.4512939453125, 0.537017822265625, 0.62274169921875, 0.708465576171875, 0.794189453125, 0.879913330078125, 0.96563720703125, 1.051361083984375, 1.1370849609375, 1.222808837890625, 1.30853271484375, 1.394256591796875, 1.47998046875, 1.565704345703125, 1.65142822265625, 1.737152099609375, 1.8228759765625, 1.908599853515625, 1.99432373046875, 2.080047607421875, 2.165771484375, 2.251495361328125, 2.33721923828125, 2.422943115234375, 2.5086669921875, 2.594390869140625, 2.68011474609375, 2.765838623046875, 2.8515625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 6.0, 5.0, 12.0, 12.0, 6.0, 18.0, 23.0, 24.0, 35.0, 41.0, 40.0, 41.0, 51.0, 59.0, 61.0, 54.0, 60.0, 52.0, 63.0, 38.0, 53.0, 32.0, 32.0, 31.0, 24.0, 28.0, 17.0, 14.0, 20.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002551078796386719, -0.00024754181504249573, -0.00023997575044631958, -0.00023240968585014343, -0.00022484362125396729, -0.00021727755665779114, -0.000209711492061615, -0.00020214542746543884, -0.0001945793628692627, -0.00018701329827308655, -0.0001794472336769104, -0.00017188116908073425, -0.0001643151044845581, -0.00015674903988838196, -0.0001491829752922058, -0.00014161691069602966, -0.00013405084609985352, -0.00012648478150367737, -0.00011891871690750122, -0.00011135265231132507, -0.00010378658771514893, -9.622052311897278e-05, -8.865445852279663e-05, -8.108839392662048e-05, -7.352232933044434e-05, -6.595626473426819e-05, -5.839020013809204e-05, -5.0824135541915894e-05, -4.3258070945739746e-05, -3.56920063495636e-05, -2.812594175338745e-05, -2.0559877157211304e-05, -1.2993812561035156e-05, -5.427747964859009e-06, 2.1383166313171387e-06, 9.704381227493286e-06, 1.7270445823669434e-05, 2.483651041984558e-05, 3.240257501602173e-05, 3.9968639612197876e-05, 4.7534704208374023e-05, 5.510076880455017e-05, 6.266683340072632e-05, 7.023289799690247e-05, 7.779896259307861e-05, 8.536502718925476e-05, 9.293109178543091e-05, 0.00010049715638160706, 0.0001080632209777832, 0.00011562928557395935, 0.0001231953501701355, 0.00013076141476631165, 0.0001383274793624878, 0.00014589354395866394, 0.0001534596085548401, 0.00016102567315101624, 0.00016859173774719238, 0.00017615780234336853, 0.00018372386693954468, 0.00019128993153572083, 0.00019885599613189697, 0.00020642206072807312, 0.00021398812532424927, 0.00022155418992042542, 0.00022912025451660156]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 11.0, 9.0, 22.0, 36.0, 56.0, 65.0, 97.0, 172.0, 279.0, 447.0, 735.0, 1197.0, 1823.0, 3111.0, 4954.0, 7966.0, 13319.0, 21613.0, 35395.0, 56829.0, 87006.0, 122160.0, 148828.0, 152391.0, 129923.0, 94236.0, 63026.0, 39798.0, 24426.0, 14958.0, 9077.0, 5437.0, 3439.0, 2082.0, 1298.0, 820.0, 541.0, 333.0, 185.0, 154.0, 98.0, 73.0, 38.0, 31.0, 19.0, 13.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.4140625, -2.33648681640625, -2.2589111328125, -2.18133544921875, -2.103759765625, -2.02618408203125, -1.9486083984375, -1.87103271484375, -1.79345703125, -1.71588134765625, -1.6383056640625, -1.56072998046875, -1.483154296875, -1.40557861328125, -1.3280029296875, -1.25042724609375, -1.1728515625, -1.09527587890625, -1.0177001953125, -0.94012451171875, -0.862548828125, -0.78497314453125, -0.7073974609375, -0.62982177734375, -0.55224609375, -0.47467041015625, -0.3970947265625, -0.31951904296875, -0.241943359375, -0.16436767578125, -0.0867919921875, -0.00921630859375, 0.068359375, 0.14593505859375, 0.2235107421875, 0.30108642578125, 0.378662109375, 0.45623779296875, 0.5338134765625, 0.61138916015625, 0.68896484375, 0.76654052734375, 0.8441162109375, 0.92169189453125, 0.999267578125, 1.07684326171875, 1.1544189453125, 1.23199462890625, 1.3095703125, 1.38714599609375, 1.4647216796875, 1.54229736328125, 1.619873046875, 1.69744873046875, 1.7750244140625, 1.85260009765625, 1.93017578125, 2.00775146484375, 2.0853271484375, 2.16290283203125, 2.240478515625, 2.31805419921875, 2.3956298828125, 2.47320556640625, 2.55078125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 5.0, 9.0, 13.0, 11.0, 28.0, 8.0, 34.0, 26.0, 50.0, 48.0, 44.0, 77.0, 63.0, 75.0, 64.0, 70.0, 60.0, 46.0, 57.0, 45.0, 29.0, 24.0, 28.0, 12.0, 16.0, 11.0, 11.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1107330322265625, -1.070098876953125, -1.0294647216796875, -0.98883056640625, -0.9481964111328125, -0.907562255859375, -0.8669281005859375, -0.8262939453125, -0.7856597900390625, -0.745025634765625, -0.7043914794921875, -0.66375732421875, -0.6231231689453125, -0.582489013671875, -0.5418548583984375, -0.501220703125, -0.4605865478515625, -0.419952392578125, -0.3793182373046875, -0.33868408203125, -0.2980499267578125, -0.257415771484375, -0.2167816162109375, -0.1761474609375, -0.1355133056640625, -0.094879150390625, -0.0542449951171875, -0.01361083984375, 0.0270233154296875, 0.067657470703125, 0.1082916259765625, 0.14892578125, 0.1895599365234375, 0.230194091796875, 0.2708282470703125, 0.31146240234375, 0.3520965576171875, 0.392730712890625, 0.4333648681640625, 0.4739990234375, 0.5146331787109375, 0.555267333984375, 0.5959014892578125, 0.63653564453125, 0.6771697998046875, 0.717803955078125, 0.7584381103515625, 0.799072265625, 0.8397064208984375, 0.880340576171875, 0.9209747314453125, 0.96160888671875, 1.0022430419921875, 1.042877197265625, 1.0835113525390625, 1.1241455078125, 1.1647796630859375, 1.205413818359375, 1.2460479736328125, 1.28668212890625, 1.3273162841796875, 1.367950439453125, 1.4085845947265625, 1.44921875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 11.0, 13.0, 12.0, 12.0, 17.0, 25.0, 14.0, 23.0, 28.0, 30.0, 40.0, 43.0, 35.0, 44.0, 39.0, 29.0, 39.0, 45.0, 37.0, 40.0, 38.0, 39.0, 41.0, 39.0, 26.0, 27.0, 28.0, 30.0, 20.0, 13.0, 15.0, 21.0, 14.0, 6.0, 13.0, 7.0, 8.0, 2.0, 5.0, 3.0, 9.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.625288486480713, -4.487185001373291, -4.349081516265869, -4.210978031158447, -4.072874546051025, -3.9347710609436035, -3.7966675758361816, -3.6585640907287598, -3.520460605621338, -3.382357120513916, -3.244253635406494, -3.1061501502990723, -2.9680466651916504, -2.8299431800842285, -2.6918396949768066, -2.5537362098693848, -2.415632486343384, -2.277529001235962, -2.13942551612854, -2.001322031021118, -1.8632185459136963, -1.7251150608062744, -1.587011456489563, -1.4489079713821411, -1.3108044862747192, -1.1727010011672974, -1.0345975160598755, -0.8964939713478088, -0.758390486240387, -0.6202870011329651, -0.48218345642089844, -0.34407997131347656, -0.2059764862060547, -0.06787298619747162, 0.07023051381111145, 0.2083340287208557, 0.3464375138282776, 0.48454099893569946, 0.6226445436477661, 0.760748028755188, 0.8988515138626099, 1.0369549989700317, 1.1750584840774536, 1.313162088394165, 1.451265573501587, 1.5893690586090088, 1.7274725437164307, 1.8655760288238525, 2.0036795139312744, 2.1417829990386963, 2.279886484146118, 2.41798996925354, 2.556093454360962, 2.694196939468384, 2.8323006629943848, 2.9704041481018066, 3.1085076332092285, 3.2466111183166504, 3.3847146034240723, 3.522818088531494, 3.660921573638916, 3.799025058746338, 3.9371285438537598, 4.075232028961182, 4.2133355140686035]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 3.0, 11.0, 7.0, 5.0, 12.0, 19.0, 19.0, 16.0, 18.0, 20.0, 24.0, 24.0, 30.0, 39.0, 24.0, 36.0, 45.0, 52.0, 29.0, 38.0, 38.0, 35.0, 30.0, 45.0, 29.0, 32.0, 35.0, 34.0, 26.0, 27.0, 28.0, 23.0, 19.0, 24.0, 15.0, 10.0, 17.0, 5.0, 11.0, 11.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.939199924468994, -4.793707370758057, -4.648214817047119, -4.502722263336182, -4.357229709625244, -4.211736679077148, -4.066244125366211, -3.9207515716552734, -3.775259017944336, -3.6297664642333984, -3.484273910522461, -3.3387813568115234, -3.193288564682007, -3.0477960109710693, -2.902303457260132, -2.7568106651306152, -2.611318349838257, -2.4658257961273193, -2.320333242416382, -2.1748404502868652, -2.0293478965759277, -1.8838553428649902, -1.7383627891540527, -1.5928701162338257, -1.4473775625228882, -1.3018850088119507, -1.1563923358917236, -1.0108997821807861, -0.8654071688652039, -0.7199145555496216, -0.5744220018386841, -0.42892932891845703, -0.28343677520751953, -0.13794417679309845, 0.007548421621322632, 0.15304100513458252, 0.2985336184501648, 0.44402623176574707, 0.5895187854766846, 0.7350114583969116, 0.8805040121078491, 1.0259965658187866, 1.1714892387390137, 1.3169817924499512, 1.4624743461608887, 1.6079670190811157, 1.7534595727920532, 1.8989522457122803, 2.0444447994232178, 2.1899373531341553, 2.3354299068450928, 2.4809226989746094, 2.626415252685547, 2.7719078063964844, 2.917400360107422, 3.0628929138183594, 3.208385467529297, 3.3538780212402344, 3.499370574951172, 3.6448631286621094, 3.790355920791626, 3.9358484745025635, 4.081340789794922, 4.226833820343018, 4.372326374053955]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 10.0, 11.0, 21.0, 42.0, 77.0, 137.0, 223.0, 412.0, 687.0, 1153.0, 1932.0, 3500.0, 6239.0, 10840.0, 18707.0, 32467.0, 55675.0, 94401.0, 156813.0, 251611.0, 378619.0, 520103.0, 612259.0, 605244.0, 498200.0, 359886.0, 234455.0, 144688.0, 86616.0, 50737.0, 29072.0, 16876.0, 9715.0, 5440.0, 3115.0, 1775.0, 1063.0, 616.0, 371.0, 207.0, 97.0, 73.0, 38.0, 23.0, 17.0, 9.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.864471435546875, -3.73089599609375, -3.597320556640625, -3.4637451171875, -3.330169677734375, -3.19659423828125, -3.063018798828125, -2.929443359375, -2.795867919921875, -2.66229248046875, -2.528717041015625, -2.3951416015625, -2.261566162109375, -2.12799072265625, -1.994415283203125, -1.86083984375, -1.727264404296875, -1.59368896484375, -1.460113525390625, -1.3265380859375, -1.192962646484375, -1.05938720703125, -0.925811767578125, -0.792236328125, -0.658660888671875, -0.52508544921875, -0.391510009765625, -0.2579345703125, -0.124359130859375, 0.00921630859375, 0.142791748046875, 0.2763671875, 0.409942626953125, 0.54351806640625, 0.677093505859375, 0.8106689453125, 0.944244384765625, 1.07781982421875, 1.211395263671875, 1.344970703125, 1.478546142578125, 1.61212158203125, 1.745697021484375, 1.8792724609375, 2.012847900390625, 2.14642333984375, 2.279998779296875, 2.41357421875, 2.547149658203125, 2.68072509765625, 2.814300537109375, 2.9478759765625, 3.081451416015625, 3.21502685546875, 3.348602294921875, 3.482177734375, 3.615753173828125, 3.74932861328125, 3.882904052734375, 4.0164794921875, 4.150054931640625, 4.28363037109375, 4.417205810546875, 4.55078125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 13.0, 6.0, 14.0, 13.0, 10.0, 12.0, 25.0, 18.0, 24.0, 19.0, 23.0, 25.0, 39.0, 32.0, 35.0, 41.0, 42.0, 47.0, 32.0, 51.0, 38.0, 27.0, 28.0, 21.0, 31.0, 44.0, 31.0, 25.0, 25.0, 23.0, 19.0, 24.0, 12.0, 15.0, 16.0, 10.0, 15.0, 7.0, 11.0, 5.0, 5.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.337890625, -3.24005126953125, -3.1422119140625, -3.04437255859375, -2.946533203125, -2.84869384765625, -2.7508544921875, -2.65301513671875, -2.55517578125, -2.45733642578125, -2.3594970703125, -2.26165771484375, -2.163818359375, -2.06597900390625, -1.9681396484375, -1.87030029296875, -1.7724609375, -1.67462158203125, -1.5767822265625, -1.47894287109375, -1.381103515625, -1.28326416015625, -1.1854248046875, -1.08758544921875, -0.98974609375, -0.89190673828125, -0.7940673828125, -0.69622802734375, -0.598388671875, -0.50054931640625, -0.4027099609375, -0.30487060546875, -0.20703125, -0.10919189453125, -0.0113525390625, 0.08648681640625, 0.184326171875, 0.28216552734375, 0.3800048828125, 0.47784423828125, 0.57568359375, 0.67352294921875, 0.7713623046875, 0.86920166015625, 0.967041015625, 1.06488037109375, 1.1627197265625, 1.26055908203125, 1.3583984375, 1.45623779296875, 1.5540771484375, 1.65191650390625, 1.749755859375, 1.84759521484375, 1.9454345703125, 2.04327392578125, 2.14111328125, 2.23895263671875, 2.3367919921875, 2.43463134765625, 2.532470703125, 2.63031005859375, 2.7281494140625, 2.82598876953125, 2.923828125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 6.0, 12.0, 11.0, 13.0, 31.0, 32.0, 66.0, 119.0, 180.0, 317.0, 500.0, 758.0, 1212.0, 2027.0, 3130.0, 5075.0, 8057.0, 13031.0, 20460.0, 32339.0, 50469.0, 78087.0, 118143.0, 173938.0, 244297.0, 324446.0, 405598.0, 462091.0, 476591.0, 444366.0, 377277.0, 295354.0, 217030.0, 152261.0, 102356.0, 67707.0, 43272.0, 27489.0, 17356.0, 10618.0, 6830.0, 4159.0, 2678.0, 1653.0, 1072.0, 705.0, 391.0, 241.0, 163.0, 107.0, 65.0, 50.0, 20.0, 14.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0], "bins": [-3.2890625, -3.184051513671875, -3.07904052734375, -2.974029541015625, -2.8690185546875, -2.764007568359375, -2.65899658203125, -2.553985595703125, -2.448974609375, -2.343963623046875, -2.23895263671875, -2.133941650390625, -2.0289306640625, -1.923919677734375, -1.81890869140625, -1.713897705078125, -1.60888671875, -1.503875732421875, -1.39886474609375, -1.293853759765625, -1.1888427734375, -1.083831787109375, -0.97882080078125, -0.873809814453125, -0.768798828125, -0.663787841796875, -0.55877685546875, -0.453765869140625, -0.3487548828125, -0.243743896484375, -0.13873291015625, -0.033721923828125, 0.0712890625, 0.176300048828125, 0.28131103515625, 0.386322021484375, 0.4913330078125, 0.596343994140625, 0.70135498046875, 0.806365966796875, 0.911376953125, 1.016387939453125, 1.12139892578125, 1.226409912109375, 1.3314208984375, 1.436431884765625, 1.54144287109375, 1.646453857421875, 1.75146484375, 1.856475830078125, 1.96148681640625, 2.066497802734375, 2.1715087890625, 2.276519775390625, 2.38153076171875, 2.486541748046875, 2.591552734375, 2.696563720703125, 2.80157470703125, 2.906585693359375, 3.0115966796875, 3.116607666015625, 3.22161865234375, 3.326629638671875, 3.431640625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 7.0, 8.0, 18.0, 26.0, 23.0, 41.0, 51.0, 81.0, 71.0, 91.0, 88.0, 123.0, 161.0, 146.0, 193.0, 198.0, 211.0, 219.0, 188.0, 204.0, 211.0, 217.0, 216.0, 215.0, 188.0, 127.0, 147.0, 105.0, 88.0, 69.0, 63.0, 56.0, 45.0, 36.0, 30.0, 30.0, 18.0, 9.0, 13.0, 7.0, 12.0, 6.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6845703125, -1.6304779052734375, -1.576385498046875, -1.5222930908203125, -1.46820068359375, -1.4141082763671875, -1.360015869140625, -1.3059234619140625, -1.2518310546875, -1.1977386474609375, -1.143646240234375, -1.0895538330078125, -1.03546142578125, -0.9813690185546875, -0.927276611328125, -0.8731842041015625, -0.819091796875, -0.7649993896484375, -0.710906982421875, -0.6568145751953125, -0.60272216796875, -0.5486297607421875, -0.494537353515625, -0.4404449462890625, -0.3863525390625, -0.3322601318359375, -0.278167724609375, -0.2240753173828125, -0.16998291015625, -0.1158905029296875, -0.061798095703125, -0.0077056884765625, 0.04638671875, 0.1004791259765625, 0.154571533203125, 0.2086639404296875, 0.26275634765625, 0.3168487548828125, 0.370941162109375, 0.4250335693359375, 0.4791259765625, 0.5332183837890625, 0.587310791015625, 0.6414031982421875, 0.69549560546875, 0.7495880126953125, 0.803680419921875, 0.8577728271484375, 0.911865234375, 0.9659576416015625, 1.020050048828125, 1.0741424560546875, 1.12823486328125, 1.1823272705078125, 1.236419677734375, 1.2905120849609375, 1.3446044921875, 1.3986968994140625, 1.452789306640625, 1.5068817138671875, 1.56097412109375, 1.6150665283203125, 1.669158935546875, 1.7232513427734375, 1.77734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 8.0, 8.0, 10.0, 10.0, 9.0, 14.0, 23.0, 17.0, 29.0, 25.0, 34.0, 37.0, 37.0, 29.0, 55.0, 42.0, 54.0, 48.0, 36.0, 51.0, 47.0, 60.0, 35.0, 35.0, 34.0, 30.0, 26.0, 22.0, 25.0, 19.0, 20.0, 19.0, 15.0, 9.0, 7.0, 7.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.819105625152588, -4.674719333648682, -4.530333518981934, -4.385947227478027, -4.241560935974121, -4.097175121307373, -3.952788829803467, -3.8084027767181396, -3.6640167236328125, -3.5196306705474854, -3.375244379043579, -3.230858325958252, -3.086472272872925, -2.9420862197875977, -2.7976999282836914, -2.6533138751983643, -2.508927583694458, -2.364541530609131, -2.2201552391052246, -2.0757691860198975, -1.9313831329345703, -1.7869969606399536, -1.642610788345337, -1.4982247352600098, -1.353838562965393, -1.2094523906707764, -1.0650663375854492, -0.9206801652908325, -0.7762940526008606, -0.6319079399108887, -0.487521767616272, -0.3431357145309448, -0.19874954223632812, -0.05436341464519501, 0.09002271294593811, 0.23440885543823242, 0.37879496812820435, 0.5231810808181763, 0.667567253112793, 0.8119533061981201, 0.9563394784927368, 1.1007256507873535, 1.2451117038726807, 1.3894978761672974, 1.533884048461914, 1.6782701015472412, 1.822656273841858, 1.967042326927185, 2.1114284992218018, 2.255814552307129, 2.400200843811035, 2.5445868968963623, 2.6889729499816895, 2.8333592414855957, 2.977745294570923, 3.12213134765625, 3.2665176391601562, 3.4109036922454834, 3.5552899837493896, 3.699676036834717, 3.844062089920044, 3.988448143005371, 4.132834434509277, 4.277220726013184, 4.421606540679932]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 9.0, 11.0, 12.0, 16.0, 11.0, 10.0, 11.0, 20.0, 25.0, 21.0, 27.0, 37.0, 28.0, 36.0, 26.0, 40.0, 39.0, 38.0, 43.0, 50.0, 40.0, 37.0, 36.0, 39.0, 36.0, 28.0, 30.0, 26.0, 33.0, 24.0, 17.0, 15.0, 19.0, 19.0, 19.0, 10.0, 7.0, 8.0, 10.0, 9.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.7706501483917236, -3.647010326385498, -3.5233705043792725, -3.399730682373047, -3.2760908603668213, -3.1524510383605957, -3.028810977935791, -2.9051713943481445, -2.78153133392334, -2.6578915119171143, -2.5342516899108887, -2.410611867904663, -2.2869720458984375, -2.163332223892212, -2.0396924018859863, -1.9160524606704712, -1.7924127578735352, -1.6687729358673096, -1.545133113861084, -1.4214932918548584, -1.2978534698486328, -1.1742136478424072, -1.050573706626892, -0.9269338846206665, -0.8032940626144409, -0.6796542406082153, -0.5560144186019897, -0.4323745369911194, -0.3087347149848938, -0.1850948929786682, -0.06145501136779785, 0.062184810638427734, 0.18582439422607422, 0.3094642162322998, 0.4331040680408478, 0.5567439198493958, 0.6803837418556213, 0.8040235638618469, 0.9276634454727173, 1.0513032674789429, 1.1749430894851685, 1.298582911491394, 1.4222227334976196, 1.5458626747131348, 1.6695024967193604, 1.793142318725586, 1.9167821407318115, 2.040421962738037, 2.1640617847442627, 2.2877016067504883, 2.411341428756714, 2.5349812507629395, 2.658621072769165, 2.7822608947753906, 2.9059009552001953, 3.029540538787842, 3.1531805992126465, 3.276820421218872, 3.4004602432250977, 3.5241000652313232, 3.647739887237549, 3.7713797092437744, 3.89501953125, 4.018659591674805, 4.142299175262451]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 11.0, 17.0, 13.0, 19.0, 36.0, 56.0, 73.0, 81.0, 143.0, 169.0, 274.0, 419.0, 625.0, 969.0, 1542.0, 2369.0, 4174.0, 7077.0, 12552.0, 22807.0, 43383.0, 84183.0, 160593.0, 244975.0, 210279.0, 118248.0, 61228.0, 31773.0, 17134.0, 9273.0, 5320.0, 3135.0, 1982.0, 1179.0, 786.0, 567.0, 309.0, 243.0, 143.0, 106.0, 81.0, 69.0, 38.0, 23.0, 25.0, 13.0, 17.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 4.0], "bins": [-1.99609375, -1.9369659423828125, -1.877838134765625, -1.8187103271484375, -1.75958251953125, -1.7004547119140625, -1.641326904296875, -1.5821990966796875, -1.5230712890625, -1.4639434814453125, -1.404815673828125, -1.3456878662109375, -1.28656005859375, -1.2274322509765625, -1.168304443359375, -1.1091766357421875, -1.050048828125, -0.9909210205078125, -0.931793212890625, -0.8726654052734375, -0.81353759765625, -0.7544097900390625, -0.695281982421875, -0.6361541748046875, -0.5770263671875, -0.5178985595703125, -0.458770751953125, -0.3996429443359375, -0.34051513671875, -0.2813873291015625, -0.222259521484375, -0.1631317138671875, -0.10400390625, -0.0448760986328125, 0.014251708984375, 0.0733795166015625, 0.13250732421875, 0.1916351318359375, 0.250762939453125, 0.3098907470703125, 0.3690185546875, 0.4281463623046875, 0.487274169921875, 0.5464019775390625, 0.60552978515625, 0.6646575927734375, 0.723785400390625, 0.7829132080078125, 0.842041015625, 0.9011688232421875, 0.960296630859375, 1.0194244384765625, 1.07855224609375, 1.1376800537109375, 1.196807861328125, 1.2559356689453125, 1.3150634765625, 1.3741912841796875, 1.433319091796875, 1.4924468994140625, 1.55157470703125, 1.6107025146484375, 1.669830322265625, 1.7289581298828125, 1.7880859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 8.0, 2.0, 6.0, 5.0, 16.0, 13.0, 10.0, 8.0, 17.0, 15.0, 15.0, 20.0, 23.0, 28.0, 34.0, 32.0, 33.0, 43.0, 51.0, 33.0, 42.0, 40.0, 45.0, 41.0, 48.0, 33.0, 29.0, 38.0, 33.0, 27.0, 20.0, 31.0, 23.0, 19.0, 16.0, 18.0, 13.0, 16.0, 9.0, 13.0, 11.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1484375, -4.01617431640625, -3.8839111328125, -3.75164794921875, -3.619384765625, -3.48712158203125, -3.3548583984375, -3.22259521484375, -3.09033203125, -2.95806884765625, -2.8258056640625, -2.69354248046875, -2.561279296875, -2.42901611328125, -2.2967529296875, -2.16448974609375, -2.0322265625, -1.89996337890625, -1.7677001953125, -1.63543701171875, -1.503173828125, -1.37091064453125, -1.2386474609375, -1.10638427734375, -0.97412109375, -0.84185791015625, -0.7095947265625, -0.57733154296875, -0.445068359375, -0.31280517578125, -0.1805419921875, -0.04827880859375, 0.083984375, 0.21624755859375, 0.3485107421875, 0.48077392578125, 0.613037109375, 0.74530029296875, 0.8775634765625, 1.00982666015625, 1.14208984375, 1.27435302734375, 1.4066162109375, 1.53887939453125, 1.671142578125, 1.80340576171875, 1.9356689453125, 2.06793212890625, 2.2001953125, 2.33245849609375, 2.4647216796875, 2.59698486328125, 2.729248046875, 2.86151123046875, 2.9937744140625, 3.12603759765625, 3.25830078125, 3.39056396484375, 3.5228271484375, 3.65509033203125, 3.787353515625, 3.91961669921875, 4.0518798828125, 4.18414306640625, 4.31640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 11.0, 11.0, 19.0, 14.0, 31.0, 21.0, 35.0, 64.0, 66.0, 137.0, 171.0, 245.0, 392.0, 608.0, 1161.0, 1899.0, 3716.0, 7588.0, 17482.0, 42386.0, 113389.0, 283702.0, 332670.0, 146509.0, 54852.0, 21789.0, 9272.0, 4557.0, 2333.0, 1223.0, 790.0, 461.0, 307.0, 183.0, 143.0, 93.0, 54.0, 48.0, 29.0, 24.0, 17.0, 14.0, 10.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.431640625, -2.35595703125, -2.2802734375, -2.20458984375, -2.12890625, -2.05322265625, -1.9775390625, -1.90185546875, -1.826171875, -1.75048828125, -1.6748046875, -1.59912109375, -1.5234375, -1.44775390625, -1.3720703125, -1.29638671875, -1.220703125, -1.14501953125, -1.0693359375, -0.99365234375, -0.91796875, -0.84228515625, -0.7666015625, -0.69091796875, -0.615234375, -0.53955078125, -0.4638671875, -0.38818359375, -0.3125, -0.23681640625, -0.1611328125, -0.08544921875, -0.009765625, 0.06591796875, 0.1416015625, 0.21728515625, 0.29296875, 0.36865234375, 0.4443359375, 0.52001953125, 0.595703125, 0.67138671875, 0.7470703125, 0.82275390625, 0.8984375, 0.97412109375, 1.0498046875, 1.12548828125, 1.201171875, 1.27685546875, 1.3525390625, 1.42822265625, 1.50390625, 1.57958984375, 1.6552734375, 1.73095703125, 1.806640625, 1.88232421875, 1.9580078125, 2.03369140625, 2.109375, 2.18505859375, 2.2607421875, 2.33642578125, 2.412109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 3.0, 2.0, 5.0, 12.0, 9.0, 11.0, 16.0, 12.0, 21.0, 29.0, 22.0, 21.0, 27.0, 32.0, 33.0, 26.0, 26.0, 27.0, 31.0, 34.0, 41.0, 38.0, 42.0, 41.0, 50.0, 46.0, 43.0, 36.0, 30.0, 27.0, 30.0, 25.0, 19.0, 22.0, 16.0, 15.0, 15.0, 12.0, 10.0, 4.0, 4.0, 9.0, 8.0, 4.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.310546875, -2.22967529296875, -2.1488037109375, -2.06793212890625, -1.987060546875, -1.90618896484375, -1.8253173828125, -1.74444580078125, -1.66357421875, -1.58270263671875, -1.5018310546875, -1.42095947265625, -1.340087890625, -1.25921630859375, -1.1783447265625, -1.09747314453125, -1.0166015625, -0.93572998046875, -0.8548583984375, -0.77398681640625, -0.693115234375, -0.61224365234375, -0.5313720703125, -0.45050048828125, -0.36962890625, -0.28875732421875, -0.2078857421875, -0.12701416015625, -0.046142578125, 0.03472900390625, 0.1156005859375, 0.19647216796875, 0.27734375, 0.35821533203125, 0.4390869140625, 0.51995849609375, 0.600830078125, 0.68170166015625, 0.7625732421875, 0.84344482421875, 0.92431640625, 1.00518798828125, 1.0860595703125, 1.16693115234375, 1.247802734375, 1.32867431640625, 1.4095458984375, 1.49041748046875, 1.5712890625, 1.65216064453125, 1.7330322265625, 1.81390380859375, 1.894775390625, 1.97564697265625, 2.0565185546875, 2.13739013671875, 2.21826171875, 2.29913330078125, 2.3800048828125, 2.46087646484375, 2.541748046875, 2.62261962890625, 2.7034912109375, 2.78436279296875, 2.865234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 16.0, 28.0, 19.0, 44.0, 42.0, 82.0, 117.0, 173.0, 238.0, 372.0, 607.0, 1076.0, 2059.0, 4284.0, 11494.0, 43125.0, 315176.0, 563615.0, 77991.0, 16611.0, 5612.0, 2509.0, 1260.0, 720.0, 427.0, 252.0, 164.0, 121.0, 87.0, 58.0, 34.0, 48.0, 15.0, 13.0, 15.0, 10.0, 2.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0], "bins": [-1.35546875, -1.316925048828125, -1.27838134765625, -1.239837646484375, -1.2012939453125, -1.162750244140625, -1.12420654296875, -1.085662841796875, -1.047119140625, -1.008575439453125, -0.97003173828125, -0.931488037109375, -0.8929443359375, -0.854400634765625, -0.81585693359375, -0.777313232421875, -0.73876953125, -0.700225830078125, -0.66168212890625, -0.623138427734375, -0.5845947265625, -0.546051025390625, -0.50750732421875, -0.468963623046875, -0.430419921875, -0.391876220703125, -0.35333251953125, -0.314788818359375, -0.2762451171875, -0.237701416015625, -0.19915771484375, -0.160614013671875, -0.1220703125, -0.083526611328125, -0.04498291015625, -0.006439208984375, 0.0321044921875, 0.070648193359375, 0.10919189453125, 0.147735595703125, 0.186279296875, 0.224822998046875, 0.26336669921875, 0.301910400390625, 0.3404541015625, 0.378997802734375, 0.41754150390625, 0.456085205078125, 0.49462890625, 0.533172607421875, 0.57171630859375, 0.610260009765625, 0.6488037109375, 0.687347412109375, 0.72589111328125, 0.764434814453125, 0.802978515625, 0.841522216796875, 0.88006591796875, 0.918609619140625, 0.9571533203125, 0.995697021484375, 1.03424072265625, 1.072784423828125, 1.111328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 0.0, 5.0, 8.0, 5.0, 6.0, 9.0, 15.0, 25.0, 36.0, 53.0, 87.0, 138.0, 135.0, 141.0, 99.0, 79.0, 51.0, 30.0, 14.0, 12.0, 8.0, 4.0, 5.0, 5.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.641315460205078e-05, -7.365085184574127e-05, -7.088854908943176e-05, -6.812624633312225e-05, -6.536394357681274e-05, -6.260164082050323e-05, -5.9839338064193726e-05, -5.7077035307884216e-05, -5.431473255157471e-05, -5.15524297952652e-05, -4.879012703895569e-05, -4.602782428264618e-05, -4.326552152633667e-05, -4.050321877002716e-05, -3.774091601371765e-05, -3.497861325740814e-05, -3.221631050109863e-05, -2.9454007744789124e-05, -2.6691704988479614e-05, -2.3929402232170105e-05, -2.1167099475860596e-05, -1.8404796719551086e-05, -1.5642493963241577e-05, -1.2880191206932068e-05, -1.0117888450622559e-05, -7.355585694313049e-06, -4.59328293800354e-06, -1.8309801816940308e-06, 9.313225746154785e-07, 3.693625330924988e-06, 6.455928087234497e-06, 9.218230843544006e-06, 1.1980533599853516e-05, 1.4742836356163025e-05, 1.7505139112472534e-05, 2.0267441868782043e-05, 2.3029744625091553e-05, 2.5792047381401062e-05, 2.855435013771057e-05, 3.131665289402008e-05, 3.407895565032959e-05, 3.68412584066391e-05, 3.960356116294861e-05, 4.236586391925812e-05, 4.512816667556763e-05, 4.7890469431877136e-05, 5.0652772188186646e-05, 5.3415074944496155e-05, 5.6177377700805664e-05, 5.893968045711517e-05, 6.170198321342468e-05, 6.446428596973419e-05, 6.72265887260437e-05, 6.998889148235321e-05, 7.275119423866272e-05, 7.551349699497223e-05, 7.827579975128174e-05, 8.103810250759125e-05, 8.380040526390076e-05, 8.656270802021027e-05, 8.932501077651978e-05, 9.208731353282928e-05, 9.48496162891388e-05, 9.76119190454483e-05, 0.00010037422180175781]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 13.0, 17.0, 23.0, 26.0, 43.0, 58.0, 97.0, 124.0, 213.0, 358.0, 538.0, 984.0, 1713.0, 3066.0, 5630.0, 11636.0, 25582.0, 61652.0, 156718.0, 338886.0, 259111.0, 103585.0, 41623.0, 18297.0, 8599.0, 4193.0, 2374.0, 1347.0, 760.0, 455.0, 286.0, 166.0, 134.0, 60.0, 60.0, 34.0, 31.0, 20.0, 5.0, 7.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8083419799804688, -0.7802581787109375, -0.7521743774414062, -0.724090576171875, -0.6960067749023438, -0.6679229736328125, -0.6398391723632812, -0.61175537109375, -0.5836715698242188, -0.5555877685546875, -0.5275039672851562, -0.499420166015625, -0.47133636474609375, -0.4432525634765625, -0.41516876220703125, -0.3870849609375, -0.35900115966796875, -0.3309173583984375, -0.30283355712890625, -0.274749755859375, -0.24666595458984375, -0.2185821533203125, -0.19049835205078125, -0.16241455078125, -0.13433074951171875, -0.1062469482421875, -0.07816314697265625, -0.050079345703125, -0.02199554443359375, 0.0060882568359375, 0.03417205810546875, 0.062255859375, 0.09033966064453125, 0.1184234619140625, 0.14650726318359375, 0.174591064453125, 0.20267486572265625, 0.2307586669921875, 0.25884246826171875, 0.28692626953125, 0.31501007080078125, 0.3430938720703125, 0.37117767333984375, 0.399261474609375, 0.42734527587890625, 0.4554290771484375, 0.48351287841796875, 0.5115966796875, 0.5396804809570312, 0.5677642822265625, 0.5958480834960938, 0.623931884765625, 0.6520156860351562, 0.6800994873046875, 0.7081832885742188, 0.73626708984375, 0.7643508911132812, 0.7924346923828125, 0.8205184936523438, 0.848602294921875, 0.8766860961914062, 0.9047698974609375, 0.9328536987304688, 0.9609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 8.0, 14.0, 7.0, 10.0, 20.0, 30.0, 30.0, 55.0, 54.0, 84.0, 102.0, 102.0, 121.0, 81.0, 70.0, 58.0, 34.0, 29.0, 25.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.1250152587890625, -0.118927001953125, -0.1128387451171875, -0.10675048828125, -0.1006622314453125, -0.094573974609375, -0.0884857177734375, -0.0823974609375, -0.0763092041015625, -0.070220947265625, -0.0641326904296875, -0.05804443359375, -0.0519561767578125, -0.045867919921875, -0.0397796630859375, -0.03369140625, -0.0276031494140625, -0.021514892578125, -0.0154266357421875, -0.00933837890625, -0.0032501220703125, 0.002838134765625, 0.0089263916015625, 0.0150146484375, 0.0211029052734375, 0.027191162109375, 0.0332794189453125, 0.03936767578125, 0.0454559326171875, 0.051544189453125, 0.0576324462890625, 0.063720703125, 0.0698089599609375, 0.075897216796875, 0.0819854736328125, 0.08807373046875, 0.0941619873046875, 0.100250244140625, 0.1063385009765625, 0.1124267578125, 0.1185150146484375, 0.124603271484375, 0.1306915283203125, 0.13677978515625, 0.1428680419921875, 0.148956298828125, 0.1550445556640625, 0.1611328125, 0.1672210693359375, 0.173309326171875, 0.1793975830078125, 0.18548583984375, 0.1915740966796875, 0.197662353515625, 0.2037506103515625, 0.2098388671875, 0.2159271240234375, 0.222015380859375, 0.2281036376953125, 0.23419189453125, 0.2402801513671875, 0.246368408203125, 0.2524566650390625, 0.258544921875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 11.0, 9.0, 13.0, 15.0, 13.0, 19.0, 22.0, 22.0, 26.0, 30.0, 45.0, 29.0, 41.0, 42.0, 49.0, 45.0, 48.0, 33.0, 52.0, 54.0, 54.0, 45.0, 28.0, 26.0, 32.0, 18.0, 29.0, 25.0, 17.0, 23.0, 15.0, 19.0, 8.0, 8.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.821465015411377, -4.6818156242370605, -4.542166233062744, -4.4025163650512695, -4.262866973876953, -4.123217582702637, -3.9835681915283203, -3.843918800354004, -3.7042691707611084, -3.564619779586792, -3.4249701499938965, -3.28532075881958, -3.1456713676452637, -3.006021738052368, -2.8663723468780518, -2.7267227172851562, -2.58707332611084, -2.4474239349365234, -2.307774305343628, -2.1681249141693115, -2.028475284576416, -1.8888258934020996, -1.7491765022277832, -1.6095269918441772, -1.4698774814605713, -1.3302279710769653, -1.1905784606933594, -1.050929069519043, -0.911279559135437, -0.771630048751831, -0.6319805979728699, -0.4923311471939087, -0.35268115997314453, -0.21303167939186096, -0.07338219881057739, 0.06626728177070618, 0.20591676235198975, 0.3455662727355957, 0.4852157235145569, 0.6248651742935181, 0.764514684677124, 0.90416419506073, 1.043813705444336, 1.1834630966186523, 1.3231126070022583, 1.4627621173858643, 1.6024115085601807, 1.7420610189437866, 1.8817105293273926, 2.021359920501709, 2.1610095500946045, 2.300658941268921, 2.4403085708618164, 2.579957962036133, 2.719607353210449, 2.8592567443847656, 2.998906373977661, 3.1385557651519775, 3.278205394744873, 3.4178547859191895, 3.557504177093506, 3.6971538066864014, 3.8368031978607178, 3.9764528274536133, 4.11610221862793]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 13.0, 13.0, 13.0, 11.0, 13.0, 9.0, 20.0, 23.0, 21.0, 29.0, 36.0, 28.0, 39.0, 26.0, 36.0, 39.0, 39.0, 42.0, 50.0, 41.0, 40.0, 34.0, 42.0, 38.0, 23.0, 34.0, 29.0, 32.0, 22.0, 16.0, 16.0, 18.0, 24.0, 14.0, 11.0, 6.0, 7.0, 15.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8153915405273438, -3.6913139820098877, -3.5672361850738525, -3.4431586265563965, -3.3190808296203613, -3.1950032711029053, -3.070925712585449, -2.946847915649414, -2.822770357131958, -2.698692798614502, -2.574615001678467, -2.4505374431610107, -2.3264596462249756, -2.2023820877075195, -2.0783042907714844, -1.9542267322540283, -1.8301490545272827, -1.706071376800537, -1.5819936990737915, -1.457916021347046, -1.3338384628295898, -1.2097607851028442, -1.0856831073760986, -0.9616054892539978, -0.8375278115272522, -0.7134501338005066, -0.5893725156784058, -0.46529483795166016, -0.34121719002723694, -0.21713954210281372, -0.09306186437606812, 0.031015753746032715, 0.15509343147277832, 0.27917107939720154, 0.40324872732162476, 0.5273264050483704, 0.6514040231704712, 0.7754817008972168, 0.8995593786239624, 1.023637056350708, 1.147714614868164, 1.2717922925949097, 1.3958699703216553, 1.5199475288391113, 1.644025206565857, 1.7681028842926025, 1.8921805620193481, 2.0162582397460938, 2.140336036682129, 2.264413595199585, 2.38849139213562, 2.512568950653076, 2.6366467475891113, 2.7607243061065674, 2.8848018646240234, 3.0088796615600586, 3.1329572200775146, 3.2570347785949707, 3.381112575531006, 3.505190134048462, 3.629267930984497, 3.753345489501953, 3.8774232864379883, 4.001500606536865, 4.1255784034729]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 20.0, 34.0, 41.0, 61.0, 132.0, 193.0, 307.0, 446.0, 745.0, 1153.0, 1936.0, 3158.0, 5036.0, 8045.0, 12823.0, 20019.0, 30268.0, 44357.0, 62118.0, 82452.0, 101335.0, 115692.0, 118678.0, 109897.0, 93381.0, 73500.0, 54472.0, 38251.0, 25597.0, 16495.0, 10553.0, 6744.0, 4052.0, 2549.0, 1528.0, 892.0, 590.0, 384.0, 219.0, 140.0, 99.0, 73.0, 33.0, 24.0, 10.0, 5.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.626953125, -3.514617919921875, -3.40228271484375, -3.289947509765625, -3.1776123046875, -3.065277099609375, -2.95294189453125, -2.840606689453125, -2.728271484375, -2.615936279296875, -2.50360107421875, -2.391265869140625, -2.2789306640625, -2.166595458984375, -2.05426025390625, -1.941925048828125, -1.82958984375, -1.717254638671875, -1.60491943359375, -1.492584228515625, -1.3802490234375, -1.267913818359375, -1.15557861328125, -1.043243408203125, -0.930908203125, -0.818572998046875, -0.70623779296875, -0.593902587890625, -0.4815673828125, -0.369232177734375, -0.25689697265625, -0.144561767578125, -0.0322265625, 0.080108642578125, 0.19244384765625, 0.304779052734375, 0.4171142578125, 0.529449462890625, 0.64178466796875, 0.754119873046875, 0.866455078125, 0.978790283203125, 1.09112548828125, 1.203460693359375, 1.3157958984375, 1.428131103515625, 1.54046630859375, 1.652801513671875, 1.76513671875, 1.877471923828125, 1.98980712890625, 2.102142333984375, 2.2144775390625, 2.326812744140625, 2.43914794921875, 2.551483154296875, 2.663818359375, 2.776153564453125, 2.88848876953125, 3.000823974609375, 3.1131591796875, 3.225494384765625, 3.33782958984375, 3.450164794921875, 3.5625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 1.0, 4.0, 7.0, 8.0, 14.0, 5.0, 16.0, 23.0, 10.0, 22.0, 26.0, 23.0, 33.0, 33.0, 23.0, 36.0, 42.0, 43.0, 41.0, 49.0, 41.0, 34.0, 48.0, 49.0, 37.0, 28.0, 46.0, 39.0, 26.0, 28.0, 26.0, 18.0, 17.0, 13.0, 15.0, 20.0, 13.0, 12.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2109375, -4.07501220703125, -3.9390869140625, -3.80316162109375, -3.667236328125, -3.53131103515625, -3.3953857421875, -3.25946044921875, -3.12353515625, -2.98760986328125, -2.8516845703125, -2.71575927734375, -2.579833984375, -2.44390869140625, -2.3079833984375, -2.17205810546875, -2.0361328125, -1.90020751953125, -1.7642822265625, -1.62835693359375, -1.492431640625, -1.35650634765625, -1.2205810546875, -1.08465576171875, -0.94873046875, -0.81280517578125, -0.6768798828125, -0.54095458984375, -0.405029296875, -0.26910400390625, -0.1331787109375, 0.00274658203125, 0.138671875, 0.27459716796875, 0.4105224609375, 0.54644775390625, 0.682373046875, 0.81829833984375, 0.9542236328125, 1.09014892578125, 1.22607421875, 1.36199951171875, 1.4979248046875, 1.63385009765625, 1.769775390625, 1.90570068359375, 2.0416259765625, 2.17755126953125, 2.3134765625, 2.44940185546875, 2.5853271484375, 2.72125244140625, 2.857177734375, 2.99310302734375, 3.1290283203125, 3.26495361328125, 3.40087890625, 3.53680419921875, 3.6727294921875, 3.80865478515625, 3.944580078125, 4.08050537109375, 4.2164306640625, 4.35235595703125, 4.48828125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 14.0, 5.0, 9.0, 13.0, 34.0, 55.0, 98.0, 149.0, 193.0, 365.0, 588.0, 930.0, 1481.0, 2533.0, 4052.0, 6559.0, 10735.0, 16769.0, 26363.0, 39743.0, 57721.0, 79107.0, 100017.0, 116183.0, 122269.0, 116165.0, 99936.0, 78730.0, 57199.0, 39986.0, 26146.0, 16874.0, 10595.0, 6441.0, 4096.0, 2460.0, 1541.0, 893.0, 572.0, 353.0, 215.0, 132.0, 81.0, 58.0, 42.0, 28.0, 18.0, 3.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.78515625, -3.672149658203125, -3.55914306640625, -3.446136474609375, -3.3331298828125, -3.220123291015625, -3.10711669921875, -2.994110107421875, -2.881103515625, -2.768096923828125, -2.65509033203125, -2.542083740234375, -2.4290771484375, -2.316070556640625, -2.20306396484375, -2.090057373046875, -1.97705078125, -1.864044189453125, -1.75103759765625, -1.638031005859375, -1.5250244140625, -1.412017822265625, -1.29901123046875, -1.186004638671875, -1.072998046875, -0.959991455078125, -0.84698486328125, -0.733978271484375, -0.6209716796875, -0.507965087890625, -0.39495849609375, -0.281951904296875, -0.1689453125, -0.055938720703125, 0.05706787109375, 0.170074462890625, 0.2830810546875, 0.396087646484375, 0.50909423828125, 0.622100830078125, 0.735107421875, 0.848114013671875, 0.96112060546875, 1.074127197265625, 1.1871337890625, 1.300140380859375, 1.41314697265625, 1.526153564453125, 1.63916015625, 1.752166748046875, 1.86517333984375, 1.978179931640625, 2.0911865234375, 2.204193115234375, 2.31719970703125, 2.430206298828125, 2.543212890625, 2.656219482421875, 2.76922607421875, 2.882232666015625, 2.9952392578125, 3.108245849609375, 3.22125244140625, 3.334259033203125, 3.447265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 18.0, 8.0, 17.0, 16.0, 12.0, 19.0, 39.0, 26.0, 36.0, 45.0, 36.0, 42.0, 49.0, 49.0, 35.0, 35.0, 46.0, 40.0, 35.0, 37.0, 43.0, 27.0, 45.0, 35.0, 36.0, 23.0, 25.0, 25.0, 16.0, 12.0, 8.0, 11.0, 5.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.62249755859375, -2.5379638671875, -2.45343017578125, -2.368896484375, -2.28436279296875, -2.1998291015625, -2.11529541015625, -2.03076171875, -1.94622802734375, -1.8616943359375, -1.77716064453125, -1.692626953125, -1.60809326171875, -1.5235595703125, -1.43902587890625, -1.3544921875, -1.26995849609375, -1.1854248046875, -1.10089111328125, -1.016357421875, -0.93182373046875, -0.8472900390625, -0.76275634765625, -0.67822265625, -0.59368896484375, -0.5091552734375, -0.42462158203125, -0.340087890625, -0.25555419921875, -0.1710205078125, -0.08648681640625, -0.001953125, 0.08258056640625, 0.1671142578125, 0.25164794921875, 0.336181640625, 0.42071533203125, 0.5052490234375, 0.58978271484375, 0.67431640625, 0.75885009765625, 0.8433837890625, 0.92791748046875, 1.012451171875, 1.09698486328125, 1.1815185546875, 1.26605224609375, 1.3505859375, 1.43511962890625, 1.5196533203125, 1.60418701171875, 1.688720703125, 1.77325439453125, 1.8577880859375, 1.94232177734375, 2.02685546875, 2.11138916015625, 2.1959228515625, 2.28045654296875, 2.364990234375, 2.44952392578125, 2.5340576171875, 2.61859130859375, 2.703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 22.0, 18.0, 36.0, 71.0, 104.0, 153.0, 210.0, 316.0, 497.0, 765.0, 1133.0, 1740.0, 2640.0, 4000.0, 6005.0, 9515.0, 14408.0, 21811.0, 32973.0, 49259.0, 70284.0, 95331.0, 118810.0, 132446.0, 126556.0, 106579.0, 80457.0, 57639.0, 38957.0, 26070.0, 17233.0, 11101.0, 7265.0, 4893.0, 3147.0, 2077.0, 1352.0, 904.0, 637.0, 385.0, 256.0, 171.0, 110.0, 69.0, 52.0, 31.0, 18.0, 19.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0], "bins": [-1.8662109375, -1.81085205078125, -1.7554931640625, -1.70013427734375, -1.644775390625, -1.58941650390625, -1.5340576171875, -1.47869873046875, -1.42333984375, -1.36798095703125, -1.3126220703125, -1.25726318359375, -1.201904296875, -1.14654541015625, -1.0911865234375, -1.03582763671875, -0.98046875, -0.92510986328125, -0.8697509765625, -0.81439208984375, -0.759033203125, -0.70367431640625, -0.6483154296875, -0.59295654296875, -0.53759765625, -0.48223876953125, -0.4268798828125, -0.37152099609375, -0.316162109375, -0.26080322265625, -0.2054443359375, -0.15008544921875, -0.0947265625, -0.03936767578125, 0.0159912109375, 0.07135009765625, 0.126708984375, 0.18206787109375, 0.2374267578125, 0.29278564453125, 0.34814453125, 0.40350341796875, 0.4588623046875, 0.51422119140625, 0.569580078125, 0.62493896484375, 0.6802978515625, 0.73565673828125, 0.791015625, 0.84637451171875, 0.9017333984375, 0.95709228515625, 1.012451171875, 1.06781005859375, 1.1231689453125, 1.17852783203125, 1.23388671875, 1.28924560546875, 1.3446044921875, 1.39996337890625, 1.455322265625, 1.51068115234375, 1.5660400390625, 1.62139892578125, 1.6767578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 9.0, 9.0, 9.0, 16.0, 9.0, 27.0, 31.0, 28.0, 41.0, 43.0, 43.0, 46.0, 62.0, 57.0, 75.0, 51.0, 66.0, 62.0, 57.0, 39.0, 42.0, 25.0, 33.0, 24.0, 22.0, 17.0, 16.0, 8.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015878677368164062, -0.0001522749662399292, -0.00014576315879821777, -0.00013925135135650635, -0.00013273954391479492, -0.0001262277364730835, -0.00011971592903137207, -0.00011320412158966064, -0.00010669231414794922, -0.00010018050670623779, -9.366869926452637e-05, -8.715689182281494e-05, -8.064508438110352e-05, -7.413327693939209e-05, -6.762146949768066e-05, -6.110966205596924e-05, -5.459785461425781e-05, -4.808604717254639e-05, -4.157423973083496e-05, -3.5062432289123535e-05, -2.855062484741211e-05, -2.2038817405700684e-05, -1.5527009963989258e-05, -9.015202522277832e-06, -2.5033950805664062e-06, 4.0084123611450195e-06, 1.0520219802856445e-05, 1.703202724456787e-05, 2.3543834686279297e-05, 3.0055642127990723e-05, 3.656744956970215e-05, 4.3079257011413574e-05, 4.9591064453125e-05, 5.6102871894836426e-05, 6.261467933654785e-05, 6.912648677825928e-05, 7.56382942199707e-05, 8.215010166168213e-05, 8.866190910339355e-05, 9.517371654510498e-05, 0.0001016855239868164, 0.00010819733142852783, 0.00011470913887023926, 0.00012122094631195068, 0.0001277327537536621, 0.00013424456119537354, 0.00014075636863708496, 0.0001472681760787964, 0.0001537799835205078, 0.00016029179096221924, 0.00016680359840393066, 0.0001733154058456421, 0.00017982721328735352, 0.00018633902072906494, 0.00019285082817077637, 0.0001993626356124878, 0.00020587444305419922, 0.00021238625049591064, 0.00021889805793762207, 0.0002254098653793335, 0.00023192167282104492, 0.00023843348026275635, 0.0002449452877044678, 0.0002514570951461792, 0.0002579689025878906]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 7.0, 21.0, 29.0, 53.0, 97.0, 148.0, 167.0, 304.0, 458.0, 695.0, 1056.0, 1659.0, 2720.0, 4286.0, 6512.0, 10001.0, 15293.0, 23190.0, 35399.0, 52523.0, 74330.0, 98998.0, 122149.0, 132145.0, 123992.0, 103083.0, 77138.0, 54781.0, 37077.0, 24535.0, 16108.0, 10507.0, 6778.0, 4423.0, 2851.0, 1789.0, 1174.0, 731.0, 472.0, 312.0, 190.0, 133.0, 76.0, 51.0, 31.0, 17.0, 15.0, 16.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-1.7177734375, -1.6633453369140625, -1.608917236328125, -1.5544891357421875, -1.50006103515625, -1.4456329345703125, -1.391204833984375, -1.3367767333984375, -1.2823486328125, -1.2279205322265625, -1.173492431640625, -1.1190643310546875, -1.06463623046875, -1.0102081298828125, -0.955780029296875, -0.9013519287109375, -0.846923828125, -0.7924957275390625, -0.738067626953125, -0.6836395263671875, -0.62921142578125, -0.5747833251953125, -0.520355224609375, -0.4659271240234375, -0.4114990234375, -0.3570709228515625, -0.302642822265625, -0.2482147216796875, -0.19378662109375, -0.1393585205078125, -0.084930419921875, -0.0305023193359375, 0.02392578125, 0.0783538818359375, 0.132781982421875, 0.1872100830078125, 0.24163818359375, 0.2960662841796875, 0.350494384765625, 0.4049224853515625, 0.4593505859375, 0.5137786865234375, 0.568206787109375, 0.6226348876953125, 0.67706298828125, 0.7314910888671875, 0.785919189453125, 0.8403472900390625, 0.894775390625, 0.9492034912109375, 1.003631591796875, 1.0580596923828125, 1.11248779296875, 1.1669158935546875, 1.221343994140625, 1.2757720947265625, 1.3302001953125, 1.3846282958984375, 1.439056396484375, 1.4934844970703125, 1.54791259765625, 1.6023406982421875, 1.656768798828125, 1.7111968994140625, 1.765625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 5.0, 6.0, 10.0, 7.0, 8.0, 20.0, 22.0, 40.0, 25.0, 43.0, 49.0, 39.0, 52.0, 52.0, 46.0, 57.0, 57.0, 55.0, 59.0, 43.0, 54.0, 28.0, 33.0, 35.0, 21.0, 24.0, 18.0, 17.0, 11.0, 17.0, 16.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.83251953125, -0.8074798583984375, -0.782440185546875, -0.7574005126953125, -0.73236083984375, -0.7073211669921875, -0.682281494140625, -0.6572418212890625, -0.6322021484375, -0.6071624755859375, -0.582122802734375, -0.5570831298828125, -0.53204345703125, -0.5070037841796875, -0.481964111328125, -0.4569244384765625, -0.431884765625, -0.4068450927734375, -0.381805419921875, -0.3567657470703125, -0.33172607421875, -0.3066864013671875, -0.281646728515625, -0.2566070556640625, -0.2315673828125, -0.2065277099609375, -0.181488037109375, -0.1564483642578125, -0.13140869140625, -0.1063690185546875, -0.081329345703125, -0.0562896728515625, -0.03125, -0.0062103271484375, 0.018829345703125, 0.0438690185546875, 0.06890869140625, 0.0939483642578125, 0.118988037109375, 0.1440277099609375, 0.1690673828125, 0.1941070556640625, 0.219146728515625, 0.2441864013671875, 0.26922607421875, 0.2942657470703125, 0.319305419921875, 0.3443450927734375, 0.369384765625, 0.3944244384765625, 0.419464111328125, 0.4445037841796875, 0.46954345703125, 0.4945831298828125, 0.519622802734375, 0.5446624755859375, 0.5697021484375, 0.5947418212890625, 0.619781494140625, 0.6448211669921875, 0.66986083984375, 0.6949005126953125, 0.719940185546875, 0.7449798583984375, 0.77001953125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 10.0, 15.0, 17.0, 17.0, 12.0, 22.0, 23.0, 20.0, 36.0, 33.0, 41.0, 36.0, 37.0, 52.0, 44.0, 47.0, 46.0, 58.0, 45.0, 41.0, 49.0, 33.0, 28.0, 36.0, 29.0, 19.0, 19.0, 25.0, 16.0, 13.0, 14.0, 8.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.887038707733154, -4.752031326293945, -4.617023468017578, -4.482016086578369, -4.34700870513916, -4.212000846862793, -4.076993465423584, -3.941985845565796, -3.806978225708008, -3.6719706058502197, -3.5369632244110107, -3.4019556045532227, -3.2669479846954346, -3.1319403648376465, -2.9969329833984375, -2.8619253635406494, -2.7269179821014404, -2.5919103622436523, -2.4569029808044434, -2.3218953609466553, -2.186887741088867, -2.051880359649658, -1.9168727397918701, -1.781865119934082, -1.6468576192855835, -1.511850118637085, -1.3768424987792969, -1.2418349981307983, -1.1068274974822998, -0.9718198776245117, -0.8368123769760132, -0.7018048167228699, -0.5667974948883057, -0.43178993463516235, -0.29678240418434143, -0.1617748737335205, -0.026767313480377197, 0.10824024677276611, 0.24324774742126465, 0.37825530767440796, 0.5132628679275513, 0.6482704281806946, 0.7832779884338379, 0.9182854890823364, 1.053292989730835, 1.188300609588623, 1.3233081102371216, 1.4583156108856201, 1.5933232307434082, 1.7283307313919067, 1.8633383512496948, 1.9983458518981934, 2.1333534717559814, 2.2683610916137695, 2.4033684730529785, 2.5383760929107666, 2.6733837127685547, 2.8083913326263428, 2.9433987140655518, 3.07840633392334, 3.213413953781128, 3.348421573638916, 3.483428955078125, 3.618436574935913, 3.753443956375122]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 7.0, 17.0, 13.0, 6.0, 10.0, 9.0, 22.0, 9.0, 16.0, 34.0, 20.0, 26.0, 32.0, 29.0, 28.0, 40.0, 31.0, 41.0, 54.0, 45.0, 40.0, 35.0, 38.0, 52.0, 46.0, 23.0, 40.0, 22.0, 34.0, 30.0, 25.0, 24.0, 14.0, 16.0, 16.0, 10.0, 8.0, 7.0, 7.0, 6.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.141263008117676, -4.004789352416992, -3.868316173553467, -3.7318427562713623, -3.595369338989258, -3.458895683288574, -3.3224222660064697, -3.1859488487243652, -3.0494754314422607, -2.9130020141601562, -2.7765285968780518, -2.6400551795959473, -2.5035815238952637, -2.3671083450317383, -2.2306346893310547, -2.09416127204895, -1.9576878547668457, -1.8212144374847412, -1.6847410202026367, -1.5482674837112427, -1.4117940664291382, -1.2753206491470337, -1.1388471126556396, -1.0023736953735352, -0.8659002780914307, -0.7294268608093262, -0.5929533839225769, -0.45647993683815, -0.32000648975372314, -0.18353307247161865, -0.047059595584869385, 0.08941388130187988, 0.22588729858398438, 0.36236074566841125, 0.49883419275283813, 0.6353076696395874, 0.7717810869216919, 0.9082545042037964, 1.0447280406951904, 1.181201457977295, 1.3176748752593994, 1.454148292541504, 1.5906217098236084, 1.7270952463150024, 1.863568663597107, 2.000041961669922, 2.1365156173706055, 2.27298903465271, 2.4094624519348145, 2.545935869216919, 2.6824092864990234, 2.818882703781128, 2.9553561210632324, 3.091829776763916, 3.2283031940460205, 3.364776611328125, 3.5012500286102295, 3.637723445892334, 3.7741968631744385, 3.910670280456543, 4.047143936157227, 4.183617115020752, 4.3200907707214355, 4.456563949584961, 4.5930376052856445]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 9.0, 12.0, 13.0, 27.0, 40.0, 48.0, 105.0, 163.0, 257.0, 364.0, 571.0, 954.0, 1529.0, 2465.0, 4006.0, 6484.0, 10564.0, 17160.0, 28220.0, 45401.0, 73009.0, 114654.0, 177974.0, 266038.0, 373071.0, 481595.0, 549084.0, 540207.0, 460123.0, 348884.0, 245233.0, 163451.0, 105382.0, 66405.0, 41657.0, 26266.0, 16048.0, 9896.0, 6230.0, 3942.0, 2434.0, 1608.0, 952.0, 598.0, 412.0, 270.0, 164.0, 122.0, 69.0, 46.0, 27.0, 19.0, 14.0, 7.0, 8.0, 0.0, 1.0, 2.0], "bins": [-3.484375, -3.37847900390625, -3.2725830078125, -3.16668701171875, -3.060791015625, -2.95489501953125, -2.8489990234375, -2.74310302734375, -2.63720703125, -2.53131103515625, -2.4254150390625, -2.31951904296875, -2.213623046875, -2.10772705078125, -2.0018310546875, -1.89593505859375, -1.7900390625, -1.68414306640625, -1.5782470703125, -1.47235107421875, -1.366455078125, -1.26055908203125, -1.1546630859375, -1.04876708984375, -0.94287109375, -0.83697509765625, -0.7310791015625, -0.62518310546875, -0.519287109375, -0.41339111328125, -0.3074951171875, -0.20159912109375, -0.095703125, 0.01019287109375, 0.1160888671875, 0.22198486328125, 0.327880859375, 0.43377685546875, 0.5396728515625, 0.64556884765625, 0.75146484375, 0.85736083984375, 0.9632568359375, 1.06915283203125, 1.175048828125, 1.28094482421875, 1.3868408203125, 1.49273681640625, 1.5986328125, 1.70452880859375, 1.8104248046875, 1.91632080078125, 2.022216796875, 2.12811279296875, 2.2340087890625, 2.33990478515625, 2.44580078125, 2.55169677734375, 2.6575927734375, 2.76348876953125, 2.869384765625, 2.97528076171875, 3.0811767578125, 3.18707275390625, 3.29296875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 11.0, 9.0, 10.0, 10.0, 10.0, 11.0, 18.0, 14.0, 24.0, 24.0, 32.0, 20.0, 32.0, 26.0, 45.0, 52.0, 40.0, 45.0, 36.0, 47.0, 48.0, 29.0, 47.0, 51.0, 43.0, 38.0, 26.0, 33.0, 28.0, 35.0, 24.0, 14.0, 11.0, 8.0, 16.0, 11.0, 7.0, 2.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.578125, -3.47442626953125, -3.3707275390625, -3.26702880859375, -3.163330078125, -3.05963134765625, -2.9559326171875, -2.85223388671875, -2.74853515625, -2.64483642578125, -2.5411376953125, -2.43743896484375, -2.333740234375, -2.23004150390625, -2.1263427734375, -2.02264404296875, -1.9189453125, -1.81524658203125, -1.7115478515625, -1.60784912109375, -1.504150390625, -1.40045166015625, -1.2967529296875, -1.19305419921875, -1.08935546875, -0.98565673828125, -0.8819580078125, -0.77825927734375, -0.674560546875, -0.57086181640625, -0.4671630859375, -0.36346435546875, -0.259765625, -0.15606689453125, -0.0523681640625, 0.05133056640625, 0.155029296875, 0.25872802734375, 0.3624267578125, 0.46612548828125, 0.56982421875, 0.67352294921875, 0.7772216796875, 0.88092041015625, 0.984619140625, 1.08831787109375, 1.1920166015625, 1.29571533203125, 1.3994140625, 1.50311279296875, 1.6068115234375, 1.71051025390625, 1.814208984375, 1.91790771484375, 2.0216064453125, 2.12530517578125, 2.22900390625, 2.33270263671875, 2.4364013671875, 2.54010009765625, 2.643798828125, 2.74749755859375, 2.8511962890625, 2.95489501953125, 3.05859375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 8.0, 6.0, 5.0, 11.0, 28.0, 24.0, 53.0, 96.0, 145.0, 220.0, 393.0, 578.0, 1032.0, 1600.0, 2704.0, 4465.0, 7310.0, 12206.0, 19967.0, 33422.0, 53356.0, 86183.0, 134525.0, 201663.0, 288954.0, 385446.0, 466623.0, 512614.0, 499270.0, 434345.0, 340429.0, 246924.0, 169025.0, 110199.0, 69893.0, 43527.0, 26216.0, 16233.0, 9469.0, 5955.0, 3481.0, 2141.0, 1316.0, 840.0, 540.0, 317.0, 197.0, 114.0, 96.0, 50.0, 27.0, 15.0, 23.0, 9.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.970703125, -2.867462158203125, -2.76422119140625, -2.660980224609375, -2.5577392578125, -2.454498291015625, -2.35125732421875, -2.248016357421875, -2.144775390625, -2.041534423828125, -1.93829345703125, -1.835052490234375, -1.7318115234375, -1.628570556640625, -1.52532958984375, -1.422088623046875, -1.31884765625, -1.215606689453125, -1.11236572265625, -1.009124755859375, -0.9058837890625, -0.802642822265625, -0.69940185546875, -0.596160888671875, -0.492919921875, -0.389678955078125, -0.28643798828125, -0.183197021484375, -0.0799560546875, 0.023284912109375, 0.12652587890625, 0.229766845703125, 0.3330078125, 0.436248779296875, 0.53948974609375, 0.642730712890625, 0.7459716796875, 0.849212646484375, 0.95245361328125, 1.055694580078125, 1.158935546875, 1.262176513671875, 1.36541748046875, 1.468658447265625, 1.5718994140625, 1.675140380859375, 1.77838134765625, 1.881622314453125, 1.98486328125, 2.088104248046875, 2.19134521484375, 2.294586181640625, 2.3978271484375, 2.501068115234375, 2.60430908203125, 2.707550048828125, 2.810791015625, 2.914031982421875, 3.01727294921875, 3.120513916015625, 3.2237548828125, 3.326995849609375, 3.43023681640625, 3.533477783203125, 3.63671875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 0.0, 4.0, 13.0, 9.0, 17.0, 17.0, 22.0, 29.0, 37.0, 35.0, 58.0, 62.0, 66.0, 81.0, 109.0, 130.0, 139.0, 123.0, 152.0, 173.0, 206.0, 173.0, 192.0, 213.0, 196.0, 209.0, 173.0, 153.0, 176.0, 165.0, 159.0, 115.0, 121.0, 112.0, 97.0, 65.0, 54.0, 51.0, 37.0, 31.0, 21.0, 13.0, 12.0, 18.0, 8.0, 8.0, 4.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.264678955078125, -1.22076416015625, -1.176849365234375, -1.1329345703125, -1.089019775390625, -1.04510498046875, -1.001190185546875, -0.957275390625, -0.913360595703125, -0.86944580078125, -0.825531005859375, -0.7816162109375, -0.737701416015625, -0.69378662109375, -0.649871826171875, -0.60595703125, -0.562042236328125, -0.51812744140625, -0.474212646484375, -0.4302978515625, -0.386383056640625, -0.34246826171875, -0.298553466796875, -0.254638671875, -0.210723876953125, -0.16680908203125, -0.122894287109375, -0.0789794921875, -0.035064697265625, 0.00885009765625, 0.052764892578125, 0.0966796875, 0.140594482421875, 0.18450927734375, 0.228424072265625, 0.2723388671875, 0.316253662109375, 0.36016845703125, 0.404083251953125, 0.447998046875, 0.491912841796875, 0.53582763671875, 0.579742431640625, 0.6236572265625, 0.667572021484375, 0.71148681640625, 0.755401611328125, 0.79931640625, 0.843231201171875, 0.88714599609375, 0.931060791015625, 0.9749755859375, 1.018890380859375, 1.06280517578125, 1.106719970703125, 1.150634765625, 1.194549560546875, 1.23846435546875, 1.282379150390625, 1.3262939453125, 1.370208740234375, 1.41412353515625, 1.458038330078125, 1.501953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 12.0, 12.0, 24.0, 27.0, 25.0, 24.0, 40.0, 35.0, 46.0, 53.0, 51.0, 60.0, 42.0, 52.0, 44.0, 44.0, 52.0, 43.0, 28.0, 31.0, 32.0, 30.0, 24.0, 29.0, 14.0, 12.0, 19.0, 14.0, 9.0, 7.0, 5.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.032153606414795, -3.8995118141174316, -3.7668702602386475, -3.634228467941284, -3.5015869140625, -3.3689451217651367, -3.2363033294677734, -3.10366153717041, -2.971019983291626, -2.8383781909942627, -2.7057366371154785, -2.5730948448181152, -2.440453052520752, -2.3078114986419678, -2.1751697063446045, -2.0425281524658203, -1.909886360168457, -1.7772446870803833, -1.6446030139923096, -1.5119612216949463, -1.3793195486068726, -1.2466778755187988, -1.1140360832214355, -0.9813944101333618, -0.8487527370452881, -0.7161110639572144, -0.5834693312644958, -0.45082762837409973, -0.3181859254837036, -0.18554425239562988, -0.05290251970291138, 0.07973921298980713, 0.21238040924072266, 0.3450221121311188, 0.4776638150215149, 0.6103055477142334, 0.7429472208023071, 0.8755888938903809, 1.0082306861877441, 1.1408723592758179, 1.2735140323638916, 1.4061557054519653, 1.538797378540039, 1.6714391708374023, 1.804080843925476, 1.9367225170135498, 2.069364309310913, 2.2020058631896973, 2.3346476554870605, 2.467289447784424, 2.599931001663208, 2.7325727939605713, 2.8652143478393555, 2.9978561401367188, 3.130497932434082, 3.2631397247314453, 3.3957812786102295, 3.5284230709075928, 3.661064624786377, 3.7937064170837402, 3.9263482093811035, 4.058989524841309, 4.191631317138672, 4.324273109436035, 4.456914901733398]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 13.0, 10.0, 15.0, 19.0, 12.0, 20.0, 19.0, 15.0, 32.0, 34.0, 32.0, 38.0, 31.0, 40.0, 39.0, 40.0, 35.0, 41.0, 49.0, 39.0, 41.0, 33.0, 42.0, 34.0, 41.0, 28.0, 22.0, 25.0, 26.0, 22.0, 17.0, 9.0, 14.0, 17.0, 11.0, 12.0, 7.0, 2.0, 6.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.9306440353393555, -3.8147025108337402, -3.698760986328125, -3.5828194618225098, -3.4668779373168945, -3.3509364128112793, -3.234994888305664, -3.119053363800049, -3.0031118392944336, -2.8871703147888184, -2.771228790283203, -2.655287265777588, -2.5393457412719727, -2.4234042167663574, -2.307462692260742, -2.191521167755127, -2.0755794048309326, -1.9596378803253174, -1.8436963558197021, -1.727754831314087, -1.6118133068084717, -1.4958717823028564, -1.3799301385879517, -1.2639886140823364, -1.1480470895767212, -1.032105565071106, -0.9161640405654907, -0.8002224564552307, -0.6842809319496155, -0.5683394074440002, -0.45239782333374023, -0.336456298828125, -0.22051477432250977, -0.10457323491573334, 0.01136830449104309, 0.1273098587989807, 0.24325138330459595, 0.3591929078102112, 0.4751344919204712, 0.5910760164260864, 0.7070175409317017, 0.8229590654373169, 0.9389005899429321, 1.054842233657837, 1.1707837581634521, 1.2867252826690674, 1.4026668071746826, 1.5186083316802979, 1.634549856185913, 1.7504913806915283, 1.8664329051971436, 1.9823744297027588, 2.098315954208374, 2.2142574787139893, 2.3301992416381836, 2.446140766143799, 2.562082290649414, 2.6780238151550293, 2.7939653396606445, 2.9099068641662598, 3.025848388671875, 3.1417899131774902, 3.2577314376831055, 3.3736729621887207, 3.489614486694336]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 11.0, 9.0, 14.0, 26.0, 43.0, 57.0, 91.0, 155.0, 236.0, 378.0, 539.0, 886.0, 1402.0, 2332.0, 3793.0, 6372.0, 10418.0, 17856.0, 30960.0, 54319.0, 95036.0, 158327.0, 209708.0, 182052.0, 115813.0, 66219.0, 37784.0, 21677.0, 12654.0, 7529.0, 4538.0, 2768.0, 1679.0, 1048.0, 669.0, 399.0, 271.0, 169.0, 93.0, 80.0, 51.0, 31.0, 29.0, 12.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.122528076171875, -1.08197021484375, -1.041412353515625, -1.0008544921875, -0.960296630859375, -0.91973876953125, -0.879180908203125, -0.838623046875, -0.798065185546875, -0.75750732421875, -0.716949462890625, -0.6763916015625, -0.635833740234375, -0.59527587890625, -0.554718017578125, -0.51416015625, -0.473602294921875, -0.43304443359375, -0.392486572265625, -0.3519287109375, -0.311370849609375, -0.27081298828125, -0.230255126953125, -0.189697265625, -0.149139404296875, -0.10858154296875, -0.068023681640625, -0.0274658203125, 0.013092041015625, 0.05364990234375, 0.094207763671875, 0.134765625, 0.175323486328125, 0.21588134765625, 0.256439208984375, 0.2969970703125, 0.337554931640625, 0.37811279296875, 0.418670654296875, 0.459228515625, 0.499786376953125, 0.54034423828125, 0.580902099609375, 0.6214599609375, 0.662017822265625, 0.70257568359375, 0.743133544921875, 0.78369140625, 0.824249267578125, 0.86480712890625, 0.905364990234375, 0.9459228515625, 0.986480712890625, 1.02703857421875, 1.067596435546875, 1.108154296875, 1.148712158203125, 1.18927001953125, 1.229827880859375, 1.2703857421875, 1.310943603515625, 1.35150146484375, 1.392059326171875, 1.4326171875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 6.0, 11.0, 19.0, 12.0, 17.0, 23.0, 31.0, 33.0, 28.0, 53.0, 45.0, 39.0, 43.0, 50.0, 45.0, 36.0, 51.0, 41.0, 53.0, 50.0, 36.0, 38.0, 35.0, 29.0, 21.0, 20.0, 26.0, 27.0, 11.0, 18.0, 8.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.46051025390625, -4.3194580078125, -4.17840576171875, -4.037353515625, -3.89630126953125, -3.7552490234375, -3.61419677734375, -3.47314453125, -3.33209228515625, -3.1910400390625, -3.04998779296875, -2.908935546875, -2.76788330078125, -2.6268310546875, -2.48577880859375, -2.3447265625, -2.20367431640625, -2.0626220703125, -1.92156982421875, -1.780517578125, -1.63946533203125, -1.4984130859375, -1.35736083984375, -1.21630859375, -1.07525634765625, -0.9342041015625, -0.79315185546875, -0.652099609375, -0.51104736328125, -0.3699951171875, -0.22894287109375, -0.087890625, 0.05316162109375, 0.1942138671875, 0.33526611328125, 0.476318359375, 0.61737060546875, 0.7584228515625, 0.89947509765625, 1.04052734375, 1.18157958984375, 1.3226318359375, 1.46368408203125, 1.604736328125, 1.74578857421875, 1.8868408203125, 2.02789306640625, 2.1689453125, 2.30999755859375, 2.4510498046875, 2.59210205078125, 2.733154296875, 2.87420654296875, 3.0152587890625, 3.15631103515625, 3.29736328125, 3.43841552734375, 3.5794677734375, 3.72052001953125, 3.861572265625, 4.00262451171875, 4.1436767578125, 4.28472900390625, 4.42578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 9.0, 24.0, 30.0, 54.0, 64.0, 90.0, 123.0, 202.0, 303.0, 458.0, 687.0, 1136.0, 1607.0, 2710.0, 4542.0, 7414.0, 12589.0, 21773.0, 37904.0, 66151.0, 115320.0, 186329.0, 217344.0, 154586.0, 91540.0, 52169.0, 30146.0, 17332.0, 10178.0, 5902.0, 3675.0, 2174.0, 1359.0, 878.0, 538.0, 370.0, 253.0, 183.0, 120.0, 76.0, 57.0, 44.0, 35.0, 24.0, 14.0, 10.0, 5.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2080078125, -1.17059326171875, -1.1331787109375, -1.09576416015625, -1.058349609375, -1.02093505859375, -0.9835205078125, -0.94610595703125, -0.90869140625, -0.87127685546875, -0.8338623046875, -0.79644775390625, -0.759033203125, -0.72161865234375, -0.6842041015625, -0.64678955078125, -0.609375, -0.57196044921875, -0.5345458984375, -0.49713134765625, -0.459716796875, -0.42230224609375, -0.3848876953125, -0.34747314453125, -0.31005859375, -0.27264404296875, -0.2352294921875, -0.19781494140625, -0.160400390625, -0.12298583984375, -0.0855712890625, -0.04815673828125, -0.0107421875, 0.02667236328125, 0.0640869140625, 0.10150146484375, 0.138916015625, 0.17633056640625, 0.2137451171875, 0.25115966796875, 0.28857421875, 0.32598876953125, 0.3634033203125, 0.40081787109375, 0.438232421875, 0.47564697265625, 0.5130615234375, 0.55047607421875, 0.587890625, 0.62530517578125, 0.6627197265625, 0.70013427734375, 0.737548828125, 0.77496337890625, 0.8123779296875, 0.84979248046875, 0.88720703125, 0.92462158203125, 0.9620361328125, 0.99945068359375, 1.036865234375, 1.07427978515625, 1.1116943359375, 1.14910888671875, 1.1865234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 13.0, 14.0, 14.0, 14.0, 14.0, 22.0, 21.0, 26.0, 20.0, 24.0, 26.0, 46.0, 34.0, 38.0, 35.0, 41.0, 41.0, 38.0, 35.0, 35.0, 40.0, 39.0, 36.0, 32.0, 48.0, 34.0, 26.0, 17.0, 20.0, 19.0, 14.0, 15.0, 16.0, 17.0, 12.0, 3.0, 10.0, 6.0, 10.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.548828125, -2.472991943359375, -2.39715576171875, -2.321319580078125, -2.2454833984375, -2.169647216796875, -2.09381103515625, -2.017974853515625, -1.942138671875, -1.866302490234375, -1.79046630859375, -1.714630126953125, -1.6387939453125, -1.562957763671875, -1.48712158203125, -1.411285400390625, -1.33544921875, -1.259613037109375, -1.18377685546875, -1.107940673828125, -1.0321044921875, -0.956268310546875, -0.88043212890625, -0.804595947265625, -0.728759765625, -0.652923583984375, -0.57708740234375, -0.501251220703125, -0.4254150390625, -0.349578857421875, -0.27374267578125, -0.197906494140625, -0.1220703125, -0.046234130859375, 0.02960205078125, 0.105438232421875, 0.1812744140625, 0.257110595703125, 0.33294677734375, 0.408782958984375, 0.484619140625, 0.560455322265625, 0.63629150390625, 0.712127685546875, 0.7879638671875, 0.863800048828125, 0.93963623046875, 1.015472412109375, 1.09130859375, 1.167144775390625, 1.24298095703125, 1.318817138671875, 1.3946533203125, 1.470489501953125, 1.54632568359375, 1.622161865234375, 1.697998046875, 1.773834228515625, 1.84967041015625, 1.925506591796875, 2.0013427734375, 2.077178955078125, 2.15301513671875, 2.228851318359375, 2.3046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 7.0, 7.0, 12.0, 14.0, 11.0, 21.0, 35.0, 37.0, 39.0, 85.0, 92.0, 162.0, 200.0, 360.0, 518.0, 843.0, 1374.0, 2634.0, 5483.0, 12752.0, 39595.0, 174471.0, 562467.0, 181234.0, 40661.0, 13304.0, 5458.0, 2669.0, 1502.0, 847.0, 549.0, 346.0, 222.0, 138.0, 110.0, 84.0, 51.0, 34.0, 33.0, 19.0, 24.0, 14.0, 10.0, 11.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.8017578125, -0.77783203125, -0.75390625, -0.72998046875, -0.7060546875, -0.68212890625, -0.658203125, -0.63427734375, -0.6103515625, -0.58642578125, -0.5625, -0.53857421875, -0.5146484375, -0.49072265625, -0.466796875, -0.44287109375, -0.4189453125, -0.39501953125, -0.37109375, -0.34716796875, -0.3232421875, -0.29931640625, -0.275390625, -0.25146484375, -0.2275390625, -0.20361328125, -0.1796875, -0.15576171875, -0.1318359375, -0.10791015625, -0.083984375, -0.06005859375, -0.0361328125, -0.01220703125, 0.01171875, 0.03564453125, 0.0595703125, 0.08349609375, 0.107421875, 0.13134765625, 0.1552734375, 0.17919921875, 0.203125, 0.22705078125, 0.2509765625, 0.27490234375, 0.298828125, 0.32275390625, 0.3466796875, 0.37060546875, 0.39453125, 0.41845703125, 0.4423828125, 0.46630859375, 0.490234375, 0.51416015625, 0.5380859375, 0.56201171875, 0.5859375, 0.60986328125, 0.6337890625, 0.65771484375, 0.681640625, 0.70556640625, 0.7294921875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 13.0, 11.0, 30.0, 62.0, 56.0, 95.0, 107.0, 150.0, 111.0, 90.0, 88.0, 60.0, 41.0, 23.0, 20.0, 6.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.537271499633789e-05, -5.3685158491134644e-05, -5.1997601985931396e-05, -5.031004548072815e-05, -4.86224889755249e-05, -4.6934932470321655e-05, -4.524737596511841e-05, -4.355981945991516e-05, -4.1872262954711914e-05, -4.018470644950867e-05, -3.849714994430542e-05, -3.680959343910217e-05, -3.5122036933898926e-05, -3.343448042869568e-05, -3.174692392349243e-05, -3.0059367418289185e-05, -2.8371810913085938e-05, -2.668425440788269e-05, -2.4996697902679443e-05, -2.3309141397476196e-05, -2.162158489227295e-05, -1.9934028387069702e-05, -1.8246471881866455e-05, -1.6558915376663208e-05, -1.4871358871459961e-05, -1.3183802366256714e-05, -1.1496245861053467e-05, -9.80868935585022e-06, -8.121132850646973e-06, -6.433576345443726e-06, -4.7460198402404785e-06, -3.0584633350372314e-06, -1.3709068298339844e-06, 3.166496753692627e-07, 2.0042061805725098e-06, 3.691762685775757e-06, 5.379319190979004e-06, 7.066875696182251e-06, 8.754432201385498e-06, 1.0441988706588745e-05, 1.2129545211791992e-05, 1.381710171699524e-05, 1.5504658222198486e-05, 1.7192214727401733e-05, 1.887977123260498e-05, 2.0567327737808228e-05, 2.2254884243011475e-05, 2.394244074821472e-05, 2.562999725341797e-05, 2.7317553758621216e-05, 2.9005110263824463e-05, 3.069266676902771e-05, 3.238022327423096e-05, 3.4067779779434204e-05, 3.575533628463745e-05, 3.74428927898407e-05, 3.9130449295043945e-05, 4.081800580024719e-05, 4.250556230545044e-05, 4.4193118810653687e-05, 4.5880675315856934e-05, 4.756823182106018e-05, 4.925578832626343e-05, 5.0943344831466675e-05, 5.263090133666992e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 7.0, 14.0, 12.0, 23.0, 23.0, 43.0, 66.0, 101.0, 122.0, 165.0, 227.0, 365.0, 524.0, 878.0, 1317.0, 2067.0, 3317.0, 5831.0, 10568.0, 20755.0, 43896.0, 94692.0, 205153.0, 301555.0, 188150.0, 86300.0, 39014.0, 19180.0, 9882.0, 5491.0, 3107.0, 1896.0, 1203.0, 840.0, 543.0, 367.0, 253.0, 174.0, 106.0, 102.0, 56.0, 44.0, 44.0, 31.0, 11.0, 10.0, 6.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.578125, -0.560302734375, -0.54248046875, -0.524658203125, -0.5068359375, -0.489013671875, -0.47119140625, -0.453369140625, -0.435546875, -0.417724609375, -0.39990234375, -0.382080078125, -0.3642578125, -0.346435546875, -0.32861328125, -0.310791015625, -0.29296875, -0.275146484375, -0.25732421875, -0.239501953125, -0.2216796875, -0.203857421875, -0.18603515625, -0.168212890625, -0.150390625, -0.132568359375, -0.11474609375, -0.096923828125, -0.0791015625, -0.061279296875, -0.04345703125, -0.025634765625, -0.0078125, 0.010009765625, 0.02783203125, 0.045654296875, 0.0634765625, 0.081298828125, 0.09912109375, 0.116943359375, 0.134765625, 0.152587890625, 0.17041015625, 0.188232421875, 0.2060546875, 0.223876953125, 0.24169921875, 0.259521484375, 0.27734375, 0.295166015625, 0.31298828125, 0.330810546875, 0.3486328125, 0.366455078125, 0.38427734375, 0.402099609375, 0.419921875, 0.437744140625, 0.45556640625, 0.473388671875, 0.4912109375, 0.509033203125, 0.52685546875, 0.544677734375, 0.5625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 4.0, 7.0, 14.0, 8.0, 22.0, 14.0, 31.0, 28.0, 35.0, 55.0, 44.0, 74.0, 64.0, 70.0, 52.0, 64.0, 66.0, 51.0, 53.0, 48.0, 32.0, 27.0, 14.0, 18.0, 17.0, 15.0, 11.0, 6.0, 5.0, 7.0, 2.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.17427349090576172, -0.16971397399902344, -0.16515445709228516, -0.16059494018554688, -0.1560354232788086, -0.1514759063720703, -0.14691638946533203, -0.14235687255859375, -0.13779735565185547, -0.1332378387451172, -0.1286783218383789, -0.12411880493164062, -0.11955928802490234, -0.11499977111816406, -0.11044025421142578, -0.1058807373046875, -0.10132122039794922, -0.09676170349121094, -0.09220218658447266, -0.08764266967773438, -0.0830831527709961, -0.07852363586425781, -0.07396411895751953, -0.06940460205078125, -0.06484508514404297, -0.06028556823730469, -0.055726051330566406, -0.051166534423828125, -0.046607017517089844, -0.04204750061035156, -0.03748798370361328, -0.032928466796875, -0.02836894989013672, -0.023809432983398438, -0.019249916076660156, -0.014690399169921875, -0.010130882263183594, -0.0055713653564453125, -0.0010118484497070312, 0.00354766845703125, 0.008107185363769531, 0.012666702270507812, 0.017226219177246094, 0.021785736083984375, 0.026345252990722656, 0.030904769897460938, 0.03546428680419922, 0.0400238037109375, 0.04458332061767578, 0.04914283752441406, 0.053702354431152344, 0.058261871337890625, 0.0628213882446289, 0.06738090515136719, 0.07194042205810547, 0.07649993896484375, 0.08105945587158203, 0.08561897277832031, 0.0901784896850586, 0.09473800659179688, 0.09929752349853516, 0.10385704040527344, 0.10841655731201172, 0.11297607421875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 7.0, 9.0, 9.0, 14.0, 20.0, 15.0, 20.0, 23.0, 32.0, 23.0, 43.0, 31.0, 53.0, 52.0, 58.0, 46.0, 38.0, 54.0, 41.0, 50.0, 40.0, 37.0, 35.0, 25.0, 29.0, 30.0, 26.0, 20.0, 19.0, 11.0, 18.0, 14.0, 12.0, 6.0, 4.0, 7.0, 10.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.079821586608887, -3.952615261077881, -3.825408935546875, -3.69820237159729, -3.570996046066284, -3.4437897205352783, -3.3165831565856934, -3.1893768310546875, -3.0621705055236816, -2.934964179992676, -2.80775785446167, -2.680551290512085, -2.553344964981079, -2.4261386394500732, -2.2989320755004883, -2.1717257499694824, -2.0445194244384766, -1.9173130989074707, -1.7901066541671753, -1.6629002094268799, -1.535693883895874, -1.4084875583648682, -1.2812811136245728, -1.1540746688842773, -1.0268683433532715, -0.8996619582176208, -0.7724555730819702, -0.6452491879463196, -0.518042802810669, -0.3908364176750183, -0.2636300325393677, -0.13642364740371704, -0.009216785430908203, 0.11798959970474243, 0.24519598484039307, 0.3724023699760437, 0.49960875511169434, 0.626815140247345, 0.7540215253829956, 0.8812279105186462, 1.0084342956542969, 1.1356406211853027, 1.2628470659255981, 1.3900535106658936, 1.5172598361968994, 1.6444661617279053, 1.7716726064682007, 1.898879051208496, 2.026085376739502, 2.153291702270508, 2.2804980278015137, 2.4077045917510986, 2.5349109172821045, 2.6621172428131104, 2.7893238067626953, 2.916530132293701, 3.043736457824707, 3.170942783355713, 3.2981491088867188, 3.4253556728363037, 3.5525619983673096, 3.6797683238983154, 3.8069748878479004, 3.9341812133789062, 4.061387538909912]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 15.0, 10.0, 16.0, 17.0, 16.0, 17.0, 19.0, 19.0, 29.0, 38.0, 31.0, 37.0, 33.0, 38.0, 41.0, 31.0, 45.0, 40.0, 50.0, 36.0, 44.0, 31.0, 37.0, 42.0, 32.0, 31.0, 25.0, 21.0, 29.0, 16.0, 18.0, 9.0, 17.0, 16.0, 10.0, 12.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.870497465133667, -3.7558631896972656, -3.6412289142608643, -3.526594638824463, -3.4119601249694824, -3.297325849533081, -3.1826915740966797, -3.0680572986602783, -2.953423023223877, -2.8387887477874756, -2.724154472351074, -2.6095199584960938, -2.4948856830596924, -2.380251407623291, -2.2656171321868896, -2.1509828567504883, -2.036348342895508, -1.9217140674591064, -1.8070796728134155, -1.6924453973770142, -1.5778110027313232, -1.4631767272949219, -1.3485424518585205, -1.2339081764221191, -1.1192737817764282, -1.0046395063400269, -0.8900051116943359, -0.7753708362579346, -0.6607365012168884, -0.5461021661758423, -0.4314678907394409, -0.3168335556983948, -0.20219922065734863, -0.08756490051746368, 0.027069419622421265, 0.14170372486114502, 0.25633805990219116, 0.3709723949432373, 0.48560667037963867, 0.6002410054206848, 0.714875340461731, 0.8295096755027771, 0.9441440105438232, 1.0587782859802246, 1.173412561416626, 1.288046956062317, 1.4026812314987183, 1.5173156261444092, 1.6319499015808105, 1.746584177017212, 1.8612185716629028, 1.9758528470993042, 2.090487241744995, 2.2051215171813965, 2.319755792617798, 2.434390068054199, 2.5490245819091797, 2.663658857345581, 2.7782931327819824, 2.892927646636963, 3.0075619220733643, 3.1221961975097656, 3.236830472946167, 3.3514647483825684, 3.4660990238189697]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 10.0, 9.0, 14.0, 6.0, 19.0, 38.0, 52.0, 79.0, 100.0, 206.0, 326.0, 482.0, 774.0, 1210.0, 1932.0, 3111.0, 4848.0, 7857.0, 12110.0, 18898.0, 28697.0, 41872.0, 58751.0, 78903.0, 97984.0, 113625.0, 119137.0, 112010.0, 96659.0, 76459.0, 56109.0, 39819.0, 27141.0, 17803.0, 11513.0, 7359.0, 4708.0, 2921.0, 1813.0, 1146.0, 813.0, 442.0, 283.0, 179.0, 110.0, 81.0, 56.0, 36.0, 24.0, 12.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0], "bins": [-3.337890625, -3.238067626953125, -3.13824462890625, -3.038421630859375, -2.9385986328125, -2.838775634765625, -2.73895263671875, -2.639129638671875, -2.539306640625, -2.439483642578125, -2.33966064453125, -2.239837646484375, -2.1400146484375, -2.040191650390625, -1.94036865234375, -1.840545654296875, -1.74072265625, -1.640899658203125, -1.54107666015625, -1.441253662109375, -1.3414306640625, -1.241607666015625, -1.14178466796875, -1.041961669921875, -0.942138671875, -0.842315673828125, -0.74249267578125, -0.642669677734375, -0.5428466796875, -0.443023681640625, -0.34320068359375, -0.243377685546875, -0.1435546875, -0.043731689453125, 0.05609130859375, 0.155914306640625, 0.2557373046875, 0.355560302734375, 0.45538330078125, 0.555206298828125, 0.655029296875, 0.754852294921875, 0.85467529296875, 0.954498291015625, 1.0543212890625, 1.154144287109375, 1.25396728515625, 1.353790283203125, 1.45361328125, 1.553436279296875, 1.65325927734375, 1.753082275390625, 1.8529052734375, 1.952728271484375, 2.05255126953125, 2.152374267578125, 2.252197265625, 2.352020263671875, 2.45184326171875, 2.551666259765625, 2.6514892578125, 2.751312255859375, 2.85113525390625, 2.950958251953125, 3.05078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 9.0, 13.0, 10.0, 13.0, 18.0, 20.0, 32.0, 24.0, 30.0, 42.0, 35.0, 39.0, 34.0, 39.0, 32.0, 43.0, 45.0, 56.0, 41.0, 51.0, 38.0, 45.0, 33.0, 33.0, 38.0, 34.0, 24.0, 17.0, 23.0, 8.0, 10.0, 13.0, 10.0, 9.0, 4.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.93780517578125, -3.8092041015625, -3.68060302734375, -3.552001953125, -3.42340087890625, -3.2947998046875, -3.16619873046875, -3.03759765625, -2.90899658203125, -2.7803955078125, -2.65179443359375, -2.523193359375, -2.39459228515625, -2.2659912109375, -2.13739013671875, -2.0087890625, -1.88018798828125, -1.7515869140625, -1.62298583984375, -1.494384765625, -1.36578369140625, -1.2371826171875, -1.10858154296875, -0.97998046875, -0.85137939453125, -0.7227783203125, -0.59417724609375, -0.465576171875, -0.33697509765625, -0.2083740234375, -0.07977294921875, 0.048828125, 0.17742919921875, 0.3060302734375, 0.43463134765625, 0.563232421875, 0.69183349609375, 0.8204345703125, 0.94903564453125, 1.07763671875, 1.20623779296875, 1.3348388671875, 1.46343994140625, 1.592041015625, 1.72064208984375, 1.8492431640625, 1.97784423828125, 2.1064453125, 2.23504638671875, 2.3636474609375, 2.49224853515625, 2.620849609375, 2.74945068359375, 2.8780517578125, 3.00665283203125, 3.13525390625, 3.26385498046875, 3.3924560546875, 3.52105712890625, 3.649658203125, 3.77825927734375, 3.9068603515625, 4.03546142578125, 4.1640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 9.0, 3.0, 19.0, 22.0, 43.0, 58.0, 89.0, 109.0, 179.0, 268.0, 430.0, 672.0, 982.0, 1518.0, 2356.0, 3525.0, 5408.0, 7930.0, 12186.0, 17949.0, 26227.0, 36841.0, 50781.0, 66100.0, 82036.0, 96105.0, 104247.0, 104872.0, 98115.0, 84795.0, 68305.0, 52296.0, 38607.0, 27587.0, 19189.0, 13201.0, 8705.0, 5736.0, 3732.0, 2537.0, 1658.0, 1086.0, 712.0, 451.0, 292.0, 200.0, 150.0, 85.0, 46.0, 41.0, 22.0, 19.0, 12.0, 10.0, 2.0, 5.0, 4.0], "bins": [-3.01171875, -2.92333984375, -2.8349609375, -2.74658203125, -2.658203125, -2.56982421875, -2.4814453125, -2.39306640625, -2.3046875, -2.21630859375, -2.1279296875, -2.03955078125, -1.951171875, -1.86279296875, -1.7744140625, -1.68603515625, -1.59765625, -1.50927734375, -1.4208984375, -1.33251953125, -1.244140625, -1.15576171875, -1.0673828125, -0.97900390625, -0.890625, -0.80224609375, -0.7138671875, -0.62548828125, -0.537109375, -0.44873046875, -0.3603515625, -0.27197265625, -0.18359375, -0.09521484375, -0.0068359375, 0.08154296875, 0.169921875, 0.25830078125, 0.3466796875, 0.43505859375, 0.5234375, 0.61181640625, 0.7001953125, 0.78857421875, 0.876953125, 0.96533203125, 1.0537109375, 1.14208984375, 1.23046875, 1.31884765625, 1.4072265625, 1.49560546875, 1.583984375, 1.67236328125, 1.7607421875, 1.84912109375, 1.9375, 2.02587890625, 2.1142578125, 2.20263671875, 2.291015625, 2.37939453125, 2.4677734375, 2.55615234375, 2.64453125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 7.0, 6.0, 7.0, 6.0, 5.0, 10.0, 5.0, 18.0, 16.0, 18.0, 20.0, 22.0, 29.0, 22.0, 36.0, 34.0, 35.0, 44.0, 36.0, 40.0, 29.0, 36.0, 39.0, 38.0, 38.0, 38.0, 29.0, 39.0, 27.0, 25.0, 26.0, 22.0, 21.0, 25.0, 16.0, 21.0, 17.0, 8.0, 17.0, 14.0, 16.0, 9.0, 6.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.154296875, -2.08721923828125, -2.0201416015625, -1.95306396484375, -1.885986328125, -1.81890869140625, -1.7518310546875, -1.68475341796875, -1.61767578125, -1.55059814453125, -1.4835205078125, -1.41644287109375, -1.349365234375, -1.28228759765625, -1.2152099609375, -1.14813232421875, -1.0810546875, -1.01397705078125, -0.9468994140625, -0.87982177734375, -0.812744140625, -0.74566650390625, -0.6785888671875, -0.61151123046875, -0.54443359375, -0.47735595703125, -0.4102783203125, -0.34320068359375, -0.276123046875, -0.20904541015625, -0.1419677734375, -0.07489013671875, -0.0078125, 0.05926513671875, 0.1263427734375, 0.19342041015625, 0.260498046875, 0.32757568359375, 0.3946533203125, 0.46173095703125, 0.52880859375, 0.59588623046875, 0.6629638671875, 0.73004150390625, 0.797119140625, 0.86419677734375, 0.9312744140625, 0.99835205078125, 1.0654296875, 1.13250732421875, 1.1995849609375, 1.26666259765625, 1.333740234375, 1.40081787109375, 1.4678955078125, 1.53497314453125, 1.60205078125, 1.66912841796875, 1.7362060546875, 1.80328369140625, 1.870361328125, 1.93743896484375, 2.0045166015625, 2.07159423828125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 12.0, 13.0, 6.0, 15.0, 22.0, 34.0, 34.0, 66.0, 67.0, 102.0, 127.0, 204.0, 273.0, 384.0, 560.0, 856.0, 1401.0, 2601.0, 5531.0, 13329.0, 37826.0, 110948.0, 267858.0, 329717.0, 175490.0, 62674.0, 21417.0, 8200.0, 3572.0, 1902.0, 1101.0, 680.0, 416.0, 317.0, 207.0, 173.0, 122.0, 69.0, 76.0, 34.0, 27.0, 18.0, 26.0, 8.0, 15.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.2890625, -4.1517333984375, -4.014404296875, -3.8770751953125, -3.73974609375, -3.6024169921875, -3.465087890625, -3.3277587890625, -3.1904296875, -3.0531005859375, -2.915771484375, -2.7784423828125, -2.64111328125, -2.5037841796875, -2.366455078125, -2.2291259765625, -2.091796875, -1.9544677734375, -1.817138671875, -1.6798095703125, -1.54248046875, -1.4051513671875, -1.267822265625, -1.1304931640625, -0.9931640625, -0.8558349609375, -0.718505859375, -0.5811767578125, -0.44384765625, -0.3065185546875, -0.169189453125, -0.0318603515625, 0.10546875, 0.2427978515625, 0.380126953125, 0.5174560546875, 0.65478515625, 0.7921142578125, 0.929443359375, 1.0667724609375, 1.2041015625, 1.3414306640625, 1.478759765625, 1.6160888671875, 1.75341796875, 1.8907470703125, 2.028076171875, 2.1654052734375, 2.302734375, 2.4400634765625, 2.577392578125, 2.7147216796875, 2.85205078125, 2.9893798828125, 3.126708984375, 3.2640380859375, 3.4013671875, 3.5386962890625, 3.676025390625, 3.8133544921875, 3.95068359375, 4.0880126953125, 4.225341796875, 4.3626708984375, 4.5]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 18.0, 22.0, 28.0, 28.0, 34.0, 41.0, 50.0, 48.0, 69.0, 66.0, 82.0, 76.0, 65.0, 67.0, 57.0, 54.0, 42.0, 25.0, 26.0, 20.0, 16.0, 10.0, 10.0, 8.0, 10.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002682209014892578, -0.00026115216314792633, -0.00025408342480659485, -0.00024701468646526337, -0.00023994594812393188, -0.0002328772097826004, -0.00022580847144126892, -0.00021873973309993744, -0.00021167099475860596, -0.00020460225641727448, -0.000197533518075943, -0.0001904647797346115, -0.00018339604139328003, -0.00017632730305194855, -0.00016925856471061707, -0.00016218982636928558, -0.0001551210880279541, -0.00014805234968662262, -0.00014098361134529114, -0.00013391487300395966, -0.00012684613466262817, -0.00011977739632129669, -0.00011270865797996521, -0.00010563991963863373, -9.857118129730225e-05, -9.150244295597076e-05, -8.443370461463928e-05, -7.73649662733078e-05, -7.029622793197632e-05, -6.322748959064484e-05, -5.6158751249313354e-05, -4.909001290798187e-05, -4.202127456665039e-05, -3.495253622531891e-05, -2.7883797883987427e-05, -2.0815059542655945e-05, -1.3746321201324463e-05, -6.677582859992981e-06, 3.91155481338501e-07, 7.459893822669983e-06, 1.4528632164001465e-05, 2.1597370505332947e-05, 2.866610884666443e-05, 3.573484718799591e-05, 4.280358552932739e-05, 4.9872323870658875e-05, 5.6941062211990356e-05, 6.400980055332184e-05, 7.107853889465332e-05, 7.81472772359848e-05, 8.521601557731628e-05, 9.228475391864777e-05, 9.935349225997925e-05, 0.00010642223060131073, 0.00011349096894264221, 0.0001205597072839737, 0.00012762844562530518, 0.00013469718396663666, 0.00014176592230796814, 0.00014883466064929962, 0.0001559033989906311, 0.00016297213733196259, 0.00017004087567329407, 0.00017710961401462555, 0.00018417835235595703]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 17.0, 21.0, 34.0, 49.0, 67.0, 99.0, 173.0, 257.0, 413.0, 627.0, 950.0, 1866.0, 3266.0, 6103.0, 11141.0, 21380.0, 39749.0, 73145.0, 122362.0, 176700.0, 195466.0, 160266.0, 104396.0, 59653.0, 32476.0, 17151.0, 9084.0, 4851.0, 2772.0, 1547.0, 924.0, 553.0, 326.0, 215.0, 127.0, 98.0, 63.0, 37.0, 24.0, 23.0, 20.0, 13.0, 15.0, 5.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.234375, -2.158203125, -2.08203125, -2.005859375, -1.9296875, -1.853515625, -1.77734375, -1.701171875, -1.625, -1.548828125, -1.47265625, -1.396484375, -1.3203125, -1.244140625, -1.16796875, -1.091796875, -1.015625, -0.939453125, -0.86328125, -0.787109375, -0.7109375, -0.634765625, -0.55859375, -0.482421875, -0.40625, -0.330078125, -0.25390625, -0.177734375, -0.1015625, -0.025390625, 0.05078125, 0.126953125, 0.203125, 0.279296875, 0.35546875, 0.431640625, 0.5078125, 0.583984375, 0.66015625, 0.736328125, 0.8125, 0.888671875, 0.96484375, 1.041015625, 1.1171875, 1.193359375, 1.26953125, 1.345703125, 1.421875, 1.498046875, 1.57421875, 1.650390625, 1.7265625, 1.802734375, 1.87890625, 1.955078125, 2.03125, 2.107421875, 2.18359375, 2.259765625, 2.3359375, 2.412109375, 2.48828125, 2.564453125, 2.640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 2.0, 7.0, 8.0, 8.0, 10.0, 12.0, 16.0, 28.0, 40.0, 44.0, 51.0, 41.0, 54.0, 53.0, 54.0, 66.0, 62.0, 64.0, 65.0, 47.0, 39.0, 37.0, 29.0, 32.0, 30.0, 10.0, 15.0, 17.0, 7.0, 14.0, 7.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8193359375, -0.793365478515625, -0.76739501953125, -0.741424560546875, -0.7154541015625, -0.689483642578125, -0.66351318359375, -0.637542724609375, -0.611572265625, -0.585601806640625, -0.55963134765625, -0.533660888671875, -0.5076904296875, -0.481719970703125, -0.45574951171875, -0.429779052734375, -0.40380859375, -0.377838134765625, -0.35186767578125, -0.325897216796875, -0.2999267578125, -0.273956298828125, -0.24798583984375, -0.222015380859375, -0.196044921875, -0.170074462890625, -0.14410400390625, -0.118133544921875, -0.0921630859375, -0.066192626953125, -0.04022216796875, -0.014251708984375, 0.01171875, 0.037689208984375, 0.06365966796875, 0.089630126953125, 0.1156005859375, 0.141571044921875, 0.16754150390625, 0.193511962890625, 0.219482421875, 0.245452880859375, 0.27142333984375, 0.297393798828125, 0.3233642578125, 0.349334716796875, 0.37530517578125, 0.401275634765625, 0.42724609375, 0.453216552734375, 0.47918701171875, 0.505157470703125, 0.5311279296875, 0.557098388671875, 0.58306884765625, 0.609039306640625, 0.635009765625, 0.660980224609375, 0.68695068359375, 0.712921142578125, 0.7388916015625, 0.764862060546875, 0.79083251953125, 0.816802978515625, 0.8427734375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 5.0, 5.0, 10.0, 12.0, 20.0, 15.0, 22.0, 28.0, 33.0, 27.0, 37.0, 55.0, 65.0, 71.0, 65.0, 55.0, 55.0, 48.0, 47.0, 43.0, 44.0, 32.0, 31.0, 36.0, 26.0, 26.0, 14.0, 13.0, 11.0, 12.0, 9.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.555331707000732, -4.4065141677856445, -4.257696151733398, -4.1088786125183105, -3.9600610733032227, -3.8112432956695557, -3.6624255180358887, -3.513607978820801, -3.364790439605713, -3.215972661972046, -3.067155122756958, -2.918337345123291, -2.769519805908203, -2.620702028274536, -2.471884250640869, -2.3230667114257812, -2.1742489337921143, -2.0254311561584473, -1.8766136169433594, -1.7277958393096924, -1.5789783000946045, -1.4301605224609375, -1.28134286403656, -1.1325252056121826, -0.9837075471878052, -0.8348898887634277, -0.6860722303390503, -0.5372545123100281, -0.38843685388565063, -0.2396191954612732, -0.09080147743225098, 0.058016180992126465, 0.2068338394165039, 0.35565149784088135, 0.5044691562652588, 0.653286874294281, 0.8021045327186584, 0.9509221911430359, 1.099739909172058, 1.2485575675964355, 1.397375226020813, 1.5461928844451904, 1.6950105428695679, 1.8438282012939453, 1.9926459789276123, 2.1414635181427, 2.290281295776367, 2.439098834991455, 2.587916612625122, 2.736734390258789, 2.885551929473877, 3.034369707107544, 3.183187246322632, 3.332005023956299, 3.4808225631713867, 3.6296403408050537, 3.7784581184387207, 3.9272758960723877, 4.076093673706055, 4.224911212921143, 4.3737287521362305, 4.522546291351318, 4.6713643074035645, 4.820181846618652, 4.96899938583374]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 11.0, 13.0, 16.0, 15.0, 27.0, 18.0, 21.0, 28.0, 39.0, 30.0, 41.0, 38.0, 29.0, 41.0, 39.0, 52.0, 37.0, 43.0, 36.0, 39.0, 32.0, 32.0, 29.0, 32.0, 23.0, 29.0, 27.0, 24.0, 24.0, 17.0, 17.0, 15.0, 8.0, 9.0, 8.0, 10.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.558986186981201, -3.441723585128784, -3.324460983276367, -3.207198143005371, -3.089935541152954, -2.972672939300537, -2.85541033744812, -2.738147735595703, -2.620884895324707, -2.50362229347229, -2.386359691619873, -2.269096851348877, -2.15183424949646, -2.034571647644043, -1.917309045791626, -1.800046443939209, -1.682783842086792, -1.565521240234375, -1.4482585191726685, -1.3309959173202515, -1.213733196258545, -1.096470594406128, -0.9792079925537109, -0.8619453310966492, -0.7446826696395874, -0.6274200081825256, -0.5101573467254639, -0.3928947448730469, -0.2756320834159851, -0.15836942195892334, -0.04110682010650635, 0.07615584135055542, 0.1934185028076172, 0.31068116426467896, 0.42794379591941833, 0.5452064275741577, 0.6624690890312195, 0.7797317504882812, 0.8969943523406982, 1.0142569541931152, 1.1315196752548218, 1.2487822771072388, 1.3660449981689453, 1.4833076000213623, 1.6005702018737793, 1.7178329229354858, 1.8350955247879028, 1.9523582458496094, 2.0696208477020264, 2.1868834495544434, 2.3041460514068604, 2.4214086532592773, 2.5386714935302734, 2.6559340953826904, 2.7731966972351074, 2.8904592990875244, 3.0077219009399414, 3.1249845027923584, 3.2422471046447754, 3.3595099449157715, 3.4767725467681885, 3.5940351486206055, 3.7112977504730225, 3.8285603523254395, 3.9458231925964355]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 10.0, 10.0, 17.0, 27.0, 54.0, 86.0, 146.0, 219.0, 429.0, 763.0, 1333.0, 2330.0, 3988.0, 6909.0, 11629.0, 20361.0, 34729.0, 59911.0, 100155.0, 165651.0, 264069.0, 394725.0, 530670.0, 616171.0, 595042.0, 480297.0, 341455.0, 222888.0, 137684.0, 82995.0, 49087.0, 29032.0, 16956.0, 10097.0, 5908.0, 3496.0, 2038.0, 1225.0, 694.0, 416.0, 246.0, 139.0, 98.0, 45.0, 24.0, 18.0, 10.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16796875, -3.058013916015625, -2.94805908203125, -2.838104248046875, -2.7281494140625, -2.618194580078125, -2.50823974609375, -2.398284912109375, -2.288330078125, -2.178375244140625, -2.06842041015625, -1.958465576171875, -1.8485107421875, -1.738555908203125, -1.62860107421875, -1.518646240234375, -1.40869140625, -1.298736572265625, -1.18878173828125, -1.078826904296875, -0.9688720703125, -0.858917236328125, -0.74896240234375, -0.639007568359375, -0.529052734375, -0.419097900390625, -0.30914306640625, -0.199188232421875, -0.0892333984375, 0.020721435546875, 0.13067626953125, 0.240631103515625, 0.3505859375, 0.460540771484375, 0.57049560546875, 0.680450439453125, 0.7904052734375, 0.900360107421875, 1.01031494140625, 1.120269775390625, 1.230224609375, 1.340179443359375, 1.45013427734375, 1.560089111328125, 1.6700439453125, 1.779998779296875, 1.88995361328125, 1.999908447265625, 2.10986328125, 2.219818115234375, 2.32977294921875, 2.439727783203125, 2.5496826171875, 2.659637451171875, 2.76959228515625, 2.879547119140625, 2.989501953125, 3.099456787109375, 3.20941162109375, 3.319366455078125, 3.4293212890625, 3.539276123046875, 3.64923095703125, 3.759185791015625, 3.869140625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 10.0, 3.0, 9.0, 8.0, 6.0, 16.0, 13.0, 12.0, 15.0, 18.0, 23.0, 34.0, 19.0, 38.0, 28.0, 32.0, 49.0, 39.0, 47.0, 48.0, 40.0, 42.0, 38.0, 32.0, 41.0, 21.0, 40.0, 35.0, 26.0, 25.0, 31.0, 27.0, 22.0, 19.0, 18.0, 11.0, 16.0, 11.0, 8.0, 10.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.517578125, -2.433502197265625, -2.34942626953125, -2.265350341796875, -2.1812744140625, -2.097198486328125, -2.01312255859375, -1.929046630859375, -1.844970703125, -1.760894775390625, -1.67681884765625, -1.592742919921875, -1.5086669921875, -1.424591064453125, -1.34051513671875, -1.256439208984375, -1.17236328125, -1.088287353515625, -1.00421142578125, -0.920135498046875, -0.8360595703125, -0.751983642578125, -0.66790771484375, -0.583831787109375, -0.499755859375, -0.415679931640625, -0.33160400390625, -0.247528076171875, -0.1634521484375, -0.079376220703125, 0.00469970703125, 0.088775634765625, 0.1728515625, 0.256927490234375, 0.34100341796875, 0.425079345703125, 0.5091552734375, 0.593231201171875, 0.67730712890625, 0.761383056640625, 0.845458984375, 0.929534912109375, 1.01361083984375, 1.097686767578125, 1.1817626953125, 1.265838623046875, 1.34991455078125, 1.433990478515625, 1.51806640625, 1.602142333984375, 1.68621826171875, 1.770294189453125, 1.8543701171875, 1.938446044921875, 2.02252197265625, 2.106597900390625, 2.190673828125, 2.274749755859375, 2.35882568359375, 2.442901611328125, 2.5269775390625, 2.611053466796875, 2.69512939453125, 2.779205322265625, 2.86328125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 16.0, 26.0, 58.0, 84.0, 148.0, 266.0, 447.0, 842.0, 1472.0, 2768.0, 5060.0, 9364.0, 17503.0, 32728.0, 59845.0, 108044.0, 187057.0, 305963.0, 455555.0, 593994.0, 649487.0, 589793.0, 451813.0, 302134.0, 184192.0, 105952.0, 59463.0, 32055.0, 17396.0, 9191.0, 5271.0, 2779.0, 1507.0, 831.0, 492.0, 294.0, 153.0, 85.0, 60.0, 38.0, 25.0, 11.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.129180908203125, -3.00640869140625, -2.883636474609375, -2.7608642578125, -2.638092041015625, -2.51531982421875, -2.392547607421875, -2.269775390625, -2.147003173828125, -2.02423095703125, -1.901458740234375, -1.7786865234375, -1.655914306640625, -1.53314208984375, -1.410369873046875, -1.28759765625, -1.164825439453125, -1.04205322265625, -0.919281005859375, -0.7965087890625, -0.673736572265625, -0.55096435546875, -0.428192138671875, -0.305419921875, -0.182647705078125, -0.05987548828125, 0.062896728515625, 0.1856689453125, 0.308441162109375, 0.43121337890625, 0.553985595703125, 0.6767578125, 0.799530029296875, 0.92230224609375, 1.045074462890625, 1.1678466796875, 1.290618896484375, 1.41339111328125, 1.536163330078125, 1.658935546875, 1.781707763671875, 1.90447998046875, 2.027252197265625, 2.1500244140625, 2.272796630859375, 2.39556884765625, 2.518341064453125, 2.64111328125, 2.763885498046875, 2.88665771484375, 3.009429931640625, 3.1322021484375, 3.254974365234375, 3.37774658203125, 3.500518798828125, 3.623291015625, 3.746063232421875, 3.86883544921875, 3.991607666015625, 4.1143798828125, 4.237152099609375, 4.35992431640625, 4.482696533203125, 4.60546875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 7.0, 17.0, 18.0, 29.0, 26.0, 42.0, 40.0, 64.0, 104.0, 96.0, 111.0, 139.0, 166.0, 181.0, 197.0, 190.0, 227.0, 221.0, 221.0, 225.0, 226.0, 236.0, 198.0, 159.0, 166.0, 139.0, 122.0, 102.0, 79.0, 66.0, 56.0, 50.0, 35.0, 27.0, 24.0, 15.0, 12.0, 4.0, 9.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.49609375, -1.4499359130859375, -1.403778076171875, -1.3576202392578125, -1.31146240234375, -1.2653045654296875, -1.219146728515625, -1.1729888916015625, -1.1268310546875, -1.0806732177734375, -1.034515380859375, -0.9883575439453125, -0.94219970703125, -0.8960418701171875, -0.849884033203125, -0.8037261962890625, -0.757568359375, -0.7114105224609375, -0.665252685546875, -0.6190948486328125, -0.57293701171875, -0.5267791748046875, -0.480621337890625, -0.4344635009765625, -0.3883056640625, -0.3421478271484375, -0.295989990234375, -0.2498321533203125, -0.20367431640625, -0.1575164794921875, -0.111358642578125, -0.0652008056640625, -0.01904296875, 0.0271148681640625, 0.073272705078125, 0.1194305419921875, 0.16558837890625, 0.2117462158203125, 0.257904052734375, 0.3040618896484375, 0.3502197265625, 0.3963775634765625, 0.442535400390625, 0.4886932373046875, 0.53485107421875, 0.5810089111328125, 0.627166748046875, 0.6733245849609375, 0.719482421875, 0.7656402587890625, 0.811798095703125, 0.8579559326171875, 0.90411376953125, 0.9502716064453125, 0.996429443359375, 1.0425872802734375, 1.0887451171875, 1.1349029541015625, 1.181060791015625, 1.2272186279296875, 1.27337646484375, 1.3195343017578125, 1.365692138671875, 1.4118499755859375, 1.4580078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 3.0, 4.0, 13.0, 15.0, 12.0, 14.0, 21.0, 20.0, 18.0, 22.0, 21.0, 37.0, 43.0, 50.0, 51.0, 57.0, 60.0, 66.0, 47.0, 45.0, 65.0, 45.0, 33.0, 44.0, 31.0, 37.0, 25.0, 19.0, 15.0, 14.0, 15.0, 12.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.385538101196289, -4.245887279510498, -4.106236457824707, -3.966585397720337, -3.826934337615967, -3.687283515930176, -3.5476326942443848, -3.4079818725585938, -3.2683308124542236, -3.1286799907684326, -2.9890289306640625, -2.8493781089782715, -2.7097272872924805, -2.5700762271881104, -2.4304254055023193, -2.290774345397949, -2.151123523712158, -2.011472702026367, -1.871821641921997, -1.732170820236206, -1.5925198793411255, -1.452868938446045, -1.313218116760254, -1.1735671758651733, -1.0339162349700928, -0.8942652940750122, -0.7546144127845764, -0.6149635314941406, -0.47531259059906006, -0.3356616497039795, -0.1960107684135437, -0.05635988712310791, 0.08329057693481445, 0.22294148802757263, 0.3625923991203308, 0.5022432804107666, 0.6418942213058472, 0.7815451622009277, 0.9211960434913635, 1.0608469247817993, 1.2004978656768799, 1.3401488065719604, 1.479799747467041, 1.619450569152832, 1.7591015100479126, 1.8987524509429932, 2.038403272628784, 2.1780543327331543, 2.3177051544189453, 2.4573559761047363, 2.5970070362091064, 2.7366578578948975, 2.8763089179992676, 3.0159597396850586, 3.1556105613708496, 3.2952613830566406, 3.4349124431610107, 3.5745632648468018, 3.714214324951172, 3.853865146636963, 3.993515968322754, 4.133167266845703, 4.272818088531494, 4.412468910217285, 4.552119731903076]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 11.0, 11.0, 14.0, 12.0, 21.0, 19.0, 24.0, 25.0, 31.0, 21.0, 26.0, 34.0, 34.0, 50.0, 42.0, 44.0, 36.0, 37.0, 38.0, 39.0, 43.0, 48.0, 26.0, 30.0, 33.0, 32.0, 21.0, 24.0, 31.0, 16.0, 20.0, 12.0, 10.0, 12.0, 10.0, 8.0, 5.0, 12.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9760704040527344, -2.873430013656616, -2.770789861679077, -2.668149471282959, -2.56550931930542, -2.4628689289093018, -2.3602285385131836, -2.2575883865356445, -2.1549482345581055, -2.0523078441619873, -1.9496676921844482, -1.84702730178833, -1.744387149810791, -1.6417467594146729, -1.5391064882278442, -1.4364662170410156, -1.3338258266448975, -1.2311855554580688, -1.1285452842712402, -1.025904893875122, -0.9232646822929382, -0.8206244111061096, -0.7179840803146362, -0.6153438091278076, -0.512703537940979, -0.4100632667541504, -0.3074229657649994, -0.2047826647758484, -0.10214239358901978, 0.0004978775978088379, 0.10313820838928223, 0.20577847957611084, 0.30841851234436035, 0.41105878353118896, 0.5136990547180176, 0.616339385509491, 0.7189796566963196, 0.8216199278831482, 0.9242602586746216, 1.0269005298614502, 1.1295408010482788, 1.2321810722351074, 1.334821343421936, 1.4374616146087646, 1.5401020050048828, 1.6427421569824219, 1.74538254737854, 1.8480228185653687, 1.9506630897521973, 2.0533034801483154, 2.1559436321258545, 2.2585840225219727, 2.3612241744995117, 2.46386456489563, 2.566504955291748, 2.669145107269287, 2.771785259246826, 2.8744256496429443, 2.9770658016204834, 3.0797061920166016, 3.1823463439941406, 3.284986734390259, 3.387627124786377, 3.490267276763916, 3.592907667160034]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 20.0, 23.0, 49.0, 67.0, 104.0, 116.0, 204.0, 290.0, 465.0, 680.0, 1057.0, 1633.0, 2569.0, 4080.0, 6452.0, 10108.0, 16753.0, 27355.0, 45310.0, 74161.0, 118910.0, 171639.0, 186563.0, 142460.0, 92239.0, 56236.0, 34084.0, 20730.0, 12617.0, 7867.0, 4852.0, 3114.0, 2021.0, 1302.0, 848.0, 512.0, 365.0, 219.0, 161.0, 95.0, 71.0, 42.0, 45.0, 17.0, 17.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8894805908203125, -0.859039306640625, -0.8285980224609375, -0.79815673828125, -0.7677154541015625, -0.737274169921875, -0.7068328857421875, -0.6763916015625, -0.6459503173828125, -0.615509033203125, -0.5850677490234375, -0.55462646484375, -0.5241851806640625, -0.493743896484375, -0.4633026123046875, -0.432861328125, -0.4024200439453125, -0.371978759765625, -0.3415374755859375, -0.31109619140625, -0.2806549072265625, -0.250213623046875, -0.2197723388671875, -0.1893310546875, -0.1588897705078125, -0.128448486328125, -0.0980072021484375, -0.06756591796875, -0.0371246337890625, -0.006683349609375, 0.0237579345703125, 0.05419921875, 0.0846405029296875, 0.115081787109375, 0.1455230712890625, 0.17596435546875, 0.2064056396484375, 0.236846923828125, 0.2672882080078125, 0.2977294921875, 0.3281707763671875, 0.358612060546875, 0.3890533447265625, 0.41949462890625, 0.4499359130859375, 0.480377197265625, 0.5108184814453125, 0.541259765625, 0.5717010498046875, 0.602142333984375, 0.6325836181640625, 0.66302490234375, 0.6934661865234375, 0.723907470703125, 0.7543487548828125, 0.7847900390625, 0.8152313232421875, 0.845672607421875, 0.8761138916015625, 0.90655517578125, 0.9369964599609375, 0.967437744140625, 0.9978790283203125, 1.0283203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 14.0, 11.0, 10.0, 14.0, 24.0, 14.0, 23.0, 27.0, 25.0, 27.0, 29.0, 35.0, 39.0, 33.0, 35.0, 35.0, 42.0, 50.0, 42.0, 43.0, 40.0, 40.0, 25.0, 41.0, 40.0, 37.0, 26.0, 20.0, 21.0, 18.0, 20.0, 11.0, 11.0, 14.0, 13.0, 4.0, 9.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.13641357421875, -3.0267333984375, -2.91705322265625, -2.807373046875, -2.69769287109375, -2.5880126953125, -2.47833251953125, -2.36865234375, -2.25897216796875, -2.1492919921875, -2.03961181640625, -1.929931640625, -1.82025146484375, -1.7105712890625, -1.60089111328125, -1.4912109375, -1.38153076171875, -1.2718505859375, -1.16217041015625, -1.052490234375, -0.94281005859375, -0.8331298828125, -0.72344970703125, -0.61376953125, -0.50408935546875, -0.3944091796875, -0.28472900390625, -0.175048828125, -0.06536865234375, 0.0443115234375, 0.15399169921875, 0.263671875, 0.37335205078125, 0.4830322265625, 0.59271240234375, 0.702392578125, 0.81207275390625, 0.9217529296875, 1.03143310546875, 1.14111328125, 1.25079345703125, 1.3604736328125, 1.47015380859375, 1.579833984375, 1.68951416015625, 1.7991943359375, 1.90887451171875, 2.0185546875, 2.12823486328125, 2.2379150390625, 2.34759521484375, 2.457275390625, 2.56695556640625, 2.6766357421875, 2.78631591796875, 2.89599609375, 3.00567626953125, 3.1153564453125, 3.22503662109375, 3.334716796875, 3.44439697265625, 3.5540771484375, 3.66375732421875, 3.7734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 15.0, 20.0, 25.0, 50.0, 57.0, 84.0, 146.0, 212.0, 319.0, 552.0, 786.0, 1264.0, 2142.0, 3805.0, 6652.0, 12122.0, 22112.0, 41524.0, 77740.0, 146225.0, 236801.0, 220025.0, 127838.0, 68075.0, 36261.0, 18933.0, 10498.0, 5882.0, 3353.0, 1913.0, 1061.0, 739.0, 447.0, 302.0, 184.0, 124.0, 89.0, 51.0, 40.0, 27.0, 17.0, 10.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.154296875, -1.1169281005859375, -1.079559326171875, -1.0421905517578125, -1.00482177734375, -0.9674530029296875, -0.930084228515625, -0.8927154541015625, -0.8553466796875, -0.8179779052734375, -0.780609130859375, -0.7432403564453125, -0.70587158203125, -0.6685028076171875, -0.631134033203125, -0.5937652587890625, -0.556396484375, -0.5190277099609375, -0.481658935546875, -0.4442901611328125, -0.40692138671875, -0.3695526123046875, -0.332183837890625, -0.2948150634765625, -0.2574462890625, -0.2200775146484375, -0.182708740234375, -0.1453399658203125, -0.10797119140625, -0.0706024169921875, -0.033233642578125, 0.0041351318359375, 0.04150390625, 0.0788726806640625, 0.116241455078125, 0.1536102294921875, 0.19097900390625, 0.2283477783203125, 0.265716552734375, 0.3030853271484375, 0.3404541015625, 0.3778228759765625, 0.415191650390625, 0.4525604248046875, 0.48992919921875, 0.5272979736328125, 0.564666748046875, 0.6020355224609375, 0.639404296875, 0.6767730712890625, 0.714141845703125, 0.7515106201171875, 0.78887939453125, 0.8262481689453125, 0.863616943359375, 0.9009857177734375, 0.9383544921875, 0.9757232666015625, 1.013092041015625, 1.0504608154296875, 1.08782958984375, 1.1251983642578125, 1.162567138671875, 1.1999359130859375, 1.2373046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 6.0, 7.0, 11.0, 14.0, 12.0, 18.0, 14.0, 25.0, 32.0, 22.0, 23.0, 18.0, 36.0, 39.0, 32.0, 33.0, 41.0, 44.0, 37.0, 33.0, 36.0, 41.0, 42.0, 27.0, 29.0, 27.0, 34.0, 31.0, 31.0, 25.0, 16.0, 26.0, 19.0, 24.0, 13.0, 15.0, 12.0, 10.0, 4.0, 8.0, 5.0, 7.0, 6.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 3.0], "bins": [-2.1796875, -2.1142578125, -2.048828125, -1.9833984375, -1.91796875, -1.8525390625, -1.787109375, -1.7216796875, -1.65625, -1.5908203125, -1.525390625, -1.4599609375, -1.39453125, -1.3291015625, -1.263671875, -1.1982421875, -1.1328125, -1.0673828125, -1.001953125, -0.9365234375, -0.87109375, -0.8056640625, -0.740234375, -0.6748046875, -0.609375, -0.5439453125, -0.478515625, -0.4130859375, -0.34765625, -0.2822265625, -0.216796875, -0.1513671875, -0.0859375, -0.0205078125, 0.044921875, 0.1103515625, 0.17578125, 0.2412109375, 0.306640625, 0.3720703125, 0.4375, 0.5029296875, 0.568359375, 0.6337890625, 0.69921875, 0.7646484375, 0.830078125, 0.8955078125, 0.9609375, 1.0263671875, 1.091796875, 1.1572265625, 1.22265625, 1.2880859375, 1.353515625, 1.4189453125, 1.484375, 1.5498046875, 1.615234375, 1.6806640625, 1.74609375, 1.8115234375, 1.876953125, 1.9423828125, 2.0078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 10.0, 6.0, 18.0, 22.0, 41.0, 57.0, 55.0, 69.0, 106.0, 145.0, 218.0, 328.0, 491.0, 706.0, 1139.0, 2088.0, 4571.0, 11869.0, 43029.0, 225615.0, 574687.0, 136557.0, 29170.0, 8968.0, 3665.0, 1838.0, 1036.0, 628.0, 432.0, 282.0, 201.0, 147.0, 95.0, 63.0, 53.0, 29.0, 36.0, 28.0, 9.0, 10.0, 10.0, 3.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.744140625, -0.7211456298828125, -0.698150634765625, -0.6751556396484375, -0.65216064453125, -0.6291656494140625, -0.606170654296875, -0.5831756591796875, -0.5601806640625, -0.5371856689453125, -0.514190673828125, -0.4911956787109375, -0.46820068359375, -0.4452056884765625, -0.422210693359375, -0.3992156982421875, -0.376220703125, -0.3532257080078125, -0.330230712890625, -0.3072357177734375, -0.28424072265625, -0.2612457275390625, -0.238250732421875, -0.2152557373046875, -0.1922607421875, -0.1692657470703125, -0.146270751953125, -0.1232757568359375, -0.10028076171875, -0.0772857666015625, -0.054290771484375, -0.0312957763671875, -0.00830078125, 0.0146942138671875, 0.037689208984375, 0.0606842041015625, 0.08367919921875, 0.1066741943359375, 0.129669189453125, 0.1526641845703125, 0.1756591796875, 0.1986541748046875, 0.221649169921875, 0.2446441650390625, 0.26763916015625, 0.2906341552734375, 0.313629150390625, 0.3366241455078125, 0.359619140625, 0.3826141357421875, 0.405609130859375, 0.4286041259765625, 0.45159912109375, 0.4745941162109375, 0.497589111328125, 0.5205841064453125, 0.5435791015625, 0.5665740966796875, 0.589569091796875, 0.6125640869140625, 0.63555908203125, 0.6585540771484375, 0.681549072265625, 0.7045440673828125, 0.7275390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 14.0, 25.0, 33.0, 38.0, 34.0, 56.0, 74.0, 81.0, 73.0, 77.0, 79.0, 86.0, 54.0, 55.0, 35.0, 36.0, 31.0, 21.0, 21.0, 11.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.224611282348633e-05, -3.1286850571632385e-05, -3.0327588319778442e-05, -2.93683260679245e-05, -2.8409063816070557e-05, -2.7449801564216614e-05, -2.649053931236267e-05, -2.5531277060508728e-05, -2.4572014808654785e-05, -2.3612752556800842e-05, -2.26534903049469e-05, -2.1694228053092957e-05, -2.0734965801239014e-05, -1.977570354938507e-05, -1.8816441297531128e-05, -1.7857179045677185e-05, -1.6897916793823242e-05, -1.59386545419693e-05, -1.4979392290115356e-05, -1.4020130038261414e-05, -1.306086778640747e-05, -1.2101605534553528e-05, -1.1142343282699585e-05, -1.0183081030845642e-05, -9.2238187789917e-06, -8.264556527137756e-06, -7.3052942752838135e-06, -6.346032023429871e-06, -5.386769771575928e-06, -4.427507519721985e-06, -3.468245267868042e-06, -2.508983016014099e-06, -1.5497207641601562e-06, -5.904585123062134e-07, 3.688037395477295e-07, 1.3280659914016724e-06, 2.2873282432556152e-06, 3.246590495109558e-06, 4.205852746963501e-06, 5.165114998817444e-06, 6.124377250671387e-06, 7.08363950252533e-06, 8.042901754379272e-06, 9.002164006233215e-06, 9.961426258087158e-06, 1.0920688509941101e-05, 1.1879950761795044e-05, 1.2839213013648987e-05, 1.379847526550293e-05, 1.4757737517356873e-05, 1.5716999769210815e-05, 1.6676262021064758e-05, 1.76355242729187e-05, 1.8594786524772644e-05, 1.9554048776626587e-05, 2.051331102848053e-05, 2.1472573280334473e-05, 2.2431835532188416e-05, 2.339109778404236e-05, 2.43503600358963e-05, 2.5309622287750244e-05, 2.6268884539604187e-05, 2.722814679145813e-05, 2.8187409043312073e-05, 2.9146671295166016e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 13.0, 14.0, 24.0, 29.0, 40.0, 60.0, 63.0, 105.0, 166.0, 224.0, 301.0, 493.0, 759.0, 1158.0, 1947.0, 3335.0, 5687.0, 10510.0, 21169.0, 47046.0, 117903.0, 295628.0, 313971.0, 128497.0, 50694.0, 22481.0, 11090.0, 5940.0, 3455.0, 1991.0, 1284.0, 772.0, 544.0, 352.0, 260.0, 152.0, 118.0, 73.0, 51.0, 41.0, 28.0, 22.0, 12.0, 8.0, 8.0, 8.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0], "bins": [-0.59375, -0.5763092041015625, -0.558868408203125, -0.5414276123046875, -0.52398681640625, -0.5065460205078125, -0.489105224609375, -0.4716644287109375, -0.4542236328125, -0.4367828369140625, -0.419342041015625, -0.4019012451171875, -0.38446044921875, -0.3670196533203125, -0.349578857421875, -0.3321380615234375, -0.314697265625, -0.2972564697265625, -0.279815673828125, -0.2623748779296875, -0.24493408203125, -0.2274932861328125, -0.210052490234375, -0.1926116943359375, -0.1751708984375, -0.1577301025390625, -0.140289306640625, -0.1228485107421875, -0.10540771484375, -0.0879669189453125, -0.070526123046875, -0.0530853271484375, -0.03564453125, -0.0182037353515625, -0.000762939453125, 0.0166778564453125, 0.03411865234375, 0.0515594482421875, 0.069000244140625, 0.0864410400390625, 0.1038818359375, 0.1213226318359375, 0.138763427734375, 0.1562042236328125, 0.17364501953125, 0.1910858154296875, 0.208526611328125, 0.2259674072265625, 0.243408203125, 0.2608489990234375, 0.278289794921875, 0.2957305908203125, 0.31317138671875, 0.3306121826171875, 0.348052978515625, 0.3654937744140625, 0.3829345703125, 0.4003753662109375, 0.417816162109375, 0.4352569580078125, 0.45269775390625, 0.4701385498046875, 0.487579345703125, 0.5050201416015625, 0.5224609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 12.0, 7.0, 15.0, 14.0, 28.0, 43.0, 58.0, 69.0, 87.0, 98.0, 93.0, 94.0, 90.0, 67.0, 57.0, 43.0, 29.0, 23.0, 14.0, 10.0, 11.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1844482421875, -0.17952919006347656, -0.17461013793945312, -0.1696910858154297, -0.16477203369140625, -0.1598529815673828, -0.15493392944335938, -0.15001487731933594, -0.1450958251953125, -0.14017677307128906, -0.13525772094726562, -0.1303386688232422, -0.12541961669921875, -0.12050056457519531, -0.11558151245117188, -0.11066246032714844, -0.105743408203125, -0.10082435607910156, -0.09590530395507812, -0.09098625183105469, -0.08606719970703125, -0.08114814758300781, -0.07622909545898438, -0.07131004333496094, -0.0663909912109375, -0.06147193908691406, -0.056552886962890625, -0.05163383483886719, -0.04671478271484375, -0.04179573059082031, -0.036876678466796875, -0.03195762634277344, -0.02703857421875, -0.022119522094726562, -0.017200469970703125, -0.012281417846679688, -0.00736236572265625, -0.0024433135986328125, 0.002475738525390625, 0.0073947906494140625, 0.0123138427734375, 0.017232894897460938, 0.022151947021484375, 0.027070999145507812, 0.03199005126953125, 0.03690910339355469, 0.041828155517578125, 0.04674720764160156, 0.051666259765625, 0.05658531188964844, 0.061504364013671875, 0.06642341613769531, 0.07134246826171875, 0.07626152038574219, 0.08118057250976562, 0.08609962463378906, 0.0910186767578125, 0.09593772888183594, 0.10085678100585938, 0.10577583312988281, 0.11069488525390625, 0.11561393737792969, 0.12053298950195312, 0.12545204162597656, 0.13037109375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 10.0, 10.0, 19.0, 17.0, 13.0, 23.0, 19.0, 25.0, 26.0, 30.0, 41.0, 57.0, 48.0, 69.0, 53.0, 65.0, 49.0, 54.0, 54.0, 52.0, 26.0, 47.0, 29.0, 34.0, 23.0, 17.0, 18.0, 15.0, 16.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.429186820983887, -4.28815221786499, -4.147117614746094, -4.006083011627197, -3.865048408508301, -3.7240138053894043, -3.582979440689087, -3.4419448375701904, -3.300910234451294, -3.1598756313323975, -3.018841028213501, -2.8778064250946045, -2.736772060394287, -2.5957374572753906, -2.454702854156494, -2.3136682510375977, -2.172633647918701, -2.0315990447998047, -1.8905644416809082, -1.7495299577713013, -1.6084953546524048, -1.4674607515335083, -1.3264262676239014, -1.1853916645050049, -1.0443570613861084, -0.9033224582672119, -0.7622879147529602, -0.6212533712387085, -0.480218768119812, -0.3391841650009155, -0.19814962148666382, -0.05711507797241211, 0.08392000198364258, 0.22495457530021667, 0.36598914861679077, 0.5070236921310425, 0.648058295249939, 0.7890928983688354, 0.9301274418830872, 1.0711619853973389, 1.2121965885162354, 1.3532311916351318, 1.4942657947540283, 1.6353002786636353, 1.7763348817825317, 1.9173694849014282, 2.058403968811035, 2.1994385719299316, 2.340473175048828, 2.4815077781677246, 2.622542381286621, 2.7635769844055176, 2.904611587524414, 3.0456461906433105, 3.186680555343628, 3.3277151584625244, 3.468749761581421, 3.6097843647003174, 3.750818967819214, 3.8918535709381104, 4.032887935638428, 4.173922538757324, 4.314957141876221, 4.455991744995117, 4.597026348114014]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 7.0, 11.0, 8.0, 10.0, 14.0, 18.0, 17.0, 18.0, 23.0, 34.0, 27.0, 18.0, 31.0, 33.0, 36.0, 47.0, 39.0, 48.0, 34.0, 38.0, 37.0, 41.0, 45.0, 41.0, 30.0, 26.0, 34.0, 30.0, 24.0, 20.0, 33.0, 18.0, 16.0, 15.0, 8.0, 14.0, 9.0, 6.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9540483951568604, -2.852355480194092, -2.7506625652313232, -2.6489696502685547, -2.547276496887207, -2.4455835819244385, -2.34389066696167, -2.2421977519989014, -2.140504837036133, -2.0388119220733643, -1.9371188879013062, -1.8354259729385376, -1.7337329387664795, -1.632040023803711, -1.5303471088409424, -1.4286541938781738, -1.3269610404968262, -1.2252681255340576, -1.1235750913619995, -1.021882176399231, -0.9201892018318176, -0.8184962272644043, -0.7168033123016357, -0.6151103377342224, -0.5134173631668091, -0.41172438859939575, -0.3100314438343048, -0.20833849906921387, -0.10664552450180054, -0.004952549934387207, 0.09674036502838135, 0.19843333959579468, 0.300126314163208, 0.40181928873062134, 0.5035122632980347, 0.6052051782608032, 0.7068981528282166, 0.8085911273956299, 0.9102840423583984, 1.011976957321167, 1.113669991493225, 1.2153629064559937, 1.3170559406280518, 1.4187488555908203, 1.5204417705535889, 1.622134804725647, 1.7238277196884155, 1.8255207538604736, 1.9272136688232422, 2.0289065837860107, 2.1305994987487793, 2.232292652130127, 2.3339855670928955, 2.435678482055664, 2.5373713970184326, 2.639064311981201, 2.740757465362549, 2.8424503803253174, 2.944143295288086, 3.0458364486694336, 3.147529363632202, 3.2492222785949707, 3.3509151935577393, 3.452608108520508, 3.5543010234832764]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 13.0, 13.0, 20.0, 28.0, 47.0, 60.0, 99.0, 160.0, 239.0, 393.0, 594.0, 968.0, 1516.0, 2390.0, 3674.0, 5566.0, 8210.0, 12516.0, 18180.0, 26407.0, 36560.0, 50129.0, 64335.0, 79822.0, 93537.0, 101687.0, 102782.0, 96537.0, 85124.0, 69926.0, 54490.0, 40690.0, 29625.0, 20469.0, 14023.0, 9463.0, 6390.0, 4187.0, 2668.0, 1789.0, 1186.0, 732.0, 482.0, 311.0, 192.0, 129.0, 89.0, 41.0, 31.0, 16.0, 11.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.13323974609375, -2.0574951171875, -1.98175048828125, -1.906005859375, -1.83026123046875, -1.7545166015625, -1.67877197265625, -1.60302734375, -1.52728271484375, -1.4515380859375, -1.37579345703125, -1.300048828125, -1.22430419921875, -1.1485595703125, -1.07281494140625, -0.9970703125, -0.92132568359375, -0.8455810546875, -0.76983642578125, -0.694091796875, -0.61834716796875, -0.5426025390625, -0.46685791015625, -0.39111328125, -0.31536865234375, -0.2396240234375, -0.16387939453125, -0.088134765625, -0.01239013671875, 0.0633544921875, 0.13909912109375, 0.21484375, 0.29058837890625, 0.3663330078125, 0.44207763671875, 0.517822265625, 0.59356689453125, 0.6693115234375, 0.74505615234375, 0.82080078125, 0.89654541015625, 0.9722900390625, 1.04803466796875, 1.123779296875, 1.19952392578125, 1.2752685546875, 1.35101318359375, 1.4267578125, 1.50250244140625, 1.5782470703125, 1.65399169921875, 1.729736328125, 1.80548095703125, 1.8812255859375, 1.95697021484375, 2.03271484375, 2.10845947265625, 2.1842041015625, 2.25994873046875, 2.335693359375, 2.41143798828125, 2.4871826171875, 2.56292724609375, 2.638671875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 13.0, 13.0, 9.0, 15.0, 14.0, 9.0, 19.0, 17.0, 23.0, 22.0, 29.0, 25.0, 36.0, 39.0, 35.0, 31.0, 34.0, 50.0, 47.0, 37.0, 49.0, 34.0, 44.0, 55.0, 42.0, 37.0, 28.0, 27.0, 19.0, 19.0, 19.0, 16.0, 15.0, 15.0, 8.0, 10.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.354156494140625, -3.24151611328125, -3.128875732421875, -3.0162353515625, -2.903594970703125, -2.79095458984375, -2.678314208984375, -2.565673828125, -2.453033447265625, -2.34039306640625, -2.227752685546875, -2.1151123046875, -2.002471923828125, -1.88983154296875, -1.777191162109375, -1.66455078125, -1.551910400390625, -1.43927001953125, -1.326629638671875, -1.2139892578125, -1.101348876953125, -0.98870849609375, -0.876068115234375, -0.763427734375, -0.650787353515625, -0.53814697265625, -0.425506591796875, -0.3128662109375, -0.200225830078125, -0.08758544921875, 0.025054931640625, 0.1376953125, 0.250335693359375, 0.36297607421875, 0.475616455078125, 0.5882568359375, 0.700897216796875, 0.81353759765625, 0.926177978515625, 1.038818359375, 1.151458740234375, 1.26409912109375, 1.376739501953125, 1.4893798828125, 1.602020263671875, 1.71466064453125, 1.827301025390625, 1.93994140625, 2.052581787109375, 2.16522216796875, 2.277862548828125, 2.3905029296875, 2.503143310546875, 2.61578369140625, 2.728424072265625, 2.841064453125, 2.953704833984375, 3.06634521484375, 3.178985595703125, 3.2916259765625, 3.404266357421875, 3.51690673828125, 3.629547119140625, 3.7421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 16.0, 15.0, 28.0, 35.0, 54.0, 109.0, 148.0, 266.0, 337.0, 493.0, 774.0, 1201.0, 1863.0, 2904.0, 4411.0, 6747.0, 10390.0, 15592.0, 23096.0, 33357.0, 46242.0, 62439.0, 80160.0, 95481.0, 107104.0, 109050.0, 102590.0, 89626.0, 72488.0, 54885.0, 40612.0, 28455.0, 19570.0, 13054.0, 8627.0, 5700.0, 3695.0, 2430.0, 1576.0, 972.0, 674.0, 434.0, 252.0, 203.0, 127.0, 92.0, 62.0, 48.0, 19.0, 16.0, 10.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0], "bins": [-2.5390625, -2.460418701171875, -2.38177490234375, -2.303131103515625, -2.2244873046875, -2.145843505859375, -2.06719970703125, -1.988555908203125, -1.909912109375, -1.831268310546875, -1.75262451171875, -1.673980712890625, -1.5953369140625, -1.516693115234375, -1.43804931640625, -1.359405517578125, -1.28076171875, -1.202117919921875, -1.12347412109375, -1.044830322265625, -0.9661865234375, -0.887542724609375, -0.80889892578125, -0.730255126953125, -0.651611328125, -0.572967529296875, -0.49432373046875, -0.415679931640625, -0.3370361328125, -0.258392333984375, -0.17974853515625, -0.101104736328125, -0.0224609375, 0.056182861328125, 0.13482666015625, 0.213470458984375, 0.2921142578125, 0.370758056640625, 0.44940185546875, 0.528045654296875, 0.606689453125, 0.685333251953125, 0.76397705078125, 0.842620849609375, 0.9212646484375, 0.999908447265625, 1.07855224609375, 1.157196044921875, 1.23583984375, 1.314483642578125, 1.39312744140625, 1.471771240234375, 1.5504150390625, 1.629058837890625, 1.70770263671875, 1.786346435546875, 1.864990234375, 1.943634033203125, 2.02227783203125, 2.100921630859375, 2.1795654296875, 2.258209228515625, 2.33685302734375, 2.415496826171875, 2.494140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 8.0, 6.0, 13.0, 17.0, 11.0, 15.0, 23.0, 24.0, 18.0, 27.0, 26.0, 42.0, 46.0, 47.0, 40.0, 51.0, 50.0, 42.0, 40.0, 47.0, 40.0, 34.0, 50.0, 27.0, 45.0, 36.0, 24.0, 22.0, 18.0, 20.0, 13.0, 20.0, 14.0, 4.0, 12.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.167510986328125, -2.09478759765625, -2.022064208984375, -1.9493408203125, -1.876617431640625, -1.80389404296875, -1.731170654296875, -1.658447265625, -1.585723876953125, -1.51300048828125, -1.440277099609375, -1.3675537109375, -1.294830322265625, -1.22210693359375, -1.149383544921875, -1.07666015625, -1.003936767578125, -0.93121337890625, -0.858489990234375, -0.7857666015625, -0.713043212890625, -0.64031982421875, -0.567596435546875, -0.494873046875, -0.422149658203125, -0.34942626953125, -0.276702880859375, -0.2039794921875, -0.131256103515625, -0.05853271484375, 0.014190673828125, 0.0869140625, 0.159637451171875, 0.23236083984375, 0.305084228515625, 0.3778076171875, 0.450531005859375, 0.52325439453125, 0.595977783203125, 0.668701171875, 0.741424560546875, 0.81414794921875, 0.886871337890625, 0.9595947265625, 1.032318115234375, 1.10504150390625, 1.177764892578125, 1.25048828125, 1.323211669921875, 1.39593505859375, 1.468658447265625, 1.5413818359375, 1.614105224609375, 1.68682861328125, 1.759552001953125, 1.832275390625, 1.904998779296875, 1.97772216796875, 2.050445556640625, 2.1231689453125, 2.195892333984375, 2.26861572265625, 2.341339111328125, 2.4140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 3.0, 9.0, 12.0, 26.0, 29.0, 48.0, 74.0, 127.0, 186.0, 281.0, 481.0, 677.0, 1104.0, 1828.0, 3184.0, 5109.0, 8688.0, 14578.0, 24126.0, 39769.0, 63060.0, 93872.0, 126163.0, 148514.0, 147447.0, 123459.0, 90150.0, 60083.0, 37565.0, 23064.0, 13889.0, 8221.0, 4924.0, 2971.0, 1845.0, 1095.0, 674.0, 425.0, 298.0, 169.0, 122.0, 80.0, 55.0, 28.0, 12.0, 10.0, 5.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5932464599609375, -1.544891357421875, -1.4965362548828125, -1.44818115234375, -1.3998260498046875, -1.351470947265625, -1.3031158447265625, -1.2547607421875, -1.2064056396484375, -1.158050537109375, -1.1096954345703125, -1.06134033203125, -1.0129852294921875, -0.964630126953125, -0.9162750244140625, -0.867919921875, -0.8195648193359375, -0.771209716796875, -0.7228546142578125, -0.67449951171875, -0.6261444091796875, -0.577789306640625, -0.5294342041015625, -0.4810791015625, -0.4327239990234375, -0.384368896484375, -0.3360137939453125, -0.28765869140625, -0.2393035888671875, -0.190948486328125, -0.1425933837890625, -0.09423828125, -0.0458831787109375, 0.002471923828125, 0.0508270263671875, 0.09918212890625, 0.1475372314453125, 0.195892333984375, 0.2442474365234375, 0.2926025390625, 0.3409576416015625, 0.389312744140625, 0.4376678466796875, 0.48602294921875, 0.5343780517578125, 0.582733154296875, 0.6310882568359375, 0.679443359375, 0.7277984619140625, 0.776153564453125, 0.8245086669921875, 0.87286376953125, 0.9212188720703125, 0.969573974609375, 1.0179290771484375, 1.0662841796875, 1.1146392822265625, 1.162994384765625, 1.2113494873046875, 1.25970458984375, 1.3080596923828125, 1.356414794921875, 1.4047698974609375, 1.453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 8.0, 9.0, 5.0, 6.0, 7.0, 3.0, 9.0, 19.0, 17.0, 19.0, 20.0, 26.0, 30.0, 41.0, 46.0, 45.0, 52.0, 43.0, 67.0, 51.0, 46.0, 51.0, 55.0, 49.0, 51.0, 43.0, 37.0, 31.0, 31.0, 16.0, 19.0, 16.0, 8.0, 2.0, 7.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.000171661376953125, -0.00016713328659534454, -0.0001626051962375641, -0.00015807710587978363, -0.00015354901552200317, -0.00014902092516422272, -0.00014449283480644226, -0.0001399647444486618, -0.00013543665409088135, -0.0001309085637331009, -0.00012638047337532043, -0.00012185238301753998, -0.00011732429265975952, -0.00011279620230197906, -0.00010826811194419861, -0.00010374002158641815, -9.92119312286377e-05, -9.468384087085724e-05, -9.015575051307678e-05, -8.562766015529633e-05, -8.109956979751587e-05, -7.657147943973541e-05, -7.204338908195496e-05, -6.75152987241745e-05, -6.298720836639404e-05, -5.8459118008613586e-05, -5.393102765083313e-05, -4.940293729305267e-05, -4.487484693527222e-05, -4.034675657749176e-05, -3.5818666219711304e-05, -3.129057586193085e-05, -2.676248550415039e-05, -2.2234395146369934e-05, -1.7706304788589478e-05, -1.3178214430809021e-05, -8.650124073028564e-06, -4.122033715248108e-06, 4.0605664253234863e-07, 4.934147000312805e-06, 9.462237358093262e-06, 1.3990327715873718e-05, 1.8518418073654175e-05, 2.304650843143463e-05, 2.7574598789215088e-05, 3.2102689146995544e-05, 3.6630779504776e-05, 4.115886986255646e-05, 4.5686960220336914e-05, 5.021505057811737e-05, 5.474314093589783e-05, 5.9271231293678284e-05, 6.379932165145874e-05, 6.83274120092392e-05, 7.285550236701965e-05, 7.738359272480011e-05, 8.191168308258057e-05, 8.643977344036102e-05, 9.096786379814148e-05, 9.549595415592194e-05, 0.00010002404451370239, 0.00010455213487148285, 0.0001090802252292633, 0.00011360831558704376, 0.00011813640594482422]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 15.0, 15.0, 44.0, 67.0, 72.0, 142.0, 213.0, 287.0, 480.0, 773.0, 1197.0, 1930.0, 3084.0, 4797.0, 7846.0, 12708.0, 19849.0, 31622.0, 47947.0, 69631.0, 96274.0, 121327.0, 133927.0, 129822.0, 110446.0, 84647.0, 59978.0, 39914.0, 25828.0, 16438.0, 10280.0, 6332.0, 3974.0, 2395.0, 1493.0, 982.0, 631.0, 396.0, 258.0, 180.0, 113.0, 60.0, 51.0, 28.0, 20.0, 10.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2705078125, -1.22784423828125, -1.1851806640625, -1.14251708984375, -1.099853515625, -1.05718994140625, -1.0145263671875, -0.97186279296875, -0.92919921875, -0.88653564453125, -0.8438720703125, -0.80120849609375, -0.758544921875, -0.71588134765625, -0.6732177734375, -0.63055419921875, -0.587890625, -0.54522705078125, -0.5025634765625, -0.45989990234375, -0.417236328125, -0.37457275390625, -0.3319091796875, -0.28924560546875, -0.24658203125, -0.20391845703125, -0.1612548828125, -0.11859130859375, -0.075927734375, -0.03326416015625, 0.0093994140625, 0.05206298828125, 0.0947265625, 0.13739013671875, 0.1800537109375, 0.22271728515625, 0.265380859375, 0.30804443359375, 0.3507080078125, 0.39337158203125, 0.43603515625, 0.47869873046875, 0.5213623046875, 0.56402587890625, 0.606689453125, 0.64935302734375, 0.6920166015625, 0.73468017578125, 0.77734375, 0.82000732421875, 0.8626708984375, 0.90533447265625, 0.947998046875, 0.99066162109375, 1.0333251953125, 1.07598876953125, 1.11865234375, 1.16131591796875, 1.2039794921875, 1.24664306640625, 1.289306640625, 1.33197021484375, 1.3746337890625, 1.41729736328125, 1.4599609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 10.0, 5.0, 7.0, 12.0, 18.0, 18.0, 17.0, 16.0, 28.0, 33.0, 29.0, 35.0, 42.0, 41.0, 38.0, 53.0, 48.0, 53.0, 48.0, 44.0, 57.0, 39.0, 44.0, 40.0, 27.0, 27.0, 31.0, 31.0, 20.0, 18.0, 11.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.466064453125, -0.4508399963378906, -0.43561553955078125, -0.4203910827636719, -0.4051666259765625, -0.3899421691894531, -0.37471771240234375, -0.3594932556152344, -0.344268798828125, -0.3290443420410156, -0.31381988525390625, -0.2985954284667969, -0.2833709716796875, -0.2681465148925781, -0.25292205810546875, -0.23769760131835938, -0.22247314453125, -0.20724868774414062, -0.19202423095703125, -0.17679977416992188, -0.1615753173828125, -0.14635086059570312, -0.13112640380859375, -0.11590194702148438, -0.100677490234375, -0.08545303344726562, -0.07022857666015625, -0.055004119873046875, -0.0397796630859375, -0.024555206298828125, -0.00933074951171875, 0.005893707275390625, 0.0211181640625, 0.036342620849609375, 0.05156707763671875, 0.06679153442382812, 0.0820159912109375, 0.09724044799804688, 0.11246490478515625, 0.12768936157226562, 0.142913818359375, 0.15813827514648438, 0.17336273193359375, 0.18858718872070312, 0.2038116455078125, 0.21903610229492188, 0.23426055908203125, 0.24948501586914062, 0.26470947265625, 0.2799339294433594, 0.29515838623046875, 0.3103828430175781, 0.3256072998046875, 0.3408317565917969, 0.35605621337890625, 0.3712806701660156, 0.386505126953125, 0.4017295837402344, 0.41695404052734375, 0.4321784973144531, 0.4474029541015625, 0.4626274108886719, 0.47785186767578125, 0.4930763244628906, 0.50830078125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 14.0, 18.0, 12.0, 12.0, 24.0, 16.0, 25.0, 30.0, 36.0, 42.0, 45.0, 57.0, 67.0, 73.0, 69.0, 43.0, 50.0, 44.0, 56.0, 48.0, 29.0, 31.0, 23.0, 34.0, 11.0, 16.0, 17.0, 11.0, 10.0, 7.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4993062019348145, -4.356599807739258, -4.213893413543701, -4.0711870193481445, -3.928480625152588, -3.7857742309570312, -3.6430678367614746, -3.500361442565918, -3.3576550483703613, -3.2149486541748047, -3.072242259979248, -2.9295358657836914, -2.7868294715881348, -2.644123077392578, -2.5014166831970215, -2.358710289001465, -2.216003894805908, -2.0732975006103516, -1.930591106414795, -1.7878847122192383, -1.6451783180236816, -1.502471923828125, -1.3597655296325684, -1.2170591354370117, -1.074352741241455, -0.9316463470458984, -0.7889399528503418, -0.6462335586547852, -0.5035271644592285, -0.3608207702636719, -0.21811437606811523, -0.0754079818725586, 0.06729841232299805, 0.2100048065185547, 0.35271120071411133, 0.49541759490966797, 0.6381239891052246, 0.7808303833007812, 0.9235367774963379, 1.0662431716918945, 1.2089495658874512, 1.3516559600830078, 1.4943623542785645, 1.637068748474121, 1.7797751426696777, 1.9224815368652344, 2.065187931060791, 2.2078943252563477, 2.3506007194519043, 2.493307113647461, 2.6360135078430176, 2.778719902038574, 2.921426296234131, 3.0641326904296875, 3.206839084625244, 3.349545478820801, 3.4922518730163574, 3.634958267211914, 3.7776646614074707, 3.9203710556030273, 4.063077449798584, 4.205783843994141, 4.348490238189697, 4.491196632385254, 4.6339030265808105]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 8.0, 7.0, 5.0, 2.0, 10.0, 10.0, 17.0, 10.0, 19.0, 33.0, 13.0, 25.0, 19.0, 27.0, 40.0, 32.0, 36.0, 44.0, 38.0, 32.0, 44.0, 45.0, 44.0, 53.0, 41.0, 33.0, 24.0, 46.0, 37.0, 27.0, 21.0, 28.0, 19.0, 19.0, 23.0, 11.0, 19.0, 13.0, 8.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.827996015548706, -3.717251777648926, -3.6065077781677246, -3.4957635402679443, -3.385019540786743, -3.274275302886963, -3.1635313034057617, -3.0527870655059814, -2.942042827606201, -2.831298589706421, -2.7205545902252197, -2.6098103523254395, -2.4990663528442383, -2.388322114944458, -2.2775778770446777, -2.1668338775634766, -2.0560898780822754, -1.9453457593917847, -1.834601640701294, -1.7238574028015137, -1.613113284111023, -1.5023691654205322, -1.3916250467300415, -1.2808809280395508, -1.1701366901397705, -1.0593925714492798, -0.9486483931541443, -0.8379042744636536, -0.7271600961685181, -0.6164159774780273, -0.5056718587875366, -0.3949276804924011, -0.2841835021972656, -0.17343935370445251, -0.0626952201128006, 0.04804891347885132, 0.15879306197166443, 0.26953721046447754, 0.38028132915496826, 0.49102550745010376, 0.6017696261405945, 0.7125137448310852, 0.8232579231262207, 0.9340020418167114, 1.0447461605072021, 1.1554903984069824, 1.2662343978881836, 1.3769786357879639, 1.4877227544784546, 1.5984668731689453, 1.709210991859436, 1.8199551105499268, 1.930699348449707, 2.041443347930908, 2.1521875858306885, 2.2629318237304688, 2.37367582321167, 2.48442006111145, 2.5951640605926514, 2.7059082984924316, 2.816652297973633, 2.927396535873413, 3.0381407737731934, 3.1488847732543945, 3.259629011154175]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 12.0, 15.0, 26.0, 53.0, 92.0, 158.0, 243.0, 413.0, 673.0, 1152.0, 1989.0, 3317.0, 5802.0, 9945.0, 17187.0, 29287.0, 50557.0, 86332.0, 143427.0, 232184.0, 357557.0, 502656.0, 613049.0, 622135.0, 519920.0, 377118.0, 246085.0, 153087.0, 91213.0, 53669.0, 31272.0, 18205.0, 10590.0, 6291.0, 3505.0, 2091.0, 1203.0, 713.0, 414.0, 273.0, 155.0, 85.0, 59.0, 33.0, 21.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.16796875, -3.062591552734375, -2.95721435546875, -2.851837158203125, -2.7464599609375, -2.641082763671875, -2.53570556640625, -2.430328369140625, -2.324951171875, -2.219573974609375, -2.11419677734375, -2.008819580078125, -1.9034423828125, -1.798065185546875, -1.69268798828125, -1.587310791015625, -1.48193359375, -1.376556396484375, -1.27117919921875, -1.165802001953125, -1.0604248046875, -0.955047607421875, -0.84967041015625, -0.744293212890625, -0.638916015625, -0.533538818359375, -0.42816162109375, -0.322784423828125, -0.2174072265625, -0.112030029296875, -0.00665283203125, 0.098724365234375, 0.2041015625, 0.309478759765625, 0.41485595703125, 0.520233154296875, 0.6256103515625, 0.730987548828125, 0.83636474609375, 0.941741943359375, 1.047119140625, 1.152496337890625, 1.25787353515625, 1.363250732421875, 1.4686279296875, 1.574005126953125, 1.67938232421875, 1.784759521484375, 1.89013671875, 1.995513916015625, 2.10089111328125, 2.206268310546875, 2.3116455078125, 2.417022705078125, 2.52239990234375, 2.627777099609375, 2.733154296875, 2.838531494140625, 2.94390869140625, 3.049285888671875, 3.1546630859375, 3.260040283203125, 3.36541748046875, 3.470794677734375, 3.576171875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 13.0, 21.0, 14.0, 14.0, 14.0, 16.0, 20.0, 22.0, 30.0, 40.0, 30.0, 24.0, 28.0, 33.0, 43.0, 49.0, 34.0, 47.0, 47.0, 45.0, 35.0, 36.0, 35.0, 30.0, 27.0, 27.0, 30.0, 24.0, 21.0, 25.0, 18.0, 14.0, 16.0, 12.0, 17.0, 10.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.5228271484375, -2.447998046875, -2.3731689453125, -2.29833984375, -2.2235107421875, -2.148681640625, -2.0738525390625, -1.9990234375, -1.9241943359375, -1.849365234375, -1.7745361328125, -1.69970703125, -1.6248779296875, -1.550048828125, -1.4752197265625, -1.400390625, -1.3255615234375, -1.250732421875, -1.1759033203125, -1.10107421875, -1.0262451171875, -0.951416015625, -0.8765869140625, -0.8017578125, -0.7269287109375, -0.652099609375, -0.5772705078125, -0.50244140625, -0.4276123046875, -0.352783203125, -0.2779541015625, -0.203125, -0.1282958984375, -0.053466796875, 0.0213623046875, 0.09619140625, 0.1710205078125, 0.245849609375, 0.3206787109375, 0.3955078125, 0.4703369140625, 0.545166015625, 0.6199951171875, 0.69482421875, 0.7696533203125, 0.844482421875, 0.9193115234375, 0.994140625, 1.0689697265625, 1.143798828125, 1.2186279296875, 1.29345703125, 1.3682861328125, 1.443115234375, 1.5179443359375, 1.5927734375, 1.6676025390625, 1.742431640625, 1.8172607421875, 1.89208984375, 1.9669189453125, 2.041748046875, 2.1165771484375, 2.19140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 13.0, 15.0, 27.0, 43.0, 65.0, 136.0, 227.0, 375.0, 669.0, 1131.0, 1916.0, 3373.0, 5776.0, 9928.0, 17186.0, 29097.0, 49376.0, 82893.0, 134111.0, 210538.0, 314124.0, 427678.0, 527078.0, 565871.0, 525521.0, 428977.0, 311747.0, 209951.0, 133905.0, 82772.0, 49824.0, 29164.0, 17147.0, 9958.0, 5679.0, 3312.0, 1938.0, 1136.0, 656.0, 355.0, 236.0, 141.0, 87.0, 49.0, 28.0, 20.0, 16.0, 7.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.185546875, -3.08441162109375, -2.9832763671875, -2.88214111328125, -2.781005859375, -2.67987060546875, -2.5787353515625, -2.47760009765625, -2.37646484375, -2.27532958984375, -2.1741943359375, -2.07305908203125, -1.971923828125, -1.87078857421875, -1.7696533203125, -1.66851806640625, -1.5673828125, -1.46624755859375, -1.3651123046875, -1.26397705078125, -1.162841796875, -1.06170654296875, -0.9605712890625, -0.85943603515625, -0.75830078125, -0.65716552734375, -0.5560302734375, -0.45489501953125, -0.353759765625, -0.25262451171875, -0.1514892578125, -0.05035400390625, 0.05078125, 0.15191650390625, 0.2530517578125, 0.35418701171875, 0.455322265625, 0.55645751953125, 0.6575927734375, 0.75872802734375, 0.85986328125, 0.96099853515625, 1.0621337890625, 1.16326904296875, 1.264404296875, 1.36553955078125, 1.4666748046875, 1.56781005859375, 1.6689453125, 1.77008056640625, 1.8712158203125, 1.97235107421875, 2.073486328125, 2.17462158203125, 2.2757568359375, 2.37689208984375, 2.47802734375, 2.57916259765625, 2.6802978515625, 2.78143310546875, 2.882568359375, 2.98370361328125, 3.0848388671875, 3.18597412109375, 3.287109375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 14.0, 8.0, 15.0, 15.0, 31.0, 37.0, 36.0, 59.0, 75.0, 65.0, 82.0, 90.0, 102.0, 117.0, 120.0, 177.0, 179.0, 191.0, 217.0, 196.0, 168.0, 187.0, 200.0, 175.0, 187.0, 167.0, 150.0, 149.0, 142.0, 99.0, 102.0, 102.0, 79.0, 44.0, 56.0, 54.0, 39.0, 30.0, 21.0, 17.0, 12.0, 11.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-1.1337890625, -1.0983123779296875, -1.062835693359375, -1.0273590087890625, -0.99188232421875, -0.9564056396484375, -0.920928955078125, -0.8854522705078125, -0.8499755859375, -0.8144989013671875, -0.779022216796875, -0.7435455322265625, -0.70806884765625, -0.6725921630859375, -0.637115478515625, -0.6016387939453125, -0.566162109375, -0.5306854248046875, -0.495208740234375, -0.4597320556640625, -0.42425537109375, -0.3887786865234375, -0.353302001953125, -0.3178253173828125, -0.2823486328125, -0.2468719482421875, -0.211395263671875, -0.1759185791015625, -0.14044189453125, -0.1049652099609375, -0.069488525390625, -0.0340118408203125, 0.00146484375, 0.0369415283203125, 0.072418212890625, 0.1078948974609375, 0.14337158203125, 0.1788482666015625, 0.214324951171875, 0.2498016357421875, 0.2852783203125, 0.3207550048828125, 0.356231689453125, 0.3917083740234375, 0.42718505859375, 0.4626617431640625, 0.498138427734375, 0.5336151123046875, 0.569091796875, 0.6045684814453125, 0.640045166015625, 0.6755218505859375, 0.71099853515625, 0.7464752197265625, 0.781951904296875, 0.8174285888671875, 0.8529052734375, 0.8883819580078125, 0.923858642578125, 0.9593353271484375, 0.99481201171875, 1.0302886962890625, 1.065765380859375, 1.1012420654296875, 1.13671875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 13.0, 9.0, 12.0, 18.0, 19.0, 18.0, 27.0, 30.0, 35.0, 33.0, 39.0, 45.0, 51.0, 60.0, 69.0, 47.0, 42.0, 39.0, 55.0, 42.0, 32.0, 29.0, 42.0, 30.0, 25.0, 14.0, 19.0, 15.0, 15.0, 3.0, 14.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.7994987964630127, -3.6804840564727783, -3.561469316482544, -3.4424548149108887, -3.3234400749206543, -3.20442533493042, -3.0854105949401855, -2.966395854949951, -2.847381114959717, -2.7283663749694824, -2.609351634979248, -2.4903368949890137, -2.3713223934173584, -2.252307653427124, -2.1332929134368896, -2.0142781734466553, -1.895263671875, -1.7762489318847656, -1.6572343111038208, -1.5382195711135864, -1.4192049503326416, -1.3001902103424072, -1.1811754703521729, -1.0621607303619385, -0.9431461095809937, -0.824131429195404, -0.7051167488098145, -0.5861020088195801, -0.4670873284339905, -0.3480726480484009, -0.2290579080581665, -0.1100432276725769, 0.008971214294433594, 0.1279859095811844, 0.24700060486793518, 0.36601531505584717, 0.48502999544143677, 0.6040446758270264, 0.7230594158172607, 0.8420740962028503, 0.9610887765884399, 1.0801035165786743, 1.1991181373596191, 1.3181328773498535, 1.437147617340088, 1.5561622381210327, 1.675176978111267, 1.794191598892212, 1.9132063388824463, 2.0322210788726807, 2.151235818862915, 2.2702503204345703, 2.3892650604248047, 2.508279800415039, 2.6272945404052734, 2.746309280395508, 2.865324020385742, 2.9843387603759766, 3.103353500366211, 3.2223682403564453, 3.3413827419281006, 3.460397481918335, 3.5794122219085693, 3.6984269618988037, 3.817441463470459]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 5.0, 5.0, 11.0, 14.0, 13.0, 9.0, 19.0, 20.0, 30.0, 26.0, 38.0, 26.0, 38.0, 41.0, 43.0, 40.0, 41.0, 37.0, 57.0, 39.0, 41.0, 40.0, 35.0, 35.0, 35.0, 27.0, 29.0, 35.0, 25.0, 33.0, 22.0, 12.0, 14.0, 9.0, 12.0, 8.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.504161834716797, -3.406283378601074, -3.3084046840667725, -3.21052622795105, -3.112647533416748, -3.0147690773010254, -2.9168906211853027, -2.819011926651001, -2.7211334705352783, -2.6232550144195557, -2.525376319885254, -2.4274978637695312, -2.3296191692352295, -2.231740713119507, -2.133862018585205, -2.0359835624694824, -1.9381049871444702, -1.840226411819458, -1.7423478364944458, -1.6444692611694336, -1.546590805053711, -1.4487122297286987, -1.3508336544036865, -1.2529551982879639, -1.155076503753662, -1.05719792842865, -0.9593194127082825, -0.8614408373832703, -0.7635623216629028, -0.6656837463378906, -0.5678051710128784, -0.469926655292511, -0.37204813957214355, -0.27416959404945374, -0.17629103362560272, -0.07841247320175171, 0.01946607232093811, 0.11734461784362793, 0.21522319316864014, 0.31310170888900757, 0.4109802842140198, 0.508858859539032, 0.6067373752593994, 0.7046159505844116, 0.8024945259094238, 0.9003730416297913, 0.9982516169548035, 1.096130132675171, 1.194008708000183, 1.2918872833251953, 1.3897658586502075, 1.4876444339752197, 1.5855228900909424, 1.6834014654159546, 1.7812800407409668, 1.8791584968566895, 1.9770371913909912, 2.074915647506714, 2.1727943420410156, 2.2706727981567383, 2.36855149269104, 2.4664299488067627, 2.5643086433410645, 2.662187099456787, 2.7600655555725098]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 12.0, 17.0, 20.0, 36.0, 65.0, 70.0, 112.0, 140.0, 227.0, 306.0, 467.0, 710.0, 1016.0, 1452.0, 2305.0, 3435.0, 5145.0, 7886.0, 12307.0, 19191.0, 30452.0, 49281.0, 78884.0, 122265.0, 167823.0, 174302.0, 133224.0, 87647.0, 55304.0, 33870.0, 21492.0, 13360.0, 8739.0, 5663.0, 3650.0, 2474.0, 1660.0, 1138.0, 758.0, 526.0, 355.0, 237.0, 163.0, 131.0, 82.0, 44.0, 41.0, 23.0, 22.0, 13.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.833984375, -0.8087997436523438, -0.7836151123046875, -0.7584304809570312, -0.733245849609375, -0.7080612182617188, -0.6828765869140625, -0.6576919555664062, -0.63250732421875, -0.6073226928710938, -0.5821380615234375, -0.5569534301757812, -0.531768798828125, -0.5065841674804688, -0.4813995361328125, -0.45621490478515625, -0.4310302734375, -0.40584564208984375, -0.3806610107421875, -0.35547637939453125, -0.330291748046875, -0.30510711669921875, -0.2799224853515625, -0.25473785400390625, -0.22955322265625, -0.20436859130859375, -0.1791839599609375, -0.15399932861328125, -0.128814697265625, -0.10363006591796875, -0.0784454345703125, -0.05326080322265625, -0.028076171875, -0.00289154052734375, 0.0222930908203125, 0.04747772216796875, 0.072662353515625, 0.09784698486328125, 0.1230316162109375, 0.14821624755859375, 0.17340087890625, 0.19858551025390625, 0.2237701416015625, 0.24895477294921875, 0.274139404296875, 0.29932403564453125, 0.3245086669921875, 0.34969329833984375, 0.3748779296875, 0.40006256103515625, 0.4252471923828125, 0.45043182373046875, 0.475616455078125, 0.5008010864257812, 0.5259857177734375, 0.5511703491210938, 0.57635498046875, 0.6015396118164062, 0.6267242431640625, 0.6519088745117188, 0.677093505859375, 0.7022781372070312, 0.7274627685546875, 0.7526473999023438, 0.77783203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 9.0, 4.0, 5.0, 13.0, 13.0, 16.0, 22.0, 19.0, 16.0, 29.0, 29.0, 27.0, 29.0, 50.0, 38.0, 43.0, 30.0, 49.0, 45.0, 42.0, 37.0, 39.0, 35.0, 31.0, 34.0, 36.0, 25.0, 24.0, 30.0, 18.0, 16.0, 26.0, 18.0, 15.0, 13.0, 12.0, 11.0, 13.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.078125, -2.9798583984375, -2.881591796875, -2.7833251953125, -2.68505859375, -2.5867919921875, -2.488525390625, -2.3902587890625, -2.2919921875, -2.1937255859375, -2.095458984375, -1.9971923828125, -1.89892578125, -1.8006591796875, -1.702392578125, -1.6041259765625, -1.505859375, -1.4075927734375, -1.309326171875, -1.2110595703125, -1.11279296875, -1.0145263671875, -0.916259765625, -0.8179931640625, -0.7197265625, -0.6214599609375, -0.523193359375, -0.4249267578125, -0.32666015625, -0.2283935546875, -0.130126953125, -0.0318603515625, 0.06640625, 0.1646728515625, 0.262939453125, 0.3612060546875, 0.45947265625, 0.5577392578125, 0.656005859375, 0.7542724609375, 0.8525390625, 0.9508056640625, 1.049072265625, 1.1473388671875, 1.24560546875, 1.3438720703125, 1.442138671875, 1.5404052734375, 1.638671875, 1.7369384765625, 1.835205078125, 1.9334716796875, 2.03173828125, 2.1300048828125, 2.228271484375, 2.3265380859375, 2.4248046875, 2.5230712890625, 2.621337890625, 2.7196044921875, 2.81787109375, 2.9161376953125, 3.014404296875, 3.1126708984375, 3.2109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 18.0, 22.0, 39.0, 63.0, 65.0, 108.0, 126.0, 224.0, 337.0, 472.0, 681.0, 1107.0, 1598.0, 2583.0, 4234.0, 6781.0, 11181.0, 18887.0, 31781.0, 54900.0, 95891.0, 162816.0, 217005.0, 178098.0, 107957.0, 62023.0, 35391.0, 20739.0, 12661.0, 7684.0, 4764.0, 2931.0, 1834.0, 1219.0, 762.0, 484.0, 308.0, 243.0, 162.0, 106.0, 61.0, 59.0, 39.0, 34.0, 19.0, 8.0, 14.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.94140625, -0.91064453125, -0.8798828125, -0.84912109375, -0.818359375, -0.78759765625, -0.7568359375, -0.72607421875, -0.6953125, -0.66455078125, -0.6337890625, -0.60302734375, -0.572265625, -0.54150390625, -0.5107421875, -0.47998046875, -0.44921875, -0.41845703125, -0.3876953125, -0.35693359375, -0.326171875, -0.29541015625, -0.2646484375, -0.23388671875, -0.203125, -0.17236328125, -0.1416015625, -0.11083984375, -0.080078125, -0.04931640625, -0.0185546875, 0.01220703125, 0.04296875, 0.07373046875, 0.1044921875, 0.13525390625, 0.166015625, 0.19677734375, 0.2275390625, 0.25830078125, 0.2890625, 0.31982421875, 0.3505859375, 0.38134765625, 0.412109375, 0.44287109375, 0.4736328125, 0.50439453125, 0.53515625, 0.56591796875, 0.5966796875, 0.62744140625, 0.658203125, 0.68896484375, 0.7197265625, 0.75048828125, 0.78125, 0.81201171875, 0.8427734375, 0.87353515625, 0.904296875, 0.93505859375, 0.9658203125, 0.99658203125, 1.02734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 10.0, 17.0, 15.0, 18.0, 15.0, 27.0, 24.0, 26.0, 30.0, 29.0, 26.0, 32.0, 38.0, 32.0, 37.0, 42.0, 36.0, 34.0, 39.0, 44.0, 32.0, 38.0, 30.0, 28.0, 25.0, 30.0, 32.0, 22.0, 23.0, 18.0, 14.0, 16.0, 19.0, 10.0, 10.0, 9.0, 11.0, 6.0, 6.0, 5.0, 3.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.921875, -1.8626556396484375, -1.803436279296875, -1.7442169189453125, -1.68499755859375, -1.6257781982421875, -1.566558837890625, -1.5073394775390625, -1.4481201171875, -1.3889007568359375, -1.329681396484375, -1.2704620361328125, -1.21124267578125, -1.1520233154296875, -1.092803955078125, -1.0335845947265625, -0.974365234375, -0.9151458740234375, -0.855926513671875, -0.7967071533203125, -0.73748779296875, -0.6782684326171875, -0.619049072265625, -0.5598297119140625, -0.5006103515625, -0.4413909912109375, -0.382171630859375, -0.3229522705078125, -0.26373291015625, -0.2045135498046875, -0.145294189453125, -0.0860748291015625, -0.02685546875, 0.0323638916015625, 0.091583251953125, 0.1508026123046875, 0.21002197265625, 0.2692413330078125, 0.328460693359375, 0.3876800537109375, 0.4468994140625, 0.5061187744140625, 0.565338134765625, 0.6245574951171875, 0.68377685546875, 0.7429962158203125, 0.802215576171875, 0.8614349365234375, 0.920654296875, 0.9798736572265625, 1.039093017578125, 1.0983123779296875, 1.15753173828125, 1.2167510986328125, 1.275970458984375, 1.3351898193359375, 1.3944091796875, 1.4536285400390625, 1.512847900390625, 1.5720672607421875, 1.63128662109375, 1.6905059814453125, 1.749725341796875, 1.8089447021484375, 1.8681640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 13.0, 14.0, 16.0, 24.0, 22.0, 35.0, 72.0, 96.0, 123.0, 176.0, 271.0, 416.0, 703.0, 1188.0, 2144.0, 4150.0, 9138.0, 23399.0, 78105.0, 333980.0, 435057.0, 106859.0, 30248.0, 11240.0, 4948.0, 2509.0, 1332.0, 767.0, 483.0, 342.0, 193.0, 145.0, 103.0, 62.0, 38.0, 33.0, 39.0, 17.0, 17.0, 10.0, 2.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.489990234375, -0.4751930236816406, -0.46039581298828125, -0.4455986022949219, -0.4308013916015625, -0.4160041809082031, -0.40120697021484375, -0.3864097595214844, -0.371612548828125, -0.3568153381347656, -0.34201812744140625, -0.3272209167480469, -0.3124237060546875, -0.2976264953613281, -0.28282928466796875, -0.2680320739746094, -0.25323486328125, -0.23843765258789062, -0.22364044189453125, -0.20884323120117188, -0.1940460205078125, -0.17924880981445312, -0.16445159912109375, -0.14965438842773438, -0.134857177734375, -0.12005996704101562, -0.10526275634765625, -0.09046554565429688, -0.0756683349609375, -0.060871124267578125, -0.04607391357421875, -0.031276702880859375, -0.0164794921875, -0.001682281494140625, 0.01311492919921875, 0.027912139892578125, 0.0427093505859375, 0.057506561279296875, 0.07230377197265625, 0.08710098266601562, 0.101898193359375, 0.11669540405273438, 0.13149261474609375, 0.14628982543945312, 0.1610870361328125, 0.17588424682617188, 0.19068145751953125, 0.20547866821289062, 0.22027587890625, 0.23507308959960938, 0.24987030029296875, 0.2646675109863281, 0.2794647216796875, 0.2942619323730469, 0.30905914306640625, 0.3238563537597656, 0.338653564453125, 0.3534507751464844, 0.36824798583984375, 0.3830451965332031, 0.3978424072265625, 0.4126396179199219, 0.42743682861328125, 0.4422340393066406, 0.45703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 4.0, 10.0, 11.0, 13.0, 17.0, 23.0, 25.0, 24.0, 32.0, 40.0, 43.0, 54.0, 43.0, 63.0, 67.0, 71.0, 56.0, 54.0, 40.0, 40.0, 47.0, 31.0, 33.0, 27.0, 27.0, 13.0, 19.0, 14.0, 8.0, 7.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8358230590820312e-05, -1.779012382030487e-05, -1.722201704978943e-05, -1.6653910279273987e-05, -1.6085803508758545e-05, -1.5517696738243103e-05, -1.4949589967727661e-05, -1.438148319721222e-05, -1.3813376426696777e-05, -1.3245269656181335e-05, -1.2677162885665894e-05, -1.2109056115150452e-05, -1.154094934463501e-05, -1.0972842574119568e-05, -1.0404735803604126e-05, -9.836629033088684e-06, -9.268522262573242e-06, -8.7004154920578e-06, -8.132308721542358e-06, -7.5642019510269165e-06, -6.996095180511475e-06, -6.427988409996033e-06, -5.859881639480591e-06, -5.291774868965149e-06, -4.723668098449707e-06, -4.155561327934265e-06, -3.5874545574188232e-06, -3.0193477869033813e-06, -2.4512410163879395e-06, -1.8831342458724976e-06, -1.3150274753570557e-06, -7.469207048416138e-07, -1.7881393432617188e-07, 3.8929283618927e-07, 9.57399606704712e-07, 1.5255063772201538e-06, 2.0936131477355957e-06, 2.6617199182510376e-06, 3.2298266887664795e-06, 3.7979334592819214e-06, 4.366040229797363e-06, 4.934147000312805e-06, 5.502253770828247e-06, 6.070360541343689e-06, 6.638467311859131e-06, 7.206574082374573e-06, 7.774680852890015e-06, 8.342787623405457e-06, 8.910894393920898e-06, 9.47900116443634e-06, 1.0047107934951782e-05, 1.0615214705467224e-05, 1.1183321475982666e-05, 1.1751428246498108e-05, 1.231953501701355e-05, 1.2887641787528992e-05, 1.3455748558044434e-05, 1.4023855328559875e-05, 1.4591962099075317e-05, 1.516006886959076e-05, 1.57281756401062e-05, 1.6296282410621643e-05, 1.6864389181137085e-05, 1.7432495951652527e-05, 1.800060272216797e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 7.0, 6.0, 8.0, 10.0, 13.0, 28.0, 38.0, 45.0, 95.0, 154.0, 201.0, 320.0, 493.0, 775.0, 1266.0, 2094.0, 3394.0, 5736.0, 10048.0, 18469.0, 34735.0, 67676.0, 139083.0, 267846.0, 244903.0, 121591.0, 59489.0, 30729.0, 16545.0, 9175.0, 5413.0, 3125.0, 1911.0, 1155.0, 708.0, 459.0, 269.0, 182.0, 109.0, 79.0, 62.0, 41.0, 20.0, 18.0, 17.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.343017578125, -0.33226776123046875, -0.3215179443359375, -0.31076812744140625, -0.300018310546875, -0.28926849365234375, -0.2785186767578125, -0.26776885986328125, -0.25701904296875, -0.24626922607421875, -0.2355194091796875, -0.22476959228515625, -0.214019775390625, -0.20326995849609375, -0.1925201416015625, -0.18177032470703125, -0.1710205078125, -0.16027069091796875, -0.1495208740234375, -0.13877105712890625, -0.128021240234375, -0.11727142333984375, -0.1065216064453125, -0.09577178955078125, -0.08502197265625, -0.07427215576171875, -0.0635223388671875, -0.05277252197265625, -0.042022705078125, -0.03127288818359375, -0.0205230712890625, -0.00977325439453125, 0.0009765625, 0.01172637939453125, 0.0224761962890625, 0.03322601318359375, 0.043975830078125, 0.05472564697265625, 0.0654754638671875, 0.07622528076171875, 0.08697509765625, 0.09772491455078125, 0.1084747314453125, 0.11922454833984375, 0.129974365234375, 0.14072418212890625, 0.1514739990234375, 0.16222381591796875, 0.1729736328125, 0.18372344970703125, 0.1944732666015625, 0.20522308349609375, 0.215972900390625, 0.22672271728515625, 0.2374725341796875, 0.24822235107421875, 0.25897216796875, 0.26972198486328125, 0.2804718017578125, 0.29122161865234375, 0.301971435546875, 0.31272125244140625, 0.3234710693359375, 0.33422088623046875, 0.344970703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 7.0, 6.0, 11.0, 8.0, 17.0, 19.0, 15.0, 16.0, 29.0, 29.0, 55.0, 61.0, 68.0, 92.0, 81.0, 93.0, 86.0, 61.0, 47.0, 46.0, 32.0, 19.0, 21.0, 20.0, 14.0, 8.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0863037109375, -0.0835580825805664, -0.08081245422363281, -0.07806682586669922, -0.07532119750976562, -0.07257556915283203, -0.06982994079589844, -0.06708431243896484, -0.06433868408203125, -0.061593055725097656, -0.05884742736816406, -0.05610179901123047, -0.053356170654296875, -0.05061054229736328, -0.04786491394042969, -0.045119285583496094, -0.0423736572265625, -0.039628028869628906, -0.03688240051269531, -0.03413677215576172, -0.031391143798828125, -0.02864551544189453, -0.025899887084960938, -0.023154258728027344, -0.02040863037109375, -0.017663002014160156, -0.014917373657226562, -0.012171745300292969, -0.009426116943359375, -0.006680488586425781, -0.0039348602294921875, -0.0011892318725585938, 0.001556396484375, 0.004302024841308594, 0.0070476531982421875, 0.009793281555175781, 0.012538909912109375, 0.015284538269042969, 0.018030166625976562, 0.020775794982910156, 0.02352142333984375, 0.026267051696777344, 0.029012680053710938, 0.03175830841064453, 0.034503936767578125, 0.03724956512451172, 0.03999519348144531, 0.042740821838378906, 0.0454864501953125, 0.048232078552246094, 0.05097770690917969, 0.05372333526611328, 0.056468963623046875, 0.05921459197998047, 0.06196022033691406, 0.06470584869384766, 0.06745147705078125, 0.07019710540771484, 0.07294273376464844, 0.07568836212158203, 0.07843399047851562, 0.08117961883544922, 0.08392524719238281, 0.0866708755493164, 0.08941650390625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 6.0, 3.0, 12.0, 9.0, 11.0, 16.0, 16.0, 19.0, 22.0, 22.0, 35.0, 25.0, 42.0, 39.0, 47.0, 51.0, 62.0, 55.0, 54.0, 47.0, 47.0, 49.0, 40.0, 31.0, 39.0, 39.0, 24.0, 21.0, 17.0, 20.0, 13.0, 16.0, 7.0, 10.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8380448818206787, -3.71785831451416, -3.5976717472076416, -3.477485179901123, -3.3572986125946045, -3.237112045288086, -3.1169254779815674, -2.996738910675049, -2.8765523433685303, -2.7563657760620117, -2.636179208755493, -2.5159926414489746, -2.395806074142456, -2.2756195068359375, -2.155432939529419, -2.0352463722229004, -1.9150596857070923, -1.7948731184005737, -1.6746865510940552, -1.5544999837875366, -1.434313416481018, -1.31412672996521, -1.1939401626586914, -1.0737535953521729, -0.9535670876502991, -0.8333805203437805, -0.713193953037262, -0.5930073261260986, -0.47282078862190247, -0.3526341915130615, -0.23244762420654297, -0.11226105690002441, 0.00792551040649414, 0.1281120777130127, 0.24829865992069244, 0.3684852421283722, 0.48867180943489075, 0.6088584065437317, 0.7290449738502502, 0.8492315411567688, 0.9694181084632874, 1.0896047353744507, 1.2097913026809692, 1.3299778699874878, 1.4501644372940063, 1.570351004600525, 1.6905375719070435, 1.810724139213562, 1.9309107065200806, 2.0510973930358887, 2.1712839603424072, 2.291470527648926, 2.4116570949554443, 2.531843662261963, 2.6520302295684814, 2.772216796875, 2.8924033641815186, 3.012589931488037, 3.1327764987945557, 3.252963066101074, 3.3731496334075928, 3.4933362007141113, 3.61352276802063, 3.7337093353271484, 3.853895902633667]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 3.0, 8.0, 8.0, 12.0, 16.0, 10.0, 18.0, 22.0, 24.0, 30.0, 35.0, 29.0, 37.0, 39.0, 47.0, 37.0, 43.0, 38.0, 54.0, 40.0, 43.0, 41.0, 35.0, 33.0, 34.0, 29.0, 32.0, 31.0, 27.0, 34.0, 22.0, 10.0, 14.0, 11.0, 10.0, 10.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.5153958797454834, -3.417088270187378, -3.3187808990478516, -3.220473289489746, -3.1221656799316406, -3.023858070373535, -2.925550699234009, -2.8272430896759033, -2.728935718536377, -2.6306281089782715, -2.532320737838745, -2.4340131282806396, -2.335705518722534, -2.237398147583008, -2.1390905380249023, -2.040782928466797, -1.9424753189086914, -1.8441678285598755, -1.74586021900177, -1.647552728652954, -1.5492451190948486, -1.4509376287460327, -1.3526301383972168, -1.2543225288391113, -1.1560150384902954, -1.0577075481414795, -0.959399938583374, -0.8610924482345581, -0.7627848982810974, -0.6644773483276367, -0.5661698579788208, -0.4678623080253601, -0.3695547580718994, -0.2712472081184387, -0.17293968796730042, -0.07463216781616211, 0.023675382137298584, 0.12198293209075928, 0.2202904224395752, 0.3185979723930359, 0.4169055223464966, 0.5152130722999573, 0.613520622253418, 0.7118281126022339, 0.8101356625556946, 0.9084432125091553, 1.0067507028579712, 1.105058193206787, 1.2033658027648926, 1.3016732931137085, 1.399980902671814, 1.4982883930206299, 1.5965960025787354, 1.6949034929275513, 1.7932109832763672, 1.8915185928344727, 1.9898260831832886, 2.0881335735321045, 2.18644118309021, 2.2847485542297363, 2.383056163787842, 2.4813637733459473, 2.5796713829040527, 2.677978754043579, 2.7762863636016846]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 7.0, 4.0, 14.0, 11.0, 16.0, 30.0, 50.0, 65.0, 128.0, 172.0, 267.0, 397.0, 637.0, 1007.0, 1484.0, 2265.0, 3367.0, 5013.0, 7625.0, 10917.0, 15818.0, 22408.0, 31812.0, 43533.0, 56749.0, 70934.0, 85411.0, 95891.0, 101017.0, 98389.0, 90025.0, 76584.0, 61663.0, 47155.0, 35580.0, 25718.0, 18176.0, 12528.0, 8577.0, 5740.0, 3893.0, 2565.0, 1676.0, 1166.0, 733.0, 455.0, 336.0, 194.0, 110.0, 84.0, 64.0, 39.0, 23.0, 12.0, 17.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0], "bins": [-2.17578125, -2.107086181640625, -2.03839111328125, -1.969696044921875, -1.9010009765625, -1.832305908203125, -1.76361083984375, -1.694915771484375, -1.626220703125, -1.557525634765625, -1.48883056640625, -1.420135498046875, -1.3514404296875, -1.282745361328125, -1.21405029296875, -1.145355224609375, -1.07666015625, -1.007965087890625, -0.93927001953125, -0.870574951171875, -0.8018798828125, -0.733184814453125, -0.66448974609375, -0.595794677734375, -0.527099609375, -0.458404541015625, -0.38970947265625, -0.321014404296875, -0.2523193359375, -0.183624267578125, -0.11492919921875, -0.046234130859375, 0.0224609375, 0.091156005859375, 0.15985107421875, 0.228546142578125, 0.2972412109375, 0.365936279296875, 0.43463134765625, 0.503326416015625, 0.572021484375, 0.640716552734375, 0.70941162109375, 0.778106689453125, 0.8468017578125, 0.915496826171875, 0.98419189453125, 1.052886962890625, 1.12158203125, 1.190277099609375, 1.25897216796875, 1.327667236328125, 1.3963623046875, 1.465057373046875, 1.53375244140625, 1.602447509765625, 1.671142578125, 1.739837646484375, 1.80853271484375, 1.877227783203125, 1.9459228515625, 2.014617919921875, 2.08331298828125, 2.152008056640625, 2.220703125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 10.0, 7.0, 11.0, 6.0, 13.0, 19.0, 18.0, 21.0, 38.0, 32.0, 36.0, 39.0, 43.0, 44.0, 46.0, 40.0, 40.0, 62.0, 37.0, 44.0, 35.0, 40.0, 43.0, 40.0, 38.0, 23.0, 27.0, 28.0, 20.0, 25.0, 10.0, 17.0, 10.0, 9.0, 6.0, 7.0, 6.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-4.10546875, -3.99346923828125, -3.8814697265625, -3.76947021484375, -3.657470703125, -3.54547119140625, -3.4334716796875, -3.32147216796875, -3.20947265625, -3.09747314453125, -2.9854736328125, -2.87347412109375, -2.761474609375, -2.64947509765625, -2.5374755859375, -2.42547607421875, -2.3134765625, -2.20147705078125, -2.0894775390625, -1.97747802734375, -1.865478515625, -1.75347900390625, -1.6414794921875, -1.52947998046875, -1.41748046875, -1.30548095703125, -1.1934814453125, -1.08148193359375, -0.969482421875, -0.85748291015625, -0.7454833984375, -0.63348388671875, -0.521484375, -0.40948486328125, -0.2974853515625, -0.18548583984375, -0.073486328125, 0.03851318359375, 0.1505126953125, 0.26251220703125, 0.37451171875, 0.48651123046875, 0.5985107421875, 0.71051025390625, 0.822509765625, 0.93450927734375, 1.0465087890625, 1.15850830078125, 1.2705078125, 1.38250732421875, 1.4945068359375, 1.60650634765625, 1.718505859375, 1.83050537109375, 1.9425048828125, 2.05450439453125, 2.16650390625, 2.27850341796875, 2.3905029296875, 2.50250244140625, 2.614501953125, 2.72650146484375, 2.8385009765625, 2.95050048828125, 3.0625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 13.0, 19.0, 31.0, 44.0, 75.0, 115.0, 166.0, 222.0, 410.0, 599.0, 917.0, 1367.0, 2247.0, 3362.0, 5108.0, 7698.0, 11426.0, 16656.0, 24384.0, 33506.0, 45886.0, 59661.0, 75141.0, 88416.0, 98057.0, 101351.0, 97561.0, 88268.0, 74427.0, 59582.0, 45154.0, 33209.0, 23755.0, 16436.0, 11110.0, 7459.0, 5098.0, 3282.0, 2272.0, 1386.0, 959.0, 604.0, 401.0, 254.0, 178.0, 105.0, 69.0, 33.0, 23.0, 19.0, 16.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.121795654296875, -2.05218505859375, -1.982574462890625, -1.9129638671875, -1.843353271484375, -1.77374267578125, -1.704132080078125, -1.634521484375, -1.564910888671875, -1.49530029296875, -1.425689697265625, -1.3560791015625, -1.286468505859375, -1.21685791015625, -1.147247314453125, -1.07763671875, -1.008026123046875, -0.93841552734375, -0.868804931640625, -0.7991943359375, -0.729583740234375, -0.65997314453125, -0.590362548828125, -0.520751953125, -0.451141357421875, -0.38153076171875, -0.311920166015625, -0.2423095703125, -0.172698974609375, -0.10308837890625, -0.033477783203125, 0.0361328125, 0.105743408203125, 0.17535400390625, 0.244964599609375, 0.3145751953125, 0.384185791015625, 0.45379638671875, 0.523406982421875, 0.593017578125, 0.662628173828125, 0.73223876953125, 0.801849365234375, 0.8714599609375, 0.941070556640625, 1.01068115234375, 1.080291748046875, 1.14990234375, 1.219512939453125, 1.28912353515625, 1.358734130859375, 1.4283447265625, 1.497955322265625, 1.56756591796875, 1.637176513671875, 1.706787109375, 1.776397705078125, 1.84600830078125, 1.915618896484375, 1.9852294921875, 2.054840087890625, 2.12445068359375, 2.194061279296875, 2.263671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 7.0, 9.0, 9.0, 13.0, 11.0, 14.0, 25.0, 16.0, 19.0, 23.0, 27.0, 33.0, 36.0, 46.0, 36.0, 41.0, 41.0, 36.0, 43.0, 44.0, 50.0, 34.0, 37.0, 32.0, 36.0, 36.0, 25.0, 37.0, 27.0, 29.0, 16.0, 16.0, 13.0, 12.0, 20.0, 7.0, 4.0, 4.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.876953125, -1.816009521484375, -1.75506591796875, -1.694122314453125, -1.6331787109375, -1.572235107421875, -1.51129150390625, -1.450347900390625, -1.389404296875, -1.328460693359375, -1.26751708984375, -1.206573486328125, -1.1456298828125, -1.084686279296875, -1.02374267578125, -0.962799072265625, -0.90185546875, -0.840911865234375, -0.77996826171875, -0.719024658203125, -0.6580810546875, -0.597137451171875, -0.53619384765625, -0.475250244140625, -0.414306640625, -0.353363037109375, -0.29241943359375, -0.231475830078125, -0.1705322265625, -0.109588623046875, -0.04864501953125, 0.012298583984375, 0.0732421875, 0.134185791015625, 0.19512939453125, 0.256072998046875, 0.3170166015625, 0.377960205078125, 0.43890380859375, 0.499847412109375, 0.560791015625, 0.621734619140625, 0.68267822265625, 0.743621826171875, 0.8045654296875, 0.865509033203125, 0.92645263671875, 0.987396240234375, 1.04833984375, 1.109283447265625, 1.17022705078125, 1.231170654296875, 1.2921142578125, 1.353057861328125, 1.41400146484375, 1.474945068359375, 1.535888671875, 1.596832275390625, 1.65777587890625, 1.718719482421875, 1.7796630859375, 1.840606689453125, 1.90155029296875, 1.962493896484375, 2.0234375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 17.0, 16.0, 31.0, 49.0, 64.0, 104.0, 160.0, 276.0, 417.0, 649.0, 1057.0, 1650.0, 2504.0, 4278.0, 6801.0, 10612.0, 16700.0, 26287.0, 39622.0, 58774.0, 83494.0, 110011.0, 129527.0, 133358.0, 120227.0, 96475.0, 70317.0, 47556.0, 31829.0, 20412.0, 13011.0, 8365.0, 5136.0, 3240.0, 2012.0, 1319.0, 814.0, 504.0, 340.0, 182.0, 118.0, 91.0, 38.0, 41.0, 13.0, 12.0, 14.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.1850433349609375, -1.144500732421875, -1.1039581298828125, -1.06341552734375, -1.0228729248046875, -0.982330322265625, -0.9417877197265625, -0.9012451171875, -0.8607025146484375, -0.820159912109375, -0.7796173095703125, -0.73907470703125, -0.6985321044921875, -0.657989501953125, -0.6174468994140625, -0.576904296875, -0.5363616943359375, -0.495819091796875, -0.4552764892578125, -0.41473388671875, -0.3741912841796875, -0.333648681640625, -0.2931060791015625, -0.2525634765625, -0.2120208740234375, -0.171478271484375, -0.1309356689453125, -0.09039306640625, -0.0498504638671875, -0.009307861328125, 0.0312347412109375, 0.07177734375, 0.1123199462890625, 0.152862548828125, 0.1934051513671875, 0.23394775390625, 0.2744903564453125, 0.315032958984375, 0.3555755615234375, 0.3961181640625, 0.4366607666015625, 0.477203369140625, 0.5177459716796875, 0.55828857421875, 0.5988311767578125, 0.639373779296875, 0.6799163818359375, 0.720458984375, 0.7610015869140625, 0.801544189453125, 0.8420867919921875, 0.88262939453125, 0.9231719970703125, 0.963714599609375, 1.0042572021484375, 1.0447998046875, 1.0853424072265625, 1.125885009765625, 1.1664276123046875, 1.20697021484375, 1.2475128173828125, 1.288055419921875, 1.3285980224609375, 1.369140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 9.0, 8.0, 12.0, 9.0, 14.0, 20.0, 25.0, 21.0, 29.0, 35.0, 45.0, 31.0, 52.0, 43.0, 57.0, 64.0, 38.0, 58.0, 41.0, 49.0, 51.0, 32.0, 33.0, 28.0, 34.0, 23.0, 28.0, 12.0, 17.0, 9.0, 17.0, 10.0, 9.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011819601058959961, -0.00011432264000177383, -0.00011044926941394806, -0.00010657589882612228, -0.00010270252823829651, -9.882915765047073e-05, -9.495578706264496e-05, -9.108241647481918e-05, -8.720904588699341e-05, -8.333567529916763e-05, -7.946230471134186e-05, -7.558893412351608e-05, -7.171556353569031e-05, -6.784219294786453e-05, -6.396882236003876e-05, -6.009545177221298e-05, -5.622208118438721e-05, -5.234871059656143e-05, -4.847534000873566e-05, -4.460196942090988e-05, -4.0728598833084106e-05, -3.685522824525833e-05, -3.2981857657432556e-05, -2.910848706960678e-05, -2.5235116481781006e-05, -2.136174589395523e-05, -1.7488375306129456e-05, -1.361500471830368e-05, -9.741634130477905e-06, -5.86826354265213e-06, -1.994892954826355e-06, 1.8784776329994202e-06, 5.751848220825195e-06, 9.62521880865097e-06, 1.3498589396476746e-05, 1.737195998430252e-05, 2.1245330572128296e-05, 2.511870115995407e-05, 2.8992071747779846e-05, 3.286544233560562e-05, 3.6738812923431396e-05, 4.061218351125717e-05, 4.448555409908295e-05, 4.835892468690872e-05, 5.22322952747345e-05, 5.610566586256027e-05, 5.997903645038605e-05, 6.385240703821182e-05, 6.77257776260376e-05, 7.159914821386337e-05, 7.547251880168915e-05, 7.934588938951492e-05, 8.32192599773407e-05, 8.709263056516647e-05, 9.096600115299225e-05, 9.483937174081802e-05, 9.87127423286438e-05, 0.00010258611291646957, 0.00010645948350429535, 0.00011033285409212112, 0.0001142062246799469, 0.00011807959526777267, 0.00012195296585559845, 0.00012582633644342422, 0.00012969970703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 12.0, 12.0, 15.0, 26.0, 37.0, 58.0, 83.0, 122.0, 202.0, 338.0, 485.0, 824.0, 1417.0, 2381.0, 4230.0, 7386.0, 13318.0, 23954.0, 41704.0, 69351.0, 107934.0, 147231.0, 167980.0, 154615.0, 117312.0, 77189.0, 47160.0, 27307.0, 15535.0, 8596.0, 4858.0, 2742.0, 1631.0, 951.0, 540.0, 364.0, 239.0, 133.0, 87.0, 62.0, 45.0, 27.0, 16.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6494140625, -1.598846435546875, -1.54827880859375, -1.497711181640625, -1.4471435546875, -1.396575927734375, -1.34600830078125, -1.295440673828125, -1.244873046875, -1.194305419921875, -1.14373779296875, -1.093170166015625, -1.0426025390625, -0.992034912109375, -0.94146728515625, -0.890899658203125, -0.84033203125, -0.789764404296875, -0.73919677734375, -0.688629150390625, -0.6380615234375, -0.587493896484375, -0.53692626953125, -0.486358642578125, -0.435791015625, -0.385223388671875, -0.33465576171875, -0.284088134765625, -0.2335205078125, -0.182952880859375, -0.13238525390625, -0.081817626953125, -0.03125, 0.019317626953125, 0.06988525390625, 0.120452880859375, 0.1710205078125, 0.221588134765625, 0.27215576171875, 0.322723388671875, 0.373291015625, 0.423858642578125, 0.47442626953125, 0.524993896484375, 0.5755615234375, 0.626129150390625, 0.67669677734375, 0.727264404296875, 0.77783203125, 0.828399658203125, 0.87896728515625, 0.929534912109375, 0.9801025390625, 1.030670166015625, 1.08123779296875, 1.131805419921875, 1.182373046875, 1.232940673828125, 1.28350830078125, 1.334075927734375, 1.3846435546875, 1.435211181640625, 1.48577880859375, 1.536346435546875, 1.5869140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 4.0, 5.0, 9.0, 15.0, 15.0, 15.0, 18.0, 30.0, 22.0, 40.0, 41.0, 56.0, 48.0, 55.0, 51.0, 65.0, 55.0, 57.0, 60.0, 59.0, 48.0, 33.0, 37.0, 23.0, 27.0, 26.0, 18.0, 7.0, 18.0, 10.0, 9.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.5122222900390625, -0.497100830078125, -0.4819793701171875, -0.46685791015625, -0.4517364501953125, -0.436614990234375, -0.4214935302734375, -0.4063720703125, -0.3912506103515625, -0.376129150390625, -0.3610076904296875, -0.34588623046875, -0.3307647705078125, -0.315643310546875, -0.3005218505859375, -0.285400390625, -0.2702789306640625, -0.255157470703125, -0.2400360107421875, -0.22491455078125, -0.2097930908203125, -0.194671630859375, -0.1795501708984375, -0.1644287109375, -0.1493072509765625, -0.134185791015625, -0.1190643310546875, -0.10394287109375, -0.0888214111328125, -0.073699951171875, -0.0585784912109375, -0.04345703125, -0.0283355712890625, -0.013214111328125, 0.0019073486328125, 0.01702880859375, 0.0321502685546875, 0.047271728515625, 0.0623931884765625, 0.0775146484375, 0.0926361083984375, 0.107757568359375, 0.1228790283203125, 0.13800048828125, 0.1531219482421875, 0.168243408203125, 0.1833648681640625, 0.198486328125, 0.2136077880859375, 0.228729248046875, 0.2438507080078125, 0.25897216796875, 0.2740936279296875, 0.289215087890625, 0.3043365478515625, 0.3194580078125, 0.3345794677734375, 0.349700927734375, 0.3648223876953125, 0.37994384765625, 0.3950653076171875, 0.410186767578125, 0.4253082275390625, 0.4404296875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 8.0, 5.0, 6.0, 8.0, 14.0, 21.0, 16.0, 19.0, 22.0, 24.0, 25.0, 31.0, 42.0, 47.0, 56.0, 47.0, 35.0, 64.0, 47.0, 54.0, 49.0, 42.0, 35.0, 38.0, 36.0, 36.0, 26.0, 29.0, 20.0, 16.0, 15.0, 18.0, 10.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.22485876083374, -4.104077339172363, -3.9832959175109863, -3.8625144958496094, -3.7417328357696533, -3.6209514141082764, -3.5001699924468994, -3.3793885707855225, -3.2586071491241455, -3.1378257274627686, -3.0170443058013916, -2.8962626457214355, -2.7754812240600586, -2.6546998023986816, -2.5339183807373047, -2.4131369590759277, -2.292355537414551, -2.171574115753174, -2.050792694091797, -1.9300111532211304, -1.8092297315597534, -1.688448190689087, -1.56766676902771, -1.446885347366333, -1.326103687286377, -1.205322265625, -1.0845407247543335, -0.9637593030929565, -0.8429778814315796, -0.7221964001655579, -0.6014149188995361, -0.4806334972381592, -0.3598520755767822, -0.23907062411308289, -0.11828915774822235, 0.0024923086166381836, 0.12327376008033752, 0.24405521154403687, 0.3648366928100586, 0.48561811447143555, 0.6063995957374573, 0.727181077003479, 0.847962498664856, 0.9687439799308777, 1.0895254611968994, 1.2103068828582764, 1.3310883045196533, 1.4518697261810303, 1.5726512670516968, 1.6934326887130737, 1.8142142295837402, 1.9349956512451172, 2.055777072906494, 2.176558494567871, 2.297339916229248, 2.418121337890625, 2.538902997970581, 2.659684419631958, 2.780465841293335, 2.901247501373291, 3.022028923034668, 3.142810344696045, 3.263591766357422, 3.384373188018799, 3.505154609680176]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 13.0, 11.0, 13.0, 11.0, 15.0, 14.0, 10.0, 21.0, 31.0, 17.0, 29.0, 16.0, 23.0, 43.0, 42.0, 46.0, 36.0, 40.0, 43.0, 33.0, 31.0, 36.0, 35.0, 38.0, 28.0, 25.0, 27.0, 29.0, 33.0, 29.0, 31.0, 32.0, 21.0, 21.0, 14.0, 9.0, 7.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.1431915760040283, -3.0495197772979736, -2.95584774017334, -2.862175941467285, -2.7685039043426514, -2.6748321056365967, -2.581160068511963, -2.487488269805908, -2.3938164710998535, -2.300144672393799, -2.206472635269165, -2.1128008365631104, -2.0191287994384766, -1.9254570007324219, -1.8317850828170776, -1.7381131649017334, -1.6444411277770996, -1.5507692098617554, -1.4570972919464111, -1.3634254932403564, -1.2697534561157227, -1.176081657409668, -1.0824097394943237, -0.9887378215789795, -0.8950659036636353, -0.801393985748291, -0.7077220678329468, -0.6140502095222473, -0.5203782916069031, -0.42670637369155884, -0.3330345153808594, -0.23936259746551514, -0.1456906795501709, -0.052018776535987854, 0.04165312647819519, 0.13532501459121704, 0.22899693250656128, 0.3226688504219055, 0.416340708732605, 0.5100126266479492, 0.6036845445632935, 0.6973564624786377, 0.7910283803939819, 0.8847002387046814, 0.9783721566200256, 1.0720441341400146, 1.1657159328460693, 1.2593878507614136, 1.3530597686767578, 1.446731686592102, 1.5404036045074463, 1.634075403213501, 1.7277474403381348, 1.8214192390441895, 1.9150911569595337, 2.008763074874878, 2.1024351119995117, 2.1961069107055664, 2.2897789478302, 2.383450746536255, 2.4771227836608887, 2.5707945823669434, 2.664466381072998, 2.758138418197632, 2.8518102169036865]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 20.0, 29.0, 46.0, 79.0, 131.0, 272.0, 391.0, 686.0, 1197.0, 2095.0, 3493.0, 5949.0, 10059.0, 17194.0, 29291.0, 49105.0, 82382.0, 135537.0, 218028.0, 333862.0, 471331.0, 586323.0, 614515.0, 534788.0, 400673.0, 268946.0, 170313.0, 104122.0, 62720.0, 37253.0, 21943.0, 12822.0, 7597.0, 4469.0, 2624.0, 1623.0, 927.0, 583.0, 347.0, 201.0, 127.0, 81.0, 48.0, 19.0, 19.0, 12.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.354217529296875, -3.25335693359375, -3.152496337890625, -3.0516357421875, -2.950775146484375, -2.84991455078125, -2.749053955078125, -2.648193359375, -2.547332763671875, -2.44647216796875, -2.345611572265625, -2.2447509765625, -2.143890380859375, -2.04302978515625, -1.942169189453125, -1.84130859375, -1.740447998046875, -1.63958740234375, -1.538726806640625, -1.4378662109375, -1.337005615234375, -1.23614501953125, -1.135284423828125, -1.034423828125, -0.933563232421875, -0.83270263671875, -0.731842041015625, -0.6309814453125, -0.530120849609375, -0.42926025390625, -0.328399658203125, -0.2275390625, -0.126678466796875, -0.02581787109375, 0.075042724609375, 0.1759033203125, 0.276763916015625, 0.37762451171875, 0.478485107421875, 0.579345703125, 0.680206298828125, 0.78106689453125, 0.881927490234375, 0.9827880859375, 1.083648681640625, 1.18450927734375, 1.285369873046875, 1.38623046875, 1.487091064453125, 1.58795166015625, 1.688812255859375, 1.7896728515625, 1.890533447265625, 1.99139404296875, 2.092254638671875, 2.193115234375, 2.293975830078125, 2.39483642578125, 2.495697021484375, 2.5965576171875, 2.697418212890625, 2.79827880859375, 2.899139404296875, 3.0]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 7.0, 8.0, 10.0, 12.0, 14.0, 10.0, 6.0, 26.0, 20.0, 21.0, 24.0, 31.0, 26.0, 27.0, 22.0, 36.0, 36.0, 39.0, 44.0, 29.0, 38.0, 41.0, 41.0, 33.0, 32.0, 34.0, 40.0, 21.0, 23.0, 33.0, 26.0, 38.0, 26.0, 21.0, 14.0, 19.0, 9.0, 14.0, 8.0, 9.0, 6.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.29296875, -2.22369384765625, -2.1544189453125, -2.08514404296875, -2.015869140625, -1.94659423828125, -1.8773193359375, -1.80804443359375, -1.73876953125, -1.66949462890625, -1.6002197265625, -1.53094482421875, -1.461669921875, -1.39239501953125, -1.3231201171875, -1.25384521484375, -1.1845703125, -1.11529541015625, -1.0460205078125, -0.97674560546875, -0.907470703125, -0.83819580078125, -0.7689208984375, -0.69964599609375, -0.63037109375, -0.56109619140625, -0.4918212890625, -0.42254638671875, -0.353271484375, -0.28399658203125, -0.2147216796875, -0.14544677734375, -0.076171875, -0.00689697265625, 0.0623779296875, 0.13165283203125, 0.200927734375, 0.27020263671875, 0.3394775390625, 0.40875244140625, 0.47802734375, 0.54730224609375, 0.6165771484375, 0.68585205078125, 0.755126953125, 0.82440185546875, 0.8936767578125, 0.96295166015625, 1.0322265625, 1.10150146484375, 1.1707763671875, 1.24005126953125, 1.309326171875, 1.37860107421875, 1.4478759765625, 1.51715087890625, 1.58642578125, 1.65570068359375, 1.7249755859375, 1.79425048828125, 1.863525390625, 1.93280029296875, 2.0020751953125, 2.07135009765625, 2.140625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 15.0, 31.0, 45.0, 51.0, 89.0, 166.0, 289.0, 402.0, 664.0, 1007.0, 1587.0, 2496.0, 4083.0, 6273.0, 10156.0, 16180.0, 25516.0, 39593.0, 62067.0, 95848.0, 143532.0, 207974.0, 288727.0, 375839.0, 450274.0, 489673.0, 475683.0, 416226.0, 331561.0, 246202.0, 173157.0, 115966.0, 76782.0, 49480.0, 31924.0, 20212.0, 12747.0, 8086.0, 5080.0, 3100.0, 2039.0, 1233.0, 821.0, 543.0, 351.0, 207.0, 117.0, 74.0, 42.0, 35.0, 11.0, 12.0, 7.0, 5.0, 2.0, 1.0], "bins": [-2.947265625, -2.85992431640625, -2.7725830078125, -2.68524169921875, -2.597900390625, -2.51055908203125, -2.4232177734375, -2.33587646484375, -2.24853515625, -2.16119384765625, -2.0738525390625, -1.98651123046875, -1.899169921875, -1.81182861328125, -1.7244873046875, -1.63714599609375, -1.5498046875, -1.46246337890625, -1.3751220703125, -1.28778076171875, -1.200439453125, -1.11309814453125, -1.0257568359375, -0.93841552734375, -0.85107421875, -0.76373291015625, -0.6763916015625, -0.58905029296875, -0.501708984375, -0.41436767578125, -0.3270263671875, -0.23968505859375, -0.15234375, -0.06500244140625, 0.0223388671875, 0.10968017578125, 0.197021484375, 0.28436279296875, 0.3717041015625, 0.45904541015625, 0.54638671875, 0.63372802734375, 0.7210693359375, 0.80841064453125, 0.895751953125, 0.98309326171875, 1.0704345703125, 1.15777587890625, 1.2451171875, 1.33245849609375, 1.4197998046875, 1.50714111328125, 1.594482421875, 1.68182373046875, 1.7691650390625, 1.85650634765625, 1.94384765625, 2.03118896484375, 2.1185302734375, 2.20587158203125, 2.293212890625, 2.38055419921875, 2.4678955078125, 2.55523681640625, 2.642578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 10.0, 17.0, 20.0, 20.0, 35.0, 53.0, 46.0, 58.0, 85.0, 91.0, 110.0, 129.0, 128.0, 147.0, 165.0, 174.0, 198.0, 203.0, 230.0, 232.0, 196.0, 193.0, 205.0, 198.0, 151.0, 165.0, 145.0, 123.0, 97.0, 78.0, 80.0, 59.0, 41.0, 38.0, 33.0, 23.0, 27.0, 17.0, 8.0, 8.0, 7.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1787109375, -1.141021728515625, -1.10333251953125, -1.065643310546875, -1.0279541015625, -0.990264892578125, -0.95257568359375, -0.914886474609375, -0.877197265625, -0.839508056640625, -0.80181884765625, -0.764129638671875, -0.7264404296875, -0.688751220703125, -0.65106201171875, -0.613372802734375, -0.57568359375, -0.537994384765625, -0.50030517578125, -0.462615966796875, -0.4249267578125, -0.387237548828125, -0.34954833984375, -0.311859130859375, -0.274169921875, -0.236480712890625, -0.19879150390625, -0.161102294921875, -0.1234130859375, -0.085723876953125, -0.04803466796875, -0.010345458984375, 0.02734375, 0.065032958984375, 0.10272216796875, 0.140411376953125, 0.1781005859375, 0.215789794921875, 0.25347900390625, 0.291168212890625, 0.328857421875, 0.366546630859375, 0.40423583984375, 0.441925048828125, 0.4796142578125, 0.517303466796875, 0.55499267578125, 0.592681884765625, 0.63037109375, 0.668060302734375, 0.70574951171875, 0.743438720703125, 0.7811279296875, 0.818817138671875, 0.85650634765625, 0.894195556640625, 0.931884765625, 0.969573974609375, 1.00726318359375, 1.044952392578125, 1.0826416015625, 1.120330810546875, 1.15802001953125, 1.195709228515625, 1.2333984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 7.0, 7.0, 13.0, 13.0, 11.0, 12.0, 18.0, 18.0, 35.0, 25.0, 34.0, 36.0, 41.0, 37.0, 53.0, 46.0, 55.0, 55.0, 45.0, 59.0, 46.0, 50.0, 38.0, 32.0, 32.0, 27.0, 25.0, 22.0, 16.0, 21.0, 16.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9893364906311035, -3.8648409843444824, -3.7403454780578613, -3.6158499717712402, -3.491354465484619, -3.366858959197998, -3.242363691329956, -3.117868185043335, -2.993372678756714, -2.8688771724700928, -2.7443816661834717, -2.6198861598968506, -2.4953908920288086, -2.3708953857421875, -2.2463998794555664, -2.1219043731689453, -1.9974088668823242, -1.8729133605957031, -1.748417854309082, -1.6239224672317505, -1.4994269609451294, -1.3749314546585083, -1.2504360675811768, -1.1259405612945557, -1.0014450550079346, -0.8769495487213135, -0.7524541020393372, -0.6279586553573608, -0.5034631490707397, -0.37896764278411865, -0.25447219610214233, -0.12997674942016602, -0.005481243133544922, 0.11901423335075378, 0.2435097098350525, 0.3680051863193512, 0.4925006628036499, 0.616996169090271, 0.7414916157722473, 0.8659870624542236, 0.9904825687408447, 1.1149780750274658, 1.239473581314087, 1.3639689683914185, 1.4884644746780396, 1.6129599809646606, 1.7374553680419922, 1.8619508743286133, 1.9864463806152344, 2.1109418869018555, 2.2354373931884766, 2.3599328994750977, 2.4844284057617188, 2.60892391204834, 2.733419179916382, 2.857914686203003, 2.982410192489624, 3.106905698776245, 3.231401205062866, 3.3558967113494873, 3.4803919792175293, 3.6048874855041504, 3.7293829917907715, 3.8538784980773926, 3.9783740043640137]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 7.0, 6.0, 8.0, 11.0, 11.0, 13.0, 13.0, 13.0, 14.0, 22.0, 23.0, 30.0, 31.0, 29.0, 26.0, 24.0, 43.0, 34.0, 41.0, 44.0, 42.0, 52.0, 51.0, 30.0, 36.0, 32.0, 43.0, 36.0, 23.0, 33.0, 26.0, 24.0, 26.0, 20.0, 13.0, 11.0, 15.0, 10.0, 10.0, 5.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.173985004425049, -3.0850977897644043, -2.9962103366851807, -2.907323122024536, -2.8184356689453125, -2.729548454284668, -2.6406612396240234, -2.551774024963379, -2.4628865718841553, -2.3739993572235107, -2.285111904144287, -2.1962246894836426, -2.107337474822998, -2.0184500217437744, -1.9295628070831299, -1.8406754732131958, -1.7517881393432617, -1.6629008054733276, -1.5740134716033936, -1.485126256942749, -1.396238923072815, -1.3073515892028809, -1.2184643745422363, -1.1295770406723022, -1.0406897068023682, -0.9518023729324341, -0.8629150986671448, -0.7740278244018555, -0.6851404905319214, -0.5962531566619873, -0.507365882396698, -0.4184786081314087, -0.3295912742614746, -0.24070397019386292, -0.15181666612625122, -0.06292936205863953, 0.025957942008972168, 0.11484524607658386, 0.20373255014419556, 0.29261982440948486, 0.38150715827941895, 0.47039446234703064, 0.5592817664146423, 0.6481690406799316, 0.7370563745498657, 0.8259437084197998, 0.9148309826850891, 1.0037182569503784, 1.0926055908203125, 1.1814929246902466, 1.2703802585601807, 1.3592674732208252, 1.4481548070907593, 1.5370421409606934, 1.625929355621338, 1.714816689491272, 1.803704023361206, 1.8925913572311401, 1.9814786911010742, 2.0703659057617188, 2.1592531204223633, 2.248140573501587, 2.3370277881622314, 2.425915241241455, 2.5148024559020996]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 18.0, 16.0, 29.0, 37.0, 43.0, 73.0, 98.0, 147.0, 217.0, 295.0, 466.0, 684.0, 1017.0, 1496.0, 2210.0, 3470.0, 5429.0, 8524.0, 13658.0, 21833.0, 36445.0, 60588.0, 99224.0, 153998.0, 193685.0, 163860.0, 108491.0, 66615.0, 40262.0, 24327.0, 14573.0, 9328.0, 6025.0, 3902.0, 2444.0, 1580.0, 1082.0, 760.0, 486.0, 341.0, 228.0, 177.0, 108.0, 74.0, 46.0, 49.0, 31.0, 20.0, 15.0, 8.0, 10.0, 7.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.77490234375, -0.751129150390625, -0.72735595703125, -0.703582763671875, -0.6798095703125, -0.656036376953125, -0.63226318359375, -0.608489990234375, -0.584716796875, -0.560943603515625, -0.53717041015625, -0.513397216796875, -0.4896240234375, -0.465850830078125, -0.44207763671875, -0.418304443359375, -0.39453125, -0.370758056640625, -0.34698486328125, -0.323211669921875, -0.2994384765625, -0.275665283203125, -0.25189208984375, -0.228118896484375, -0.204345703125, -0.180572509765625, -0.15679931640625, -0.133026123046875, -0.1092529296875, -0.085479736328125, -0.06170654296875, -0.037933349609375, -0.01416015625, 0.009613037109375, 0.03338623046875, 0.057159423828125, 0.0809326171875, 0.104705810546875, 0.12847900390625, 0.152252197265625, 0.176025390625, 0.199798583984375, 0.22357177734375, 0.247344970703125, 0.2711181640625, 0.294891357421875, 0.31866455078125, 0.342437744140625, 0.3662109375, 0.389984130859375, 0.41375732421875, 0.437530517578125, 0.4613037109375, 0.485076904296875, 0.50885009765625, 0.532623291015625, 0.556396484375, 0.580169677734375, 0.60394287109375, 0.627716064453125, 0.6514892578125, 0.675262451171875, 0.69903564453125, 0.722808837890625, 0.74658203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 12.0, 2.0, 10.0, 8.0, 6.0, 11.0, 14.0, 11.0, 25.0, 18.0, 14.0, 23.0, 23.0, 30.0, 30.0, 34.0, 32.0, 26.0, 26.0, 34.0, 42.0, 44.0, 41.0, 35.0, 41.0, 40.0, 39.0, 29.0, 34.0, 33.0, 23.0, 23.0, 25.0, 15.0, 15.0, 19.0, 16.0, 21.0, 12.0, 11.0, 8.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.798828125, -2.71405029296875, -2.6292724609375, -2.54449462890625, -2.459716796875, -2.37493896484375, -2.2901611328125, -2.20538330078125, -2.12060546875, -2.03582763671875, -1.9510498046875, -1.86627197265625, -1.781494140625, -1.69671630859375, -1.6119384765625, -1.52716064453125, -1.4423828125, -1.35760498046875, -1.2728271484375, -1.18804931640625, -1.103271484375, -1.01849365234375, -0.9337158203125, -0.84893798828125, -0.76416015625, -0.67938232421875, -0.5946044921875, -0.50982666015625, -0.425048828125, -0.34027099609375, -0.2554931640625, -0.17071533203125, -0.0859375, -0.00115966796875, 0.0836181640625, 0.16839599609375, 0.253173828125, 0.33795166015625, 0.4227294921875, 0.50750732421875, 0.59228515625, 0.67706298828125, 0.7618408203125, 0.84661865234375, 0.931396484375, 1.01617431640625, 1.1009521484375, 1.18572998046875, 1.2705078125, 1.35528564453125, 1.4400634765625, 1.52484130859375, 1.609619140625, 1.69439697265625, 1.7791748046875, 1.86395263671875, 1.94873046875, 2.03350830078125, 2.1182861328125, 2.20306396484375, 2.287841796875, 2.37261962890625, 2.4573974609375, 2.54217529296875, 2.626953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 14.0, 16.0, 15.0, 41.0, 53.0, 75.0, 79.0, 139.0, 200.0, 289.0, 393.0, 596.0, 909.0, 1461.0, 2286.0, 3582.0, 5956.0, 9560.0, 16144.0, 27563.0, 47569.0, 83497.0, 141846.0, 207312.0, 195011.0, 126615.0, 73590.0, 41948.0, 24468.0, 14294.0, 8506.0, 5291.0, 3288.0, 1994.0, 1298.0, 867.0, 588.0, 351.0, 260.0, 183.0, 116.0, 71.0, 65.0, 43.0, 36.0, 21.0, 13.0, 12.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8525390625, -0.8249359130859375, -0.797332763671875, -0.7697296142578125, -0.74212646484375, -0.7145233154296875, -0.686920166015625, -0.6593170166015625, -0.6317138671875, -0.6041107177734375, -0.576507568359375, -0.5489044189453125, -0.52130126953125, -0.4936981201171875, -0.466094970703125, -0.4384918212890625, -0.410888671875, -0.3832855224609375, -0.355682373046875, -0.3280792236328125, -0.30047607421875, -0.2728729248046875, -0.245269775390625, -0.2176666259765625, -0.1900634765625, -0.1624603271484375, -0.134857177734375, -0.1072540283203125, -0.07965087890625, -0.0520477294921875, -0.024444580078125, 0.0031585693359375, 0.03076171875, 0.0583648681640625, 0.085968017578125, 0.1135711669921875, 0.14117431640625, 0.1687774658203125, 0.196380615234375, 0.2239837646484375, 0.2515869140625, 0.2791900634765625, 0.306793212890625, 0.3343963623046875, 0.36199951171875, 0.3896026611328125, 0.417205810546875, 0.4448089599609375, 0.472412109375, 0.5000152587890625, 0.527618408203125, 0.5552215576171875, 0.58282470703125, 0.6104278564453125, 0.638031005859375, 0.6656341552734375, 0.6932373046875, 0.7208404541015625, 0.748443603515625, 0.7760467529296875, 0.80364990234375, 0.8312530517578125, 0.858856201171875, 0.8864593505859375, 0.9140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 16.0, 10.0, 16.0, 18.0, 18.0, 16.0, 26.0, 29.0, 30.0, 25.0, 29.0, 34.0, 35.0, 37.0, 36.0, 54.0, 43.0, 53.0, 29.0, 57.0, 41.0, 48.0, 27.0, 33.0, 30.0, 30.0, 22.0, 26.0, 19.0, 18.0, 17.0, 12.0, 8.0, 10.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6904754638671875, -1.629974365234375, -1.5694732666015625, -1.50897216796875, -1.4484710693359375, -1.387969970703125, -1.3274688720703125, -1.2669677734375, -1.2064666748046875, -1.145965576171875, -1.0854644775390625, -1.02496337890625, -0.9644622802734375, -0.903961181640625, -0.8434600830078125, -0.782958984375, -0.7224578857421875, -0.661956787109375, -0.6014556884765625, -0.54095458984375, -0.4804534912109375, -0.419952392578125, -0.3594512939453125, -0.2989501953125, -0.2384490966796875, -0.177947998046875, -0.1174468994140625, -0.05694580078125, 0.0035552978515625, 0.064056396484375, 0.1245574951171875, 0.18505859375, 0.2455596923828125, 0.306060791015625, 0.3665618896484375, 0.42706298828125, 0.4875640869140625, 0.548065185546875, 0.6085662841796875, 0.6690673828125, 0.7295684814453125, 0.790069580078125, 0.8505706787109375, 0.91107177734375, 0.9715728759765625, 1.032073974609375, 1.0925750732421875, 1.153076171875, 1.2135772705078125, 1.274078369140625, 1.3345794677734375, 1.39508056640625, 1.4555816650390625, 1.516082763671875, 1.5765838623046875, 1.6370849609375, 1.6975860595703125, 1.758087158203125, 1.8185882568359375, 1.87908935546875, 1.9395904541015625, 2.000091552734375, 2.0605926513671875, 2.12109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 12.0, 14.0, 30.0, 30.0, 41.0, 68.0, 91.0, 134.0, 209.0, 318.0, 634.0, 1106.0, 2117.0, 4880.0, 12822.0, 45147.0, 245932.0, 566503.0, 125206.0, 27078.0, 8762.0, 3549.0, 1709.0, 837.0, 464.0, 298.0, 195.0, 106.0, 88.0, 43.0, 33.0, 21.0, 13.0, 9.0, 13.0, 9.0, 9.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.48291015625, -0.46697998046875, -0.4510498046875, -0.43511962890625, -0.419189453125, -0.40325927734375, -0.3873291015625, -0.37139892578125, -0.35546875, -0.33953857421875, -0.3236083984375, -0.30767822265625, -0.291748046875, -0.27581787109375, -0.2598876953125, -0.24395751953125, -0.22802734375, -0.21209716796875, -0.1961669921875, -0.18023681640625, -0.164306640625, -0.14837646484375, -0.1324462890625, -0.11651611328125, -0.1005859375, -0.08465576171875, -0.0687255859375, -0.05279541015625, -0.036865234375, -0.02093505859375, -0.0050048828125, 0.01092529296875, 0.02685546875, 0.04278564453125, 0.0587158203125, 0.07464599609375, 0.090576171875, 0.10650634765625, 0.1224365234375, 0.13836669921875, 0.154296875, 0.17022705078125, 0.1861572265625, 0.20208740234375, 0.218017578125, 0.23394775390625, 0.2498779296875, 0.26580810546875, 0.28173828125, 0.29766845703125, 0.3135986328125, 0.32952880859375, 0.345458984375, 0.36138916015625, 0.3773193359375, 0.39324951171875, 0.4091796875, 0.42510986328125, 0.4410400390625, 0.45697021484375, 0.472900390625, 0.48883056640625, 0.5047607421875, 0.52069091796875, 0.53662109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 6.0, 2.0, 11.0, 13.0, 16.0, 16.0, 34.0, 39.0, 50.0, 70.0, 75.0, 81.0, 82.0, 80.0, 75.0, 72.0, 67.0, 60.0, 33.0, 42.0, 18.0, 20.0, 7.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9861927032470703e-05, -2.9025599360466003e-05, -2.8189271688461304e-05, -2.7352944016456604e-05, -2.6516616344451904e-05, -2.5680288672447205e-05, -2.4843961000442505e-05, -2.4007633328437805e-05, -2.3171305656433105e-05, -2.2334977984428406e-05, -2.1498650312423706e-05, -2.0662322640419006e-05, -1.9825994968414307e-05, -1.8989667296409607e-05, -1.8153339624404907e-05, -1.7317011952400208e-05, -1.6480684280395508e-05, -1.5644356608390808e-05, -1.4808028936386108e-05, -1.3971701264381409e-05, -1.3135373592376709e-05, -1.229904592037201e-05, -1.146271824836731e-05, -1.062639057636261e-05, -9.79006290435791e-06, -8.95373523235321e-06, -8.11740756034851e-06, -7.281079888343811e-06, -6.444752216339111e-06, -5.608424544334412e-06, -4.772096872329712e-06, -3.935769200325012e-06, -3.0994415283203125e-06, -2.263113856315613e-06, -1.426786184310913e-06, -5.904585123062134e-07, 2.4586915969848633e-07, 1.082196831703186e-06, 1.9185245037078857e-06, 2.7548521757125854e-06, 3.591179847717285e-06, 4.427507519721985e-06, 5.2638351917266846e-06, 6.100162863731384e-06, 6.936490535736084e-06, 7.772818207740784e-06, 8.609145879745483e-06, 9.445473551750183e-06, 1.0281801223754883e-05, 1.1118128895759583e-05, 1.1954456567764282e-05, 1.2790784239768982e-05, 1.3627111911773682e-05, 1.4463439583778381e-05, 1.529976725578308e-05, 1.613609492778778e-05, 1.697242259979248e-05, 1.780875027179718e-05, 1.864507794380188e-05, 1.948140561580658e-05, 2.031773328781128e-05, 2.115406095981598e-05, 2.199038863182068e-05, 2.282671630382538e-05, 2.3663043975830078e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 3.0, 9.0, 13.0, 19.0, 19.0, 32.0, 51.0, 74.0, 98.0, 124.0, 194.0, 251.0, 419.0, 686.0, 1179.0, 2027.0, 3861.0, 7368.0, 15341.0, 32202.0, 75592.0, 184196.0, 327620.0, 225363.0, 94687.0, 39855.0, 17994.0, 8805.0, 4509.0, 2431.0, 1304.0, 785.0, 454.0, 303.0, 207.0, 112.0, 105.0, 80.0, 51.0, 31.0, 39.0, 18.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.359130859375, -0.3487586975097656, -0.33838653564453125, -0.3280143737792969, -0.3176422119140625, -0.3072700500488281, -0.29689788818359375, -0.2865257263183594, -0.276153564453125, -0.2657814025878906, -0.25540924072265625, -0.24503707885742188, -0.2346649169921875, -0.22429275512695312, -0.21392059326171875, -0.20354843139648438, -0.19317626953125, -0.18280410766601562, -0.17243194580078125, -0.16205978393554688, -0.1516876220703125, -0.14131546020507812, -0.13094329833984375, -0.12057113647460938, -0.110198974609375, -0.09982681274414062, -0.08945465087890625, -0.07908248901367188, -0.0687103271484375, -0.058338165283203125, -0.04796600341796875, -0.037593841552734375, -0.0272216796875, -0.016849517822265625, -0.00647735595703125, 0.003894805908203125, 0.0142669677734375, 0.024639129638671875, 0.03501129150390625, 0.045383453369140625, 0.055755615234375, 0.06612777709960938, 0.07649993896484375, 0.08687210083007812, 0.0972442626953125, 0.10761642456054688, 0.11798858642578125, 0.12836074829101562, 0.13873291015625, 0.14910507202148438, 0.15947723388671875, 0.16984939575195312, 0.1802215576171875, 0.19059371948242188, 0.20096588134765625, 0.21133804321289062, 0.221710205078125, 0.23208236694335938, 0.24245452880859375, 0.2528266906738281, 0.2631988525390625, 0.2735710144042969, 0.28394317626953125, 0.2943153381347656, 0.3046875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 3.0, 10.0, 16.0, 9.0, 20.0, 21.0, 22.0, 41.0, 35.0, 46.0, 33.0, 59.0, 41.0, 47.0, 63.0, 42.0, 51.0, 46.0, 44.0, 45.0, 38.0, 30.0, 37.0, 22.0, 36.0, 27.0, 15.0, 15.0, 18.0, 8.0, 11.0, 6.0, 2.0, 9.0, 5.0, 3.0, 1.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.058807373046875, -0.05706214904785156, -0.055316925048828125, -0.05357170104980469, -0.05182647705078125, -0.05008125305175781, -0.048336029052734375, -0.04659080505371094, -0.0448455810546875, -0.04310035705566406, -0.041355133056640625, -0.03960990905761719, -0.03786468505859375, -0.03611946105957031, -0.034374237060546875, -0.03262901306152344, -0.0308837890625, -0.029138565063476562, -0.027393341064453125, -0.025648117065429688, -0.02390289306640625, -0.022157669067382812, -0.020412445068359375, -0.018667221069335938, -0.0169219970703125, -0.015176773071289062, -0.013431549072265625, -0.011686325073242188, -0.00994110107421875, -0.008195877075195312, -0.006450653076171875, -0.0047054290771484375, -0.002960205078125, -0.0012149810791015625, 0.000530242919921875, 0.0022754669189453125, 0.00402069091796875, 0.0057659149169921875, 0.007511138916015625, 0.009256362915039062, 0.0110015869140625, 0.012746810913085938, 0.014492034912109375, 0.016237258911132812, 0.01798248291015625, 0.019727706909179688, 0.021472930908203125, 0.023218154907226562, 0.02496337890625, 0.026708602905273438, 0.028453826904296875, 0.030199050903320312, 0.03194427490234375, 0.03368949890136719, 0.035434722900390625, 0.03717994689941406, 0.0389251708984375, 0.04067039489746094, 0.042415618896484375, 0.04416084289550781, 0.04590606689453125, 0.04765129089355469, 0.049396514892578125, 0.05114173889160156, 0.052886962890625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 13.0, 10.0, 16.0, 10.0, 18.0, 22.0, 26.0, 32.0, 32.0, 40.0, 39.0, 41.0, 51.0, 44.0, 54.0, 60.0, 52.0, 58.0, 44.0, 50.0, 31.0, 32.0, 34.0, 26.0, 28.0, 17.0, 24.0, 16.0, 13.0, 7.0, 7.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0174078941345215, -3.8919522762298584, -3.766496419906616, -3.641040802001953, -3.515584945678711, -3.390129327774048, -3.2646737098693848, -3.1392178535461426, -3.0137622356414795, -2.8883066177368164, -2.762850761413574, -2.637395143508911, -2.511939525604248, -2.386483669281006, -2.2610280513763428, -2.1355724334716797, -2.0101165771484375, -1.8846608400344849, -1.7592051029205322, -1.6337494850158691, -1.5082937479019165, -1.3828380107879639, -1.2573823928833008, -1.1319266557693481, -1.0064709186553955, -0.8810151815414429, -0.755559504032135, -0.6301038265228271, -0.5046480894088745, -0.3791923522949219, -0.253736674785614, -0.12828099727630615, -0.0028257369995117188, 0.12262997031211853, 0.24808567762374878, 0.37354138493537903, 0.4989970922470093, 0.6244528293609619, 0.7499085068702698, 0.8753641843795776, 1.0008199214935303, 1.126275658607483, 1.2517313957214355, 1.3771870136260986, 1.5026427507400513, 1.628098487854004, 1.753554105758667, 1.8790098428726196, 2.0044655799865723, 2.1299211978912354, 2.2553770542144775, 2.3808326721191406, 2.506288528442383, 2.631744146347046, 2.757199764251709, 2.882655620574951, 3.0081112384796143, 3.1335668563842773, 3.2590227127075195, 3.3844783306121826, 3.5099339485168457, 3.635389804840088, 3.760845422744751, 3.886301040649414, 4.011756896972656]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 12.0, 12.0, 13.0, 10.0, 17.0, 21.0, 20.0, 30.0, 32.0, 33.0, 23.0, 26.0, 36.0, 37.0, 42.0, 40.0, 42.0, 54.0, 51.0, 35.0, 35.0, 28.0, 40.0, 37.0, 29.0, 29.0, 34.0, 21.0, 27.0, 16.0, 16.0, 10.0, 15.0, 10.0, 11.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.1854891777038574, -3.0970325469970703, -3.008575677871704, -2.920119047164917, -2.831662178039551, -2.7432055473327637, -2.6547489166259766, -2.5662920475006104, -2.4778354167938232, -2.389378786087036, -2.30092191696167, -2.212465286254883, -2.1240084171295166, -2.0355517864227295, -1.9470950365066528, -1.8586382865905762, -1.7701815366744995, -1.6817247867584229, -1.5932680368423462, -1.5048112869262695, -1.4163546562194824, -1.3278979063034058, -1.239441156387329, -1.150984525680542, -1.0625276565551758, -0.9740709066390991, -0.8856142163276672, -0.7971574664115906, -0.7087007761001587, -0.620244026184082, -0.5317872762680054, -0.4433305859565735, -0.3548738956451416, -0.26641717553138733, -0.17796044051647186, -0.0895037055015564, -0.001046985387802124, 0.08740973472595215, 0.1758664846420288, 0.2643231749534607, 0.35277992486953735, 0.4412366449832916, 0.5296933650970459, 0.6181501150131226, 0.7066068649291992, 0.7950635552406311, 0.8835203051567078, 0.9719769954681396, 1.0604337453842163, 1.148890495300293, 1.2373472452163696, 1.3258039951324463, 1.4142606258392334, 1.50271737575531, 1.5911741256713867, 1.6796307563781738, 1.76808762550354, 1.8565443754196167, 1.9450011253356934, 2.0334577560424805, 2.1219146251678467, 2.210371255874634, 2.298828125, 2.387284755706787, 2.475741386413574]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 4.0, 5.0, 2.0, 10.0, 17.0, 20.0, 33.0, 52.0, 71.0, 112.0, 171.0, 253.0, 417.0, 579.0, 902.0, 1329.0, 2025.0, 2983.0, 4490.0, 6780.0, 9931.0, 14543.0, 21337.0, 30058.0, 41681.0, 55459.0, 71356.0, 86762.0, 98650.0, 104133.0, 102490.0, 92008.0, 78253.0, 62602.0, 47415.0, 34409.0, 24540.0, 17068.0, 11731.0, 8074.0, 5283.0, 3470.0, 2396.0, 1598.0, 1016.0, 701.0, 457.0, 293.0, 213.0, 137.0, 95.0, 48.0, 32.0, 25.0, 25.0, 11.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.248046875, -2.177154541015625, -2.10626220703125, -2.035369873046875, -1.9644775390625, -1.893585205078125, -1.82269287109375, -1.751800537109375, -1.680908203125, -1.610015869140625, -1.53912353515625, -1.468231201171875, -1.3973388671875, -1.326446533203125, -1.25555419921875, -1.184661865234375, -1.11376953125, -1.042877197265625, -0.97198486328125, -0.901092529296875, -0.8302001953125, -0.759307861328125, -0.68841552734375, -0.617523193359375, -0.546630859375, -0.475738525390625, -0.40484619140625, -0.333953857421875, -0.2630615234375, -0.192169189453125, -0.12127685546875, -0.050384521484375, 0.0205078125, 0.091400146484375, 0.16229248046875, 0.233184814453125, 0.3040771484375, 0.374969482421875, 0.44586181640625, 0.516754150390625, 0.587646484375, 0.658538818359375, 0.72943115234375, 0.800323486328125, 0.8712158203125, 0.942108154296875, 1.01300048828125, 1.083892822265625, 1.15478515625, 1.225677490234375, 1.29656982421875, 1.367462158203125, 1.4383544921875, 1.509246826171875, 1.58013916015625, 1.651031494140625, 1.721923828125, 1.792816162109375, 1.86370849609375, 1.934600830078125, 2.0054931640625, 2.076385498046875, 2.14727783203125, 2.218170166015625, 2.2890625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 7.0, 5.0, 11.0, 9.0, 17.0, 14.0, 9.0, 9.0, 20.0, 22.0, 22.0, 27.0, 29.0, 30.0, 42.0, 34.0, 38.0, 40.0, 52.0, 53.0, 45.0, 50.0, 43.0, 52.0, 30.0, 32.0, 36.0, 37.0, 32.0, 26.0, 16.0, 22.0, 20.0, 12.0, 8.0, 11.0, 11.0, 6.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.1875, -3.087493896484375, -2.98748779296875, -2.887481689453125, -2.7874755859375, -2.687469482421875, -2.58746337890625, -2.487457275390625, -2.387451171875, -2.287445068359375, -2.18743896484375, -2.087432861328125, -1.9874267578125, -1.887420654296875, -1.78741455078125, -1.687408447265625, -1.58740234375, -1.487396240234375, -1.38739013671875, -1.287384033203125, -1.1873779296875, -1.087371826171875, -0.98736572265625, -0.887359619140625, -0.787353515625, -0.687347412109375, -0.58734130859375, -0.487335205078125, -0.3873291015625, -0.287322998046875, -0.18731689453125, -0.087310791015625, 0.0126953125, 0.112701416015625, 0.21270751953125, 0.312713623046875, 0.4127197265625, 0.512725830078125, 0.61273193359375, 0.712738037109375, 0.812744140625, 0.912750244140625, 1.01275634765625, 1.112762451171875, 1.2127685546875, 1.312774658203125, 1.41278076171875, 1.512786865234375, 1.61279296875, 1.712799072265625, 1.81280517578125, 1.912811279296875, 2.0128173828125, 2.112823486328125, 2.21282958984375, 2.312835693359375, 2.412841796875, 2.512847900390625, 2.61285400390625, 2.712860107421875, 2.8128662109375, 2.912872314453125, 3.01287841796875, 3.112884521484375, 3.212890625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 10.0, 13.0, 28.0, 44.0, 66.0, 88.0, 114.0, 204.0, 341.0, 525.0, 736.0, 1185.0, 1803.0, 2787.0, 3978.0, 6079.0, 9057.0, 13352.0, 18985.0, 27308.0, 37077.0, 50164.0, 63826.0, 78422.0, 90148.0, 98106.0, 99523.0, 94283.0, 83167.0, 69323.0, 55266.0, 42123.0, 30880.0, 22134.0, 15705.0, 10626.0, 7079.0, 4780.0, 3104.0, 2100.0, 1396.0, 954.0, 588.0, 385.0, 235.0, 182.0, 113.0, 57.0, 44.0, 32.0, 16.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.271484375, -2.20306396484375, -2.1346435546875, -2.06622314453125, -1.997802734375, -1.92938232421875, -1.8609619140625, -1.79254150390625, -1.72412109375, -1.65570068359375, -1.5872802734375, -1.51885986328125, -1.450439453125, -1.38201904296875, -1.3135986328125, -1.24517822265625, -1.1767578125, -1.10833740234375, -1.0399169921875, -0.97149658203125, -0.903076171875, -0.83465576171875, -0.7662353515625, -0.69781494140625, -0.62939453125, -0.56097412109375, -0.4925537109375, -0.42413330078125, -0.355712890625, -0.28729248046875, -0.2188720703125, -0.15045166015625, -0.08203125, -0.01361083984375, 0.0548095703125, 0.12322998046875, 0.191650390625, 0.26007080078125, 0.3284912109375, 0.39691162109375, 0.46533203125, 0.53375244140625, 0.6021728515625, 0.67059326171875, 0.739013671875, 0.80743408203125, 0.8758544921875, 0.94427490234375, 1.0126953125, 1.08111572265625, 1.1495361328125, 1.21795654296875, 1.286376953125, 1.35479736328125, 1.4232177734375, 1.49163818359375, 1.56005859375, 1.62847900390625, 1.6968994140625, 1.76531982421875, 1.833740234375, 1.90216064453125, 1.9705810546875, 2.03900146484375, 2.107421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 17.0, 5.0, 14.0, 15.0, 11.0, 18.0, 21.0, 22.0, 27.0, 33.0, 32.0, 29.0, 34.0, 47.0, 52.0, 47.0, 40.0, 36.0, 52.0, 32.0, 45.0, 34.0, 35.0, 25.0, 35.0, 19.0, 29.0, 22.0, 14.0, 16.0, 21.0, 19.0, 20.0, 12.0, 5.0, 7.0, 9.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.705078125, -1.6501922607421875, -1.595306396484375, -1.5404205322265625, -1.48553466796875, -1.4306488037109375, -1.375762939453125, -1.3208770751953125, -1.2659912109375, -1.2111053466796875, -1.156219482421875, -1.1013336181640625, -1.04644775390625, -0.9915618896484375, -0.936676025390625, -0.8817901611328125, -0.826904296875, -0.7720184326171875, -0.717132568359375, -0.6622467041015625, -0.60736083984375, -0.5524749755859375, -0.497589111328125, -0.4427032470703125, -0.3878173828125, -0.3329315185546875, -0.278045654296875, -0.2231597900390625, -0.16827392578125, -0.1133880615234375, -0.058502197265625, -0.0036163330078125, 0.05126953125, 0.1061553955078125, 0.161041259765625, 0.2159271240234375, 0.27081298828125, 0.3256988525390625, 0.380584716796875, 0.4354705810546875, 0.4903564453125, 0.5452423095703125, 0.600128173828125, 0.6550140380859375, 0.70989990234375, 0.7647857666015625, 0.819671630859375, 0.8745574951171875, 0.929443359375, 0.9843292236328125, 1.039215087890625, 1.0941009521484375, 1.14898681640625, 1.2038726806640625, 1.258758544921875, 1.3136444091796875, 1.3685302734375, 1.4234161376953125, 1.478302001953125, 1.5331878662109375, 1.58807373046875, 1.6429595947265625, 1.697845458984375, 1.7527313232421875, 1.8076171875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 8.0, 13.0, 24.0, 17.0, 37.0, 50.0, 65.0, 93.0, 129.0, 208.0, 320.0, 496.0, 772.0, 1264.0, 2071.0, 3521.0, 5983.0, 10646.0, 18753.0, 34074.0, 59799.0, 100256.0, 146736.0, 178615.0, 168635.0, 126735.0, 81250.0, 46950.0, 26175.0, 14636.0, 8289.0, 4689.0, 2660.0, 1613.0, 1063.0, 686.0, 389.0, 246.0, 167.0, 113.0, 78.0, 55.0, 54.0, 31.0, 29.0, 21.0, 12.0, 6.0, 1.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0], "bins": [-1.7626953125, -1.70892333984375, -1.6551513671875, -1.60137939453125, -1.547607421875, -1.49383544921875, -1.4400634765625, -1.38629150390625, -1.33251953125, -1.27874755859375, -1.2249755859375, -1.17120361328125, -1.117431640625, -1.06365966796875, -1.0098876953125, -0.95611572265625, -0.90234375, -0.84857177734375, -0.7947998046875, -0.74102783203125, -0.687255859375, -0.63348388671875, -0.5797119140625, -0.52593994140625, -0.47216796875, -0.41839599609375, -0.3646240234375, -0.31085205078125, -0.257080078125, -0.20330810546875, -0.1495361328125, -0.09576416015625, -0.0419921875, 0.01177978515625, 0.0655517578125, 0.11932373046875, 0.173095703125, 0.22686767578125, 0.2806396484375, 0.33441162109375, 0.38818359375, 0.44195556640625, 0.4957275390625, 0.54949951171875, 0.603271484375, 0.65704345703125, 0.7108154296875, 0.76458740234375, 0.818359375, 0.87213134765625, 0.9259033203125, 0.97967529296875, 1.033447265625, 1.08721923828125, 1.1409912109375, 1.19476318359375, 1.24853515625, 1.30230712890625, 1.3560791015625, 1.40985107421875, 1.463623046875, 1.51739501953125, 1.5711669921875, 1.62493896484375, 1.6787109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 11.0, 6.0, 12.0, 7.0, 11.0, 15.0, 13.0, 24.0, 35.0, 25.0, 34.0, 38.0, 57.0, 59.0, 61.0, 44.0, 52.0, 60.0, 63.0, 40.0, 51.0, 46.0, 39.0, 40.0, 26.0, 14.0, 22.0, 15.0, 21.0, 6.0, 11.0, 7.0, 6.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011092424392700195, -0.00010638032108545303, -0.00010183639824390411, -9.72924754023552e-05, -9.274855256080627e-05, -8.820462971925735e-05, -8.366070687770844e-05, -7.911678403615952e-05, -7.45728611946106e-05, -7.002893835306168e-05, -6.548501551151276e-05, -6.094109266996384e-05, -5.639716982841492e-05, -5.1853246986866e-05, -4.730932414531708e-05, -4.276540130376816e-05, -3.822147846221924e-05, -3.367755562067032e-05, -2.91336327791214e-05, -2.458970993757248e-05, -2.004578709602356e-05, -1.550186425447464e-05, -1.095794141292572e-05, -6.4140185713768005e-06, -1.8700957298278809e-06, 2.673827111721039e-06, 7.2177499532699585e-06, 1.1761672794818878e-05, 1.6305595636367798e-05, 2.0849518477916718e-05, 2.5393441319465637e-05, 2.9937364161014557e-05, 3.4481287002563477e-05, 3.9025209844112396e-05, 4.3569132685661316e-05, 4.8113055527210236e-05, 5.2656978368759155e-05, 5.7200901210308075e-05, 6.1744824051857e-05, 6.628874689340591e-05, 7.083266973495483e-05, 7.537659257650375e-05, 7.992051541805267e-05, 8.446443825960159e-05, 8.900836110115051e-05, 9.355228394269943e-05, 9.809620678424835e-05, 0.00010264012962579727, 0.00010718405246734619, 0.00011172797530889511, 0.00011627189815044403, 0.00012081582099199295, 0.00012535974383354187, 0.0001299036666750908, 0.0001344475895166397, 0.00013899151235818863, 0.00014353543519973755, 0.00014807935804128647, 0.0001526232808828354, 0.0001571672037243843, 0.00016171112656593323, 0.00016625504940748215, 0.00017079897224903107, 0.00017534289509058, 0.0001798868179321289]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 10.0, 10.0, 21.0, 17.0, 42.0, 54.0, 108.0, 122.0, 208.0, 347.0, 640.0, 1035.0, 1724.0, 2798.0, 4778.0, 8286.0, 14186.0, 24058.0, 40897.0, 66468.0, 99868.0, 134715.0, 155307.0, 149412.0, 121652.0, 85654.0, 55439.0, 33354.0, 19723.0, 11356.0, 6668.0, 3914.0, 2271.0, 1388.0, 798.0, 473.0, 277.0, 189.0, 99.0, 71.0, 45.0, 37.0, 14.0, 13.0, 9.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3709869384765625, -1.324981689453125, -1.2789764404296875, -1.23297119140625, -1.1869659423828125, -1.140960693359375, -1.0949554443359375, -1.0489501953125, -1.0029449462890625, -0.956939697265625, -0.9109344482421875, -0.86492919921875, -0.8189239501953125, -0.772918701171875, -0.7269134521484375, -0.680908203125, -0.6349029541015625, -0.588897705078125, -0.5428924560546875, -0.49688720703125, -0.4508819580078125, -0.404876708984375, -0.3588714599609375, -0.3128662109375, -0.2668609619140625, -0.220855712890625, -0.1748504638671875, -0.12884521484375, -0.0828399658203125, -0.036834716796875, 0.0091705322265625, 0.05517578125, 0.1011810302734375, 0.147186279296875, 0.1931915283203125, 0.23919677734375, 0.2852020263671875, 0.331207275390625, 0.3772125244140625, 0.4232177734375, 0.4692230224609375, 0.515228271484375, 0.5612335205078125, 0.60723876953125, 0.6532440185546875, 0.699249267578125, 0.7452545166015625, 0.791259765625, 0.8372650146484375, 0.883270263671875, 0.9292755126953125, 0.97528076171875, 1.0212860107421875, 1.067291259765625, 1.1132965087890625, 1.1593017578125, 1.2053070068359375, 1.251312255859375, 1.2973175048828125, 1.34332275390625, 1.3893280029296875, 1.435333251953125, 1.4813385009765625, 1.52734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 10.0, 4.0, 17.0, 16.0, 10.0, 26.0, 23.0, 25.0, 27.0, 49.0, 35.0, 48.0, 46.0, 31.0, 42.0, 27.0, 50.0, 44.0, 36.0, 35.0, 36.0, 49.0, 37.0, 30.0, 28.0, 37.0, 24.0, 26.0, 22.0, 18.0, 15.0, 5.0, 7.0, 4.0, 10.0, 10.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4052734375, -0.39263916015625, -0.3800048828125, -0.36737060546875, -0.354736328125, -0.34210205078125, -0.3294677734375, -0.31683349609375, -0.30419921875, -0.29156494140625, -0.2789306640625, -0.26629638671875, -0.253662109375, -0.24102783203125, -0.2283935546875, -0.21575927734375, -0.203125, -0.19049072265625, -0.1778564453125, -0.16522216796875, -0.152587890625, -0.13995361328125, -0.1273193359375, -0.11468505859375, -0.10205078125, -0.08941650390625, -0.0767822265625, -0.06414794921875, -0.051513671875, -0.03887939453125, -0.0262451171875, -0.01361083984375, -0.0009765625, 0.01165771484375, 0.0242919921875, 0.03692626953125, 0.049560546875, 0.06219482421875, 0.0748291015625, 0.08746337890625, 0.10009765625, 0.11273193359375, 0.1253662109375, 0.13800048828125, 0.150634765625, 0.16326904296875, 0.1759033203125, 0.18853759765625, 0.201171875, 0.21380615234375, 0.2264404296875, 0.23907470703125, 0.251708984375, 0.26434326171875, 0.2769775390625, 0.28961181640625, 0.30224609375, 0.31488037109375, 0.3275146484375, 0.34014892578125, 0.352783203125, 0.36541748046875, 0.3780517578125, 0.39068603515625, 0.4033203125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 2.0, 7.0, 2.0, 7.0, 5.0, 3.0, 7.0, 12.0, 12.0, 16.0, 19.0, 23.0, 21.0, 29.0, 34.0, 39.0, 32.0, 41.0, 59.0, 55.0, 47.0, 45.0, 48.0, 50.0, 41.0, 47.0, 39.0, 42.0, 39.0, 31.0, 21.0, 15.0, 22.0, 20.0, 14.0, 11.0, 7.0, 7.0, 2.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0], "bins": [-4.134402275085449, -4.014522075653076, -3.894641876220703, -3.77476167678833, -3.654881477355957, -3.535001277923584, -3.415121078491211, -3.295240640640259, -3.1753604412078857, -3.0554802417755127, -2.9356000423431396, -2.8157198429107666, -2.6958396434783936, -2.5759592056274414, -2.4560790061950684, -2.3361988067626953, -2.2163186073303223, -2.096438407897949, -1.9765582084655762, -1.8566780090332031, -1.7367976903915405, -1.6169174909591675, -1.4970372915267944, -1.3771569728851318, -1.257277011871338, -1.1373968124389648, -1.0175166130065918, -0.897636353969574, -0.7777560949325562, -0.6578758955001831, -0.5379956960678101, -0.41811543703079224, -0.2982351779937744, -0.17835494875907898, -0.05847473442554474, 0.0614054799079895, 0.18128570914268494, 0.30116593837738037, 0.4210461378097534, 0.5409263968467712, 0.6608065962791443, 0.7806867957115173, 0.9005670547485352, 1.0204472541809082, 1.1403274536132812, 1.2602076530456543, 1.3800878524780273, 1.49996817111969, 1.619848370552063, 1.739728569984436, 1.859608769416809, 1.9794890880584717, 2.0993692874908447, 2.2192494869232178, 2.339129686355591, 2.459009885787964, 2.578890085220337, 2.69877028465271, 2.818650484085083, 2.938530683517456, 3.058410882949829, 3.1782913208007812, 3.2981715202331543, 3.4180517196655273, 3.5379319190979004]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 7.0, 3.0, 8.0, 9.0, 9.0, 16.0, 14.0, 13.0, 17.0, 20.0, 18.0, 19.0, 32.0, 34.0, 41.0, 42.0, 39.0, 28.0, 48.0, 29.0, 51.0, 36.0, 45.0, 26.0, 45.0, 50.0, 36.0, 38.0, 28.0, 31.0, 28.0, 29.0, 24.0, 11.0, 18.0, 11.0, 10.0, 5.0, 9.0, 6.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2428908348083496, -3.148726463317871, -3.0545620918273926, -2.960397720336914, -2.8662331104278564, -2.772068738937378, -2.6779043674468994, -2.583739995956421, -2.4895753860473633, -2.3954110145568848, -2.3012466430664062, -2.2070822715759277, -2.11291766166687, -2.0187532901763916, -1.924588918685913, -1.8304245471954346, -1.736260175704956, -1.6420958042144775, -1.5479313135147095, -1.453766942024231, -1.359602451324463, -1.2654380798339844, -1.1712737083435059, -1.0771093368530273, -0.9829448461532593, -0.888780415058136, -0.7946159839630127, -0.7004516124725342, -0.6062871813774109, -0.5121227502822876, -0.4179583787918091, -0.3237939476966858, -0.2296295166015625, -0.1354651004076004, -0.041300684213638306, 0.0528637170791626, 0.1470281481742859, 0.24119257926940918, 0.3353569507598877, 0.429521381855011, 0.5236858129501343, 0.6178502440452576, 0.7120146751403809, 0.8061790466308594, 0.9003434777259827, 0.994507908821106, 1.0886722803115845, 1.1828367710113525, 1.277001142501831, 1.3711655139923096, 1.4653300046920776, 1.5594943761825562, 1.6536588668823242, 1.7478232383728027, 1.8419876098632812, 1.9361519813537598, 2.0303163528442383, 2.124480724334717, 2.2186450958251953, 2.312809467315674, 2.4069740772247314, 2.50113844871521, 2.5953028202056885, 2.689467191696167, 2.7836318016052246]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 12.0, 30.0, 43.0, 55.0, 124.0, 183.0, 285.0, 480.0, 764.0, 1326.0, 2155.0, 3604.0, 6109.0, 10251.0, 17533.0, 29326.0, 50116.0, 86583.0, 144864.0, 236852.0, 367205.0, 518691.0, 629472.0, 626982.0, 514060.0, 364241.0, 234053.0, 142353.0, 85612.0, 49954.0, 29615.0, 17098.0, 9867.0, 5800.0, 3540.0, 2050.0, 1229.0, 684.0, 422.0, 247.0, 183.0, 93.0, 54.0, 34.0, 21.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3046875, -3.201385498046875, -3.09808349609375, -2.994781494140625, -2.8914794921875, -2.788177490234375, -2.68487548828125, -2.581573486328125, -2.478271484375, -2.374969482421875, -2.27166748046875, -2.168365478515625, -2.0650634765625, -1.961761474609375, -1.85845947265625, -1.755157470703125, -1.65185546875, -1.548553466796875, -1.44525146484375, -1.341949462890625, -1.2386474609375, -1.135345458984375, -1.03204345703125, -0.928741455078125, -0.825439453125, -0.722137451171875, -0.61883544921875, -0.515533447265625, -0.4122314453125, -0.308929443359375, -0.20562744140625, -0.102325439453125, 0.0009765625, 0.104278564453125, 0.20758056640625, 0.310882568359375, 0.4141845703125, 0.517486572265625, 0.62078857421875, 0.724090576171875, 0.827392578125, 0.930694580078125, 1.03399658203125, 1.137298583984375, 1.2406005859375, 1.343902587890625, 1.44720458984375, 1.550506591796875, 1.65380859375, 1.757110595703125, 1.86041259765625, 1.963714599609375, 2.0670166015625, 2.170318603515625, 2.27362060546875, 2.376922607421875, 2.480224609375, 2.583526611328125, 2.68682861328125, 2.790130615234375, 2.8934326171875, 2.996734619140625, 3.10003662109375, 3.203338623046875, 3.306640625]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 14.0, 27.0, 21.0, 26.0, 22.0, 25.0, 36.0, 47.0, 37.0, 33.0, 42.0, 60.0, 50.0, 49.0, 35.0, 45.0, 48.0, 40.0, 37.0, 49.0, 35.0, 23.0, 27.0, 23.0, 19.0, 19.0, 19.0, 13.0, 6.0, 2.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.6231689453125, -2.541259765625, -2.4593505859375, -2.37744140625, -2.2955322265625, -2.213623046875, -2.1317138671875, -2.0498046875, -1.9678955078125, -1.885986328125, -1.8040771484375, -1.72216796875, -1.6402587890625, -1.558349609375, -1.4764404296875, -1.39453125, -1.3126220703125, -1.230712890625, -1.1488037109375, -1.06689453125, -0.9849853515625, -0.903076171875, -0.8211669921875, -0.7392578125, -0.6573486328125, -0.575439453125, -0.4935302734375, -0.41162109375, -0.3297119140625, -0.247802734375, -0.1658935546875, -0.083984375, -0.0020751953125, 0.079833984375, 0.1617431640625, 0.24365234375, 0.3255615234375, 0.407470703125, 0.4893798828125, 0.5712890625, 0.6531982421875, 0.735107421875, 0.8170166015625, 0.89892578125, 0.9808349609375, 1.062744140625, 1.1446533203125, 1.2265625, 1.3084716796875, 1.390380859375, 1.4722900390625, 1.55419921875, 1.6361083984375, 1.718017578125, 1.7999267578125, 1.8818359375, 1.9637451171875, 2.045654296875, 2.1275634765625, 2.20947265625, 2.2913818359375, 2.373291015625, 2.4552001953125, 2.537109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 15.0, 18.0, 41.0, 46.0, 84.0, 130.0, 224.0, 353.0, 613.0, 1011.0, 1530.0, 2672.0, 4457.0, 7281.0, 12239.0, 20119.0, 33550.0, 54489.0, 88542.0, 141156.0, 215643.0, 311992.0, 419339.0, 507780.0, 542952.0, 508952.0, 420335.0, 313574.0, 215700.0, 140765.0, 88695.0, 55306.0, 33450.0, 20268.0, 12223.0, 7485.0, 4400.0, 2642.0, 1688.0, 1000.0, 602.0, 358.0, 227.0, 122.0, 80.0, 47.0, 37.0, 17.0, 11.0, 10.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.365234375, -3.2677001953125, -3.170166015625, -3.0726318359375, -2.97509765625, -2.8775634765625, -2.780029296875, -2.6824951171875, -2.5849609375, -2.4874267578125, -2.389892578125, -2.2923583984375, -2.19482421875, -2.0972900390625, -1.999755859375, -1.9022216796875, -1.8046875, -1.7071533203125, -1.609619140625, -1.5120849609375, -1.41455078125, -1.3170166015625, -1.219482421875, -1.1219482421875, -1.0244140625, -0.9268798828125, -0.829345703125, -0.7318115234375, -0.63427734375, -0.5367431640625, -0.439208984375, -0.3416748046875, -0.244140625, -0.1466064453125, -0.049072265625, 0.0484619140625, 0.14599609375, 0.2435302734375, 0.341064453125, 0.4385986328125, 0.5361328125, 0.6336669921875, 0.731201171875, 0.8287353515625, 0.92626953125, 1.0238037109375, 1.121337890625, 1.2188720703125, 1.31640625, 1.4139404296875, 1.511474609375, 1.6090087890625, 1.70654296875, 1.8040771484375, 1.901611328125, 1.9991455078125, 2.0966796875, 2.1942138671875, 2.291748046875, 2.3892822265625, 2.48681640625, 2.5843505859375, 2.681884765625, 2.7794189453125, 2.876953125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 12.0, 7.0, 15.0, 14.0, 16.0, 52.0, 37.0, 39.0, 51.0, 81.0, 70.0, 107.0, 122.0, 150.0, 172.0, 206.0, 201.0, 210.0, 212.0, 200.0, 244.0, 217.0, 219.0, 219.0, 162.0, 180.0, 134.0, 138.0, 99.0, 107.0, 72.0, 75.0, 43.0, 48.0, 38.0, 35.0, 16.0, 14.0, 11.0, 6.0, 6.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0839691162109375, -1.043914794921875, -1.0038604736328125, -0.96380615234375, -0.9237518310546875, -0.883697509765625, -0.8436431884765625, -0.8035888671875, -0.7635345458984375, -0.723480224609375, -0.6834259033203125, -0.64337158203125, -0.6033172607421875, -0.563262939453125, -0.5232086181640625, -0.483154296875, -0.4430999755859375, -0.403045654296875, -0.3629913330078125, -0.32293701171875, -0.2828826904296875, -0.242828369140625, -0.2027740478515625, -0.1627197265625, -0.1226654052734375, -0.082611083984375, -0.0425567626953125, -0.00250244140625, 0.0375518798828125, 0.077606201171875, 0.1176605224609375, 0.15771484375, 0.1977691650390625, 0.237823486328125, 0.2778778076171875, 0.31793212890625, 0.3579864501953125, 0.398040771484375, 0.4380950927734375, 0.4781494140625, 0.5182037353515625, 0.558258056640625, 0.5983123779296875, 0.63836669921875, 0.6784210205078125, 0.718475341796875, 0.7585296630859375, 0.798583984375, 0.8386383056640625, 0.878692626953125, 0.9187469482421875, 0.95880126953125, 0.9988555908203125, 1.038909912109375, 1.0789642333984375, 1.1190185546875, 1.1590728759765625, 1.199127197265625, 1.2391815185546875, 1.27923583984375, 1.3192901611328125, 1.359344482421875, 1.3993988037109375, 1.439453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 4.0, 6.0, 9.0, 9.0, 18.0, 13.0, 22.0, 16.0, 37.0, 28.0, 37.0, 46.0, 51.0, 44.0, 70.0, 57.0, 56.0, 59.0, 61.0, 51.0, 57.0, 38.0, 35.0, 32.0, 26.0, 17.0, 16.0, 18.0, 12.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.254247665405273, -4.113621234893799, -3.972994804382324, -3.8323686122894287, -3.691742181777954, -3.5511157512664795, -3.410489559173584, -3.2698631286621094, -3.1292366981506348, -2.98861026763916, -2.8479838371276855, -2.70735764503479, -2.5667312145233154, -2.426104784011841, -2.2854785919189453, -2.1448521614074707, -2.004225730895996, -1.8635993003845215, -1.7229729890823364, -1.5823466777801514, -1.4417202472686768, -1.3010938167572021, -1.160467505455017, -1.019841194152832, -0.8792147636413574, -0.7385883927345276, -0.5979620218276978, -0.4573356509208679, -0.3167092800140381, -0.17608290910720825, -0.03545653820037842, 0.10516983270645142, 0.24579668045043945, 0.3864230513572693, 0.5270494222640991, 0.667675793170929, 0.8083021640777588, 0.9489285349845886, 1.0895549058914185, 1.2301812171936035, 1.3708076477050781, 1.5114340782165527, 1.6520603895187378, 1.7926867008209229, 1.9333131313323975, 2.073939561843872, 2.2145657539367676, 2.355192184448242, 2.495818614959717, 2.6364450454711914, 2.777071475982666, 2.9176976680755615, 3.058324098587036, 3.1989505290985107, 3.3395767211914062, 3.480203151702881, 3.6208295822143555, 3.76145601272583, 3.9020824432373047, 4.042708873748779, 4.183335304260254, 4.32396125793457, 4.464587688446045, 4.6052141189575195, 4.745840549468994]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 4.0, 9.0, 6.0, 15.0, 15.0, 16.0, 20.0, 20.0, 14.0, 20.0, 35.0, 30.0, 34.0, 30.0, 33.0, 38.0, 49.0, 35.0, 35.0, 36.0, 41.0, 42.0, 41.0, 51.0, 28.0, 43.0, 37.0, 29.0, 22.0, 18.0, 19.0, 23.0, 28.0, 13.0, 10.0, 12.0, 9.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.814690589904785, -2.7282521724700928, -2.6418139934539795, -2.555375576019287, -2.468937397003174, -2.3824989795684814, -2.296060562133789, -2.209622383117676, -2.1231839656829834, -2.036745548248291, -1.9503073692321777, -1.8638689517974854, -1.7774306535720825, -1.6909923553466797, -1.6045539379119873, -1.5181156396865845, -1.4316773414611816, -1.3452390432357788, -1.258800745010376, -1.1723623275756836, -1.0859240293502808, -0.9994857311248779, -0.9130473732948303, -0.8266090154647827, -0.7401707172393799, -0.653732419013977, -0.5672940611839294, -0.4808557331562042, -0.394417405128479, -0.3079790771007538, -0.22154074907302856, -0.13510239124298096, -0.04866385459899902, 0.037774473428726196, 0.12421280145645142, 0.21065112948417664, 0.29708945751190186, 0.3835277855396271, 0.4699661135673523, 0.5564044713973999, 0.6428427696228027, 0.7292810678482056, 0.8157194256782532, 0.9021577835083008, 0.9885960817337036, 1.0750343799591064, 1.1614727973937988, 1.2479110956192017, 1.3343493938446045, 1.4207876920700073, 1.5072259902954102, 1.5936644077301025, 1.6801027059555054, 1.7665410041809082, 1.8529794216156006, 1.9394177198410034, 2.0258560180664062, 2.1122944355010986, 2.198732614517212, 2.2851710319519043, 2.3716092109680176, 2.45804762840271, 2.5444860458374023, 2.6309242248535156, 2.717362642288208]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 13.0, 12.0, 14.0, 23.0, 31.0, 42.0, 69.0, 101.0, 137.0, 237.0, 334.0, 526.0, 744.0, 1139.0, 1749.0, 2639.0, 4118.0, 6563.0, 10584.0, 16937.0, 28604.0, 47994.0, 82984.0, 136823.0, 193717.0, 188652.0, 129172.0, 78523.0, 45457.0, 26958.0, 16175.0, 9990.0, 6196.0, 3919.0, 2487.0, 1585.0, 1089.0, 715.0, 468.0, 318.0, 224.0, 134.0, 99.0, 82.0, 68.0, 31.0, 33.0, 14.0, 10.0, 14.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.9287109375, -0.9005203247070312, -0.8723297119140625, -0.8441390991210938, -0.815948486328125, -0.7877578735351562, -0.7595672607421875, -0.7313766479492188, -0.70318603515625, -0.6749954223632812, -0.6468048095703125, -0.6186141967773438, -0.590423583984375, -0.5622329711914062, -0.5340423583984375, -0.5058517456054688, -0.4776611328125, -0.44947052001953125, -0.4212799072265625, -0.39308929443359375, -0.364898681640625, -0.33670806884765625, -0.3085174560546875, -0.28032684326171875, -0.25213623046875, -0.22394561767578125, -0.1957550048828125, -0.16756439208984375, -0.139373779296875, -0.11118316650390625, -0.0829925537109375, -0.05480194091796875, -0.026611328125, 0.00157928466796875, 0.0297698974609375, 0.05796051025390625, 0.086151123046875, 0.11434173583984375, 0.1425323486328125, 0.17072296142578125, 0.19891357421875, 0.22710418701171875, 0.2552947998046875, 0.28348541259765625, 0.311676025390625, 0.33986663818359375, 0.3680572509765625, 0.39624786376953125, 0.4244384765625, 0.45262908935546875, 0.4808197021484375, 0.5090103149414062, 0.537200927734375, 0.5653915405273438, 0.5935821533203125, 0.6217727661132812, 0.64996337890625, 0.6781539916992188, 0.7063446044921875, 0.7345352172851562, 0.762725830078125, 0.7909164428710938, 0.8191070556640625, 0.8472976684570312, 0.87548828125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 1.0, 7.0, 4.0, 8.0, 19.0, 22.0, 15.0, 13.0, 27.0, 26.0, 27.0, 29.0, 41.0, 34.0, 36.0, 40.0, 39.0, 49.0, 46.0, 44.0, 53.0, 39.0, 39.0, 39.0, 38.0, 46.0, 29.0, 32.0, 31.0, 20.0, 18.0, 17.0, 17.0, 17.0, 13.0, 8.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771484375, -3.664276123046875, -3.55706787109375, -3.449859619140625, -3.3426513671875, -3.235443115234375, -3.12823486328125, -3.021026611328125, -2.913818359375, -2.806610107421875, -2.69940185546875, -2.592193603515625, -2.4849853515625, -2.377777099609375, -2.27056884765625, -2.163360595703125, -2.05615234375, -1.948944091796875, -1.84173583984375, -1.734527587890625, -1.6273193359375, -1.520111083984375, -1.41290283203125, -1.305694580078125, -1.198486328125, -1.091278076171875, -0.98406982421875, -0.876861572265625, -0.7696533203125, -0.662445068359375, -0.55523681640625, -0.448028564453125, -0.3408203125, -0.233612060546875, -0.12640380859375, -0.019195556640625, 0.0880126953125, 0.195220947265625, 0.30242919921875, 0.409637451171875, 0.516845703125, 0.624053955078125, 0.73126220703125, 0.838470458984375, 0.9456787109375, 1.052886962890625, 1.16009521484375, 1.267303466796875, 1.37451171875, 1.481719970703125, 1.58892822265625, 1.696136474609375, 1.8033447265625, 1.910552978515625, 2.01776123046875, 2.124969482421875, 2.232177734375, 2.339385986328125, 2.44659423828125, 2.553802490234375, 2.6610107421875, 2.768218994140625, 2.87542724609375, 2.982635498046875, 3.08984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 15.0, 17.0, 20.0, 36.0, 51.0, 85.0, 115.0, 175.0, 210.0, 373.0, 609.0, 846.0, 1422.0, 2220.0, 3816.0, 6257.0, 11048.0, 20017.0, 36539.0, 69416.0, 131711.0, 226963.0, 233670.0, 140113.0, 73722.0, 38873.0, 21187.0, 11679.0, 6770.0, 4122.0, 2343.0, 1472.0, 919.0, 558.0, 366.0, 252.0, 181.0, 121.0, 70.0, 52.0, 32.0, 30.0, 23.0, 15.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1184234619140625, -1.083526611328125, -1.0486297607421875, -1.01373291015625, -0.9788360595703125, -0.943939208984375, -0.9090423583984375, -0.8741455078125, -0.8392486572265625, -0.804351806640625, -0.7694549560546875, -0.73455810546875, -0.6996612548828125, -0.664764404296875, -0.6298675537109375, -0.594970703125, -0.5600738525390625, -0.525177001953125, -0.4902801513671875, -0.45538330078125, -0.4204864501953125, -0.385589599609375, -0.3506927490234375, -0.3157958984375, -0.2808990478515625, -0.246002197265625, -0.2111053466796875, -0.17620849609375, -0.1413116455078125, -0.106414794921875, -0.0715179443359375, -0.03662109375, -0.0017242431640625, 0.033172607421875, 0.0680694580078125, 0.10296630859375, 0.1378631591796875, 0.172760009765625, 0.2076568603515625, 0.2425537109375, 0.2774505615234375, 0.312347412109375, 0.3472442626953125, 0.38214111328125, 0.4170379638671875, 0.451934814453125, 0.4868316650390625, 0.521728515625, 0.5566253662109375, 0.591522216796875, 0.6264190673828125, 0.66131591796875, 0.6962127685546875, 0.731109619140625, 0.7660064697265625, 0.8009033203125, 0.8358001708984375, 0.870697021484375, 0.9055938720703125, 0.94049072265625, 0.9753875732421875, 1.010284423828125, 1.0451812744140625, 1.080078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 19.0, 27.0, 21.0, 21.0, 22.0, 23.0, 30.0, 24.0, 39.0, 38.0, 34.0, 30.0, 34.0, 31.0, 34.0, 37.0, 46.0, 42.0, 31.0, 40.0, 30.0, 28.0, 28.0, 25.0, 21.0, 20.0, 17.0, 15.0, 17.0, 18.0, 13.0, 13.0, 13.0, 12.0, 8.0, 8.0, 4.0, 7.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.4637451171875, -1.408935546875, -1.3541259765625, -1.29931640625, -1.2445068359375, -1.189697265625, -1.1348876953125, -1.080078125, -1.0252685546875, -0.970458984375, -0.9156494140625, -0.86083984375, -0.8060302734375, -0.751220703125, -0.6964111328125, -0.6416015625, -0.5867919921875, -0.531982421875, -0.4771728515625, -0.42236328125, -0.3675537109375, -0.312744140625, -0.2579345703125, -0.203125, -0.1483154296875, -0.093505859375, -0.0386962890625, 0.01611328125, 0.0709228515625, 0.125732421875, 0.1805419921875, 0.2353515625, 0.2901611328125, 0.344970703125, 0.3997802734375, 0.45458984375, 0.5093994140625, 0.564208984375, 0.6190185546875, 0.673828125, 0.7286376953125, 0.783447265625, 0.8382568359375, 0.89306640625, 0.9478759765625, 1.002685546875, 1.0574951171875, 1.1123046875, 1.1671142578125, 1.221923828125, 1.2767333984375, 1.33154296875, 1.3863525390625, 1.441162109375, 1.4959716796875, 1.55078125, 1.6055908203125, 1.660400390625, 1.7152099609375, 1.77001953125, 1.8248291015625, 1.879638671875, 1.9344482421875, 1.9892578125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 7.0, 15.0, 19.0, 22.0, 27.0, 41.0, 78.0, 94.0, 141.0, 188.0, 329.0, 474.0, 700.0, 1020.0, 1510.0, 2294.0, 3959.0, 7071.0, 15241.0, 44948.0, 270291.0, 571558.0, 83607.0, 22421.0, 9322.0, 4916.0, 2857.0, 1795.0, 1147.0, 827.0, 525.0, 363.0, 222.0, 167.0, 127.0, 64.0, 40.0, 36.0, 25.0, 21.0, 11.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6954269409179688, -0.6716156005859375, -0.6478042602539062, -0.623992919921875, -0.6001815795898438, -0.5763702392578125, -0.5525588989257812, -0.52874755859375, -0.5049362182617188, -0.4811248779296875, -0.45731353759765625, -0.433502197265625, -0.40969085693359375, -0.3858795166015625, -0.36206817626953125, -0.3382568359375, -0.31444549560546875, -0.2906341552734375, -0.26682281494140625, -0.243011474609375, -0.21920013427734375, -0.1953887939453125, -0.17157745361328125, -0.14776611328125, -0.12395477294921875, -0.1001434326171875, -0.07633209228515625, -0.052520751953125, -0.02870941162109375, -0.0048980712890625, 0.01891326904296875, 0.042724609375, 0.06653594970703125, 0.0903472900390625, 0.11415863037109375, 0.137969970703125, 0.16178131103515625, 0.1855926513671875, 0.20940399169921875, 0.23321533203125, 0.25702667236328125, 0.2808380126953125, 0.30464935302734375, 0.328460693359375, 0.35227203369140625, 0.3760833740234375, 0.39989471435546875, 0.4237060546875, 0.44751739501953125, 0.4713287353515625, 0.49514007568359375, 0.518951416015625, 0.5427627563476562, 0.5665740966796875, 0.5903854370117188, 0.61419677734375, 0.6380081176757812, 0.6618194580078125, 0.6856307983398438, 0.709442138671875, 0.7332534790039062, 0.7570648193359375, 0.7808761596679688, 0.8046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 7.0, 23.0, 26.0, 42.0, 70.0, 127.0, 148.0, 178.0, 124.0, 90.0, 54.0, 37.0, 11.0, 9.0, 7.0, 5.0, 6.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.276369094848633e-05, -6.073899567127228e-05, -5.871430039405823e-05, -5.668960511684418e-05, -5.466490983963013e-05, -5.264021456241608e-05, -5.0615519285202026e-05, -4.8590824007987976e-05, -4.6566128730773926e-05, -4.4541433453559875e-05, -4.2516738176345825e-05, -4.0492042899131775e-05, -3.8467347621917725e-05, -3.6442652344703674e-05, -3.4417957067489624e-05, -3.2393261790275574e-05, -3.0368566513061523e-05, -2.8343871235847473e-05, -2.6319175958633423e-05, -2.4294480681419373e-05, -2.2269785404205322e-05, -2.0245090126991272e-05, -1.822039484977722e-05, -1.619569957256317e-05, -1.4171004295349121e-05, -1.214630901813507e-05, -1.012161374092102e-05, -8.09691846370697e-06, -6.07222318649292e-06, -4.04752790927887e-06, -2.0228326320648193e-06, 1.862645149230957e-09, 2.0265579223632812e-06, 4.0512531995773315e-06, 6.075948476791382e-06, 8.100643754005432e-06, 1.0125339031219482e-05, 1.2150034308433533e-05, 1.4174729585647583e-05, 1.6199424862861633e-05, 1.8224120140075684e-05, 2.0248815417289734e-05, 2.2273510694503784e-05, 2.4298205971717834e-05, 2.6322901248931885e-05, 2.8347596526145935e-05, 3.0372291803359985e-05, 3.2396987080574036e-05, 3.4421682357788086e-05, 3.6446377635002136e-05, 3.8471072912216187e-05, 4.049576818943024e-05, 4.252046346664429e-05, 4.454515874385834e-05, 4.656985402107239e-05, 4.859454929828644e-05, 5.061924457550049e-05, 5.264393985271454e-05, 5.466863512992859e-05, 5.669333040714264e-05, 5.871802568435669e-05, 6.074272096157074e-05, 6.276741623878479e-05, 6.479211151599884e-05, 6.681680679321289e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 6.0, 9.0, 21.0, 34.0, 34.0, 57.0, 89.0, 148.0, 199.0, 347.0, 461.0, 834.0, 1226.0, 2114.0, 3411.0, 6201.0, 12830.0, 30231.0, 100382.0, 469233.0, 308659.0, 66560.0, 22436.0, 10074.0, 5123.0, 3019.0, 1803.0, 1076.0, 685.0, 409.0, 273.0, 202.0, 126.0, 75.0, 53.0, 28.0, 20.0, 22.0, 18.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8681640625, -0.8425140380859375, -0.816864013671875, -0.7912139892578125, -0.76556396484375, -0.7399139404296875, -0.714263916015625, -0.6886138916015625, -0.6629638671875, -0.6373138427734375, -0.611663818359375, -0.5860137939453125, -0.56036376953125, -0.5347137451171875, -0.509063720703125, -0.4834136962890625, -0.457763671875, -0.4321136474609375, -0.406463623046875, -0.3808135986328125, -0.35516357421875, -0.3295135498046875, -0.303863525390625, -0.2782135009765625, -0.2525634765625, -0.2269134521484375, -0.201263427734375, -0.1756134033203125, -0.14996337890625, -0.1243133544921875, -0.098663330078125, -0.0730133056640625, -0.04736328125, -0.0217132568359375, 0.003936767578125, 0.0295867919921875, 0.05523681640625, 0.0808868408203125, 0.106536865234375, 0.1321868896484375, 0.1578369140625, 0.1834869384765625, 0.209136962890625, 0.2347869873046875, 0.26043701171875, 0.2860870361328125, 0.311737060546875, 0.3373870849609375, 0.363037109375, 0.3886871337890625, 0.414337158203125, 0.4399871826171875, 0.46563720703125, 0.4912872314453125, 0.516937255859375, 0.5425872802734375, 0.5682373046875, 0.5938873291015625, 0.619537353515625, 0.6451873779296875, 0.67083740234375, 0.6964874267578125, 0.722137451171875, 0.7477874755859375, 0.7734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 15.0, 7.0, 25.0, 23.0, 36.0, 53.0, 65.0, 91.0, 82.0, 91.0, 80.0, 66.0, 70.0, 46.0, 49.0, 32.0, 26.0, 28.0, 13.0, 12.0, 8.0, 10.0, 6.0, 8.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10385799407958984, -0.10078239440917969, -0.09770679473876953, -0.09463119506835938, -0.09155559539794922, -0.08847999572753906, -0.0854043960571289, -0.08232879638671875, -0.0792531967163086, -0.07617759704589844, -0.07310199737548828, -0.07002639770507812, -0.06695079803466797, -0.06387519836425781, -0.060799598693847656, -0.0577239990234375, -0.054648399353027344, -0.05157279968261719, -0.04849720001220703, -0.045421600341796875, -0.04234600067138672, -0.03927040100097656, -0.036194801330566406, -0.03311920166015625, -0.030043601989746094, -0.026968002319335938, -0.02389240264892578, -0.020816802978515625, -0.01774120330810547, -0.014665603637695312, -0.011590003967285156, -0.008514404296875, -0.005438804626464844, -0.0023632049560546875, 0.0007123947143554688, 0.003787994384765625, 0.006863594055175781, 0.009939193725585938, 0.013014793395996094, 0.01609039306640625, 0.019165992736816406, 0.022241592407226562, 0.02531719207763672, 0.028392791748046875, 0.03146839141845703, 0.03454399108886719, 0.037619590759277344, 0.0406951904296875, 0.043770790100097656, 0.04684638977050781, 0.04992198944091797, 0.052997589111328125, 0.05607318878173828, 0.05914878845214844, 0.062224388122558594, 0.06529998779296875, 0.0683755874633789, 0.07145118713378906, 0.07452678680419922, 0.07760238647460938, 0.08067798614501953, 0.08375358581542969, 0.08682918548583984, 0.08990478515625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 5.0, 6.0, 8.0, 8.0, 19.0, 17.0, 17.0, 21.0, 28.0, 30.0, 46.0, 35.0, 60.0, 46.0, 62.0, 64.0, 56.0, 63.0, 57.0, 50.0, 62.0, 35.0, 35.0, 31.0, 24.0, 21.0, 17.0, 17.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.44452428817749, -4.301990509033203, -4.159457206726074, -4.016923427581787, -3.874390125274658, -3.731856346130371, -3.589322805404663, -3.446789264678955, -3.304255723953247, -3.161722183227539, -3.019188642501831, -2.876655101776123, -2.734121322631836, -2.591588020324707, -2.44905424118042, -2.306520700454712, -2.163987159729004, -2.021453619003296, -1.878920078277588, -1.7363864183425903, -1.5938528776168823, -1.4513193368911743, -1.3087856769561768, -1.1662521362304688, -1.0237185955047607, -0.8811850547790527, -0.7386514544487, -0.5961178541183472, -0.45358431339263916, -0.31105077266693115, -0.16851717233657837, -0.025983572006225586, 0.11654996871948242, 0.2590835392475128, 0.4016171097755432, 0.544150710105896, 0.686684250831604, 0.829217791557312, 0.9717513918876648, 1.1142849922180176, 1.2568185329437256, 1.3993520736694336, 1.5418856143951416, 1.6844192743301392, 1.8269528150558472, 1.9694863557815552, 2.1120200157165527, 2.2545535564422607, 2.3970870971679688, 2.5396206378936768, 2.6821541786193848, 2.8246877193450928, 2.967221260070801, 3.109755039215088, 3.252288579940796, 3.394822120666504, 3.537355661392212, 3.67988920211792, 3.822422742843628, 3.964956283569336, 4.107490062713623, 4.250023365020752, 4.392557144165039, 4.535090446472168, 4.677624225616455]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 9.0, 3.0, 10.0, 5.0, 16.0, 16.0, 17.0, 17.0, 23.0, 12.0, 24.0, 31.0, 33.0, 34.0, 27.0, 36.0, 38.0, 49.0, 38.0, 27.0, 42.0, 40.0, 41.0, 44.0, 44.0, 32.0, 41.0, 33.0, 33.0, 19.0, 20.0, 17.0, 23.0, 30.0, 14.0, 10.0, 10.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.78905987739563, -2.7029528617858887, -2.6168456077575684, -2.530738353729248, -2.444631338119507, -2.3585243225097656, -2.2724170684814453, -2.186309814453125, -2.100202798843384, -2.0140957832336426, -1.9279885292053223, -1.8418813943862915, -1.7557742595672607, -1.66966712474823, -1.5835599899291992, -1.4974528551101685, -1.4113457202911377, -1.325238585472107, -1.2391314506530762, -1.1530243158340454, -1.0669171810150146, -0.9808100461959839, -0.8947029113769531, -0.8085957765579224, -0.7224886417388916, -0.6363815069198608, -0.5502743721008301, -0.4641672372817993, -0.37806010246276855, -0.2919529676437378, -0.20584583282470703, -0.11973869800567627, -0.03363156318664551, 0.052475571632385254, 0.13858270645141602, 0.22468984127044678, 0.31079697608947754, 0.3969041109085083, 0.48301124572753906, 0.5691183805465698, 0.6552255153656006, 0.7413326501846313, 0.8274397850036621, 0.9135469198226929, 0.9996540546417236, 1.0857611894607544, 1.1718683242797852, 1.257975459098816, 1.3440825939178467, 1.4301897287368774, 1.5162968635559082, 1.602403998374939, 1.6885111331939697, 1.7746182680130005, 1.8607254028320312, 1.946832537651062, 2.0329396724700928, 2.119046688079834, 2.2051539421081543, 2.2912611961364746, 2.377368211746216, 2.463475227355957, 2.5495824813842773, 2.6356897354125977, 2.721796751022339]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 15.0, 15.0, 27.0, 40.0, 64.0, 131.0, 168.0, 241.0, 441.0, 708.0, 1248.0, 1922.0, 3189.0, 5057.0, 8391.0, 13058.0, 20762.0, 31171.0, 45839.0, 63643.0, 83686.0, 102604.0, 115369.0, 117934.0, 109834.0, 92174.0, 72503.0, 53432.0, 37276.0, 24973.0, 16186.0, 9843.0, 6343.0, 3862.0, 2505.0, 1506.0, 892.0, 578.0, 344.0, 204.0, 126.0, 91.0, 60.0, 40.0, 30.0, 11.0, 12.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.57818603515625, -2.4981689453125, -2.41815185546875, -2.338134765625, -2.25811767578125, -2.1781005859375, -2.09808349609375, -2.01806640625, -1.93804931640625, -1.8580322265625, -1.77801513671875, -1.697998046875, -1.61798095703125, -1.5379638671875, -1.45794677734375, -1.3779296875, -1.29791259765625, -1.2178955078125, -1.13787841796875, -1.057861328125, -0.97784423828125, -0.8978271484375, -0.81781005859375, -0.73779296875, -0.65777587890625, -0.5777587890625, -0.49774169921875, -0.417724609375, -0.33770751953125, -0.2576904296875, -0.17767333984375, -0.09765625, -0.01763916015625, 0.0623779296875, 0.14239501953125, 0.222412109375, 0.30242919921875, 0.3824462890625, 0.46246337890625, 0.54248046875, 0.62249755859375, 0.7025146484375, 0.78253173828125, 0.862548828125, 0.94256591796875, 1.0225830078125, 1.10260009765625, 1.1826171875, 1.26263427734375, 1.3426513671875, 1.42266845703125, 1.502685546875, 1.58270263671875, 1.6627197265625, 1.74273681640625, 1.82275390625, 1.90277099609375, 1.9827880859375, 2.06280517578125, 2.142822265625, 2.22283935546875, 2.3028564453125, 2.38287353515625, 2.462890625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 6.0, 11.0, 9.0, 15.0, 15.0, 14.0, 25.0, 23.0, 28.0, 29.0, 30.0, 42.0, 32.0, 33.0, 37.0, 40.0, 41.0, 48.0, 48.0, 38.0, 38.0, 38.0, 51.0, 45.0, 32.0, 32.0, 26.0, 30.0, 26.0, 17.0, 20.0, 12.0, 17.0, 9.0, 2.0, 6.0, 7.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.982421875, -2.883697509765625, -2.78497314453125, -2.686248779296875, -2.5875244140625, -2.488800048828125, -2.39007568359375, -2.291351318359375, -2.192626953125, -2.093902587890625, -1.99517822265625, -1.896453857421875, -1.7977294921875, -1.699005126953125, -1.60028076171875, -1.501556396484375, -1.40283203125, -1.304107666015625, -1.20538330078125, -1.106658935546875, -1.0079345703125, -0.909210205078125, -0.81048583984375, -0.711761474609375, -0.613037109375, -0.514312744140625, -0.41558837890625, -0.316864013671875, -0.2181396484375, -0.119415283203125, -0.02069091796875, 0.078033447265625, 0.1767578125, 0.275482177734375, 0.37420654296875, 0.472930908203125, 0.5716552734375, 0.670379638671875, 0.76910400390625, 0.867828369140625, 0.966552734375, 1.065277099609375, 1.16400146484375, 1.262725830078125, 1.3614501953125, 1.460174560546875, 1.55889892578125, 1.657623291015625, 1.75634765625, 1.855072021484375, 1.95379638671875, 2.052520751953125, 2.1512451171875, 2.249969482421875, 2.34869384765625, 2.447418212890625, 2.546142578125, 2.644866943359375, 2.74359130859375, 2.842315673828125, 2.9410400390625, 3.039764404296875, 3.13848876953125, 3.237213134765625, 3.3359375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 6.0, 9.0, 14.0, 11.0, 21.0, 45.0, 61.0, 77.0, 143.0, 226.0, 330.0, 513.0, 715.0, 1060.0, 1598.0, 2423.0, 3472.0, 5164.0, 7610.0, 10867.0, 15640.0, 22311.0, 30624.0, 41152.0, 53250.0, 67055.0, 79780.0, 89589.0, 95357.0, 94993.0, 88242.0, 78742.0, 64828.0, 52317.0, 39697.0, 30055.0, 21617.0, 15523.0, 10763.0, 7482.0, 4978.0, 3318.0, 2271.0, 1470.0, 1099.0, 680.0, 445.0, 286.0, 232.0, 158.0, 99.0, 64.0, 34.0, 19.0, 10.0, 9.0, 7.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0], "bins": [-1.9814453125, -1.9152984619140625, -1.849151611328125, -1.7830047607421875, -1.71685791015625, -1.6507110595703125, -1.584564208984375, -1.5184173583984375, -1.4522705078125, -1.3861236572265625, -1.319976806640625, -1.2538299560546875, -1.18768310546875, -1.1215362548828125, -1.055389404296875, -0.9892425537109375, -0.923095703125, -0.8569488525390625, -0.790802001953125, -0.7246551513671875, -0.65850830078125, -0.5923614501953125, -0.526214599609375, -0.4600677490234375, -0.3939208984375, -0.3277740478515625, -0.261627197265625, -0.1954803466796875, -0.12933349609375, -0.0631866455078125, 0.002960205078125, 0.0691070556640625, 0.13525390625, 0.2014007568359375, 0.267547607421875, 0.3336944580078125, 0.39984130859375, 0.4659881591796875, 0.532135009765625, 0.5982818603515625, 0.6644287109375, 0.7305755615234375, 0.796722412109375, 0.8628692626953125, 0.92901611328125, 0.9951629638671875, 1.061309814453125, 1.1274566650390625, 1.193603515625, 1.2597503662109375, 1.325897216796875, 1.3920440673828125, 1.45819091796875, 1.5243377685546875, 1.590484619140625, 1.6566314697265625, 1.7227783203125, 1.7889251708984375, 1.855072021484375, 1.9212188720703125, 1.98736572265625, 2.0535125732421875, 2.119659423828125, 2.1858062744140625, 2.251953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 7.0, 14.0, 7.0, 17.0, 19.0, 16.0, 24.0, 24.0, 33.0, 24.0, 28.0, 25.0, 47.0, 41.0, 30.0, 35.0, 35.0, 34.0, 42.0, 37.0, 46.0, 36.0, 32.0, 34.0, 27.0, 30.0, 28.0, 26.0, 27.0, 18.0, 21.0, 18.0, 18.0, 10.0, 14.0, 7.0, 8.0, 10.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.90234375, -1.8460235595703125, -1.789703369140625, -1.7333831787109375, -1.67706298828125, -1.6207427978515625, -1.564422607421875, -1.5081024169921875, -1.4517822265625, -1.3954620361328125, -1.339141845703125, -1.2828216552734375, -1.22650146484375, -1.1701812744140625, -1.113861083984375, -1.0575408935546875, -1.001220703125, -0.9449005126953125, -0.888580322265625, -0.8322601318359375, -0.77593994140625, -0.7196197509765625, -0.663299560546875, -0.6069793701171875, -0.5506591796875, -0.4943389892578125, -0.438018798828125, -0.3816986083984375, -0.32537841796875, -0.2690582275390625, -0.212738037109375, -0.1564178466796875, -0.10009765625, -0.0437774658203125, 0.012542724609375, 0.0688629150390625, 0.12518310546875, 0.1815032958984375, 0.237823486328125, 0.2941436767578125, 0.3504638671875, 0.4067840576171875, 0.463104248046875, 0.5194244384765625, 0.57574462890625, 0.6320648193359375, 0.688385009765625, 0.7447052001953125, 0.801025390625, 0.8573455810546875, 0.913665771484375, 0.9699859619140625, 1.02630615234375, 1.0826263427734375, 1.138946533203125, 1.1952667236328125, 1.2515869140625, 1.3079071044921875, 1.364227294921875, 1.4205474853515625, 1.47686767578125, 1.5331878662109375, 1.589508056640625, 1.6458282470703125, 1.7021484375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 9.0, 8.0, 18.0, 29.0, 36.0, 67.0, 93.0, 148.0, 236.0, 373.0, 573.0, 913.0, 1477.0, 2421.0, 3950.0, 6473.0, 11325.0, 19188.0, 32403.0, 54763.0, 87199.0, 127363.0, 159422.0, 162760.0, 134494.0, 94665.0, 59837.0, 35780.0, 21419.0, 12441.0, 7361.0, 4414.0, 2629.0, 1542.0, 986.0, 616.0, 406.0, 238.0, 171.0, 95.0, 77.0, 48.0, 32.0, 13.0, 19.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.7646484375, -1.712890625, -1.6611328125, -1.609375, -1.5576171875, -1.505859375, -1.4541015625, -1.40234375, -1.3505859375, -1.298828125, -1.2470703125, -1.1953125, -1.1435546875, -1.091796875, -1.0400390625, -0.98828125, -0.9365234375, -0.884765625, -0.8330078125, -0.78125, -0.7294921875, -0.677734375, -0.6259765625, -0.57421875, -0.5224609375, -0.470703125, -0.4189453125, -0.3671875, -0.3154296875, -0.263671875, -0.2119140625, -0.16015625, -0.1083984375, -0.056640625, -0.0048828125, 0.046875, 0.0986328125, 0.150390625, 0.2021484375, 0.25390625, 0.3056640625, 0.357421875, 0.4091796875, 0.4609375, 0.5126953125, 0.564453125, 0.6162109375, 0.66796875, 0.7197265625, 0.771484375, 0.8232421875, 0.875, 0.9267578125, 0.978515625, 1.0302734375, 1.08203125, 1.1337890625, 1.185546875, 1.2373046875, 1.2890625, 1.3408203125, 1.392578125, 1.4443359375, 1.49609375, 1.5478515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 10.0, 12.0, 17.0, 27.0, 25.0, 42.0, 38.0, 66.0, 67.0, 59.0, 53.0, 70.0, 74.0, 74.0, 66.0, 49.0, 52.0, 37.0, 31.0, 18.0, 25.0, 13.0, 14.0, 7.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015473365783691406, -0.00014875270426273346, -0.00014277175068855286, -0.00013679079711437225, -0.00013080984354019165, -0.00012482888996601105, -0.00011884793639183044, -0.00011286698281764984, -0.00010688602924346924, -0.00010090507566928864, -9.492412209510803e-05, -8.894316852092743e-05, -8.296221494674683e-05, -7.698126137256622e-05, -7.100030779838562e-05, -6.501935422420502e-05, -5.9038400650024414e-05, -5.305744707584381e-05, -4.707649350166321e-05, -4.1095539927482605e-05, -3.5114586353302e-05, -2.91336327791214e-05, -2.3152679204940796e-05, -1.7171725630760193e-05, -1.119077205657959e-05, -5.209818482398987e-06, 7.711350917816162e-07, 6.752088665962219e-06, 1.2733042240142822e-05, 1.8713995814323425e-05, 2.469494938850403e-05, 3.067590296268463e-05, 3.6656856536865234e-05, 4.263781011104584e-05, 4.861876368522644e-05, 5.4599717259407043e-05, 6.0580670833587646e-05, 6.656162440776825e-05, 7.254257798194885e-05, 7.852353155612946e-05, 8.450448513031006e-05, 9.048543870449066e-05, 9.646639227867126e-05, 0.00010244734585285187, 0.00010842829942703247, 0.00011440925300121307, 0.00012039020657539368, 0.00012637116014957428, 0.00013235211372375488, 0.00013833306729793549, 0.0001443140208721161, 0.0001502949744462967, 0.0001562759280204773, 0.0001622568815946579, 0.0001682378351688385, 0.0001742187887430191, 0.0001801997423171997, 0.0001861806958913803, 0.0001921616494655609, 0.00019814260303974152, 0.00020412355661392212, 0.00021010451018810272, 0.00021608546376228333, 0.00022206641733646393, 0.00022804737091064453]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 15.0, 14.0, 22.0, 29.0, 39.0, 60.0, 82.0, 145.0, 215.0, 351.0, 512.0, 816.0, 1408.0, 2394.0, 4039.0, 6845.0, 12147.0, 20977.0, 36727.0, 62131.0, 98969.0, 141735.0, 169786.0, 162185.0, 124425.0, 82532.0, 50333.0, 29670.0, 16773.0, 9534.0, 5445.0, 3239.0, 1915.0, 1136.0, 666.0, 434.0, 264.0, 186.0, 88.0, 72.0, 47.0, 36.0, 35.0, 20.0, 14.0, 11.0, 13.0, 4.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6357421875, -1.5826263427734375, -1.529510498046875, -1.4763946533203125, -1.42327880859375, -1.3701629638671875, -1.317047119140625, -1.2639312744140625, -1.2108154296875, -1.1576995849609375, -1.104583740234375, -1.0514678955078125, -0.99835205078125, -0.9452362060546875, -0.892120361328125, -0.8390045166015625, -0.785888671875, -0.7327728271484375, -0.679656982421875, -0.6265411376953125, -0.57342529296875, -0.5203094482421875, -0.467193603515625, -0.4140777587890625, -0.3609619140625, -0.3078460693359375, -0.254730224609375, -0.2016143798828125, -0.14849853515625, -0.0953826904296875, -0.042266845703125, 0.0108489990234375, 0.06396484375, 0.1170806884765625, 0.170196533203125, 0.2233123779296875, 0.27642822265625, 0.3295440673828125, 0.382659912109375, 0.4357757568359375, 0.4888916015625, 0.5420074462890625, 0.595123291015625, 0.6482391357421875, 0.70135498046875, 0.7544708251953125, 0.807586669921875, 0.8607025146484375, 0.913818359375, 0.9669342041015625, 1.020050048828125, 1.0731658935546875, 1.12628173828125, 1.1793975830078125, 1.232513427734375, 1.2856292724609375, 1.3387451171875, 1.3918609619140625, 1.444976806640625, 1.4980926513671875, 1.55120849609375, 1.6043243408203125, 1.657440185546875, 1.7105560302734375, 1.763671875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 5.0, 4.0, 10.0, 5.0, 14.0, 8.0, 18.0, 27.0, 30.0, 51.0, 53.0, 53.0, 48.0, 57.0, 66.0, 67.0, 60.0, 70.0, 49.0, 54.0, 56.0, 36.0, 38.0, 20.0, 25.0, 11.0, 14.0, 12.0, 14.0, 9.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54541015625, -0.528717041015625, -0.51202392578125, -0.495330810546875, -0.4786376953125, -0.461944580078125, -0.44525146484375, -0.428558349609375, -0.411865234375, -0.395172119140625, -0.37847900390625, -0.361785888671875, -0.3450927734375, -0.328399658203125, -0.31170654296875, -0.295013427734375, -0.2783203125, -0.261627197265625, -0.24493408203125, -0.228240966796875, -0.2115478515625, -0.194854736328125, -0.17816162109375, -0.161468505859375, -0.144775390625, -0.128082275390625, -0.11138916015625, -0.094696044921875, -0.0780029296875, -0.061309814453125, -0.04461669921875, -0.027923583984375, -0.01123046875, 0.005462646484375, 0.02215576171875, 0.038848876953125, 0.0555419921875, 0.072235107421875, 0.08892822265625, 0.105621337890625, 0.122314453125, 0.139007568359375, 0.15570068359375, 0.172393798828125, 0.1890869140625, 0.205780029296875, 0.22247314453125, 0.239166259765625, 0.255859375, 0.272552490234375, 0.28924560546875, 0.305938720703125, 0.3226318359375, 0.339324951171875, 0.35601806640625, 0.372711181640625, 0.389404296875, 0.406097412109375, 0.42279052734375, 0.439483642578125, 0.4561767578125, 0.472869873046875, 0.48956298828125, 0.506256103515625, 0.52294921875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 3.0, 14.0, 8.0, 13.0, 19.0, 17.0, 24.0, 28.0, 32.0, 37.0, 50.0, 35.0, 53.0, 64.0, 63.0, 67.0, 61.0, 61.0, 48.0, 47.0, 38.0, 39.0, 27.0, 20.0, 37.0, 12.0, 11.0, 15.0, 12.0, 6.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.602250576019287, -4.4600019454956055, -4.317753314971924, -4.175504207611084, -4.033255577087402, -3.8910069465637207, -3.748758316040039, -3.6065096855163574, -3.4642608165740967, -3.322012186050415, -3.1797633171081543, -3.0375146865844727, -2.895266056060791, -2.7530171871185303, -2.6107685565948486, -2.468519687652588, -2.3262710571289062, -2.1840224266052246, -2.041773557662964, -1.8995249271392822, -1.757276177406311, -1.6150274276733398, -1.4727787971496582, -1.330530047416687, -1.1882812976837158, -1.0460325479507446, -0.9037838578224182, -0.7615351676940918, -0.6192864179611206, -0.4770376682281494, -0.334788978099823, -0.19254028797149658, -0.05029106140136719, 0.09195765852928162, 0.23420637845993042, 0.3764550983905792, 0.518703818321228, 0.6609525680541992, 0.8032012581825256, 0.945449948310852, 1.0876986980438232, 1.2299474477767944, 1.3721961975097656, 1.5144448280334473, 1.6566935777664185, 1.7989423274993896, 1.9411909580230713, 2.083439826965332, 2.2256884574890137, 2.3679370880126953, 2.510185956954956, 2.6524345874786377, 2.7946834564208984, 2.93693208694458, 3.0791807174682617, 3.2214293479919434, 3.363678216934204, 3.5059268474578857, 3.6481757164001465, 3.790424346923828, 3.9326729774475098, 4.074921607971191, 4.217170715332031, 4.359419345855713, 4.5016679763793945]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 7.0, 8.0, 9.0, 10.0, 8.0, 9.0, 19.0, 22.0, 23.0, 24.0, 35.0, 36.0, 34.0, 33.0, 30.0, 54.0, 33.0, 44.0, 44.0, 39.0, 38.0, 49.0, 49.0, 40.0, 38.0, 41.0, 28.0, 21.0, 30.0, 23.0, 19.0, 23.0, 17.0, 16.0, 9.0, 10.0, 7.0, 4.0, 7.0, 5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.2402915954589844, -3.1429500579833984, -3.0456082820892334, -2.9482667446136475, -2.8509249687194824, -2.7535834312438965, -2.6562418937683105, -2.5589001178741455, -2.4615583419799805, -2.3642168045043945, -2.2668750286102295, -2.1695334911346436, -2.0721917152404785, -1.9748501777648926, -1.877508521080017, -1.7801668643951416, -1.6828253269195557, -1.5854836702346802, -1.4881420135498047, -1.3908004760742188, -1.2934587001800537, -1.1961171627044678, -1.0987755060195923, -1.0014338493347168, -0.9040921926498413, -0.8067505359649658, -0.7094088792800903, -0.6120672821998596, -0.5147256255149841, -0.41738396883010864, -0.32004237174987793, -0.22270071506500244, -0.12535929679870605, -0.02801765501499176, 0.06932398676872253, 0.16666561365127563, 0.2640072703361511, 0.3613489270210266, 0.4586905241012573, 0.5560321807861328, 0.6533738374710083, 0.7507154941558838, 0.8480571508407593, 0.94539874792099, 1.0427403450012207, 1.1400821208953857, 1.2374236583709717, 1.3347653150558472, 1.4321069717407227, 1.5294486284255981, 1.6267902851104736, 1.7241318225860596, 1.8214735984802246, 1.9188151359558105, 2.0161566734313965, 2.1134984493255615, 2.2108402252197266, 2.3081817626953125, 2.4055235385894775, 2.5028650760650635, 2.6002068519592285, 2.6975483894348145, 2.7948899269104004, 2.8922317028045654, 2.9895732402801514]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 7.0, 15.0, 19.0, 40.0, 48.0, 74.0, 102.0, 182.0, 331.0, 493.0, 761.0, 1375.0, 2111.0, 3449.0, 5702.0, 9340.0, 15359.0, 25382.0, 41998.0, 69262.0, 112762.0, 179877.0, 276179.0, 399155.0, 522208.0, 593112.0, 564776.0, 458088.0, 329637.0, 220458.0, 139650.0, 87252.0, 52713.0, 32166.0, 19525.0, 11861.0, 7247.0, 4392.0, 2688.0, 1718.0, 1020.0, 611.0, 420.0, 267.0, 164.0, 110.0, 80.0, 28.0, 24.0, 15.0, 15.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.234375, -3.135528564453125, -3.03668212890625, -2.937835693359375, -2.8389892578125, -2.740142822265625, -2.64129638671875, -2.542449951171875, -2.443603515625, -2.344757080078125, -2.24591064453125, -2.147064208984375, -2.0482177734375, -1.949371337890625, -1.85052490234375, -1.751678466796875, -1.65283203125, -1.553985595703125, -1.45513916015625, -1.356292724609375, -1.2574462890625, -1.158599853515625, -1.05975341796875, -0.960906982421875, -0.862060546875, -0.763214111328125, -0.66436767578125, -0.565521240234375, -0.4666748046875, -0.367828369140625, -0.26898193359375, -0.170135498046875, -0.0712890625, 0.027557373046875, 0.12640380859375, 0.225250244140625, 0.3240966796875, 0.422943115234375, 0.52178955078125, 0.620635986328125, 0.719482421875, 0.818328857421875, 0.91717529296875, 1.016021728515625, 1.1148681640625, 1.213714599609375, 1.31256103515625, 1.411407470703125, 1.51025390625, 1.609100341796875, 1.70794677734375, 1.806793212890625, 1.9056396484375, 2.004486083984375, 2.10333251953125, 2.202178955078125, 2.301025390625, 2.399871826171875, 2.49871826171875, 2.597564697265625, 2.6964111328125, 2.795257568359375, 2.89410400390625, 2.992950439453125, 3.091796875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 7.0, 13.0, 9.0, 13.0, 11.0, 15.0, 14.0, 24.0, 31.0, 22.0, 36.0, 29.0, 33.0, 34.0, 34.0, 37.0, 52.0, 39.0, 39.0, 47.0, 36.0, 40.0, 36.0, 24.0, 33.0, 36.0, 25.0, 33.0, 27.0, 30.0, 23.0, 16.0, 13.0, 20.0, 8.0, 20.0, 9.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.39453125, -2.32366943359375, -2.2528076171875, -2.18194580078125, -2.111083984375, -2.04022216796875, -1.9693603515625, -1.89849853515625, -1.82763671875, -1.75677490234375, -1.6859130859375, -1.61505126953125, -1.544189453125, -1.47332763671875, -1.4024658203125, -1.33160400390625, -1.2607421875, -1.18988037109375, -1.1190185546875, -1.04815673828125, -0.977294921875, -0.90643310546875, -0.8355712890625, -0.76470947265625, -0.69384765625, -0.62298583984375, -0.5521240234375, -0.48126220703125, -0.410400390625, -0.33953857421875, -0.2686767578125, -0.19781494140625, -0.126953125, -0.05609130859375, 0.0147705078125, 0.08563232421875, 0.156494140625, 0.22735595703125, 0.2982177734375, 0.36907958984375, 0.43994140625, 0.51080322265625, 0.5816650390625, 0.65252685546875, 0.723388671875, 0.79425048828125, 0.8651123046875, 0.93597412109375, 1.0068359375, 1.07769775390625, 1.1485595703125, 1.21942138671875, 1.290283203125, 1.36114501953125, 1.4320068359375, 1.50286865234375, 1.57373046875, 1.64459228515625, 1.7154541015625, 1.78631591796875, 1.857177734375, 1.92803955078125, 1.9989013671875, 2.06976318359375, 2.140625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 2.0, 21.0, 29.0, 53.0, 78.0, 133.0, 207.0, 340.0, 490.0, 844.0, 1301.0, 2139.0, 3585.0, 5574.0, 8947.0, 14636.0, 23172.0, 36909.0, 58131.0, 90574.0, 137095.0, 202046.0, 284615.0, 373691.0, 454253.0, 497568.0, 486850.0, 425758.0, 337690.0, 250671.0, 173795.0, 116466.0, 75841.0, 48778.0, 31011.0, 19198.0, 12051.0, 7337.0, 4710.0, 2908.0, 1790.0, 1138.0, 694.0, 445.0, 287.0, 162.0, 114.0, 54.0, 41.0, 23.0, 13.0, 9.0, 4.0, 8.0, 2.0, 0.0, 2.0], "bins": [-3.037109375, -2.94451904296875, -2.8519287109375, -2.75933837890625, -2.666748046875, -2.57415771484375, -2.4815673828125, -2.38897705078125, -2.29638671875, -2.20379638671875, -2.1112060546875, -2.01861572265625, -1.926025390625, -1.83343505859375, -1.7408447265625, -1.64825439453125, -1.5556640625, -1.46307373046875, -1.3704833984375, -1.27789306640625, -1.185302734375, -1.09271240234375, -1.0001220703125, -0.90753173828125, -0.81494140625, -0.72235107421875, -0.6297607421875, -0.53717041015625, -0.444580078125, -0.35198974609375, -0.2593994140625, -0.16680908203125, -0.07421875, 0.01837158203125, 0.1109619140625, 0.20355224609375, 0.296142578125, 0.38873291015625, 0.4813232421875, 0.57391357421875, 0.66650390625, 0.75909423828125, 0.8516845703125, 0.94427490234375, 1.036865234375, 1.12945556640625, 1.2220458984375, 1.31463623046875, 1.4072265625, 1.49981689453125, 1.5924072265625, 1.68499755859375, 1.777587890625, 1.87017822265625, 1.9627685546875, 2.05535888671875, 2.14794921875, 2.24053955078125, 2.3331298828125, 2.42572021484375, 2.518310546875, 2.61090087890625, 2.7034912109375, 2.79608154296875, 2.888671875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 8.0, 13.0, 15.0, 25.0, 24.0, 38.0, 48.0, 38.0, 68.0, 76.0, 105.0, 105.0, 136.0, 132.0, 145.0, 152.0, 189.0, 183.0, 179.0, 180.0, 221.0, 211.0, 215.0, 183.0, 181.0, 171.0, 165.0, 153.0, 98.0, 105.0, 75.0, 95.0, 64.0, 50.0, 47.0, 39.0, 24.0, 24.0, 22.0, 22.0, 9.0, 9.0, 8.0, 8.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.2646484375, -1.2282867431640625, -1.191925048828125, -1.1555633544921875, -1.11920166015625, -1.0828399658203125, -1.046478271484375, -1.0101165771484375, -0.9737548828125, -0.9373931884765625, -0.901031494140625, -0.8646697998046875, -0.82830810546875, -0.7919464111328125, -0.755584716796875, -0.7192230224609375, -0.682861328125, -0.6464996337890625, -0.610137939453125, -0.5737762451171875, -0.53741455078125, -0.5010528564453125, -0.464691162109375, -0.4283294677734375, -0.3919677734375, -0.3556060791015625, -0.319244384765625, -0.2828826904296875, -0.24652099609375, -0.2101593017578125, -0.173797607421875, -0.1374359130859375, -0.10107421875, -0.0647125244140625, -0.028350830078125, 0.0080108642578125, 0.04437255859375, 0.0807342529296875, 0.117095947265625, 0.1534576416015625, 0.1898193359375, 0.2261810302734375, 0.262542724609375, 0.2989044189453125, 0.33526611328125, 0.3716278076171875, 0.407989501953125, 0.4443511962890625, 0.480712890625, 0.5170745849609375, 0.553436279296875, 0.5897979736328125, 0.62615966796875, 0.6625213623046875, 0.698883056640625, 0.7352447509765625, 0.7716064453125, 0.8079681396484375, 0.844329833984375, 0.8806915283203125, 0.91705322265625, 0.9534149169921875, 0.989776611328125, 1.0261383056640625, 1.0625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 9.0, 6.0, 7.0, 11.0, 11.0, 17.0, 18.0, 19.0, 25.0, 31.0, 38.0, 53.0, 41.0, 49.0, 68.0, 54.0, 52.0, 59.0, 56.0, 51.0, 53.0, 51.0, 47.0, 45.0, 21.0, 23.0, 17.0, 13.0, 16.0, 5.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.395505428314209, -4.2524871826171875, -4.109468936920166, -3.9664504528045654, -3.823431968688965, -3.6804137229919434, -3.537395477294922, -3.3943772315979004, -3.2513587474823, -3.1083405017852783, -2.9653220176696777, -2.8223037719726562, -2.6792855262756348, -2.536267042160034, -2.3932487964630127, -2.250230312347412, -2.1072120666503906, -1.9641937017440796, -1.8211753368377686, -1.678157091140747, -1.535138726234436, -1.392120361328125, -1.2491021156311035, -1.1060837507247925, -0.9630653858184814, -0.8200470209121704, -0.6770287156105042, -0.5340104103088379, -0.39099204540252686, -0.24797368049621582, -0.10495537519454956, 0.0380629301071167, 0.18108177185058594, 0.3241001069545746, 0.46711844205856323, 0.6101367473602295, 0.7531551122665405, 0.8961734771728516, 1.039191722869873, 1.182210087776184, 1.3252284526824951, 1.4682468175888062, 1.6112651824951172, 1.7542834281921387, 1.8973017930984497, 2.0403201580047607, 2.1833384037017822, 2.326356887817383, 2.4693751335144043, 2.612393379211426, 2.7554118633270264, 2.898430109024048, 3.0414485931396484, 3.18446683883667, 3.3274850845336914, 3.470503330230713, 3.6135218143463135, 3.756540060043335, 3.8995585441589355, 4.042576789855957, 4.1855950355529785, 4.32861328125, 4.47163200378418, 4.614650249481201, 4.757668495178223]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 10.0, 4.0, 4.0, 11.0, 7.0, 11.0, 5.0, 8.0, 22.0, 18.0, 15.0, 26.0, 26.0, 33.0, 15.0, 22.0, 40.0, 35.0, 57.0, 50.0, 51.0, 47.0, 37.0, 43.0, 50.0, 32.0, 47.0, 30.0, 35.0, 32.0, 30.0, 23.0, 25.0, 18.0, 14.0, 13.0, 17.0, 8.0, 12.0, 3.0, 5.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.967454671859741, -2.875128984451294, -2.7828030586242676, -2.6904773712158203, -2.598151683807373, -2.5058257579803467, -2.4135000705718994, -2.321174144744873, -2.228848457336426, -2.1365227699279785, -2.044196844100952, -1.9518711566925049, -1.859545350074768, -1.7672195434570312, -1.674893856048584, -1.5825680494308472, -1.4902422428131104, -1.3979164361953735, -1.3055906295776367, -1.2132649421691895, -1.1209391355514526, -1.0286133289337158, -0.9362875819206238, -0.8439618349075317, -0.7516360282897949, -0.6593102216720581, -0.5669844746589661, -0.47465869784355164, -0.3823329210281372, -0.2900071442127228, -0.19768136739730835, -0.10535562038421631, -0.013030052185058594, 0.07929572463035583, 0.17162150144577026, 0.2639472782611847, 0.3562730550765991, 0.44859883189201355, 0.540924608707428, 0.63325035572052, 0.7255761623382568, 0.8179019689559937, 0.9102277159690857, 1.0025534629821777, 1.0948792695999146, 1.1872050762176514, 1.2795307636260986, 1.3718565702438354, 1.4641823768615723, 1.556508183479309, 1.648833990097046, 1.7411596775054932, 1.83348548412323, 1.9258112907409668, 2.018136978149414, 2.1104626655578613, 2.2027885913848877, 2.295114278793335, 2.3874402046203613, 2.4797658920288086, 2.572091579437256, 2.6644175052642822, 2.7567431926727295, 2.849069118499756, 2.941394805908203]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 4.0, 9.0, 9.0, 11.0, 22.0, 35.0, 49.0, 71.0, 84.0, 136.0, 187.0, 235.0, 339.0, 480.0, 661.0, 931.0, 1414.0, 1967.0, 2780.0, 3986.0, 6015.0, 8927.0, 13188.0, 19878.0, 30765.0, 47792.0, 74411.0, 113177.0, 155134.0, 167705.0, 133905.0, 91975.0, 59415.0, 38361.0, 24661.0, 15911.0, 10622.0, 7230.0, 4917.0, 3311.0, 2312.0, 1555.0, 1188.0, 824.0, 552.0, 403.0, 289.0, 211.0, 161.0, 130.0, 62.0, 67.0, 27.0, 18.0, 18.0, 10.0, 16.0, 6.0, 3.0, 1.0, 4.0], "bins": [-0.6787109375, -0.6576614379882812, -0.6366119384765625, -0.6155624389648438, -0.594512939453125, -0.5734634399414062, -0.5524139404296875, -0.5313644409179688, -0.51031494140625, -0.48926544189453125, -0.4682159423828125, -0.44716644287109375, -0.426116943359375, -0.40506744384765625, -0.3840179443359375, -0.36296844482421875, -0.3419189453125, -0.32086944580078125, -0.2998199462890625, -0.27877044677734375, -0.257720947265625, -0.23667144775390625, -0.2156219482421875, -0.19457244873046875, -0.17352294921875, -0.15247344970703125, -0.1314239501953125, -0.11037445068359375, -0.089324951171875, -0.06827545166015625, -0.0472259521484375, -0.02617645263671875, -0.005126953125, 0.01592254638671875, 0.0369720458984375, 0.05802154541015625, 0.079071044921875, 0.10012054443359375, 0.1211700439453125, 0.14221954345703125, 0.16326904296875, 0.18431854248046875, 0.2053680419921875, 0.22641754150390625, 0.247467041015625, 0.26851654052734375, 0.2895660400390625, 0.31061553955078125, 0.3316650390625, 0.35271453857421875, 0.3737640380859375, 0.39481353759765625, 0.415863037109375, 0.43691253662109375, 0.4579620361328125, 0.47901153564453125, 0.50006103515625, 0.5211105346679688, 0.5421600341796875, 0.5632095336914062, 0.584259033203125, 0.6053085327148438, 0.6263580322265625, 0.6474075317382812, 0.66845703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 9.0, 9.0, 4.0, 3.0, 12.0, 7.0, 19.0, 9.0, 12.0, 15.0, 18.0, 27.0, 25.0, 27.0, 26.0, 37.0, 36.0, 37.0, 44.0, 48.0, 37.0, 45.0, 54.0, 46.0, 40.0, 37.0, 33.0, 36.0, 28.0, 28.0, 24.0, 18.0, 18.0, 22.0, 15.0, 18.0, 16.0, 11.0, 10.0, 4.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.326171875, -3.22991943359375, -3.1336669921875, -3.03741455078125, -2.941162109375, -2.84490966796875, -2.7486572265625, -2.65240478515625, -2.55615234375, -2.45989990234375, -2.3636474609375, -2.26739501953125, -2.171142578125, -2.07489013671875, -1.9786376953125, -1.88238525390625, -1.7861328125, -1.68988037109375, -1.5936279296875, -1.49737548828125, -1.401123046875, -1.30487060546875, -1.2086181640625, -1.11236572265625, -1.01611328125, -0.91986083984375, -0.8236083984375, -0.72735595703125, -0.631103515625, -0.53485107421875, -0.4385986328125, -0.34234619140625, -0.24609375, -0.14984130859375, -0.0535888671875, 0.04266357421875, 0.138916015625, 0.23516845703125, 0.3314208984375, 0.42767333984375, 0.52392578125, 0.62017822265625, 0.7164306640625, 0.81268310546875, 0.908935546875, 1.00518798828125, 1.1014404296875, 1.19769287109375, 1.2939453125, 1.39019775390625, 1.4864501953125, 1.58270263671875, 1.678955078125, 1.77520751953125, 1.8714599609375, 1.96771240234375, 2.06396484375, 2.16021728515625, 2.2564697265625, 2.35272216796875, 2.448974609375, 2.54522705078125, 2.6414794921875, 2.73773193359375, 2.833984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 6.0, 11.0, 16.0, 34.0, 45.0, 70.0, 96.0, 149.0, 238.0, 368.0, 615.0, 961.0, 1610.0, 2580.0, 4504.0, 7761.0, 13897.0, 25396.0, 46193.0, 86130.0, 158063.0, 240689.0, 203303.0, 116039.0, 62715.0, 33678.0, 18539.0, 10263.0, 5873.0, 3359.0, 2011.0, 1315.0, 734.0, 431.0, 318.0, 186.0, 119.0, 87.0, 52.0, 29.0, 22.0, 21.0, 10.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8720703125, -0.84063720703125, -0.8092041015625, -0.77777099609375, -0.746337890625, -0.71490478515625, -0.6834716796875, -0.65203857421875, -0.62060546875, -0.58917236328125, -0.5577392578125, -0.52630615234375, -0.494873046875, -0.46343994140625, -0.4320068359375, -0.40057373046875, -0.369140625, -0.33770751953125, -0.3062744140625, -0.27484130859375, -0.243408203125, -0.21197509765625, -0.1805419921875, -0.14910888671875, -0.11767578125, -0.08624267578125, -0.0548095703125, -0.02337646484375, 0.008056640625, 0.03948974609375, 0.0709228515625, 0.10235595703125, 0.1337890625, 0.16522216796875, 0.1966552734375, 0.22808837890625, 0.259521484375, 0.29095458984375, 0.3223876953125, 0.35382080078125, 0.38525390625, 0.41668701171875, 0.4481201171875, 0.47955322265625, 0.510986328125, 0.54241943359375, 0.5738525390625, 0.60528564453125, 0.63671875, 0.66815185546875, 0.6995849609375, 0.73101806640625, 0.762451171875, 0.79388427734375, 0.8253173828125, 0.85675048828125, 0.88818359375, 0.91961669921875, 0.9510498046875, 0.98248291015625, 1.013916015625, 1.04534912109375, 1.0767822265625, 1.10821533203125, 1.1396484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 3.0, 14.0, 8.0, 15.0, 4.0, 11.0, 21.0, 18.0, 18.0, 23.0, 32.0, 30.0, 34.0, 41.0, 37.0, 50.0, 47.0, 50.0, 38.0, 44.0, 31.0, 39.0, 28.0, 52.0, 29.0, 32.0, 30.0, 33.0, 17.0, 23.0, 35.0, 17.0, 15.0, 11.0, 24.0, 11.0, 11.0, 6.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.419921875, -2.355987548828125, -2.29205322265625, -2.228118896484375, -2.1641845703125, -2.100250244140625, -2.03631591796875, -1.972381591796875, -1.908447265625, -1.844512939453125, -1.78057861328125, -1.716644287109375, -1.6527099609375, -1.588775634765625, -1.52484130859375, -1.460906982421875, -1.39697265625, -1.333038330078125, -1.26910400390625, -1.205169677734375, -1.1412353515625, -1.077301025390625, -1.01336669921875, -0.949432373046875, -0.885498046875, -0.821563720703125, -0.75762939453125, -0.693695068359375, -0.6297607421875, -0.565826416015625, -0.50189208984375, -0.437957763671875, -0.3740234375, -0.310089111328125, -0.24615478515625, -0.182220458984375, -0.1182861328125, -0.054351806640625, 0.00958251953125, 0.073516845703125, 0.137451171875, 0.201385498046875, 0.26531982421875, 0.329254150390625, 0.3931884765625, 0.457122802734375, 0.52105712890625, 0.584991455078125, 0.64892578125, 0.712860107421875, 0.77679443359375, 0.840728759765625, 0.9046630859375, 0.968597412109375, 1.03253173828125, 1.096466064453125, 1.160400390625, 1.224334716796875, 1.28826904296875, 1.352203369140625, 1.4161376953125, 1.480072021484375, 1.54400634765625, 1.607940673828125, 1.671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 6.0, 17.0, 26.0, 50.0, 67.0, 78.0, 99.0, 174.0, 252.0, 395.0, 625.0, 1030.0, 1763.0, 3788.0, 9807.0, 53503.0, 850065.0, 104034.0, 12724.0, 4547.0, 2248.0, 1209.0, 729.0, 421.0, 266.0, 209.0, 141.0, 78.0, 54.0, 44.0, 16.0, 23.0, 12.0, 10.0, 9.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.291015625, -1.24884033203125, -1.2066650390625, -1.16448974609375, -1.122314453125, -1.08013916015625, -1.0379638671875, -0.99578857421875, -0.95361328125, -0.91143798828125, -0.8692626953125, -0.82708740234375, -0.784912109375, -0.74273681640625, -0.7005615234375, -0.65838623046875, -0.6162109375, -0.57403564453125, -0.5318603515625, -0.48968505859375, -0.447509765625, -0.40533447265625, -0.3631591796875, -0.32098388671875, -0.27880859375, -0.23663330078125, -0.1944580078125, -0.15228271484375, -0.110107421875, -0.06793212890625, -0.0257568359375, 0.01641845703125, 0.05859375, 0.10076904296875, 0.1429443359375, 0.18511962890625, 0.227294921875, 0.26947021484375, 0.3116455078125, 0.35382080078125, 0.39599609375, 0.43817138671875, 0.4803466796875, 0.52252197265625, 0.564697265625, 0.60687255859375, 0.6490478515625, 0.69122314453125, 0.7333984375, 0.77557373046875, 0.8177490234375, 0.85992431640625, 0.902099609375, 0.94427490234375, 0.9864501953125, 1.02862548828125, 1.07080078125, 1.11297607421875, 1.1551513671875, 1.19732666015625, 1.239501953125, 1.28167724609375, 1.3238525390625, 1.36602783203125, 1.408203125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 18.0, 47.0, 250.0, 418.0, 174.0, 38.0, 10.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001690387725830078, -0.0001646401360630989, -0.00016024149954319, -0.0001558428630232811, -0.0001514442265033722, -0.0001470455899834633, -0.00014264695346355438, -0.00013824831694364548, -0.00013384968042373657, -0.00012945104390382767, -0.00012505240738391876, -0.00012065377086400986, -0.00011625513434410095, -0.00011185649782419205, -0.00010745786130428314, -0.00010305922478437424, -9.866058826446533e-05, -9.426195174455643e-05, -8.986331522464752e-05, -8.546467870473862e-05, -8.106604218482971e-05, -7.666740566492081e-05, -7.22687691450119e-05, -6.7870132625103e-05, -6.347149610519409e-05, -5.907285958528519e-05, -5.467422306537628e-05, -5.027558654546738e-05, -4.587695002555847e-05, -4.147831350564957e-05, -3.707967698574066e-05, -3.2681040465831757e-05, -2.828240394592285e-05, -2.3883767426013947e-05, -1.948513090610504e-05, -1.5086494386196136e-05, -1.0687857866287231e-05, -6.289221346378326e-06, -1.8905848264694214e-06, 2.5080516934394836e-06, 6.906688213348389e-06, 1.1305324733257294e-05, 1.57039612531662e-05, 2.0102597773075104e-05, 2.450123429298401e-05, 2.8899870812892914e-05, 3.329850733280182e-05, 3.7697143852710724e-05, 4.209578037261963e-05, 4.6494416892528534e-05, 5.089305341243744e-05, 5.5291689932346344e-05, 5.969032645225525e-05, 6.408896297216415e-05, 6.848759949207306e-05, 7.288623601198196e-05, 7.728487253189087e-05, 8.168350905179977e-05, 8.608214557170868e-05, 9.048078209161758e-05, 9.487941861152649e-05, 9.92780551314354e-05, 0.0001036766916513443, 0.0001080753281712532, 0.00011247396469116211]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 13.0, 19.0, 28.0, 25.0, 36.0, 71.0, 108.0, 160.0, 231.0, 401.0, 559.0, 935.0, 1537.0, 2492.0, 4404.0, 8678.0, 19091.0, 61170.0, 335306.0, 477921.0, 87978.0, 24531.0, 10263.0, 5122.0, 2828.0, 1755.0, 1002.0, 675.0, 370.0, 242.0, 181.0, 145.0, 65.0, 44.0, 51.0, 23.0, 26.0, 14.0, 15.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77734375, -0.753143310546875, -0.72894287109375, -0.704742431640625, -0.6805419921875, -0.656341552734375, -0.63214111328125, -0.607940673828125, -0.583740234375, -0.559539794921875, -0.53533935546875, -0.511138916015625, -0.4869384765625, -0.462738037109375, -0.43853759765625, -0.414337158203125, -0.39013671875, -0.365936279296875, -0.34173583984375, -0.317535400390625, -0.2933349609375, -0.269134521484375, -0.24493408203125, -0.220733642578125, -0.196533203125, -0.172332763671875, -0.14813232421875, -0.123931884765625, -0.0997314453125, -0.075531005859375, -0.05133056640625, -0.027130126953125, -0.0029296875, 0.021270751953125, 0.04547119140625, 0.069671630859375, 0.0938720703125, 0.118072509765625, 0.14227294921875, 0.166473388671875, 0.190673828125, 0.214874267578125, 0.23907470703125, 0.263275146484375, 0.2874755859375, 0.311676025390625, 0.33587646484375, 0.360076904296875, 0.38427734375, 0.408477783203125, 0.43267822265625, 0.456878662109375, 0.4810791015625, 0.505279541015625, 0.52947998046875, 0.553680419921875, 0.577880859375, 0.602081298828125, 0.62628173828125, 0.650482177734375, 0.6746826171875, 0.698883056640625, 0.72308349609375, 0.747283935546875, 0.771484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 1.0, 6.0, 7.0, 5.0, 15.0, 15.0, 18.0, 19.0, 20.0, 41.0, 61.0, 60.0, 71.0, 81.0, 83.0, 83.0, 69.0, 62.0, 59.0, 53.0, 38.0, 23.0, 23.0, 17.0, 12.0, 7.0, 6.0, 6.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08528614044189453, -0.08268165588378906, -0.0800771713256836, -0.07747268676757812, -0.07486820220947266, -0.07226371765136719, -0.06965923309326172, -0.06705474853515625, -0.06445026397705078, -0.06184577941894531, -0.059241294860839844, -0.056636810302734375, -0.054032325744628906, -0.05142784118652344, -0.04882335662841797, -0.0462188720703125, -0.04361438751220703, -0.04100990295410156, -0.038405418395996094, -0.035800933837890625, -0.033196449279785156, -0.030591964721679688, -0.02798748016357422, -0.02538299560546875, -0.02277851104736328, -0.020174026489257812, -0.017569541931152344, -0.014965057373046875, -0.012360572814941406, -0.009756088256835938, -0.007151603698730469, -0.004547119140625, -0.0019426345825195312, 0.0006618499755859375, 0.0032663345336914062, 0.005870819091796875, 0.008475303649902344, 0.011079788208007812, 0.013684272766113281, 0.01628875732421875, 0.01889324188232422, 0.021497726440429688, 0.024102210998535156, 0.026706695556640625, 0.029311180114746094, 0.03191566467285156, 0.03452014923095703, 0.0371246337890625, 0.03972911834716797, 0.04233360290527344, 0.044938087463378906, 0.047542572021484375, 0.050147056579589844, 0.05275154113769531, 0.05535602569580078, 0.05796051025390625, 0.06056499481201172, 0.06316947937011719, 0.06577396392822266, 0.06837844848632812, 0.0709829330444336, 0.07358741760253906, 0.07619190216064453, 0.07879638671875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 13.0, 17.0, 15.0, 16.0, 24.0, 29.0, 49.0, 37.0, 47.0, 38.0, 66.0, 54.0, 53.0, 52.0, 66.0, 56.0, 48.0, 45.0, 62.0, 45.0, 27.0, 23.0, 22.0, 11.0, 14.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2968430519104, -4.153965950012207, -4.011088848114014, -3.8682117462158203, -3.725334644317627, -3.5824575424194336, -3.4395806789398193, -3.296703577041626, -3.1538264751434326, -3.0109493732452393, -2.868072271347046, -2.7251951694488525, -2.5823183059692383, -2.439441204071045, -2.2965641021728516, -2.153687000274658, -2.010809898376465, -1.8679327964782715, -1.7250556945800781, -1.5821787118911743, -1.439301609992981, -1.2964245080947876, -1.1535475254058838, -1.0106704235076904, -0.8677933216094971, -0.7249162197113037, -0.5820391774177551, -0.43916210532188416, -0.2962850332260132, -0.15340793132781982, -0.01053088903427124, 0.13234615325927734, 0.2752237319946289, 0.4181008040904999, 0.5609778761863708, 0.7038549184799194, 0.8467320203781128, 0.9896091222763062, 1.13248610496521, 1.2753632068634033, 1.4182403087615967, 1.56111741065979, 1.7039945125579834, 1.8468714952468872, 1.9897485971450806, 2.1326255798339844, 2.2755026817321777, 2.418379783630371, 2.5612568855285645, 2.704133987426758, 2.847011089324951, 2.9898881912231445, 3.132765293121338, 3.2756423950195312, 3.4185192584991455, 3.561396360397339, 3.7042734622955322, 3.8471505641937256, 3.990027666091919, 4.132904529571533, 4.275781631469727, 4.41865873336792, 4.561535835266113, 4.704412937164307, 4.8472900390625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 7.0, 5.0, 9.0, 8.0, 11.0, 6.0, 7.0, 21.0, 17.0, 16.0, 28.0, 24.0, 33.0, 15.0, 23.0, 38.0, 40.0, 56.0, 49.0, 49.0, 46.0, 41.0, 42.0, 44.0, 38.0, 43.0, 32.0, 35.0, 33.0, 29.0, 22.0, 25.0, 20.0, 15.0, 13.0, 17.0, 9.0, 11.0, 4.0, 4.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.9570462703704834, -2.8646326065063477, -2.772218942642212, -2.6798055171966553, -2.5873918533325195, -2.494978189468384, -2.402564525604248, -2.3101511001586914, -2.2177374362945557, -2.12532377243042, -2.032910108566284, -1.940496563911438, -1.8480830192565918, -1.755669355392456, -1.6632556915283203, -1.5708421468734741, -1.4784284830093384, -1.3860148191452026, -1.2936012744903564, -1.2011876106262207, -1.1087740659713745, -1.0163604021072388, -0.9239467978477478, -0.8315331935882568, -0.7391195893287659, -0.6467059850692749, -0.5542923808097839, -0.4618787467479706, -0.3694651424884796, -0.27705153822898865, -0.1846379041671753, -0.09222429990768433, 0.00018930435180664062, 0.0926029160618782, 0.18501652777194977, 0.27743014693260193, 0.3698437511920929, 0.46225735545158386, 0.5546709895133972, 0.6470845937728882, 0.7394981980323792, 0.8319118022918701, 0.9243254065513611, 1.016739010810852, 1.1091526746749878, 1.201566219329834, 1.2939798831939697, 1.3863935470581055, 1.4788070917129517, 1.5712207555770874, 1.6636343002319336, 1.7560479640960693, 1.8484615087509155, 1.9408751726150513, 2.0332887172698975, 2.125702381134033, 2.218116044998169, 2.3105297088623047, 2.4029433727264404, 2.495356798171997, 2.587770462036133, 2.6801841259002686, 2.7725977897644043, 2.865011215209961, 2.9574248790740967]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 10.0, 8.0, 15.0, 16.0, 32.0, 39.0, 44.0, 100.0, 145.0, 225.0, 414.0, 734.0, 1417.0, 2824.0, 5746.0, 12144.0, 24562.0, 47944.0, 85840.0, 136037.0, 177560.0, 184203.0, 150329.0, 100599.0, 57474.0, 30132.0, 14930.0, 7364.0, 3704.0, 1868.0, 930.0, 464.0, 258.0, 146.0, 86.0, 70.0, 27.0, 42.0, 19.0, 15.0, 14.0, 3.0, 7.0, 8.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15234375, -4.023193359375, -3.89404296875, -3.764892578125, -3.6357421875, -3.506591796875, -3.37744140625, -3.248291015625, -3.119140625, -2.989990234375, -2.86083984375, -2.731689453125, -2.6025390625, -2.473388671875, -2.34423828125, -2.215087890625, -2.0859375, -1.956787109375, -1.82763671875, -1.698486328125, -1.5693359375, -1.440185546875, -1.31103515625, -1.181884765625, -1.052734375, -0.923583984375, -0.79443359375, -0.665283203125, -0.5361328125, -0.406982421875, -0.27783203125, -0.148681640625, -0.01953125, 0.109619140625, 0.23876953125, 0.367919921875, 0.4970703125, 0.626220703125, 0.75537109375, 0.884521484375, 1.013671875, 1.142822265625, 1.27197265625, 1.401123046875, 1.5302734375, 1.659423828125, 1.78857421875, 1.917724609375, 2.046875, 2.176025390625, 2.30517578125, 2.434326171875, 2.5634765625, 2.692626953125, 2.82177734375, 2.950927734375, 3.080078125, 3.209228515625, 3.33837890625, 3.467529296875, 3.5966796875, 3.725830078125, 3.85498046875, 3.984130859375, 4.11328125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 10.0, 12.0, 11.0, 12.0, 12.0, 17.0, 22.0, 21.0, 25.0, 18.0, 33.0, 44.0, 34.0, 33.0, 44.0, 36.0, 52.0, 44.0, 42.0, 50.0, 36.0, 30.0, 34.0, 36.0, 38.0, 38.0, 24.0, 21.0, 27.0, 19.0, 14.0, 28.0, 24.0, 5.0, 9.0, 9.0, 4.0, 5.0, 1.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.291015625, -3.19171142578125, -3.0924072265625, -2.99310302734375, -2.893798828125, -2.79449462890625, -2.6951904296875, -2.59588623046875, -2.49658203125, -2.39727783203125, -2.2979736328125, -2.19866943359375, -2.099365234375, -2.00006103515625, -1.9007568359375, -1.80145263671875, -1.7021484375, -1.60284423828125, -1.5035400390625, -1.40423583984375, -1.304931640625, -1.20562744140625, -1.1063232421875, -1.00701904296875, -0.90771484375, -0.80841064453125, -0.7091064453125, -0.60980224609375, -0.510498046875, -0.41119384765625, -0.3118896484375, -0.21258544921875, -0.11328125, -0.01397705078125, 0.0853271484375, 0.18463134765625, 0.283935546875, 0.38323974609375, 0.4825439453125, 0.58184814453125, 0.68115234375, 0.78045654296875, 0.8797607421875, 0.97906494140625, 1.078369140625, 1.17767333984375, 1.2769775390625, 1.37628173828125, 1.4755859375, 1.57489013671875, 1.6741943359375, 1.77349853515625, 1.872802734375, 1.97210693359375, 2.0714111328125, 2.17071533203125, 2.27001953125, 2.36932373046875, 2.4686279296875, 2.56793212890625, 2.667236328125, 2.76654052734375, 2.8658447265625, 2.96514892578125, 3.064453125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 15.0, 24.0, 23.0, 38.0, 66.0, 123.0, 170.0, 293.0, 532.0, 990.0, 1619.0, 2808.0, 5080.0, 8509.0, 14451.0, 23588.0, 37186.0, 55677.0, 79467.0, 103598.0, 122421.0, 130999.0, 123390.0, 104262.0, 80251.0, 57032.0, 37468.0, 23663.0, 14468.0, 8504.0, 4983.0, 2950.0, 1615.0, 916.0, 500.0, 333.0, 206.0, 132.0, 65.0, 50.0, 23.0, 25.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.80078125, -2.708984375, -2.6171875, -2.525390625, -2.43359375, -2.341796875, -2.25, -2.158203125, -2.06640625, -1.974609375, -1.8828125, -1.791015625, -1.69921875, -1.607421875, -1.515625, -1.423828125, -1.33203125, -1.240234375, -1.1484375, -1.056640625, -0.96484375, -0.873046875, -0.78125, -0.689453125, -0.59765625, -0.505859375, -0.4140625, -0.322265625, -0.23046875, -0.138671875, -0.046875, 0.044921875, 0.13671875, 0.228515625, 0.3203125, 0.412109375, 0.50390625, 0.595703125, 0.6875, 0.779296875, 0.87109375, 0.962890625, 1.0546875, 1.146484375, 1.23828125, 1.330078125, 1.421875, 1.513671875, 1.60546875, 1.697265625, 1.7890625, 1.880859375, 1.97265625, 2.064453125, 2.15625, 2.248046875, 2.33984375, 2.431640625, 2.5234375, 2.615234375, 2.70703125, 2.798828125, 2.890625, 2.982421875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 8.0, 6.0, 9.0, 8.0, 13.0, 18.0, 13.0, 23.0, 23.0, 23.0, 24.0, 30.0, 38.0, 17.0, 46.0, 37.0, 33.0, 42.0, 33.0, 37.0, 43.0, 45.0, 32.0, 41.0, 31.0, 34.0, 32.0, 23.0, 26.0, 19.0, 30.0, 33.0, 15.0, 24.0, 16.0, 11.0, 9.0, 13.0, 11.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.9267578125, -1.8705291748046875, -1.814300537109375, -1.7580718994140625, -1.70184326171875, -1.6456146240234375, -1.589385986328125, -1.5331573486328125, -1.4769287109375, -1.4207000732421875, -1.364471435546875, -1.3082427978515625, -1.25201416015625, -1.1957855224609375, -1.139556884765625, -1.0833282470703125, -1.027099609375, -0.9708709716796875, -0.914642333984375, -0.8584136962890625, -0.80218505859375, -0.7459564208984375, -0.689727783203125, -0.6334991455078125, -0.5772705078125, -0.5210418701171875, -0.464813232421875, -0.4085845947265625, -0.35235595703125, -0.2961273193359375, -0.239898681640625, -0.1836700439453125, -0.12744140625, -0.0712127685546875, -0.014984130859375, 0.0412445068359375, 0.09747314453125, 0.1537017822265625, 0.209930419921875, 0.2661590576171875, 0.3223876953125, 0.3786163330078125, 0.434844970703125, 0.4910736083984375, 0.54730224609375, 0.6035308837890625, 0.659759521484375, 0.7159881591796875, 0.772216796875, 0.8284454345703125, 0.884674072265625, 0.9409027099609375, 0.99713134765625, 1.0533599853515625, 1.109588623046875, 1.1658172607421875, 1.2220458984375, 1.2782745361328125, 1.334503173828125, 1.3907318115234375, 1.44696044921875, 1.5031890869140625, 1.559417724609375, 1.6156463623046875, 1.671875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 8.0, 11.0, 15.0, 19.0, 37.0, 55.0, 74.0, 92.0, 160.0, 204.0, 309.0, 421.0, 670.0, 933.0, 1515.0, 2273.0, 4034.0, 7944.0, 22940.0, 102758.0, 376157.0, 380093.0, 105667.0, 23298.0, 7906.0, 3976.0, 2368.0, 1457.0, 976.0, 733.0, 430.0, 306.0, 195.0, 145.0, 107.0, 64.0, 61.0, 39.0, 24.0, 17.0, 12.0, 9.0, 6.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.56640625, -5.39776611328125, -5.2291259765625, -5.06048583984375, -4.891845703125, -4.72320556640625, -4.5545654296875, -4.38592529296875, -4.21728515625, -4.04864501953125, -3.8800048828125, -3.71136474609375, -3.542724609375, -3.37408447265625, -3.2054443359375, -3.03680419921875, -2.8681640625, -2.69952392578125, -2.5308837890625, -2.36224365234375, -2.193603515625, -2.02496337890625, -1.8563232421875, -1.68768310546875, -1.51904296875, -1.35040283203125, -1.1817626953125, -1.01312255859375, -0.844482421875, -0.67584228515625, -0.5072021484375, -0.33856201171875, -0.169921875, -0.00128173828125, 0.1673583984375, 0.33599853515625, 0.504638671875, 0.67327880859375, 0.8419189453125, 1.01055908203125, 1.17919921875, 1.34783935546875, 1.5164794921875, 1.68511962890625, 1.853759765625, 2.02239990234375, 2.1910400390625, 2.35968017578125, 2.5283203125, 2.69696044921875, 2.8656005859375, 3.03424072265625, 3.202880859375, 3.37152099609375, 3.5401611328125, 3.70880126953125, 3.87744140625, 4.04608154296875, 4.2147216796875, 4.38336181640625, 4.552001953125, 4.72064208984375, 4.8892822265625, 5.05792236328125, 5.2265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 7.0, 6.0, 16.0, 27.0, 71.0, 112.0, 131.0, 172.0, 158.0, 121.0, 79.0, 34.0, 17.0, 16.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004525184631347656, -0.00043723732233047485, -0.0004219561815261841, -0.0004066750407218933, -0.00039139389991760254, -0.00037611275911331177, -0.000360831618309021, -0.0003455504775047302, -0.00033026933670043945, -0.0003149881958961487, -0.0002997070550918579, -0.00028442591428756714, -0.00026914477348327637, -0.0002538636326789856, -0.00023858249187469482, -0.00022330135107040405, -0.00020802021026611328, -0.0001927390694618225, -0.00017745792865753174, -0.00016217678785324097, -0.0001468956470489502, -0.00013161450624465942, -0.00011633336544036865, -0.00010105222463607788, -8.577108383178711e-05, -7.048994302749634e-05, -5.5208802223205566e-05, -3.9927661418914795e-05, -2.4646520614624023e-05, -9.365379810333252e-06, 5.9157609939575195e-06, 2.119690179824829e-05, 3.647804260253906e-05, 5.1759183406829834e-05, 6.70403242111206e-05, 8.232146501541138e-05, 9.760260581970215e-05, 0.00011288374662399292, 0.0001281648874282837, 0.00014344602823257446, 0.00015872716903686523, 0.000174008309841156, 0.00018928945064544678, 0.00020457059144973755, 0.00021985173225402832, 0.0002351328730583191, 0.00025041401386260986, 0.00026569515466690063, 0.0002809762954711914, 0.0002962574362754822, 0.00031153857707977295, 0.0003268197178840637, 0.0003421008586883545, 0.00035738199949264526, 0.00037266314029693604, 0.0003879442811012268, 0.0004032254219055176, 0.00041850656270980835, 0.0004337877035140991, 0.0004490688443183899, 0.00046434998512268066, 0.00047963112592697144, 0.0004949122667312622, 0.000510193407535553, 0.0005254745483398438]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 16.0, 12.0, 18.0, 33.0, 47.0, 43.0, 75.0, 102.0, 132.0, 171.0, 227.0, 302.0, 457.0, 617.0, 918.0, 1364.0, 2358.0, 4660.0, 11594.0, 37540.0, 131100.0, 327285.0, 331323.0, 134993.0, 39105.0, 12257.0, 4752.0, 2367.0, 1456.0, 921.0, 591.0, 434.0, 335.0, 223.0, 156.0, 142.0, 91.0, 80.0, 46.0, 35.0, 41.0, 42.0, 18.0, 13.0, 10.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.1640625, -4.03399658203125, -3.9039306640625, -3.77386474609375, -3.643798828125, -3.51373291015625, -3.3836669921875, -3.25360107421875, -3.12353515625, -2.99346923828125, -2.8634033203125, -2.73333740234375, -2.603271484375, -2.47320556640625, -2.3431396484375, -2.21307373046875, -2.0830078125, -1.95294189453125, -1.8228759765625, -1.69281005859375, -1.562744140625, -1.43267822265625, -1.3026123046875, -1.17254638671875, -1.04248046875, -0.91241455078125, -0.7823486328125, -0.65228271484375, -0.522216796875, -0.39215087890625, -0.2620849609375, -0.13201904296875, -0.001953125, 0.12811279296875, 0.2581787109375, 0.38824462890625, 0.518310546875, 0.64837646484375, 0.7784423828125, 0.90850830078125, 1.03857421875, 1.16864013671875, 1.2987060546875, 1.42877197265625, 1.558837890625, 1.68890380859375, 1.8189697265625, 1.94903564453125, 2.0791015625, 2.20916748046875, 2.3392333984375, 2.46929931640625, 2.599365234375, 2.72943115234375, 2.8594970703125, 2.98956298828125, 3.11962890625, 3.24969482421875, 3.3797607421875, 3.50982666015625, 3.639892578125, 3.76995849609375, 3.9000244140625, 4.03009033203125, 4.16015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 11.0, 21.0, 19.0, 19.0, 33.0, 37.0, 63.0, 45.0, 72.0, 70.0, 80.0, 83.0, 64.0, 81.0, 49.0, 37.0, 55.0, 28.0, 29.0, 16.0, 16.0, 10.0, 12.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56298828125, -0.54302978515625, -0.5230712890625, -0.50311279296875, -0.483154296875, -0.46319580078125, -0.4432373046875, -0.42327880859375, -0.4033203125, -0.38336181640625, -0.3634033203125, -0.34344482421875, -0.323486328125, -0.30352783203125, -0.2835693359375, -0.26361083984375, -0.24365234375, -0.22369384765625, -0.2037353515625, -0.18377685546875, -0.163818359375, -0.14385986328125, -0.1239013671875, -0.10394287109375, -0.083984375, -0.06402587890625, -0.0440673828125, -0.02410888671875, -0.004150390625, 0.01580810546875, 0.0357666015625, 0.05572509765625, 0.07568359375, 0.09564208984375, 0.1156005859375, 0.13555908203125, 0.155517578125, 0.17547607421875, 0.1954345703125, 0.21539306640625, 0.2353515625, 0.25531005859375, 0.2752685546875, 0.29522705078125, 0.315185546875, 0.33514404296875, 0.3551025390625, 0.37506103515625, 0.39501953125, 0.41497802734375, 0.4349365234375, 0.45489501953125, 0.474853515625, 0.49481201171875, 0.5147705078125, 0.53472900390625, 0.5546875, 0.57464599609375, 0.5946044921875, 0.61456298828125, 0.634521484375, 0.65447998046875, 0.6744384765625, 0.69439697265625, 0.71435546875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 11.0, 6.0, 8.0, 12.0, 14.0, 13.0, 18.0, 17.0, 21.0, 19.0, 24.0, 45.0, 36.0, 62.0, 41.0, 50.0, 57.0, 37.0, 42.0, 52.0, 39.0, 56.0, 50.0, 46.0, 33.0, 45.0, 23.0, 20.0, 16.0, 18.0, 7.0, 12.0, 9.0, 9.0, 5.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8454155921936035, -3.7189691066741943, -3.5925228595733643, -3.466076374053955, -3.339630126953125, -3.213183641433716, -3.0867371559143066, -2.9602909088134766, -2.8338444232940674, -2.707397937774658, -2.580951690673828, -2.454505205154419, -2.3280587196350098, -2.2016124725341797, -2.0751659870147705, -1.9487196207046509, -1.8222732543945312, -1.6958268880844116, -1.569380521774292, -1.4429340362548828, -1.3164876699447632, -1.1900413036346436, -1.0635948181152344, -0.9371484518051147, -0.8107020854949951, -0.6842557191848755, -0.5578092932701111, -0.43136289715766907, -0.30491650104522705, -0.17847013473510742, -0.05202370882034302, 0.07442271709442139, 0.20086908340454102, 0.32731547951698303, 0.45376187562942505, 0.5802083015441895, 0.7066546678543091, 0.8331010341644287, 0.9595474600791931, 1.0859938859939575, 1.2124402523040771, 1.3388866186141968, 1.4653329849243164, 1.5917794704437256, 1.7182258367538452, 1.8446722030639648, 1.971118688583374, 2.097565174102783, 2.2240114212036133, 2.3504579067230225, 2.4769041538238525, 2.6033506393432617, 2.729796886444092, 2.856243371963501, 2.98268985748291, 3.1091361045837402, 3.2355825901031494, 3.3620290756225586, 3.4884753227233887, 3.614921808242798, 3.741368293762207, 3.867814540863037, 3.9942610263824463, 4.1207075119018555, 4.2471537590026855]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 11.0, 6.0, 12.0, 19.0, 15.0, 20.0, 24.0, 31.0, 28.0, 23.0, 32.0, 36.0, 43.0, 54.0, 57.0, 46.0, 46.0, 45.0, 64.0, 39.0, 43.0, 40.0, 38.0, 22.0, 35.0, 28.0, 24.0, 20.0, 11.0, 17.0, 12.0, 9.0, 6.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2916483879089355, -3.1906661987304688, -3.089684247970581, -2.9887020587921143, -2.8877198696136475, -2.7867379188537598, -2.685755729675293, -2.584773540496826, -2.4837913513183594, -2.3828091621398926, -2.281827211380005, -2.180845022201538, -2.0798628330230713, -1.978880763053894, -1.8778986930847168, -1.77691650390625, -1.6759345531463623, -1.574952483177185, -1.4739702939987183, -1.372988224029541, -1.2720060348510742, -1.171023964881897, -1.0700418949127197, -0.9690597653388977, -0.8680776357650757, -0.7670955061912537, -0.6661133766174316, -0.5651313066482544, -0.4641491770744324, -0.36316704750061035, -0.2621849775314331, -0.16120284795761108, -0.06022047996520996, 0.04076163470745087, 0.1417437493801117, 0.24272584915161133, 0.34370797872543335, 0.44469010829925537, 0.5456721782684326, 0.6466543078422546, 0.7476364374160767, 0.8486185669898987, 0.9496006965637207, 1.050582766532898, 1.1515648365020752, 1.252547025680542, 1.3535290956497192, 1.4545111656188965, 1.5554933547973633, 1.6564754247665405, 1.7574576139450073, 1.8584396839141846, 1.9594218730926514, 2.060403823852539, 2.161386013031006, 2.2623682022094727, 2.3633503913879395, 2.4643325805664062, 2.565314531326294, 2.6662967205047607, 2.7672789096832275, 2.8682608604431152, 2.969243049621582, 3.070225238800049, 3.1712071895599365]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 19.0, 13.0, 36.0, 31.0, 62.0, 107.0, 183.0, 283.0, 440.0, 683.0, 1182.0, 2040.0, 3413.0, 5704.0, 9587.0, 15854.0, 26763.0, 44545.0, 74366.0, 121954.0, 197219.0, 301775.0, 429485.0, 548062.0, 597511.0, 550348.0, 434219.0, 305813.0, 200657.0, 125436.0, 77562.0, 47008.0, 28580.0, 17248.0, 10254.0, 6346.0, 3780.0, 2249.0, 1361.0, 788.0, 520.0, 310.0, 182.0, 121.0, 75.0, 38.0, 22.0, 15.0, 14.0, 10.0, 5.0, 5.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.423828125, -3.31854248046875, -3.2132568359375, -3.10797119140625, -3.002685546875, -2.89739990234375, -2.7921142578125, -2.68682861328125, -2.58154296875, -2.47625732421875, -2.3709716796875, -2.26568603515625, -2.160400390625, -2.05511474609375, -1.9498291015625, -1.84454345703125, -1.7392578125, -1.63397216796875, -1.5286865234375, -1.42340087890625, -1.318115234375, -1.21282958984375, -1.1075439453125, -1.00225830078125, -0.89697265625, -0.79168701171875, -0.6864013671875, -0.58111572265625, -0.475830078125, -0.37054443359375, -0.2652587890625, -0.15997314453125, -0.0546875, 0.05059814453125, 0.1558837890625, 0.26116943359375, 0.366455078125, 0.47174072265625, 0.5770263671875, 0.68231201171875, 0.78759765625, 0.89288330078125, 0.9981689453125, 1.10345458984375, 1.208740234375, 1.31402587890625, 1.4193115234375, 1.52459716796875, 1.6298828125, 1.73516845703125, 1.8404541015625, 1.94573974609375, 2.051025390625, 2.15631103515625, 2.2615966796875, 2.36688232421875, 2.47216796875, 2.57745361328125, 2.6827392578125, 2.78802490234375, 2.893310546875, 2.99859619140625, 3.1038818359375, 3.20916748046875, 3.314453125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 5.0, 10.0, 6.0, 6.0, 8.0, 6.0, 14.0, 12.0, 19.0, 16.0, 20.0, 29.0, 30.0, 26.0, 36.0, 31.0, 35.0, 44.0, 53.0, 38.0, 45.0, 43.0, 33.0, 54.0, 45.0, 29.0, 42.0, 34.0, 27.0, 26.0, 28.0, 17.0, 26.0, 13.0, 17.0, 12.0, 13.0, 9.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.28125, -2.2098388671875, -2.138427734375, -2.0670166015625, -1.99560546875, -1.9241943359375, -1.852783203125, -1.7813720703125, -1.7099609375, -1.6385498046875, -1.567138671875, -1.4957275390625, -1.42431640625, -1.3529052734375, -1.281494140625, -1.2100830078125, -1.138671875, -1.0672607421875, -0.995849609375, -0.9244384765625, -0.85302734375, -0.7816162109375, -0.710205078125, -0.6387939453125, -0.5673828125, -0.4959716796875, -0.424560546875, -0.3531494140625, -0.28173828125, -0.2103271484375, -0.138916015625, -0.0675048828125, 0.00390625, 0.0753173828125, 0.146728515625, 0.2181396484375, 0.28955078125, 0.3609619140625, 0.432373046875, 0.5037841796875, 0.5751953125, 0.6466064453125, 0.718017578125, 0.7894287109375, 0.86083984375, 0.9322509765625, 1.003662109375, 1.0750732421875, 1.146484375, 1.2178955078125, 1.289306640625, 1.3607177734375, 1.43212890625, 1.5035400390625, 1.574951171875, 1.6463623046875, 1.7177734375, 1.7891845703125, 1.860595703125, 1.9320068359375, 2.00341796875, 2.0748291015625, 2.146240234375, 2.2176513671875, 2.2890625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 8.0, 6.0, 13.0, 19.0, 31.0, 63.0, 108.0, 134.0, 276.0, 428.0, 698.0, 1121.0, 1786.0, 3013.0, 4918.0, 7938.0, 13110.0, 21803.0, 35888.0, 57604.0, 93371.0, 144190.0, 217192.0, 312096.0, 415964.0, 500261.0, 533648.0, 498947.0, 414077.0, 312067.0, 217753.0, 145025.0, 92590.0, 57363.0, 35863.0, 21577.0, 13085.0, 7823.0, 4862.0, 2882.0, 1828.0, 1115.0, 658.0, 414.0, 257.0, 147.0, 100.0, 57.0, 38.0, 30.0, 15.0, 11.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.208984375, -3.103759765625, -2.99853515625, -2.893310546875, -2.7880859375, -2.682861328125, -2.57763671875, -2.472412109375, -2.3671875, -2.261962890625, -2.15673828125, -2.051513671875, -1.9462890625, -1.841064453125, -1.73583984375, -1.630615234375, -1.525390625, -1.420166015625, -1.31494140625, -1.209716796875, -1.1044921875, -0.999267578125, -0.89404296875, -0.788818359375, -0.68359375, -0.578369140625, -0.47314453125, -0.367919921875, -0.2626953125, -0.157470703125, -0.05224609375, 0.052978515625, 0.158203125, 0.263427734375, 0.36865234375, 0.473876953125, 0.5791015625, 0.684326171875, 0.78955078125, 0.894775390625, 1.0, 1.105224609375, 1.21044921875, 1.315673828125, 1.4208984375, 1.526123046875, 1.63134765625, 1.736572265625, 1.841796875, 1.947021484375, 2.05224609375, 2.157470703125, 2.2626953125, 2.367919921875, 2.47314453125, 2.578369140625, 2.68359375, 2.788818359375, 2.89404296875, 2.999267578125, 3.1044921875, 3.209716796875, 3.31494140625, 3.420166015625, 3.525390625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 7.0, 8.0, 16.0, 32.0, 33.0, 48.0, 51.0, 76.0, 95.0, 107.0, 131.0, 162.0, 190.0, 229.0, 246.0, 244.0, 225.0, 267.0, 279.0, 256.0, 225.0, 219.0, 175.0, 167.0, 125.0, 121.0, 87.0, 59.0, 59.0, 36.0, 30.0, 21.0, 17.0, 11.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4619140625, -1.412109375, -1.3623046875, -1.3125, -1.2626953125, -1.212890625, -1.1630859375, -1.11328125, -1.0634765625, -1.013671875, -0.9638671875, -0.9140625, -0.8642578125, -0.814453125, -0.7646484375, -0.71484375, -0.6650390625, -0.615234375, -0.5654296875, -0.515625, -0.4658203125, -0.416015625, -0.3662109375, -0.31640625, -0.2666015625, -0.216796875, -0.1669921875, -0.1171875, -0.0673828125, -0.017578125, 0.0322265625, 0.08203125, 0.1318359375, 0.181640625, 0.2314453125, 0.28125, 0.3310546875, 0.380859375, 0.4306640625, 0.48046875, 0.5302734375, 0.580078125, 0.6298828125, 0.6796875, 0.7294921875, 0.779296875, 0.8291015625, 0.87890625, 0.9287109375, 0.978515625, 1.0283203125, 1.078125, 1.1279296875, 1.177734375, 1.2275390625, 1.27734375, 1.3271484375, 1.376953125, 1.4267578125, 1.4765625, 1.5263671875, 1.576171875, 1.6259765625, 1.67578125, 1.7255859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 13.0, 17.0, 13.0, 18.0, 26.0, 28.0, 36.0, 44.0, 56.0, 52.0, 64.0, 69.0, 70.0, 70.0, 56.0, 47.0, 62.0, 43.0, 40.0, 35.0, 25.0, 18.0, 22.0, 16.0, 15.0, 6.0, 12.0, 6.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.872900009155273, -5.699295520782471, -5.525691032409668, -5.352086544036865, -5.1784820556640625, -5.00487756729126, -4.831273078918457, -4.657668590545654, -4.484064102172852, -4.310459613800049, -4.136855125427246, -3.9632506370544434, -3.7896461486816406, -3.616041660308838, -3.442437171936035, -3.2688326835632324, -3.0952281951904297, -2.921623706817627, -2.748019218444824, -2.5744147300720215, -2.4008102416992188, -2.227205753326416, -2.0536012649536133, -1.8799967765808105, -1.7063922882080078, -1.532787799835205, -1.3591833114624023, -1.1855788230895996, -1.0119743347167969, -0.8383698463439941, -0.6647653579711914, -0.49116086959838867, -0.31755685806274414, -0.1439523696899414, 0.029652118682861328, 0.20325660705566406, 0.3768610954284668, 0.5504655838012695, 0.7240700721740723, 0.897674560546875, 1.0712790489196777, 1.2448835372924805, 1.4184880256652832, 1.592092514038086, 1.7656970024108887, 1.9393014907836914, 2.112905979156494, 2.286510467529297, 2.4601149559020996, 2.6337194442749023, 2.807323932647705, 2.980928421020508, 3.1545329093933105, 3.3281373977661133, 3.501741886138916, 3.6753463745117188, 3.8489508628845215, 4.022555351257324, 4.196159839630127, 4.36976432800293, 4.543368816375732, 4.716973304748535, 4.890577793121338, 5.064182281494141, 5.237786769866943]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 4.0, 6.0, 7.0, 9.0, 9.0, 18.0, 10.0, 11.0, 22.0, 17.0, 42.0, 32.0, 37.0, 44.0, 46.0, 42.0, 43.0, 50.0, 40.0, 45.0, 55.0, 38.0, 47.0, 30.0, 42.0, 42.0, 37.0, 26.0, 30.0, 16.0, 21.0, 14.0, 13.0, 11.0, 8.0, 10.0, 9.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1771504878997803, -3.077770471572876, -2.9783902168273926, -2.8790102005004883, -2.779629945755005, -2.6802499294281006, -2.580869674682617, -2.481489658355713, -2.3821096420288086, -2.2827296257019043, -2.183349370956421, -2.0839693546295166, -1.9845890998840332, -1.885209083557129, -1.785828948020935, -1.6864488124847412, -1.5870685577392578, -1.487688422203064, -1.3883082866668701, -1.2889282703399658, -1.1895480155944824, -1.0901679992675781, -0.9907878637313843, -0.8914077281951904, -0.7920275926589966, -0.6926474571228027, -0.5932673215866089, -0.4938872456550598, -0.39450711011886597, -0.2951269745826721, -0.19574689865112305, -0.0963667631149292, 0.003013134002685547, 0.1023932546377182, 0.20177337527275085, 0.3011534810066223, 0.40053361654281616, 0.49991375207901, 0.5992938280105591, 0.6986739635467529, 0.7980540990829468, 0.8974342346191406, 0.9968143701553345, 1.0961945056915283, 1.1955745220184326, 1.294954776763916, 1.3943347930908203, 1.4937149286270142, 1.593095064163208, 1.6924751996994019, 1.7918553352355957, 1.8912353515625, 1.9906156063079834, 2.0899956226348877, 2.189375877380371, 2.2887558937072754, 2.3881359100341797, 2.487515926361084, 2.5868961811065674, 2.6862761974334717, 2.785656452178955, 2.8850364685058594, 2.9844164848327637, 3.083796739578247, 3.1831769943237305]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 17.0, 17.0, 24.0, 27.0, 28.0, 50.0, 89.0, 139.0, 175.0, 320.0, 562.0, 870.0, 1446.0, 2525.0, 4301.0, 7769.0, 14146.0, 26378.0, 50343.0, 99360.0, 185241.0, 253280.0, 188546.0, 100929.0, 52298.0, 26690.0, 14214.0, 7864.0, 4444.0, 2526.0, 1579.0, 880.0, 539.0, 315.0, 199.0, 154.0, 92.0, 59.0, 38.0, 27.0, 22.0, 13.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -1.0146026611328125, -0.981353759765625, -0.9481048583984375, -0.91485595703125, -0.8816070556640625, -0.848358154296875, -0.8151092529296875, -0.7818603515625, -0.7486114501953125, -0.715362548828125, -0.6821136474609375, -0.64886474609375, -0.6156158447265625, -0.582366943359375, -0.5491180419921875, -0.515869140625, -0.4826202392578125, -0.449371337890625, -0.4161224365234375, -0.38287353515625, -0.3496246337890625, -0.316375732421875, -0.2831268310546875, -0.2498779296875, -0.2166290283203125, -0.183380126953125, -0.1501312255859375, -0.11688232421875, -0.0836334228515625, -0.050384521484375, -0.0171356201171875, 0.01611328125, 0.0493621826171875, 0.082611083984375, 0.1158599853515625, 0.14910888671875, 0.1823577880859375, 0.215606689453125, 0.2488555908203125, 0.2821044921875, 0.3153533935546875, 0.348602294921875, 0.3818511962890625, 0.41510009765625, 0.4483489990234375, 0.481597900390625, 0.5148468017578125, 0.548095703125, 0.5813446044921875, 0.614593505859375, 0.6478424072265625, 0.68109130859375, 0.7143402099609375, 0.747589111328125, 0.7808380126953125, 0.8140869140625, 0.8473358154296875, 0.880584716796875, 0.9138336181640625, 0.94708251953125, 0.9803314208984375, 1.013580322265625, 1.0468292236328125, 1.080078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 7.0, 10.0, 10.0, 19.0, 20.0, 31.0, 29.0, 38.0, 29.0, 51.0, 43.0, 51.0, 53.0, 49.0, 45.0, 57.0, 46.0, 51.0, 58.0, 49.0, 30.0, 37.0, 30.0, 27.0, 25.0, 14.0, 21.0, 19.0, 13.0, 13.0, 6.0, 3.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.821533203125, -3.69384765625, -3.566162109375, -3.4384765625, -3.310791015625, -3.18310546875, -3.055419921875, -2.927734375, -2.800048828125, -2.67236328125, -2.544677734375, -2.4169921875, -2.289306640625, -2.16162109375, -2.033935546875, -1.90625, -1.778564453125, -1.65087890625, -1.523193359375, -1.3955078125, -1.267822265625, -1.14013671875, -1.012451171875, -0.884765625, -0.757080078125, -0.62939453125, -0.501708984375, -0.3740234375, -0.246337890625, -0.11865234375, 0.009033203125, 0.13671875, 0.264404296875, 0.39208984375, 0.519775390625, 0.6474609375, 0.775146484375, 0.90283203125, 1.030517578125, 1.158203125, 1.285888671875, 1.41357421875, 1.541259765625, 1.6689453125, 1.796630859375, 1.92431640625, 2.052001953125, 2.1796875, 2.307373046875, 2.43505859375, 2.562744140625, 2.6904296875, 2.818115234375, 2.94580078125, 3.073486328125, 3.201171875, 3.328857421875, 3.45654296875, 3.584228515625, 3.7119140625, 3.839599609375, 3.96728515625, 4.094970703125, 4.22265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 7.0, 18.0, 26.0, 44.0, 63.0, 78.0, 131.0, 231.0, 357.0, 532.0, 925.0, 1624.0, 2933.0, 5552.0, 11175.0, 22774.0, 48199.0, 106543.0, 231689.0, 302963.0, 168476.0, 74929.0, 34806.0, 16557.0, 8148.0, 4291.0, 2221.0, 1274.0, 746.0, 447.0, 299.0, 173.0, 113.0, 69.0, 42.0, 32.0, 24.0, 19.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.181640625, -1.139862060546875, -1.09808349609375, -1.056304931640625, -1.0145263671875, -0.972747802734375, -0.93096923828125, -0.889190673828125, -0.847412109375, -0.805633544921875, -0.76385498046875, -0.722076416015625, -0.6802978515625, -0.638519287109375, -0.59674072265625, -0.554962158203125, -0.51318359375, -0.471405029296875, -0.42962646484375, -0.387847900390625, -0.3460693359375, -0.304290771484375, -0.26251220703125, -0.220733642578125, -0.178955078125, -0.137176513671875, -0.09539794921875, -0.053619384765625, -0.0118408203125, 0.029937744140625, 0.07171630859375, 0.113494873046875, 0.1552734375, 0.197052001953125, 0.23883056640625, 0.280609130859375, 0.3223876953125, 0.364166259765625, 0.40594482421875, 0.447723388671875, 0.489501953125, 0.531280517578125, 0.57305908203125, 0.614837646484375, 0.6566162109375, 0.698394775390625, 0.74017333984375, 0.781951904296875, 0.82373046875, 0.865509033203125, 0.90728759765625, 0.949066162109375, 0.9908447265625, 1.032623291015625, 1.07440185546875, 1.116180419921875, 1.157958984375, 1.199737548828125, 1.24151611328125, 1.283294677734375, 1.3250732421875, 1.366851806640625, 1.40863037109375, 1.450408935546875, 1.4921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 9.0, 9.0, 20.0, 13.0, 20.0, 19.0, 25.0, 24.0, 24.0, 32.0, 31.0, 41.0, 42.0, 43.0, 45.0, 53.0, 42.0, 47.0, 39.0, 41.0, 42.0, 41.0, 30.0, 33.0, 32.0, 26.0, 17.0, 31.0, 16.0, 17.0, 21.0, 16.0, 10.0, 13.0, 6.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.951141357421875, -1.88470458984375, -1.818267822265625, -1.7518310546875, -1.685394287109375, -1.61895751953125, -1.552520751953125, -1.486083984375, -1.419647216796875, -1.35321044921875, -1.286773681640625, -1.2203369140625, -1.153900146484375, -1.08746337890625, -1.021026611328125, -0.95458984375, -0.888153076171875, -0.82171630859375, -0.755279541015625, -0.6888427734375, -0.622406005859375, -0.55596923828125, -0.489532470703125, -0.423095703125, -0.356658935546875, -0.29022216796875, -0.223785400390625, -0.1573486328125, -0.090911865234375, -0.02447509765625, 0.041961669921875, 0.1083984375, 0.174835205078125, 0.24127197265625, 0.307708740234375, 0.3741455078125, 0.440582275390625, 0.50701904296875, 0.573455810546875, 0.639892578125, 0.706329345703125, 0.77276611328125, 0.839202880859375, 0.9056396484375, 0.972076416015625, 1.03851318359375, 1.104949951171875, 1.17138671875, 1.237823486328125, 1.30426025390625, 1.370697021484375, 1.4371337890625, 1.503570556640625, 1.57000732421875, 1.636444091796875, 1.702880859375, 1.769317626953125, 1.83575439453125, 1.902191162109375, 1.9686279296875, 2.035064697265625, 2.10150146484375, 2.167938232421875, 2.234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 12.0, 16.0, 15.0, 32.0, 31.0, 40.0, 71.0, 102.0, 167.0, 258.0, 329.0, 533.0, 849.0, 1521.0, 3647.0, 14729.0, 338748.0, 656650.0, 22036.0, 4382.0, 1751.0, 907.0, 547.0, 387.0, 264.0, 158.0, 93.0, 83.0, 62.0, 51.0, 22.0, 17.0, 12.0, 4.0, 4.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.16082763671875, -1.1195068359375, -1.07818603515625, -1.036865234375, -0.99554443359375, -0.9542236328125, -0.91290283203125, -0.87158203125, -0.83026123046875, -0.7889404296875, -0.74761962890625, -0.706298828125, -0.66497802734375, -0.6236572265625, -0.58233642578125, -0.541015625, -0.49969482421875, -0.4583740234375, -0.41705322265625, -0.375732421875, -0.33441162109375, -0.2930908203125, -0.25177001953125, -0.21044921875, -0.16912841796875, -0.1278076171875, -0.08648681640625, -0.045166015625, -0.00384521484375, 0.0374755859375, 0.07879638671875, 0.1201171875, 0.16143798828125, 0.2027587890625, 0.24407958984375, 0.285400390625, 0.32672119140625, 0.3680419921875, 0.40936279296875, 0.45068359375, 0.49200439453125, 0.5333251953125, 0.57464599609375, 0.615966796875, 0.65728759765625, 0.6986083984375, 0.73992919921875, 0.78125, 0.82257080078125, 0.8638916015625, 0.90521240234375, 0.946533203125, 0.98785400390625, 1.0291748046875, 1.07049560546875, 1.11181640625, 1.15313720703125, 1.1944580078125, 1.23577880859375, 1.277099609375, 1.31842041015625, 1.3597412109375, 1.40106201171875, 1.4423828125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 5.0, 18.0, 47.0, 102.0, 146.0, 177.0, 199.0, 125.0, 82.0, 33.0, 19.0, 6.0, 7.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22868537902832e-05, -6.032641977071762e-05, -5.836598575115204e-05, -5.6405551731586456e-05, -5.4445117712020874e-05, -5.248468369245529e-05, -5.052424967288971e-05, -4.856381565332413e-05, -4.6603381633758545e-05, -4.464294761419296e-05, -4.268251359462738e-05, -4.07220795750618e-05, -3.8761645555496216e-05, -3.6801211535930634e-05, -3.484077751636505e-05, -3.288034349679947e-05, -3.091990947723389e-05, -2.8959475457668304e-05, -2.6999041438102722e-05, -2.503860741853714e-05, -2.3078173398971558e-05, -2.1117739379405975e-05, -1.9157305359840393e-05, -1.719687134027481e-05, -1.5236437320709229e-05, -1.3276003301143646e-05, -1.1315569281578064e-05, -9.355135262012482e-06, -7.394701242446899e-06, -5.434267222881317e-06, -3.473833203315735e-06, -1.5133991837501526e-06, 4.470348358154297e-07, 2.407468855381012e-06, 4.367902874946594e-06, 6.3283368945121765e-06, 8.288770914077759e-06, 1.0249204933643341e-05, 1.2209638953208923e-05, 1.4170072972774506e-05, 1.6130506992340088e-05, 1.809094101190567e-05, 2.0051375031471252e-05, 2.2011809051036835e-05, 2.3972243070602417e-05, 2.5932677090168e-05, 2.789311110973358e-05, 2.9853545129299164e-05, 3.1813979148864746e-05, 3.377441316843033e-05, 3.573484718799591e-05, 3.769528120756149e-05, 3.9655715227127075e-05, 4.161614924669266e-05, 4.357658326625824e-05, 4.553701728582382e-05, 4.7497451305389404e-05, 4.9457885324954987e-05, 5.141831934452057e-05, 5.337875336408615e-05, 5.5339187383651733e-05, 5.7299621403217316e-05, 5.92600554227829e-05, 6.122048944234848e-05, 6.318092346191406e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 14.0, 20.0, 18.0, 19.0, 35.0, 45.0, 59.0, 108.0, 111.0, 169.0, 216.0, 279.0, 399.0, 499.0, 654.0, 870.0, 1177.0, 1676.0, 2637.0, 5276.0, 14765.0, 62911.0, 399818.0, 452940.0, 72632.0, 16119.0, 5785.0, 2818.0, 1683.0, 1189.0, 850.0, 707.0, 538.0, 384.0, 318.0, 203.0, 170.0, 121.0, 93.0, 67.0, 42.0, 30.0, 27.0, 20.0, 12.0, 9.0, 7.0, 7.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7431640625, -0.7192230224609375, -0.695281982421875, -0.6713409423828125, -0.64739990234375, -0.6234588623046875, -0.599517822265625, -0.5755767822265625, -0.5516357421875, -0.5276947021484375, -0.503753662109375, -0.4798126220703125, -0.45587158203125, -0.4319305419921875, -0.407989501953125, -0.3840484619140625, -0.360107421875, -0.3361663818359375, -0.312225341796875, -0.2882843017578125, -0.26434326171875, -0.2404022216796875, -0.216461181640625, -0.1925201416015625, -0.1685791015625, -0.1446380615234375, -0.120697021484375, -0.0967559814453125, -0.07281494140625, -0.0488739013671875, -0.024932861328125, -0.0009918212890625, 0.02294921875, 0.0468902587890625, 0.070831298828125, 0.0947723388671875, 0.11871337890625, 0.1426544189453125, 0.166595458984375, 0.1905364990234375, 0.2144775390625, 0.2384185791015625, 0.262359619140625, 0.2863006591796875, 0.31024169921875, 0.3341827392578125, 0.358123779296875, 0.3820648193359375, 0.406005859375, 0.4299468994140625, 0.453887939453125, 0.4778289794921875, 0.50177001953125, 0.5257110595703125, 0.549652099609375, 0.5735931396484375, 0.5975341796875, 0.6214752197265625, 0.645416259765625, 0.6693572998046875, 0.69329833984375, 0.7172393798828125, 0.741180419921875, 0.7651214599609375, 0.7890625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 9.0, 21.0, 41.0, 45.0, 55.0, 94.0, 81.0, 107.0, 106.0, 110.0, 71.0, 52.0, 53.0, 31.0, 30.0, 14.0, 18.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10317611694335938, -0.09996795654296875, -0.09675979614257812, -0.0935516357421875, -0.09034347534179688, -0.08713531494140625, -0.08392715454101562, -0.080718994140625, -0.07751083374023438, -0.07430267333984375, -0.07109451293945312, -0.0678863525390625, -0.06467819213867188, -0.06147003173828125, -0.058261871337890625, -0.0550537109375, -0.051845550537109375, -0.04863739013671875, -0.045429229736328125, -0.0422210693359375, -0.039012908935546875, -0.03580474853515625, -0.032596588134765625, -0.029388427734375, -0.026180267333984375, -0.02297210693359375, -0.019763946533203125, -0.0165557861328125, -0.013347625732421875, -0.01013946533203125, -0.006931304931640625, -0.00372314453125, -0.000514984130859375, 0.00269317626953125, 0.005901336669921875, 0.0091094970703125, 0.012317657470703125, 0.01552581787109375, 0.018733978271484375, 0.021942138671875, 0.025150299072265625, 0.02835845947265625, 0.031566619873046875, 0.0347747802734375, 0.037982940673828125, 0.04119110107421875, 0.044399261474609375, 0.047607421875, 0.050815582275390625, 0.05402374267578125, 0.057231903076171875, 0.0604400634765625, 0.06364822387695312, 0.06685638427734375, 0.07006454467773438, 0.073272705078125, 0.07648086547851562, 0.07968902587890625, 0.08289718627929688, 0.0861053466796875, 0.08931350708007812, 0.09252166748046875, 0.09572982788085938, 0.09893798828125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 10.0, 14.0, 11.0, 20.0, 22.0, 27.0, 28.0, 43.0, 50.0, 64.0, 55.0, 64.0, 73.0, 70.0, 69.0, 40.0, 55.0, 54.0, 49.0, 35.0, 22.0, 20.0, 23.0, 20.0, 14.0, 11.0, 9.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.993171215057373, -5.8181610107421875, -5.643150806427002, -5.468140602111816, -5.293130874633789, -5.1181206703186035, -4.943110466003418, -4.768100261688232, -4.593090057373047, -4.418079853057861, -4.243069648742676, -4.068059921264648, -3.893049716949463, -3.7180395126342773, -3.543029308319092, -3.3680191040039062, -3.193009376525879, -3.0179991722106934, -2.842989206314087, -2.6679790019989014, -2.492969036102295, -2.3179588317871094, -2.142948627471924, -1.9679385423660278, -1.7929284572601318, -1.6179183721542358, -1.4429082870483398, -1.2678980827331543, -1.0928879976272583, -0.9178779125213623, -0.7428677082061768, -0.5678576231002808, -0.39284753799438477, -0.21783742308616638, -0.042827308177948, 0.13218283653259277, 0.30719292163848877, 0.48220300674438477, 0.6572132110595703, 0.8322232961654663, 1.0072333812713623, 1.1822434663772583, 1.3572535514831543, 1.5322637557983398, 1.7072738409042358, 1.8822839260101318, 2.0572941303253174, 2.232304096221924, 2.4073143005371094, 2.582324504852295, 2.7573344707489014, 2.932344675064087, 3.1073546409606934, 3.282364845275879, 3.4573750495910645, 3.63238525390625, 3.8073952198028564, 3.982405424118042, 4.157415390014648, 4.332425594329834, 4.5074357986450195, 4.682445526123047, 4.857456207275391, 5.032465934753418, 5.2074761390686035]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 4.0, 6.0, 7.0, 10.0, 6.0, 19.0, 11.0, 13.0, 19.0, 18.0, 44.0, 28.0, 37.0, 38.0, 51.0, 48.0, 45.0, 41.0, 37.0, 52.0, 53.0, 35.0, 46.0, 32.0, 46.0, 39.0, 38.0, 28.0, 28.0, 17.0, 20.0, 15.0, 12.0, 12.0, 7.0, 11.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.171905517578125, -3.072941541671753, -2.973977565765381, -2.875013589859009, -2.7760496139526367, -2.6770856380462646, -2.5781216621398926, -2.4791576862335205, -2.3801937103271484, -2.2812297344207764, -2.1822657585144043, -2.0833017826080322, -1.9843378067016602, -1.885373830795288, -1.786409854888916, -1.687445878982544, -1.5884819030761719, -1.4895179271697998, -1.3905539512634277, -1.2915899753570557, -1.1926259994506836, -1.0936620235443115, -0.9946980476379395, -0.8957340717315674, -0.7967700958251953, -0.6978061199188232, -0.5988421440124512, -0.4998781681060791, -0.40091419219970703, -0.30195021629333496, -0.2029862403869629, -0.10402226448059082, -0.00505828857421875, 0.09390568733215332, 0.1928696632385254, 0.29183363914489746, 0.39079761505126953, 0.4897615909576416, 0.5887255668640137, 0.6876895427703857, 0.7866535186767578, 0.8856174945831299, 0.984581470489502, 1.083545446395874, 1.182509422302246, 1.2814733982086182, 1.3804373741149902, 1.4794013500213623, 1.5783653259277344, 1.6773293018341064, 1.7762932777404785, 1.8752572536468506, 1.9742212295532227, 2.0731852054595947, 2.172149181365967, 2.271113157272339, 2.370077133178711, 2.469041109085083, 2.568005084991455, 2.666969060897827, 2.765933036804199, 2.8648970127105713, 2.9638609886169434, 3.0628249645233154, 3.1617889404296875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 27.0, 38.0, 72.0, 79.0, 162.0, 230.0, 355.0, 577.0, 972.0, 1601.0, 2543.0, 3983.0, 6116.0, 9717.0, 15160.0, 22698.0, 33610.0, 47386.0, 65360.0, 83558.0, 100869.0, 111329.0, 112994.0, 104971.0, 89232.0, 70890.0, 52769.0, 37841.0, 25624.0, 17287.0, 11236.0, 7096.0, 4422.0, 2934.0, 1845.0, 1152.0, 659.0, 420.0, 244.0, 166.0, 117.0, 66.0, 44.0, 27.0, 17.0, 11.0, 9.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.490234375, -2.40765380859375, -2.3250732421875, -2.24249267578125, -2.159912109375, -2.07733154296875, -1.9947509765625, -1.91217041015625, -1.82958984375, -1.74700927734375, -1.6644287109375, -1.58184814453125, -1.499267578125, -1.41668701171875, -1.3341064453125, -1.25152587890625, -1.1689453125, -1.08636474609375, -1.0037841796875, -0.92120361328125, -0.838623046875, -0.75604248046875, -0.6734619140625, -0.59088134765625, -0.50830078125, -0.42572021484375, -0.3431396484375, -0.26055908203125, -0.177978515625, -0.09539794921875, -0.0128173828125, 0.06976318359375, 0.15234375, 0.23492431640625, 0.3175048828125, 0.40008544921875, 0.482666015625, 0.56524658203125, 0.6478271484375, 0.73040771484375, 0.81298828125, 0.89556884765625, 0.9781494140625, 1.06072998046875, 1.143310546875, 1.22589111328125, 1.3084716796875, 1.39105224609375, 1.4736328125, 1.55621337890625, 1.6387939453125, 1.72137451171875, 1.803955078125, 1.88653564453125, 1.9691162109375, 2.05169677734375, 2.13427734375, 2.21685791015625, 2.2994384765625, 2.38201904296875, 2.464599609375, 2.54718017578125, 2.6297607421875, 2.71234130859375, 2.794921875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 11.0, 11.0, 10.0, 12.0, 14.0, 12.0, 12.0, 23.0, 22.0, 23.0, 28.0, 36.0, 33.0, 38.0, 50.0, 40.0, 51.0, 50.0, 37.0, 54.0, 52.0, 34.0, 46.0, 36.0, 33.0, 37.0, 25.0, 24.0, 16.0, 18.0, 16.0, 24.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.287109375, -3.184783935546875, -3.08245849609375, -2.980133056640625, -2.8778076171875, -2.775482177734375, -2.67315673828125, -2.570831298828125, -2.468505859375, -2.366180419921875, -2.26385498046875, -2.161529541015625, -2.0592041015625, -1.956878662109375, -1.85455322265625, -1.752227783203125, -1.64990234375, -1.547576904296875, -1.44525146484375, -1.342926025390625, -1.2406005859375, -1.138275146484375, -1.03594970703125, -0.933624267578125, -0.831298828125, -0.728973388671875, -0.62664794921875, -0.524322509765625, -0.4219970703125, -0.319671630859375, -0.21734619140625, -0.115020751953125, -0.0126953125, 0.089630126953125, 0.19195556640625, 0.294281005859375, 0.3966064453125, 0.498931884765625, 0.60125732421875, 0.703582763671875, 0.805908203125, 0.908233642578125, 1.01055908203125, 1.112884521484375, 1.2152099609375, 1.317535400390625, 1.41986083984375, 1.522186279296875, 1.62451171875, 1.726837158203125, 1.82916259765625, 1.931488037109375, 2.0338134765625, 2.136138916015625, 2.23846435546875, 2.340789794921875, 2.443115234375, 2.545440673828125, 2.64776611328125, 2.750091552734375, 2.8524169921875, 2.954742431640625, 3.05706787109375, 3.159393310546875, 3.26171875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 13.0, 18.0, 32.0, 51.0, 74.0, 105.0, 153.0, 189.0, 360.0, 560.0, 851.0, 1213.0, 1909.0, 3029.0, 4485.0, 6851.0, 10217.0, 15458.0, 22137.0, 31060.0, 43168.0, 56863.0, 71685.0, 85855.0, 96503.0, 101787.0, 99482.0, 90795.0, 77732.0, 63184.0, 48439.0, 35676.0, 25554.0, 17723.0, 12099.0, 8049.0, 5340.0, 3383.0, 2231.0, 1481.0, 977.0, 624.0, 411.0, 253.0, 172.0, 104.0, 63.0, 51.0, 33.0, 22.0, 21.0, 7.0, 7.0, 11.0, 3.0, 0.0, 1.0], "bins": [-2.46875, -2.39324951171875, -2.3177490234375, -2.24224853515625, -2.166748046875, -2.09124755859375, -2.0157470703125, -1.94024658203125, -1.86474609375, -1.78924560546875, -1.7137451171875, -1.63824462890625, -1.562744140625, -1.48724365234375, -1.4117431640625, -1.33624267578125, -1.2607421875, -1.18524169921875, -1.1097412109375, -1.03424072265625, -0.958740234375, -0.88323974609375, -0.8077392578125, -0.73223876953125, -0.65673828125, -0.58123779296875, -0.5057373046875, -0.43023681640625, -0.354736328125, -0.27923583984375, -0.2037353515625, -0.12823486328125, -0.052734375, 0.02276611328125, 0.0982666015625, 0.17376708984375, 0.249267578125, 0.32476806640625, 0.4002685546875, 0.47576904296875, 0.55126953125, 0.62677001953125, 0.7022705078125, 0.77777099609375, 0.853271484375, 0.92877197265625, 1.0042724609375, 1.07977294921875, 1.1552734375, 1.23077392578125, 1.3062744140625, 1.38177490234375, 1.457275390625, 1.53277587890625, 1.6082763671875, 1.68377685546875, 1.75927734375, 1.83477783203125, 1.9102783203125, 1.98577880859375, 2.061279296875, 2.13677978515625, 2.2122802734375, 2.28778076171875, 2.36328125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 5.0, 6.0, 13.0, 16.0, 18.0, 21.0, 25.0, 25.0, 31.0, 34.0, 33.0, 36.0, 43.0, 41.0, 30.0, 35.0, 42.0, 44.0, 49.0, 43.0, 37.0, 43.0, 35.0, 35.0, 32.0, 29.0, 24.0, 20.0, 31.0, 16.0, 16.0, 15.0, 13.0, 13.0, 14.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.318359375, -2.2542877197265625, -2.190216064453125, -2.1261444091796875, -2.06207275390625, -1.9980010986328125, -1.933929443359375, -1.8698577880859375, -1.8057861328125, -1.7417144775390625, -1.677642822265625, -1.6135711669921875, -1.54949951171875, -1.4854278564453125, -1.421356201171875, -1.3572845458984375, -1.293212890625, -1.2291412353515625, -1.165069580078125, -1.1009979248046875, -1.03692626953125, -0.9728546142578125, -0.908782958984375, -0.8447113037109375, -0.7806396484375, -0.7165679931640625, -0.652496337890625, -0.5884246826171875, -0.52435302734375, -0.4602813720703125, -0.396209716796875, -0.3321380615234375, -0.26806640625, -0.2039947509765625, -0.139923095703125, -0.0758514404296875, -0.01177978515625, 0.0522918701171875, 0.116363525390625, 0.1804351806640625, 0.2445068359375, 0.3085784912109375, 0.372650146484375, 0.4367218017578125, 0.50079345703125, 0.5648651123046875, 0.628936767578125, 0.6930084228515625, 0.757080078125, 0.8211517333984375, 0.885223388671875, 0.9492950439453125, 1.01336669921875, 1.0774383544921875, 1.141510009765625, 1.2055816650390625, 1.2696533203125, 1.3337249755859375, 1.397796630859375, 1.4618682861328125, 1.52593994140625, 1.5900115966796875, 1.654083251953125, 1.7181549072265625, 1.7822265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 7.0, 12.0, 15.0, 31.0, 19.0, 51.0, 68.0, 92.0, 154.0, 217.0, 306.0, 513.0, 729.0, 1277.0, 2295.0, 4773.0, 13172.0, 98671.0, 673302.0, 218689.0, 21133.0, 6112.0, 2825.0, 1552.0, 889.0, 561.0, 318.0, 255.0, 167.0, 109.0, 87.0, 45.0, 36.0, 16.0, 15.0, 12.0, 2.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.390625, -12.0430908203125, -11.695556640625, -11.3480224609375, -11.00048828125, -10.6529541015625, -10.305419921875, -9.9578857421875, -9.6103515625, -9.2628173828125, -8.915283203125, -8.5677490234375, -8.22021484375, -7.8726806640625, -7.525146484375, -7.1776123046875, -6.830078125, -6.4825439453125, -6.135009765625, -5.7874755859375, -5.43994140625, -5.0924072265625, -4.744873046875, -4.3973388671875, -4.0498046875, -3.7022705078125, -3.354736328125, -3.0072021484375, -2.65966796875, -2.3121337890625, -1.964599609375, -1.6170654296875, -1.26953125, -0.9219970703125, -0.574462890625, -0.2269287109375, 0.12060546875, 0.4681396484375, 0.815673828125, 1.1632080078125, 1.5107421875, 1.8582763671875, 2.205810546875, 2.5533447265625, 2.90087890625, 3.2484130859375, 3.595947265625, 3.9434814453125, 4.291015625, 4.6385498046875, 4.986083984375, 5.3336181640625, 5.68115234375, 6.0286865234375, 6.376220703125, 6.7237548828125, 7.0712890625, 7.4188232421875, 7.766357421875, 8.1138916015625, 8.46142578125, 8.8089599609375, 9.156494140625, 9.5040283203125, 9.8515625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 14.0, 55.0, 120.0, 288.0, 283.0, 132.0, 56.0, 16.0, 7.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0012788772583007812, -0.0012461021542549133, -0.0012133270502090454, -0.0011805519461631775, -0.0011477768421173096, -0.0011150017380714417, -0.0010822266340255737, -0.0010494515299797058, -0.0010166764259338379, -0.00098390132188797, -0.000951126217842102, -0.0009183511137962341, -0.0008855760097503662, -0.0008528009057044983, -0.0008200258016586304, -0.0007872506976127625, -0.0007544755935668945, -0.0007217004895210266, -0.0006889253854751587, -0.0006561502814292908, -0.0006233751773834229, -0.0005906000733375549, -0.000557824969291687, -0.0005250498652458191, -0.0004922747611999512, -0.00045949965715408325, -0.00042672455310821533, -0.0003939494490623474, -0.0003611743450164795, -0.00032839924097061157, -0.00029562413692474365, -0.00026284903287887573, -0.0002300739288330078, -0.0001972988247871399, -0.00016452372074127197, -0.00013174861669540405, -9.897351264953613e-05, -6.619840860366821e-05, -3.342330455780029e-05, -6.48200511932373e-07, 3.212690353393555e-05, 6.490200757980347e-05, 9.767711162567139e-05, 0.0001304522156715393, 0.00016322731971740723, 0.00019600242376327515, 0.00022877752780914307, 0.000261552631855011, 0.0002943277359008789, 0.0003271028399467468, 0.00035987794399261475, 0.00039265304803848267, 0.0004254281520843506, 0.0004582032561302185, 0.0004909783601760864, 0.0005237534642219543, 0.0005565285682678223, 0.0005893036723136902, 0.0006220787763595581, 0.000654853880405426, 0.0006876289844512939, 0.0007204040884971619, 0.0007531791925430298, 0.0007859542965888977, 0.0008187294006347656]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 13.0, 20.0, 20.0, 25.0, 23.0, 47.0, 54.0, 82.0, 124.0, 142.0, 174.0, 241.0, 327.0, 435.0, 615.0, 841.0, 1410.0, 2494.0, 4890.0, 11833.0, 36137.0, 129352.0, 353612.0, 335242.0, 115736.0, 32376.0, 10911.0, 4522.0, 2370.0, 1331.0, 870.0, 584.0, 460.0, 312.0, 254.0, 176.0, 117.0, 110.0, 65.0, 54.0, 34.0, 37.0, 30.0, 14.0, 10.0, 7.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-5.09765625, -4.9329833984375, -4.768310546875, -4.6036376953125, -4.43896484375, -4.2742919921875, -4.109619140625, -3.9449462890625, -3.7802734375, -3.6156005859375, -3.450927734375, -3.2862548828125, -3.12158203125, -2.9569091796875, -2.792236328125, -2.6275634765625, -2.462890625, -2.2982177734375, -2.133544921875, -1.9688720703125, -1.80419921875, -1.6395263671875, -1.474853515625, -1.3101806640625, -1.1455078125, -0.9808349609375, -0.816162109375, -0.6514892578125, -0.48681640625, -0.3221435546875, -0.157470703125, 0.0072021484375, 0.171875, 0.3365478515625, 0.501220703125, 0.6658935546875, 0.83056640625, 0.9952392578125, 1.159912109375, 1.3245849609375, 1.4892578125, 1.6539306640625, 1.818603515625, 1.9832763671875, 2.14794921875, 2.3126220703125, 2.477294921875, 2.6419677734375, 2.806640625, 2.9713134765625, 3.135986328125, 3.3006591796875, 3.46533203125, 3.6300048828125, 3.794677734375, 3.9593505859375, 4.1240234375, 4.2886962890625, 4.453369140625, 4.6180419921875, 4.78271484375, 4.9473876953125, 5.112060546875, 5.2767333984375, 5.44140625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 24.0, 28.0, 66.0, 67.0, 110.0, 132.0, 133.0, 137.0, 106.0, 63.0, 51.0, 19.0, 17.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.362335205078125, -1.31744384765625, -1.272552490234375, -1.2276611328125, -1.182769775390625, -1.13787841796875, -1.092987060546875, -1.048095703125, -1.003204345703125, -0.95831298828125, -0.913421630859375, -0.8685302734375, -0.823638916015625, -0.77874755859375, -0.733856201171875, -0.68896484375, -0.644073486328125, -0.59918212890625, -0.554290771484375, -0.5093994140625, -0.464508056640625, -0.41961669921875, -0.374725341796875, -0.329833984375, -0.284942626953125, -0.24005126953125, -0.195159912109375, -0.1502685546875, -0.105377197265625, -0.06048583984375, -0.015594482421875, 0.029296875, 0.074188232421875, 0.11907958984375, 0.163970947265625, 0.2088623046875, 0.253753662109375, 0.29864501953125, 0.343536376953125, 0.388427734375, 0.433319091796875, 0.47821044921875, 0.523101806640625, 0.5679931640625, 0.612884521484375, 0.65777587890625, 0.702667236328125, 0.74755859375, 0.792449951171875, 0.83734130859375, 0.882232666015625, 0.9271240234375, 0.972015380859375, 1.01690673828125, 1.061798095703125, 1.106689453125, 1.151580810546875, 1.19647216796875, 1.241363525390625, 1.2862548828125, 1.331146240234375, 1.37603759765625, 1.420928955078125, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 3.0, 6.0, 13.0, 20.0, 11.0, 22.0, 26.0, 35.0, 38.0, 41.0, 59.0, 67.0, 64.0, 71.0, 59.0, 44.0, 55.0, 50.0, 47.0, 36.0, 34.0, 36.0, 37.0, 29.0, 22.0, 16.0, 8.0, 12.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.142786979675293, -4.9751691818237305, -4.80755090713501, -4.639933109283447, -4.472314834594727, -4.304697036743164, -4.137079238891602, -3.96946120262146, -3.8018431663513184, -3.6342251300811768, -3.466607093811035, -3.2989892959594727, -3.131371259689331, -2.9637532234191895, -2.796135425567627, -2.6285173892974854, -2.4608993530273438, -2.293281316757202, -2.1256632804870605, -1.958045482635498, -1.7904274463653564, -1.6228094100952148, -1.4551914930343628, -1.2875735759735107, -1.1199555397033691, -0.9523375630378723, -0.7847195863723755, -0.6171016097068787, -0.44948363304138184, -0.281865656375885, -0.11424767971038818, 0.05337023735046387, 0.22098779678344727, 0.3886057734489441, 0.5562237501144409, 0.7238417267799377, 0.8914597034454346, 1.0590777397155762, 1.2266956567764282, 1.3943135738372803, 1.5619316101074219, 1.7295496463775635, 1.8971675634384155, 2.0647854804992676, 2.232403516769409, 2.400021553039551, 2.5676393508911133, 2.735257387161255, 2.9028754234313965, 3.070493459701538, 3.2381114959716797, 3.405729293823242, 3.573347330093384, 3.7409653663635254, 3.908583164215088, 4.076201438903809, 4.243819236755371, 4.411437034606934, 4.579055309295654, 4.746673107147217, 4.9142913818359375, 5.0819091796875, 5.2495269775390625, 5.417144775390625, 5.584763050079346]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 4.0, 7.0, 9.0, 13.0, 17.0, 22.0, 29.0, 15.0, 19.0, 40.0, 26.0, 34.0, 33.0, 38.0, 49.0, 42.0, 50.0, 57.0, 36.0, 38.0, 48.0, 38.0, 36.0, 34.0, 35.0, 21.0, 37.0, 24.0, 25.0, 15.0, 10.0, 21.0, 13.0, 10.0, 14.0, 6.0, 3.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0523900985717773, -2.949246644973755, -2.8461031913757324, -2.74295973777771, -2.6398162841796875, -2.536672592163086, -2.4335291385650635, -2.330385684967041, -2.2272422313690186, -2.124098777770996, -2.0209553241729736, -1.9178117513656616, -1.8146682977676392, -1.7115248441696167, -1.6083812713623047, -1.5052378177642822, -1.4020943641662598, -1.2989509105682373, -1.1958074569702148, -1.0926638841629028, -0.9895204305648804, -0.8863769769668579, -0.7832334637641907, -0.6800899505615234, -0.576946496963501, -0.47380301356315613, -0.3706595301628113, -0.26751604676246643, -0.16437256336212158, -0.06122910976409912, 0.041914403438568115, 0.14505791664123535, 0.2482011318206787, 0.35134461522102356, 0.4544880986213684, 0.5576316118240356, 0.6607750654220581, 0.7639185190200806, 0.8670620322227478, 0.970205545425415, 1.0733489990234375, 1.17649245262146, 1.2796359062194824, 1.3827794790267944, 1.485922932624817, 1.5890663862228394, 1.6922099590301514, 1.7953534126281738, 1.8984968662261963, 2.0016403198242188, 2.104783773422241, 2.2079272270202637, 2.3110709190368652, 2.4142141342163086, 2.51735782623291, 2.6205012798309326, 2.723644733428955, 2.8267881870269775, 2.929931640625, 3.0330750942230225, 3.136218547821045, 3.2393622398376465, 3.342505693435669, 3.4456491470336914, 3.548792600631714]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 6.0, 11.0, 26.0, 35.0, 46.0, 78.0, 114.0, 174.0, 217.0, 365.0, 579.0, 895.0, 1361.0, 2157.0, 3221.0, 5187.0, 7735.0, 12113.0, 19011.0, 29648.0, 46281.0, 71845.0, 109018.0, 163782.0, 237105.0, 325675.0, 417489.0, 486264.0, 504710.0, 465274.0, 382428.0, 290207.0, 205350.0, 140016.0, 92804.0, 61508.0, 39507.0, 25836.0, 16107.0, 10777.0, 6709.0, 4565.0, 2849.0, 1828.0, 1217.0, 775.0, 493.0, 319.0, 203.0, 148.0, 90.0, 56.0, 36.0, 17.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.05859375, -2.9609375, -2.86328125, -2.765625, -2.66796875, -2.5703125, -2.47265625, -2.375, -2.27734375, -2.1796875, -2.08203125, -1.984375, -1.88671875, -1.7890625, -1.69140625, -1.59375, -1.49609375, -1.3984375, -1.30078125, -1.203125, -1.10546875, -1.0078125, -0.91015625, -0.8125, -0.71484375, -0.6171875, -0.51953125, -0.421875, -0.32421875, -0.2265625, -0.12890625, -0.03125, 0.06640625, 0.1640625, 0.26171875, 0.359375, 0.45703125, 0.5546875, 0.65234375, 0.75, 0.84765625, 0.9453125, 1.04296875, 1.140625, 1.23828125, 1.3359375, 1.43359375, 1.53125, 1.62890625, 1.7265625, 1.82421875, 1.921875, 2.01953125, 2.1171875, 2.21484375, 2.3125, 2.41015625, 2.5078125, 2.60546875, 2.703125, 2.80078125, 2.8984375, 2.99609375, 3.09375, 3.19140625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 8.0, 11.0, 9.0, 4.0, 17.0, 16.0, 20.0, 11.0, 22.0, 26.0, 27.0, 29.0, 37.0, 38.0, 44.0, 36.0, 42.0, 50.0, 44.0, 43.0, 41.0, 49.0, 43.0, 36.0, 43.0, 22.0, 26.0, 22.0, 26.0, 21.0, 21.0, 18.0, 15.0, 14.0, 18.0, 10.0, 6.0, 7.0, 5.0, 7.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.419586181640625, -2.33917236328125, -2.258758544921875, -2.1783447265625, -2.097930908203125, -2.01751708984375, -1.937103271484375, -1.856689453125, -1.776275634765625, -1.69586181640625, -1.615447998046875, -1.5350341796875, -1.454620361328125, -1.37420654296875, -1.293792724609375, -1.21337890625, -1.132965087890625, -1.05255126953125, -0.972137451171875, -0.8917236328125, -0.811309814453125, -0.73089599609375, -0.650482177734375, -0.570068359375, -0.489654541015625, -0.40924072265625, -0.328826904296875, -0.2484130859375, -0.167999267578125, -0.08758544921875, -0.007171630859375, 0.0732421875, 0.153656005859375, 0.23406982421875, 0.314483642578125, 0.3948974609375, 0.475311279296875, 0.55572509765625, 0.636138916015625, 0.716552734375, 0.796966552734375, 0.87738037109375, 0.957794189453125, 1.0382080078125, 1.118621826171875, 1.19903564453125, 1.279449462890625, 1.35986328125, 1.440277099609375, 1.52069091796875, 1.601104736328125, 1.6815185546875, 1.761932373046875, 1.84234619140625, 1.922760009765625, 2.003173828125, 2.083587646484375, 2.16400146484375, 2.244415283203125, 2.3248291015625, 2.405242919921875, 2.48565673828125, 2.566070556640625, 2.646484375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 12.0, 20.0, 40.0, 44.0, 96.0, 132.0, 212.0, 338.0, 608.0, 1026.0, 1726.0, 2824.0, 4894.0, 8549.0, 14135.0, 24165.0, 40011.0, 65188.0, 106080.0, 166551.0, 247782.0, 352160.0, 455305.0, 529764.0, 536511.0, 479883.0, 381719.0, 276432.0, 186215.0, 121328.0, 75923.0, 46214.0, 27814.0, 16523.0, 9864.0, 5965.0, 3417.0, 1939.0, 1150.0, 723.0, 388.0, 264.0, 144.0, 71.0, 47.0, 31.0, 25.0, 15.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.9375, -3.818695068359375, -3.69989013671875, -3.581085205078125, -3.4622802734375, -3.343475341796875, -3.22467041015625, -3.105865478515625, -2.987060546875, -2.868255615234375, -2.74945068359375, -2.630645751953125, -2.5118408203125, -2.393035888671875, -2.27423095703125, -2.155426025390625, -2.03662109375, -1.917816162109375, -1.79901123046875, -1.680206298828125, -1.5614013671875, -1.442596435546875, -1.32379150390625, -1.204986572265625, -1.086181640625, -0.967376708984375, -0.84857177734375, -0.729766845703125, -0.6109619140625, -0.492156982421875, -0.37335205078125, -0.254547119140625, -0.1357421875, -0.016937255859375, 0.10186767578125, 0.220672607421875, 0.3394775390625, 0.458282470703125, 0.57708740234375, 0.695892333984375, 0.814697265625, 0.933502197265625, 1.05230712890625, 1.171112060546875, 1.2899169921875, 1.408721923828125, 1.52752685546875, 1.646331787109375, 1.76513671875, 1.883941650390625, 2.00274658203125, 2.121551513671875, 2.2403564453125, 2.359161376953125, 2.47796630859375, 2.596771240234375, 2.715576171875, 2.834381103515625, 2.95318603515625, 3.071990966796875, 3.1907958984375, 3.309600830078125, 3.42840576171875, 3.547210693359375, 3.666015625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 13.0, 9.0, 13.0, 15.0, 17.0, 18.0, 35.0, 55.0, 50.0, 55.0, 63.0, 88.0, 95.0, 111.0, 111.0, 136.0, 138.0, 158.0, 159.0, 206.0, 185.0, 185.0, 176.0, 180.0, 171.0, 191.0, 173.0, 163.0, 142.0, 109.0, 122.0, 110.0, 103.0, 86.0, 70.0, 66.0, 52.0, 46.0, 36.0, 26.0, 24.0, 25.0, 16.0, 15.0, 11.0, 11.0, 7.0, 2.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0], "bins": [-1.2724609375, -1.2333831787109375, -1.194305419921875, -1.1552276611328125, -1.11614990234375, -1.0770721435546875, -1.037994384765625, -0.9989166259765625, -0.9598388671875, -0.9207611083984375, -0.881683349609375, -0.8426055908203125, -0.80352783203125, -0.7644500732421875, -0.725372314453125, -0.6862945556640625, -0.647216796875, -0.6081390380859375, -0.569061279296875, -0.5299835205078125, -0.49090576171875, -0.4518280029296875, -0.412750244140625, -0.3736724853515625, -0.3345947265625, -0.2955169677734375, -0.256439208984375, -0.2173614501953125, -0.17828369140625, -0.1392059326171875, -0.100128173828125, -0.0610504150390625, -0.02197265625, 0.0171051025390625, 0.056182861328125, 0.0952606201171875, 0.13433837890625, 0.1734161376953125, 0.212493896484375, 0.2515716552734375, 0.2906494140625, 0.3297271728515625, 0.368804931640625, 0.4078826904296875, 0.44696044921875, 0.4860382080078125, 0.525115966796875, 0.5641937255859375, 0.603271484375, 0.6423492431640625, 0.681427001953125, 0.7205047607421875, 0.75958251953125, 0.7986602783203125, 0.837738037109375, 0.8768157958984375, 0.9158935546875, 0.9549713134765625, 0.994049072265625, 1.0331268310546875, 1.07220458984375, 1.1112823486328125, 1.150360107421875, 1.1894378662109375, 1.228515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 9.0, 9.0, 13.0, 17.0, 14.0, 20.0, 23.0, 39.0, 34.0, 38.0, 43.0, 51.0, 66.0, 69.0, 54.0, 62.0, 47.0, 54.0, 47.0, 46.0, 37.0, 34.0, 24.0, 35.0, 31.0, 16.0, 10.0, 12.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.268990993499756, -5.099306106567383, -4.92962121963501, -4.759936332702637, -4.590251445770264, -4.420566558837891, -4.250881195068359, -4.081196308135986, -3.9115114212036133, -3.7418265342712402, -3.572141647338867, -3.402456760406494, -3.232771635055542, -3.063086748123169, -2.893401861190796, -2.7237167358398438, -2.55403208732605, -2.3843472003936768, -2.2146623134613037, -2.0449771881103516, -1.8752923011779785, -1.7056074142456055, -1.5359225273132324, -1.3662375211715698, -1.1965526342391968, -1.0268677473068237, -0.8571827411651611, -0.6874978542327881, -0.5178129076957703, -0.34812796115875244, -0.1784430742263794, -0.008758068084716797, 0.16092681884765625, 0.3306117653846741, 0.5002967119216919, 0.6699815988540649, 0.8396665453910828, 1.0093514919281006, 1.1790363788604736, 1.3487213850021362, 1.5184062719345093, 1.6880911588668823, 1.857776165008545, 2.027461051940918, 2.197145938873291, 2.366830825805664, 2.536515712738037, 2.7062008380889893, 2.8758857250213623, 3.0455706119537354, 3.2152554988861084, 3.3849406242370605, 3.5546255111694336, 3.7243103981018066, 3.8939952850341797, 4.063680171966553, 4.233365058898926, 4.403049945831299, 4.572734832763672, 4.742419719696045, 4.912104606628418, 5.081789970397949, 5.251474380493164, 5.421159744262695, 5.590844631195068]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 21.0, 16.0, 12.0, 21.0, 23.0, 18.0, 21.0, 33.0, 18.0, 33.0, 34.0, 47.0, 40.0, 42.0, 57.0, 46.0, 39.0, 53.0, 43.0, 30.0, 42.0, 24.0, 40.0, 30.0, 23.0, 23.0, 24.0, 13.0, 19.0, 11.0, 13.0, 10.0, 9.0, 11.0, 7.0, 3.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.0982367992401123, -3.000528335571289, -2.902820110321045, -2.8051116466522217, -2.7074031829833984, -2.6096949577331543, -2.511986494064331, -2.414278030395508, -2.3165698051452637, -2.2188613414764404, -2.1211531162261963, -2.023444652557373, -1.9257363080978394, -1.8280279636383057, -1.7303194999694824, -1.6326111555099487, -1.534902811050415, -1.4371944665908813, -1.3394861221313477, -1.2417776584625244, -1.1440693140029907, -1.046360969543457, -0.9486525654792786, -0.8509441614151001, -0.7532358169555664, -0.6555274724960327, -0.5578190684318542, -0.46011069416999817, -0.3624023199081421, -0.264693945646286, -0.16698557138442993, -0.06927716732025146, 0.028431177139282227, 0.1261395514011383, 0.22384792566299438, 0.32155629992485046, 0.41926467418670654, 0.5169730186462402, 0.6146814227104187, 0.7123898267745972, 0.8100981712341309, 0.9078065156936646, 1.0055148601531982, 1.1032233238220215, 1.2009316682815552, 1.2986400127410889, 1.396348476409912, 1.4940568208694458, 1.5917651653289795, 1.6894735097885132, 1.7871818542480469, 1.8848903179168701, 1.9825986623764038, 2.0803070068359375, 2.1780154705047607, 2.275723934173584, 2.373432159423828, 2.4711406230926514, 2.5688488483428955, 2.6665573120117188, 2.764265537261963, 2.861974000930786, 2.9596824645996094, 3.0573906898498535, 3.1550991535186768]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 19.0, 17.0, 39.0, 54.0, 78.0, 118.0, 198.0, 284.0, 416.0, 716.0, 1084.0, 1630.0, 2610.0, 4132.0, 6619.0, 10849.0, 18657.0, 31099.0, 53521.0, 88905.0, 139664.0, 189259.0, 179470.0, 125443.0, 77962.0, 46478.0, 27393.0, 16076.0, 9600.0, 5869.0, 3647.0, 2364.0, 1512.0, 988.0, 628.0, 406.0, 259.0, 155.0, 102.0, 73.0, 54.0, 25.0, 20.0, 16.0, 16.0, 7.0, 2.0, 6.0, 1.0, 2.0], "bins": [-0.884765625, -0.8600997924804688, -0.8354339599609375, -0.8107681274414062, -0.786102294921875, -0.7614364624023438, -0.7367706298828125, -0.7121047973632812, -0.68743896484375, -0.6627731323242188, -0.6381072998046875, -0.6134414672851562, -0.588775634765625, -0.5641098022460938, -0.5394439697265625, -0.5147781372070312, -0.4901123046875, -0.46544647216796875, -0.4407806396484375, -0.41611480712890625, -0.391448974609375, -0.36678314208984375, -0.3421173095703125, -0.31745147705078125, -0.29278564453125, -0.26811981201171875, -0.2434539794921875, -0.21878814697265625, -0.194122314453125, -0.16945648193359375, -0.1447906494140625, -0.12012481689453125, -0.095458984375, -0.07079315185546875, -0.0461273193359375, -0.02146148681640625, 0.003204345703125, 0.02787017822265625, 0.0525360107421875, 0.07720184326171875, 0.10186767578125, 0.12653350830078125, 0.1511993408203125, 0.17586517333984375, 0.200531005859375, 0.22519683837890625, 0.2498626708984375, 0.27452850341796875, 0.2991943359375, 0.32386016845703125, 0.3485260009765625, 0.37319183349609375, 0.397857666015625, 0.42252349853515625, 0.4471893310546875, 0.47185516357421875, 0.49652099609375, 0.5211868286132812, 0.5458526611328125, 0.5705184936523438, 0.595184326171875, 0.6198501586914062, 0.6445159912109375, 0.6691818237304688, 0.69384765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 1.0, 6.0, 3.0, 10.0, 6.0, 9.0, 15.0, 16.0, 24.0, 21.0, 28.0, 20.0, 21.0, 22.0, 40.0, 20.0, 43.0, 33.0, 45.0, 49.0, 43.0, 48.0, 50.0, 36.0, 45.0, 37.0, 42.0, 31.0, 26.0, 26.0, 21.0, 28.0, 22.0, 20.0, 14.0, 11.0, 11.0, 8.0, 8.0, 15.0, 6.0, 2.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.35546875, -3.248626708984375, -3.14178466796875, -3.034942626953125, -2.9281005859375, -2.821258544921875, -2.71441650390625, -2.607574462890625, -2.500732421875, -2.393890380859375, -2.28704833984375, -2.180206298828125, -2.0733642578125, -1.966522216796875, -1.85968017578125, -1.752838134765625, -1.64599609375, -1.539154052734375, -1.43231201171875, -1.325469970703125, -1.2186279296875, -1.111785888671875, -1.00494384765625, -0.898101806640625, -0.791259765625, -0.684417724609375, -0.57757568359375, -0.470733642578125, -0.3638916015625, -0.257049560546875, -0.15020751953125, -0.043365478515625, 0.0634765625, 0.170318603515625, 0.27716064453125, 0.384002685546875, 0.4908447265625, 0.597686767578125, 0.70452880859375, 0.811370849609375, 0.918212890625, 1.025054931640625, 1.13189697265625, 1.238739013671875, 1.3455810546875, 1.452423095703125, 1.55926513671875, 1.666107177734375, 1.77294921875, 1.879791259765625, 1.98663330078125, 2.093475341796875, 2.2003173828125, 2.307159423828125, 2.41400146484375, 2.520843505859375, 2.627685546875, 2.734527587890625, 2.84136962890625, 2.948211669921875, 3.0550537109375, 3.161895751953125, 3.26873779296875, 3.375579833984375, 3.482421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 9.0, 14.0, 12.0, 35.0, 30.0, 37.0, 72.0, 93.0, 170.0, 205.0, 352.0, 523.0, 784.0, 1302.0, 2037.0, 3383.0, 5833.0, 9861.0, 17194.0, 30213.0, 53718.0, 97455.0, 172228.0, 233083.0, 181301.0, 104395.0, 57727.0, 32189.0, 18083.0, 10454.0, 6169.0, 3569.0, 2170.0, 1391.0, 815.0, 541.0, 383.0, 241.0, 150.0, 120.0, 61.0, 37.0, 37.0, 23.0, 14.0, 16.0, 13.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8864364624023438, -0.8553924560546875, -0.8243484497070312, -0.793304443359375, -0.7622604370117188, -0.7312164306640625, -0.7001724243164062, -0.66912841796875, -0.6380844116210938, -0.6070404052734375, -0.5759963989257812, -0.544952392578125, -0.5139083862304688, -0.4828643798828125, -0.45182037353515625, -0.4207763671875, -0.38973236083984375, -0.3586883544921875, -0.32764434814453125, -0.296600341796875, -0.26555633544921875, -0.2345123291015625, -0.20346832275390625, -0.17242431640625, -0.14138031005859375, -0.1103363037109375, -0.07929229736328125, -0.048248291015625, -0.01720428466796875, 0.0138397216796875, 0.04488372802734375, 0.075927734375, 0.10697174072265625, 0.1380157470703125, 0.16905975341796875, 0.200103759765625, 0.23114776611328125, 0.2621917724609375, 0.29323577880859375, 0.32427978515625, 0.35532379150390625, 0.3863677978515625, 0.41741180419921875, 0.448455810546875, 0.47949981689453125, 0.5105438232421875, 0.5415878295898438, 0.5726318359375, 0.6036758422851562, 0.6347198486328125, 0.6657638549804688, 0.696807861328125, 0.7278518676757812, 0.7588958740234375, 0.7899398803710938, 0.82098388671875, 0.8520278930664062, 0.8830718994140625, 0.9141159057617188, 0.945159912109375, 0.9762039184570312, 1.0072479248046875, 1.0382919311523438, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 6.0, 10.0, 13.0, 20.0, 16.0, 22.0, 15.0, 29.0, 26.0, 33.0, 33.0, 35.0, 38.0, 33.0, 45.0, 43.0, 39.0, 46.0, 38.0, 34.0, 38.0, 39.0, 34.0, 38.0, 45.0, 35.0, 25.0, 27.0, 29.0, 19.0, 18.0, 9.0, 13.0, 16.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.048828125, -1.981170654296875, -1.91351318359375, -1.845855712890625, -1.7781982421875, -1.710540771484375, -1.64288330078125, -1.575225830078125, -1.507568359375, -1.439910888671875, -1.37225341796875, -1.304595947265625, -1.2369384765625, -1.169281005859375, -1.10162353515625, -1.033966064453125, -0.96630859375, -0.898651123046875, -0.83099365234375, -0.763336181640625, -0.6956787109375, -0.628021240234375, -0.56036376953125, -0.492706298828125, -0.425048828125, -0.357391357421875, -0.28973388671875, -0.222076416015625, -0.1544189453125, -0.086761474609375, -0.01910400390625, 0.048553466796875, 0.1162109375, 0.183868408203125, 0.25152587890625, 0.319183349609375, 0.3868408203125, 0.454498291015625, 0.52215576171875, 0.589813232421875, 0.657470703125, 0.725128173828125, 0.79278564453125, 0.860443115234375, 0.9281005859375, 0.995758056640625, 1.06341552734375, 1.131072998046875, 1.19873046875, 1.266387939453125, 1.33404541015625, 1.401702880859375, 1.4693603515625, 1.537017822265625, 1.60467529296875, 1.672332763671875, 1.739990234375, 1.807647705078125, 1.87530517578125, 1.942962646484375, 2.0106201171875, 2.078277587890625, 2.14593505859375, 2.213592529296875, 2.28125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 11.0, 8.0, 6.0, 18.0, 25.0, 26.0, 49.0, 69.0, 90.0, 121.0, 225.0, 314.0, 556.0, 867.0, 1633.0, 3287.0, 7422.0, 19661.0, 63392.0, 271157.0, 484072.0, 136508.0, 35875.0, 12399.0, 5160.0, 2430.0, 1213.0, 718.0, 432.0, 260.0, 183.0, 110.0, 79.0, 49.0, 31.0, 36.0, 19.0, 15.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4058113098144531, -0.39145660400390625, -0.3771018981933594, -0.3627471923828125, -0.3483924865722656, -0.33403778076171875, -0.3196830749511719, -0.305328369140625, -0.2909736633300781, -0.27661895751953125, -0.2622642517089844, -0.2479095458984375, -0.23355484008789062, -0.21920013427734375, -0.20484542846679688, -0.19049072265625, -0.17613601684570312, -0.16178131103515625, -0.14742660522460938, -0.1330718994140625, -0.11871719360351562, -0.10436248779296875, -0.09000778198242188, -0.075653076171875, -0.061298370361328125, -0.04694366455078125, -0.032588958740234375, -0.0182342529296875, -0.003879547119140625, 0.01047515869140625, 0.024829864501953125, 0.0391845703125, 0.053539276123046875, 0.06789398193359375, 0.08224868774414062, 0.0966033935546875, 0.11095809936523438, 0.12531280517578125, 0.13966751098632812, 0.154022216796875, 0.16837692260742188, 0.18273162841796875, 0.19708633422851562, 0.2114410400390625, 0.22579574584960938, 0.24015045166015625, 0.2545051574707031, 0.26885986328125, 0.2832145690917969, 0.29756927490234375, 0.3119239807128906, 0.3262786865234375, 0.3406333923339844, 0.35498809814453125, 0.3693428039550781, 0.383697509765625, 0.3980522155761719, 0.41240692138671875, 0.4267616271972656, 0.4411163330078125, 0.4554710388183594, 0.46982574462890625, 0.4841804504394531, 0.49853515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 9.0, 10.0, 11.0, 12.0, 17.0, 21.0, 26.0, 30.0, 38.0, 31.0, 55.0, 59.0, 60.0, 55.0, 62.0, 58.0, 48.0, 56.0, 67.0, 53.0, 40.0, 26.0, 27.0, 28.0, 23.0, 16.0, 13.0, 10.0, 10.0, 6.0, 4.0, 1.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.2232532501220703e-05, -2.1634623408317566e-05, -2.103671431541443e-05, -2.043880522251129e-05, -1.9840896129608154e-05, -1.9242987036705017e-05, -1.864507794380188e-05, -1.8047168850898743e-05, -1.7449259757995605e-05, -1.6851350665092468e-05, -1.625344157218933e-05, -1.5655532479286194e-05, -1.5057623386383057e-05, -1.445971429347992e-05, -1.3861805200576782e-05, -1.3263896107673645e-05, -1.2665987014770508e-05, -1.206807792186737e-05, -1.1470168828964233e-05, -1.0872259736061096e-05, -1.0274350643157959e-05, -9.676441550254822e-06, -9.078532457351685e-06, -8.480623364448547e-06, -7.88271427154541e-06, -7.284805178642273e-06, -6.686896085739136e-06, -6.0889869928359985e-06, -5.491077899932861e-06, -4.893168807029724e-06, -4.295259714126587e-06, -3.6973506212234497e-06, -3.0994415283203125e-06, -2.5015324354171753e-06, -1.903623342514038e-06, -1.3057142496109009e-06, -7.078051567077637e-07, -1.0989606380462646e-07, 4.880130290985107e-07, 1.085922122001648e-06, 1.6838312149047852e-06, 2.2817403078079224e-06, 2.8796494007110596e-06, 3.4775584936141968e-06, 4.075467586517334e-06, 4.673376679420471e-06, 5.271285772323608e-06, 5.869194865226746e-06, 6.467103958129883e-06, 7.06501305103302e-06, 7.662922143936157e-06, 8.260831236839294e-06, 8.858740329742432e-06, 9.456649422645569e-06, 1.0054558515548706e-05, 1.0652467608451843e-05, 1.125037670135498e-05, 1.1848285794258118e-05, 1.2446194887161255e-05, 1.3044103980064392e-05, 1.364201307296753e-05, 1.4239922165870667e-05, 1.4837831258773804e-05, 1.543574035167694e-05, 1.6033649444580078e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 9.0, 11.0, 13.0, 23.0, 23.0, 54.0, 48.0, 77.0, 99.0, 131.0, 193.0, 307.0, 397.0, 558.0, 897.0, 1461.0, 2404.0, 4021.0, 7346.0, 14602.0, 31018.0, 70164.0, 166401.0, 310645.0, 241078.0, 106153.0, 45567.0, 20829.0, 10325.0, 5572.0, 2989.0, 1751.0, 1063.0, 683.0, 487.0, 331.0, 220.0, 156.0, 103.0, 85.0, 72.0, 44.0, 33.0, 21.0, 21.0, 18.0, 11.0, 4.0, 4.0, 8.0, 7.0, 4.0, 0.0, 0.0, 4.0], "bins": [-0.34033203125, -0.3299369812011719, -0.31954193115234375, -0.3091468811035156, -0.2987518310546875, -0.2883567810058594, -0.27796173095703125, -0.2675666809082031, -0.257171630859375, -0.24677658081054688, -0.23638153076171875, -0.22598648071289062, -0.2155914306640625, -0.20519638061523438, -0.19480133056640625, -0.18440628051757812, -0.17401123046875, -0.16361618041992188, -0.15322113037109375, -0.14282608032226562, -0.1324310302734375, -0.12203598022460938, -0.11164093017578125, -0.10124588012695312, -0.090850830078125, -0.08045578002929688, -0.07006072998046875, -0.059665679931640625, -0.0492706298828125, -0.038875579833984375, -0.02848052978515625, -0.018085479736328125, -0.0076904296875, 0.002704620361328125, 0.01309967041015625, 0.023494720458984375, 0.0338897705078125, 0.044284820556640625, 0.05467987060546875, 0.06507492065429688, 0.075469970703125, 0.08586502075195312, 0.09626007080078125, 0.10665512084960938, 0.1170501708984375, 0.12744522094726562, 0.13784027099609375, 0.14823532104492188, 0.15863037109375, 0.16902542114257812, 0.17942047119140625, 0.18981552124023438, 0.2002105712890625, 0.21060562133789062, 0.22100067138671875, 0.23139572143554688, 0.241790771484375, 0.2521858215332031, 0.26258087158203125, 0.2729759216308594, 0.2833709716796875, 0.2937660217285156, 0.30416107177734375, 0.3145561218261719, 0.324951171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 4.0, 4.0, 14.0, 14.0, 9.0, 19.0, 26.0, 44.0, 29.0, 42.0, 62.0, 73.0, 75.0, 86.0, 90.0, 90.0, 56.0, 49.0, 48.0, 39.0, 26.0, 27.0, 17.0, 12.0, 6.0, 10.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08057880401611328, -0.07796669006347656, -0.07535457611083984, -0.07274246215820312, -0.0701303482055664, -0.06751823425292969, -0.06490612030029297, -0.06229400634765625, -0.05968189239501953, -0.05706977844238281, -0.054457664489746094, -0.051845550537109375, -0.049233436584472656, -0.04662132263183594, -0.04400920867919922, -0.0413970947265625, -0.03878498077392578, -0.03617286682128906, -0.033560752868652344, -0.030948638916015625, -0.028336524963378906, -0.025724411010742188, -0.02311229705810547, -0.02050018310546875, -0.01788806915283203, -0.015275955200195312, -0.012663841247558594, -0.010051727294921875, -0.007439613342285156, -0.0048274993896484375, -0.0022153854370117188, 0.000396728515625, 0.0030088424682617188, 0.0056209564208984375, 0.008233070373535156, 0.010845184326171875, 0.013457298278808594, 0.016069412231445312, 0.01868152618408203, 0.02129364013671875, 0.02390575408935547, 0.026517868041992188, 0.029129981994628906, 0.031742095947265625, 0.034354209899902344, 0.03696632385253906, 0.03957843780517578, 0.0421905517578125, 0.04480266571044922, 0.04741477966308594, 0.050026893615722656, 0.052639007568359375, 0.055251121520996094, 0.05786323547363281, 0.06047534942626953, 0.06308746337890625, 0.06569957733154297, 0.06831169128417969, 0.0709238052368164, 0.07353591918945312, 0.07614803314208984, 0.07876014709472656, 0.08137226104736328, 0.083984375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 17.0, 17.0, 18.0, 26.0, 30.0, 38.0, 33.0, 43.0, 49.0, 71.0, 68.0, 49.0, 63.0, 57.0, 48.0, 47.0, 46.0, 37.0, 33.0, 37.0, 27.0, 33.0, 19.0, 12.0, 11.0, 12.0, 2.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.330752372741699, -5.160385608673096, -4.990018844604492, -4.819652557373047, -4.649285793304443, -4.47891902923584, -4.3085527420043945, -4.138185977935791, -3.9678192138671875, -3.797452449798584, -3.6270859241485596, -3.456719398498535, -3.2863526344299316, -3.115985870361328, -2.9456193447113037, -2.7752528190612793, -2.604886054992676, -2.4345192909240723, -2.264152765274048, -2.0937862396240234, -1.92341947555542, -1.753052830696106, -1.582686185836792, -1.412319540977478, -1.241952896118164, -1.07158625125885, -0.9012196063995361, -0.7308529615402222, -0.5604863166809082, -0.39011967182159424, -0.21975302696228027, -0.04938638210296631, 0.12098073959350586, 0.2913473844528198, 0.4617140293121338, 0.6320806741714478, 0.8024473190307617, 0.9728139638900757, 1.1431806087493896, 1.3135472536087036, 1.4839138984680176, 1.6542805433273315, 1.8246471881866455, 1.9950138330459595, 2.1653804779052734, 2.335747241973877, 2.5061137676239014, 2.676480293273926, 2.8468470573425293, 3.017213821411133, 3.1875803470611572, 3.3579468727111816, 3.528313636779785, 3.6986804008483887, 3.869046926498413, 4.0394134521484375, 4.209780216217041, 4.3801469802856445, 4.55051326751709, 4.720880031585693, 4.891246795654297, 5.0616135597229, 5.231980323791504, 5.402346611022949, 5.572713375091553]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 10.0, 7.0, 22.0, 17.0, 10.0, 23.0, 21.0, 20.0, 23.0, 29.0, 19.0, 33.0, 38.0, 44.0, 45.0, 35.0, 57.0, 50.0, 40.0, 51.0, 40.0, 33.0, 42.0, 30.0, 32.0, 29.0, 25.0, 22.0, 22.0, 18.0, 14.0, 13.0, 11.0, 13.0, 10.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.089804172515869, -2.992260456085205, -2.894716501235962, -2.797172784805298, -2.6996288299560547, -2.6020851135253906, -2.5045413970947266, -2.4069976806640625, -2.3094537258148193, -2.2119100093841553, -2.114366054534912, -2.016822338104248, -1.9192785024642944, -1.8217346668243408, -1.7241909503936768, -1.6266471147537231, -1.5291032791137695, -1.431559443473816, -1.3340156078338623, -1.2364718914031982, -1.1389280557632446, -1.041384220123291, -0.9438404440879822, -0.8462966680526733, -0.7487528324127197, -0.6512089967727661, -0.5536652207374573, -0.45612141489982605, -0.3585776090621948, -0.2610338032245636, -0.16348999738693237, -0.06594622135162354, 0.03159785270690918, 0.1291416585445404, 0.22668546438217163, 0.32422927021980286, 0.4217730760574341, 0.5193169116973877, 0.6168606877326965, 0.7144044637680054, 0.811948299407959, 0.9094921350479126, 1.0070359706878662, 1.1045796871185303, 1.2021235227584839, 1.2996673583984375, 1.3972110748291016, 1.4947549104690552, 1.5922987461090088, 1.6898425817489624, 1.787386417388916, 1.88493013381958, 1.9824739694595337, 2.0800178050994873, 2.1775615215301514, 2.2751054763793945, 2.3726491928100586, 2.4701929092407227, 2.567736864089966, 2.66528058052063, 2.762824535369873, 2.860368251800537, 2.957911968231201, 3.0554556846618652, 3.1529996395111084]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 18.0, 20.0, 28.0, 55.0, 85.0, 168.0, 216.0, 332.0, 572.0, 930.0, 1376.0, 2182.0, 3214.0, 4942.0, 7574.0, 11268.0, 16327.0, 23747.0, 33529.0, 45465.0, 59499.0, 74893.0, 88611.0, 98137.0, 101838.0, 98368.0, 88146.0, 74656.0, 60033.0, 45784.0, 33563.0, 23700.0, 16756.0, 11044.0, 7386.0, 4883.0, 3348.0, 2131.0, 1338.0, 862.0, 559.0, 375.0, 238.0, 146.0, 88.0, 51.0, 42.0, 15.0, 13.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.474609375, -2.398468017578125, -2.32232666015625, -2.246185302734375, -2.1700439453125, -2.093902587890625, -2.01776123046875, -1.941619873046875, -1.865478515625, -1.789337158203125, -1.71319580078125, -1.637054443359375, -1.5609130859375, -1.484771728515625, -1.40863037109375, -1.332489013671875, -1.25634765625, -1.180206298828125, -1.10406494140625, -1.027923583984375, -0.9517822265625, -0.875640869140625, -0.79949951171875, -0.723358154296875, -0.647216796875, -0.571075439453125, -0.49493408203125, -0.418792724609375, -0.3426513671875, -0.266510009765625, -0.19036865234375, -0.114227294921875, -0.0380859375, 0.038055419921875, 0.11419677734375, 0.190338134765625, 0.2664794921875, 0.342620849609375, 0.41876220703125, 0.494903564453125, 0.571044921875, 0.647186279296875, 0.72332763671875, 0.799468994140625, 0.8756103515625, 0.951751708984375, 1.02789306640625, 1.104034423828125, 1.18017578125, 1.256317138671875, 1.33245849609375, 1.408599853515625, 1.4847412109375, 1.560882568359375, 1.63702392578125, 1.713165283203125, 1.789306640625, 1.865447998046875, 1.94158935546875, 2.017730712890625, 2.0938720703125, 2.170013427734375, 2.24615478515625, 2.322296142578125, 2.3984375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 10.0, 10.0, 16.0, 17.0, 16.0, 21.0, 12.0, 24.0, 26.0, 24.0, 27.0, 33.0, 32.0, 27.0, 44.0, 44.0, 42.0, 47.0, 32.0, 39.0, 47.0, 39.0, 45.0, 32.0, 37.0, 32.0, 31.0, 20.0, 22.0, 26.0, 18.0, 10.0, 15.0, 14.0, 9.0, 9.0, 10.0, 3.0, 4.0, 5.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.318359375, -3.21575927734375, -3.1131591796875, -3.01055908203125, -2.907958984375, -2.80535888671875, -2.7027587890625, -2.60015869140625, -2.49755859375, -2.39495849609375, -2.2923583984375, -2.18975830078125, -2.087158203125, -1.98455810546875, -1.8819580078125, -1.77935791015625, -1.6767578125, -1.57415771484375, -1.4715576171875, -1.36895751953125, -1.266357421875, -1.16375732421875, -1.0611572265625, -0.95855712890625, -0.85595703125, -0.75335693359375, -0.6507568359375, -0.54815673828125, -0.445556640625, -0.34295654296875, -0.2403564453125, -0.13775634765625, -0.03515625, 0.06744384765625, 0.1700439453125, 0.27264404296875, 0.375244140625, 0.47784423828125, 0.5804443359375, 0.68304443359375, 0.78564453125, 0.88824462890625, 0.9908447265625, 1.09344482421875, 1.196044921875, 1.29864501953125, 1.4012451171875, 1.50384521484375, 1.6064453125, 1.70904541015625, 1.8116455078125, 1.91424560546875, 2.016845703125, 2.11944580078125, 2.2220458984375, 2.32464599609375, 2.42724609375, 2.52984619140625, 2.6324462890625, 2.73504638671875, 2.837646484375, 2.94024658203125, 3.0428466796875, 3.14544677734375, 3.248046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 10.0, 13.0, 25.0, 31.0, 48.0, 95.0, 152.0, 220.0, 371.0, 584.0, 866.0, 1332.0, 2166.0, 3173.0, 4915.0, 7479.0, 10950.0, 15995.0, 22623.0, 31877.0, 43151.0, 56358.0, 70091.0, 83086.0, 92072.0, 97181.0, 96285.0, 89152.0, 77697.0, 63662.0, 50476.0, 37991.0, 27717.0, 20005.0, 13585.0, 9230.0, 6222.0, 4124.0, 2670.0, 1679.0, 1175.0, 739.0, 451.0, 325.0, 173.0, 122.0, 77.0, 55.0, 30.0, 23.0, 15.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.279296875, -2.20526123046875, -2.1312255859375, -2.05718994140625, -1.983154296875, -1.90911865234375, -1.8350830078125, -1.76104736328125, -1.68701171875, -1.61297607421875, -1.5389404296875, -1.46490478515625, -1.390869140625, -1.31683349609375, -1.2427978515625, -1.16876220703125, -1.0947265625, -1.02069091796875, -0.9466552734375, -0.87261962890625, -0.798583984375, -0.72454833984375, -0.6505126953125, -0.57647705078125, -0.50244140625, -0.42840576171875, -0.3543701171875, -0.28033447265625, -0.206298828125, -0.13226318359375, -0.0582275390625, 0.01580810546875, 0.08984375, 0.16387939453125, 0.2379150390625, 0.31195068359375, 0.385986328125, 0.46002197265625, 0.5340576171875, 0.60809326171875, 0.68212890625, 0.75616455078125, 0.8302001953125, 0.90423583984375, 0.978271484375, 1.05230712890625, 1.1263427734375, 1.20037841796875, 1.2744140625, 1.34844970703125, 1.4224853515625, 1.49652099609375, 1.570556640625, 1.64459228515625, 1.7186279296875, 1.79266357421875, 1.86669921875, 1.94073486328125, 2.0147705078125, 2.08880615234375, 2.162841796875, 2.23687744140625, 2.3109130859375, 2.38494873046875, 2.458984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 6.0, 12.0, 7.0, 10.0, 13.0, 17.0, 16.0, 23.0, 23.0, 31.0, 24.0, 27.0, 33.0, 35.0, 27.0, 40.0, 39.0, 42.0, 58.0, 29.0, 39.0, 46.0, 42.0, 31.0, 40.0, 31.0, 20.0, 26.0, 13.0, 30.0, 25.0, 17.0, 16.0, 17.0, 15.0, 16.0, 13.0, 11.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8165130615234375, -1.755096435546875, -1.6936798095703125, -1.63226318359375, -1.5708465576171875, -1.509429931640625, -1.4480133056640625, -1.3865966796875, -1.3251800537109375, -1.263763427734375, -1.2023468017578125, -1.14093017578125, -1.0795135498046875, -1.018096923828125, -0.9566802978515625, -0.895263671875, -0.8338470458984375, -0.772430419921875, -0.7110137939453125, -0.64959716796875, -0.5881805419921875, -0.526763916015625, -0.4653472900390625, -0.4039306640625, -0.3425140380859375, -0.281097412109375, -0.2196807861328125, -0.15826416015625, -0.0968475341796875, -0.035430908203125, 0.0259857177734375, 0.08740234375, 0.1488189697265625, 0.210235595703125, 0.2716522216796875, 0.33306884765625, 0.3944854736328125, 0.455902099609375, 0.5173187255859375, 0.5787353515625, 0.6401519775390625, 0.701568603515625, 0.7629852294921875, 0.82440185546875, 0.8858184814453125, 0.947235107421875, 1.0086517333984375, 1.070068359375, 1.1314849853515625, 1.192901611328125, 1.2543182373046875, 1.31573486328125, 1.3771514892578125, 1.438568115234375, 1.4999847412109375, 1.5614013671875, 1.6228179931640625, 1.684234619140625, 1.7456512451171875, 1.80706787109375, 1.8684844970703125, 1.929901123046875, 1.9913177490234375, 2.052734375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 9.0, 17.0, 20.0, 39.0, 65.0, 88.0, 150.0, 187.0, 278.0, 417.0, 578.0, 783.0, 1173.0, 1901.0, 3058.0, 5386.0, 9922.0, 20376.0, 45243.0, 100451.0, 197949.0, 262723.0, 200754.0, 104435.0, 46629.0, 21186.0, 10260.0, 5434.0, 3182.0, 1969.0, 1201.0, 835.0, 542.0, 417.0, 262.0, 192.0, 120.0, 110.0, 62.0, 44.0, 30.0, 18.0, 19.0, 4.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.59765625, -3.487030029296875, -3.37640380859375, -3.265777587890625, -3.1551513671875, -3.044525146484375, -2.93389892578125, -2.823272705078125, -2.712646484375, -2.602020263671875, -2.49139404296875, -2.380767822265625, -2.2701416015625, -2.159515380859375, -2.04888916015625, -1.938262939453125, -1.82763671875, -1.717010498046875, -1.60638427734375, -1.495758056640625, -1.3851318359375, -1.274505615234375, -1.16387939453125, -1.053253173828125, -0.942626953125, -0.832000732421875, -0.72137451171875, -0.610748291015625, -0.5001220703125, -0.389495849609375, -0.27886962890625, -0.168243408203125, -0.0576171875, 0.053009033203125, 0.16363525390625, 0.274261474609375, 0.3848876953125, 0.495513916015625, 0.60614013671875, 0.716766357421875, 0.827392578125, 0.938018798828125, 1.04864501953125, 1.159271240234375, 1.2698974609375, 1.380523681640625, 1.49114990234375, 1.601776123046875, 1.71240234375, 1.823028564453125, 1.93365478515625, 2.044281005859375, 2.1549072265625, 2.265533447265625, 2.37615966796875, 2.486785888671875, 2.597412109375, 2.708038330078125, 2.81866455078125, 2.929290771484375, 3.0399169921875, 3.150543212890625, 3.26116943359375, 3.371795654296875, 3.482421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 8.0, 9.0, 15.0, 8.0, 18.0, 16.0, 23.0, 33.0, 29.0, 40.0, 48.0, 60.0, 86.0, 65.0, 79.0, 85.0, 67.0, 61.0, 46.0, 41.0, 35.0, 26.0, 22.0, 10.0, 17.0, 12.0, 5.0, 4.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00026988983154296875, -0.0002614222466945648, -0.0002529546618461609, -0.00024448707699775696, -0.00023601949214935303, -0.0002275519073009491, -0.00021908432245254517, -0.00021061673760414124, -0.0002021491527557373, -0.00019368156790733337, -0.00018521398305892944, -0.0001767463982105255, -0.00016827881336212158, -0.00015981122851371765, -0.00015134364366531372, -0.0001428760588169098, -0.00013440847396850586, -0.00012594088912010193, -0.000117473304271698, -0.00010900571942329407, -0.00010053813457489014, -9.20705497264862e-05, -8.360296487808228e-05, -7.513538002967834e-05, -6.666779518127441e-05, -5.8200210332870483e-05, -4.973262548446655e-05, -4.126504063606262e-05, -3.279745578765869e-05, -2.432987093925476e-05, -1.586228609085083e-05, -7.394701242446899e-06, 1.0728836059570312e-06, 9.540468454360962e-06, 1.8008053302764893e-05, 2.6475638151168823e-05, 3.4943222999572754e-05, 4.3410807847976685e-05, 5.1878392696380615e-05, 6.0345977544784546e-05, 6.881356239318848e-05, 7.728114724159241e-05, 8.574873208999634e-05, 9.421631693840027e-05, 0.0001026839017868042, 0.00011115148663520813, 0.00011961907148361206, 0.000128086656332016, 0.00013655424118041992, 0.00014502182602882385, 0.00015348941087722778, 0.00016195699572563171, 0.00017042458057403564, 0.00017889216542243958, 0.0001873597502708435, 0.00019582733511924744, 0.00020429491996765137, 0.0002127625048160553, 0.00022123008966445923, 0.00022969767451286316, 0.0002381652593612671, 0.000246632844209671, 0.00025510042905807495, 0.0002635680139064789, 0.0002720355987548828]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 17.0, 6.0, 23.0, 22.0, 31.0, 31.0, 67.0, 91.0, 102.0, 160.0, 254.0, 327.0, 535.0, 976.0, 1826.0, 3761.0, 8185.0, 19237.0, 49832.0, 126038.0, 254522.0, 290630.0, 171486.0, 71264.0, 27510.0, 11101.0, 4927.0, 2381.0, 1199.0, 696.0, 419.0, 249.0, 211.0, 131.0, 69.0, 63.0, 45.0, 31.0, 33.0, 10.0, 12.0, 18.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.87109375, -3.74285888671875, -3.6146240234375, -3.48638916015625, -3.358154296875, -3.22991943359375, -3.1016845703125, -2.97344970703125, -2.84521484375, -2.71697998046875, -2.5887451171875, -2.46051025390625, -2.332275390625, -2.20404052734375, -2.0758056640625, -1.94757080078125, -1.8193359375, -1.69110107421875, -1.5628662109375, -1.43463134765625, -1.306396484375, -1.17816162109375, -1.0499267578125, -0.92169189453125, -0.79345703125, -0.66522216796875, -0.5369873046875, -0.40875244140625, -0.280517578125, -0.15228271484375, -0.0240478515625, 0.10418701171875, 0.232421875, 0.36065673828125, 0.4888916015625, 0.61712646484375, 0.745361328125, 0.87359619140625, 1.0018310546875, 1.13006591796875, 1.25830078125, 1.38653564453125, 1.5147705078125, 1.64300537109375, 1.771240234375, 1.89947509765625, 2.0277099609375, 2.15594482421875, 2.2841796875, 2.41241455078125, 2.5406494140625, 2.66888427734375, 2.797119140625, 2.92535400390625, 3.0535888671875, 3.18182373046875, 3.31005859375, 3.43829345703125, 3.5665283203125, 3.69476318359375, 3.822998046875, 3.95123291015625, 4.0794677734375, 4.20770263671875, 4.3359375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 17.0, 17.0, 15.0, 17.0, 23.0, 24.0, 21.0, 37.0, 46.0, 37.0, 38.0, 36.0, 39.0, 29.0, 44.0, 45.0, 44.0, 49.0, 40.0, 53.0, 36.0, 39.0, 45.0, 32.0, 37.0, 18.0, 23.0, 20.0, 12.0, 4.0, 10.0, 4.0, 8.0, 5.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4500579833984375, -0.434295654296875, -0.4185333251953125, -0.40277099609375, -0.3870086669921875, -0.371246337890625, -0.3554840087890625, -0.3397216796875, -0.3239593505859375, -0.308197021484375, -0.2924346923828125, -0.27667236328125, -0.2609100341796875, -0.245147705078125, -0.2293853759765625, -0.213623046875, -0.1978607177734375, -0.182098388671875, -0.1663360595703125, -0.15057373046875, -0.1348114013671875, -0.119049072265625, -0.1032867431640625, -0.0875244140625, -0.0717620849609375, -0.055999755859375, -0.0402374267578125, -0.02447509765625, -0.0087127685546875, 0.007049560546875, 0.0228118896484375, 0.03857421875, 0.0543365478515625, 0.070098876953125, 0.0858612060546875, 0.10162353515625, 0.1173858642578125, 0.133148193359375, 0.1489105224609375, 0.1646728515625, 0.1804351806640625, 0.196197509765625, 0.2119598388671875, 0.22772216796875, 0.2434844970703125, 0.259246826171875, 0.2750091552734375, 0.290771484375, 0.3065338134765625, 0.322296142578125, 0.3380584716796875, 0.35382080078125, 0.3695831298828125, 0.385345458984375, 0.4011077880859375, 0.4168701171875, 0.4326324462890625, 0.448394775390625, 0.4641571044921875, 0.47991943359375, 0.4956817626953125, 0.511444091796875, 0.5272064208984375, 0.54296875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 4.0, 8.0, 12.0, 11.0, 14.0, 19.0, 16.0, 29.0, 36.0, 37.0, 32.0, 49.0, 50.0, 68.0, 49.0, 54.0, 40.0, 55.0, 49.0, 44.0, 45.0, 35.0, 40.0, 29.0, 29.0, 29.0, 22.0, 18.0, 17.0, 12.0, 4.0, 10.0, 3.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.364747524261475, -5.204495429992676, -5.044243335723877, -4.883991241455078, -4.723739147186279, -4.5634870529174805, -4.403234481811523, -4.242982387542725, -4.082730293273926, -3.922478199005127, -3.762226104736328, -3.6019740104675293, -3.4417216777801514, -3.2814695835113525, -3.1212174892425537, -2.960965156555176, -2.800713300704956, -2.6404612064361572, -2.4802091121673584, -2.3199567794799805, -2.1597046852111816, -1.9994525909423828, -1.839200496673584, -1.6789482831954956, -1.5186961889266968, -1.358444094657898, -1.1981918811798096, -1.0379397869110107, -0.8776876330375671, -0.7174354791641235, -0.5571833848953247, -0.39693117141723633, -0.2366790771484375, -0.07642693817615509, 0.08382520079612732, 0.24407732486724854, 0.40432947874069214, 0.5645816326141357, 0.7248337268829346, 0.885085940361023, 1.0453380346298218, 1.2055901288986206, 1.365842342376709, 1.5260944366455078, 1.6863465309143066, 1.846598744392395, 2.0068507194519043, 2.1671030521392822, 2.327355146408081, 2.48760724067688, 2.6478593349456787, 2.8081116676330566, 2.9683637619018555, 3.1286158561706543, 3.288867950439453, 3.449120044708252, 3.609372138977051, 3.7696242332458496, 3.9298763275146484, 4.090128421783447, 4.250380516052246, 4.410633087158203, 4.570884704589844, 4.731137275695801, 4.8913893699646]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 11.0, 13.0, 8.0, 13.0, 14.0, 26.0, 25.0, 30.0, 31.0, 30.0, 30.0, 37.0, 43.0, 48.0, 36.0, 47.0, 46.0, 61.0, 51.0, 40.0, 39.0, 51.0, 31.0, 44.0, 20.0, 27.0, 25.0, 13.0, 13.0, 19.0, 14.0, 9.0, 13.0, 14.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5147292613983154, -3.401359796524048, -3.2879905700683594, -3.174621105194092, -3.0612518787384033, -2.9478824138641357, -2.8345131874084473, -2.7211437225341797, -2.607774257659912, -2.4944047927856445, -2.381035566329956, -2.2676661014556885, -2.154296875, -2.0409274101257324, -1.9275580644607544, -1.8141887187957764, -1.700819492340088, -1.5874501466751099, -1.4740808010101318, -1.3607113361358643, -1.2473421096801758, -1.1339726448059082, -1.0206032991409302, -0.9072339534759521, -0.7938646078109741, -0.6804952621459961, -0.5671259164810181, -0.45375651121139526, -0.34038716554641724, -0.2270178198814392, -0.1136484146118164, -0.0002790689468383789, 0.11309003829956055, 0.22645939886569977, 0.339828759431839, 0.4531981348991394, 0.5665674805641174, 0.6799368262290955, 0.7933062314987183, 0.9066755771636963, 1.0200449228286743, 1.1334142684936523, 1.2467836141586304, 1.3601529598236084, 1.473522424697876, 1.5868916511535645, 1.700261116027832, 1.81363046169281, 1.926999807357788, 2.0403692722320557, 2.153738498687744, 2.2671079635620117, 2.3804771900177, 2.4938466548919678, 2.6072158813476562, 2.720585346221924, 2.8339548110961914, 2.947324275970459, 3.0606935024261475, 3.174062967300415, 3.2874321937561035, 3.400801658630371, 3.5141711235046387, 3.627540349960327, 3.7409095764160156]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 13.0, 16.0, 26.0, 52.0, 79.0, 85.0, 124.0, 201.0, 317.0, 464.0, 754.0, 1184.0, 1850.0, 2997.0, 4794.0, 7923.0, 12779.0, 21323.0, 34659.0, 57155.0, 93672.0, 149813.0, 231958.0, 339193.0, 458066.0, 547988.0, 567445.0, 504838.0, 391515.0, 277574.0, 182473.0, 116575.0, 72702.0, 44290.0, 27150.0, 16497.0, 9989.0, 6122.0, 3756.0, 2181.0, 1439.0, 877.0, 512.0, 331.0, 195.0, 133.0, 88.0, 41.0, 28.0, 15.0, 13.0, 10.0, 4.0, 1.0, 5.0, 0.0, 2.0], "bins": [-3.9609375, -3.84173583984375, -3.7225341796875, -3.60333251953125, -3.484130859375, -3.36492919921875, -3.2457275390625, -3.12652587890625, -3.00732421875, -2.88812255859375, -2.7689208984375, -2.64971923828125, -2.530517578125, -2.41131591796875, -2.2921142578125, -2.17291259765625, -2.0537109375, -1.93450927734375, -1.8153076171875, -1.69610595703125, -1.576904296875, -1.45770263671875, -1.3385009765625, -1.21929931640625, -1.10009765625, -0.98089599609375, -0.8616943359375, -0.74249267578125, -0.623291015625, -0.50408935546875, -0.3848876953125, -0.26568603515625, -0.146484375, -0.02728271484375, 0.0919189453125, 0.21112060546875, 0.330322265625, 0.44952392578125, 0.5687255859375, 0.68792724609375, 0.80712890625, 0.92633056640625, 1.0455322265625, 1.16473388671875, 1.283935546875, 1.40313720703125, 1.5223388671875, 1.64154052734375, 1.7607421875, 1.87994384765625, 1.9991455078125, 2.11834716796875, 2.237548828125, 2.35675048828125, 2.4759521484375, 2.59515380859375, 2.71435546875, 2.83355712890625, 2.9527587890625, 3.07196044921875, 3.191162109375, 3.31036376953125, 3.4295654296875, 3.54876708984375, 3.66796875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 20.0, 8.0, 17.0, 17.0, 19.0, 17.0, 22.0, 35.0, 34.0, 30.0, 28.0, 27.0, 45.0, 41.0, 38.0, 42.0, 46.0, 47.0, 46.0, 48.0, 37.0, 35.0, 33.0, 30.0, 25.0, 26.0, 25.0, 15.0, 14.0, 25.0, 12.0, 11.0, 15.0, 8.0, 6.0, 10.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-3.001953125, -2.917144775390625, -2.83233642578125, -2.747528076171875, -2.6627197265625, -2.577911376953125, -2.49310302734375, -2.408294677734375, -2.323486328125, -2.238677978515625, -2.15386962890625, -2.069061279296875, -1.9842529296875, -1.899444580078125, -1.81463623046875, -1.729827880859375, -1.64501953125, -1.560211181640625, -1.47540283203125, -1.390594482421875, -1.3057861328125, -1.220977783203125, -1.13616943359375, -1.051361083984375, -0.966552734375, -0.881744384765625, -0.79693603515625, -0.712127685546875, -0.6273193359375, -0.542510986328125, -0.45770263671875, -0.372894287109375, -0.2880859375, -0.203277587890625, -0.11846923828125, -0.033660888671875, 0.0511474609375, 0.135955810546875, 0.22076416015625, 0.305572509765625, 0.390380859375, 0.475189208984375, 0.55999755859375, 0.644805908203125, 0.7296142578125, 0.814422607421875, 0.89923095703125, 0.984039306640625, 1.06884765625, 1.153656005859375, 1.23846435546875, 1.323272705078125, 1.4080810546875, 1.492889404296875, 1.57769775390625, 1.662506103515625, 1.747314453125, 1.832122802734375, 1.91693115234375, 2.001739501953125, 2.0865478515625, 2.171356201171875, 2.25616455078125, 2.340972900390625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 10.0, 14.0, 22.0, 37.0, 59.0, 95.0, 156.0, 229.0, 368.0, 632.0, 1048.0, 1678.0, 2989.0, 4879.0, 8361.0, 14414.0, 24605.0, 41530.0, 70503.0, 114969.0, 182533.0, 276418.0, 388676.0, 493568.0, 556288.0, 543229.0, 465485.0, 352585.0, 244396.0, 159170.0, 98947.0, 59869.0, 35533.0, 21016.0, 12207.0, 7221.0, 4212.0, 2483.0, 1440.0, 931.0, 565.0, 346.0, 203.0, 139.0, 82.0, 49.0, 34.0, 19.0, 12.0, 15.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.99127197265625, -3.8575439453125, -3.72381591796875, -3.590087890625, -3.45635986328125, -3.3226318359375, -3.18890380859375, -3.05517578125, -2.92144775390625, -2.7877197265625, -2.65399169921875, -2.520263671875, -2.38653564453125, -2.2528076171875, -2.11907958984375, -1.9853515625, -1.85162353515625, -1.7178955078125, -1.58416748046875, -1.450439453125, -1.31671142578125, -1.1829833984375, -1.04925537109375, -0.91552734375, -0.78179931640625, -0.6480712890625, -0.51434326171875, -0.380615234375, -0.24688720703125, -0.1131591796875, 0.02056884765625, 0.154296875, 0.28802490234375, 0.4217529296875, 0.55548095703125, 0.689208984375, 0.82293701171875, 0.9566650390625, 1.09039306640625, 1.22412109375, 1.35784912109375, 1.4915771484375, 1.62530517578125, 1.759033203125, 1.89276123046875, 2.0264892578125, 2.16021728515625, 2.2939453125, 2.42767333984375, 2.5614013671875, 2.69512939453125, 2.828857421875, 2.96258544921875, 3.0963134765625, 3.23004150390625, 3.36376953125, 3.49749755859375, 3.6312255859375, 3.76495361328125, 3.898681640625, 4.03240966796875, 4.1661376953125, 4.29986572265625, 4.43359375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 14.0, 30.0, 27.0, 43.0, 43.0, 54.0, 75.0, 67.0, 101.0, 124.0, 117.0, 126.0, 167.0, 202.0, 200.0, 221.0, 210.0, 197.0, 238.0, 218.0, 224.0, 192.0, 184.0, 140.0, 140.0, 149.0, 91.0, 84.0, 81.0, 70.0, 50.0, 49.0, 26.0, 27.0, 19.0, 23.0, 6.0, 13.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2288970947265625, -1.179473876953125, -1.1300506591796875, -1.08062744140625, -1.0312042236328125, -0.981781005859375, -0.9323577880859375, -0.8829345703125, -0.8335113525390625, -0.784088134765625, -0.7346649169921875, -0.68524169921875, -0.6358184814453125, -0.586395263671875, -0.5369720458984375, -0.487548828125, -0.4381256103515625, -0.388702392578125, -0.3392791748046875, -0.28985595703125, -0.2404327392578125, -0.191009521484375, -0.1415863037109375, -0.0921630859375, -0.0427398681640625, 0.006683349609375, 0.0561065673828125, 0.10552978515625, 0.1549530029296875, 0.204376220703125, 0.2537994384765625, 0.30322265625, 0.3526458740234375, 0.402069091796875, 0.4514923095703125, 0.50091552734375, 0.5503387451171875, 0.599761962890625, 0.6491851806640625, 0.6986083984375, 0.7480316162109375, 0.797454833984375, 0.8468780517578125, 0.89630126953125, 0.9457244873046875, 0.995147705078125, 1.0445709228515625, 1.093994140625, 1.1434173583984375, 1.192840576171875, 1.2422637939453125, 1.29168701171875, 1.3411102294921875, 1.390533447265625, 1.4399566650390625, 1.4893798828125, 1.5388031005859375, 1.588226318359375, 1.6376495361328125, 1.68707275390625, 1.7364959716796875, 1.785919189453125, 1.8353424072265625, 1.884765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 11.0, 16.0, 25.0, 28.0, 35.0, 43.0, 56.0, 52.0, 45.0, 76.0, 69.0, 52.0, 81.0, 70.0, 64.0, 46.0, 50.0, 38.0, 35.0, 18.0, 18.0, 16.0, 11.0, 14.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.525041103363037, -7.306530475616455, -7.088019847869873, -6.869509696960449, -6.650999069213867, -6.432488441467285, -6.213977813720703, -5.995467185974121, -5.776956558227539, -5.558445930480957, -5.339935302734375, -5.121424674987793, -4.902914524078369, -4.684403896331787, -4.465893268585205, -4.247382640838623, -4.028872489929199, -3.810361862182617, -3.5918514728546143, -3.3733408451080322, -3.1548304557800293, -2.9363198280334473, -2.7178092002868652, -2.499298572540283, -2.2807881832122803, -2.0622775554656982, -1.8437671661376953, -1.6252565383911133, -1.4067460298538208, -1.1882355213165283, -0.9697248935699463, -0.7512143850326538, -0.5327038764953613, -0.31419333815574646, -0.09568279981613159, 0.12282776832580566, 0.34133827686309814, 0.5598487854003906, 0.7783594131469727, 0.9968699216842651, 1.2153804302215576, 1.43389093875885, 1.6524014472961426, 1.8709120750427246, 2.0894227027893066, 2.3079330921173096, 2.5264437198638916, 2.7449541091918945, 2.9634647369384766, 3.1819753646850586, 3.4004857540130615, 3.6189963817596436, 3.8375067710876465, 4.0560173988342285, 4.2745280265808105, 4.493038654327393, 4.711548805236816, 4.930059432983398, 5.1485700607299805, 5.3670806884765625, 5.585590839385986, 5.804101467132568, 6.02261209487915, 6.241122722625732, 6.4596333503723145]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 2.0, 4.0, 9.0, 17.0, 21.0, 15.0, 17.0, 25.0, 18.0, 33.0, 28.0, 41.0, 36.0, 47.0, 36.0, 31.0, 52.0, 44.0, 40.0, 31.0, 38.0, 39.0, 49.0, 30.0, 33.0, 37.0, 36.0, 30.0, 25.0, 27.0, 19.0, 11.0, 7.0, 10.0, 15.0, 10.0, 4.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.2437453269958496, -3.1337249279022217, -3.0237045288085938, -2.913684129714966, -2.803663730621338, -2.693643569946289, -2.583623170852661, -2.473602771759033, -2.3635823726654053, -2.2535619735717773, -2.1435415744781494, -2.0335211753845215, -1.923500895500183, -1.8134804964065552, -1.7034602165222168, -1.5934398174285889, -1.483419418334961, -1.373399019241333, -1.263378620147705, -1.1533583402633667, -1.0433379411697388, -0.9333175420761108, -0.8232972025871277, -0.7132768630981445, -0.6032564640045166, -0.49323609471321106, -0.3832157254219055, -0.2731953561306, -0.16317498683929443, -0.053154587745666504, 0.05686575174331665, 0.1668860912322998, 0.27690625190734863, 0.3869266211986542, 0.4969469904899597, 0.6069673299789429, 0.7169877290725708, 0.8270081281661987, 0.9370284676551819, 1.047048807144165, 1.157069206237793, 1.267089605331421, 1.3771100044250488, 1.4871302843093872, 1.5971506834030151, 1.707171082496643, 1.8171913623809814, 1.9272117614746094, 2.0372321605682373, 2.1472525596618652, 2.257272958755493, 2.367293357849121, 2.47731351852417, 2.587334156036377, 2.697354316711426, 2.8073747158050537, 2.9173951148986816, 3.0274155139923096, 3.1374359130859375, 3.2474563121795654, 3.3574767112731934, 3.467496871948242, 3.57751727104187, 3.687537670135498, 3.797558069229126]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 14.0, 19.0, 19.0, 42.0, 59.0, 89.0, 134.0, 195.0, 316.0, 476.0, 790.0, 1198.0, 1976.0, 3092.0, 4945.0, 8095.0, 13430.0, 22004.0, 37261.0, 63627.0, 107084.0, 161663.0, 192177.0, 162352.0, 107838.0, 64436.0, 37737.0, 22365.0, 13381.0, 8121.0, 4981.0, 3191.0, 2054.0, 1238.0, 820.0, 485.0, 303.0, 200.0, 141.0, 81.0, 58.0, 26.0, 24.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9326171875, -0.90478515625, -0.876953125, -0.84912109375, -0.8212890625, -0.79345703125, -0.765625, -0.73779296875, -0.7099609375, -0.68212890625, -0.654296875, -0.62646484375, -0.5986328125, -0.57080078125, -0.54296875, -0.51513671875, -0.4873046875, -0.45947265625, -0.431640625, -0.40380859375, -0.3759765625, -0.34814453125, -0.3203125, -0.29248046875, -0.2646484375, -0.23681640625, -0.208984375, -0.18115234375, -0.1533203125, -0.12548828125, -0.09765625, -0.06982421875, -0.0419921875, -0.01416015625, 0.013671875, 0.04150390625, 0.0693359375, 0.09716796875, 0.125, 0.15283203125, 0.1806640625, 0.20849609375, 0.236328125, 0.26416015625, 0.2919921875, 0.31982421875, 0.34765625, 0.37548828125, 0.4033203125, 0.43115234375, 0.458984375, 0.48681640625, 0.5146484375, 0.54248046875, 0.5703125, 0.59814453125, 0.6259765625, 0.65380859375, 0.681640625, 0.70947265625, 0.7373046875, 0.76513671875, 0.79296875, 0.82080078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 15.0, 15.0, 26.0, 25.0, 33.0, 37.0, 37.0, 36.0, 47.0, 37.0, 55.0, 46.0, 55.0, 61.0, 51.0, 45.0, 44.0, 35.0, 36.0, 30.0, 41.0, 28.0, 22.0, 27.0, 14.0, 10.0, 15.0, 9.0, 7.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.26776123046875, -4.1292724609375, -3.99078369140625, -3.852294921875, -3.71380615234375, -3.5753173828125, -3.43682861328125, -3.29833984375, -3.15985107421875, -3.0213623046875, -2.88287353515625, -2.744384765625, -2.60589599609375, -2.4674072265625, -2.32891845703125, -2.1904296875, -2.05194091796875, -1.9134521484375, -1.77496337890625, -1.636474609375, -1.49798583984375, -1.3594970703125, -1.22100830078125, -1.08251953125, -0.94403076171875, -0.8055419921875, -0.66705322265625, -0.528564453125, -0.39007568359375, -0.2515869140625, -0.11309814453125, 0.025390625, 0.16387939453125, 0.3023681640625, 0.44085693359375, 0.579345703125, 0.71783447265625, 0.8563232421875, 0.99481201171875, 1.13330078125, 1.27178955078125, 1.4102783203125, 1.54876708984375, 1.687255859375, 1.82574462890625, 1.9642333984375, 2.10272216796875, 2.2412109375, 2.37969970703125, 2.5181884765625, 2.65667724609375, 2.795166015625, 2.93365478515625, 3.0721435546875, 3.21063232421875, 3.34912109375, 3.48760986328125, 3.6260986328125, 3.76458740234375, 3.903076171875, 4.04156494140625, 4.1800537109375, 4.31854248046875, 4.45703125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 15.0, 30.0, 39.0, 82.0, 94.0, 139.0, 214.0, 281.0, 513.0, 832.0, 1341.0, 2266.0, 3840.0, 6816.0, 11946.0, 22285.0, 41508.0, 78561.0, 150119.0, 240309.0, 217979.0, 125686.0, 65902.0, 34902.0, 18575.0, 10126.0, 5818.0, 3225.0, 1913.0, 1171.0, 709.0, 443.0, 298.0, 191.0, 138.0, 77.0, 52.0, 28.0, 26.0, 13.0, 14.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.0838165283203125, -1.047515869140625, -1.0112152099609375, -0.97491455078125, -0.9386138916015625, -0.902313232421875, -0.8660125732421875, -0.8297119140625, -0.7934112548828125, -0.757110595703125, -0.7208099365234375, -0.68450927734375, -0.6482086181640625, -0.611907958984375, -0.5756072998046875, -0.539306640625, -0.5030059814453125, -0.466705322265625, -0.4304046630859375, -0.39410400390625, -0.3578033447265625, -0.321502685546875, -0.2852020263671875, -0.2489013671875, -0.2126007080078125, -0.176300048828125, -0.1399993896484375, -0.10369873046875, -0.0673980712890625, -0.031097412109375, 0.0052032470703125, 0.04150390625, 0.0778045654296875, 0.114105224609375, 0.1504058837890625, 0.18670654296875, 0.2230072021484375, 0.259307861328125, 0.2956085205078125, 0.3319091796875, 0.3682098388671875, 0.404510498046875, 0.4408111572265625, 0.47711181640625, 0.5134124755859375, 0.549713134765625, 0.5860137939453125, 0.622314453125, 0.6586151123046875, 0.694915771484375, 0.7312164306640625, 0.76751708984375, 0.8038177490234375, 0.840118408203125, 0.8764190673828125, 0.9127197265625, 0.9490203857421875, 0.985321044921875, 1.0216217041015625, 1.05792236328125, 1.0942230224609375, 1.130523681640625, 1.1668243408203125, 1.203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 8.0, 13.0, 9.0, 13.0, 19.0, 16.0, 15.0, 30.0, 35.0, 20.0, 32.0, 31.0, 35.0, 36.0, 28.0, 34.0, 27.0, 45.0, 47.0, 40.0, 43.0, 37.0, 39.0, 28.0, 43.0, 25.0, 22.0, 19.0, 25.0, 37.0, 28.0, 18.0, 15.0, 10.0, 9.0, 5.0, 6.0, 9.0, 6.0, 5.0, 3.0, 1.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.199859619140625, -2.13018798828125, -2.060516357421875, -1.9908447265625, -1.921173095703125, -1.85150146484375, -1.781829833984375, -1.712158203125, -1.642486572265625, -1.57281494140625, -1.503143310546875, -1.4334716796875, -1.363800048828125, -1.29412841796875, -1.224456787109375, -1.15478515625, -1.085113525390625, -1.01544189453125, -0.945770263671875, -0.8760986328125, -0.806427001953125, -0.73675537109375, -0.667083740234375, -0.597412109375, -0.527740478515625, -0.45806884765625, -0.388397216796875, -0.3187255859375, -0.249053955078125, -0.17938232421875, -0.109710693359375, -0.0400390625, 0.029632568359375, 0.09930419921875, 0.168975830078125, 0.2386474609375, 0.308319091796875, 0.37799072265625, 0.447662353515625, 0.517333984375, 0.587005615234375, 0.65667724609375, 0.726348876953125, 0.7960205078125, 0.865692138671875, 0.93536376953125, 1.005035400390625, 1.07470703125, 1.144378662109375, 1.21405029296875, 1.283721923828125, 1.3533935546875, 1.423065185546875, 1.49273681640625, 1.562408447265625, 1.632080078125, 1.701751708984375, 1.77142333984375, 1.841094970703125, 1.9107666015625, 1.980438232421875, 2.05010986328125, 2.119781494140625, 2.189453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 8.0, 7.0, 10.0, 11.0, 24.0, 25.0, 31.0, 51.0, 76.0, 99.0, 134.0, 191.0, 266.0, 376.0, 558.0, 839.0, 1275.0, 2005.0, 3338.0, 5778.0, 11617.0, 28478.0, 90759.0, 351628.0, 388276.0, 102456.0, 31215.0, 12868.0, 6309.0, 3409.0, 2130.0, 1370.0, 911.0, 635.0, 402.0, 323.0, 226.0, 128.0, 114.0, 58.0, 47.0, 38.0, 28.0, 11.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4755859375, -0.4592132568359375, -0.442840576171875, -0.4264678955078125, -0.41009521484375, -0.3937225341796875, -0.377349853515625, -0.3609771728515625, -0.3446044921875, -0.3282318115234375, -0.311859130859375, -0.2954864501953125, -0.27911376953125, -0.2627410888671875, -0.246368408203125, -0.2299957275390625, -0.213623046875, -0.1972503662109375, -0.180877685546875, -0.1645050048828125, -0.14813232421875, -0.1317596435546875, -0.115386962890625, -0.0990142822265625, -0.0826416015625, -0.0662689208984375, -0.049896240234375, -0.0335235595703125, -0.01715087890625, -0.0007781982421875, 0.015594482421875, 0.0319671630859375, 0.04833984375, 0.0647125244140625, 0.081085205078125, 0.0974578857421875, 0.11383056640625, 0.1302032470703125, 0.146575927734375, 0.1629486083984375, 0.1793212890625, 0.1956939697265625, 0.212066650390625, 0.2284393310546875, 0.24481201171875, 0.2611846923828125, 0.277557373046875, 0.2939300537109375, 0.310302734375, 0.3266754150390625, 0.343048095703125, 0.3594207763671875, 0.37579345703125, 0.3921661376953125, 0.408538818359375, 0.4249114990234375, 0.4412841796875, 0.4576568603515625, 0.474029541015625, 0.4904022216796875, 0.50677490234375, 0.5231475830078125, 0.539520263671875, 0.5558929443359375, 0.572265625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 11.0, 15.0, 9.0, 17.0, 21.0, 31.0, 31.0, 37.0, 46.0, 54.0, 60.0, 68.0, 65.0, 64.0, 66.0, 57.0, 57.0, 52.0, 45.0, 45.0, 19.0, 18.0, 22.0, 14.0, 14.0, 12.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193450927734375e-05, -2.1202489733695984e-05, -2.0470470190048218e-05, -1.973845064640045e-05, -1.9006431102752686e-05, -1.827441155910492e-05, -1.7542392015457153e-05, -1.6810372471809387e-05, -1.607835292816162e-05, -1.5346333384513855e-05, -1.4614313840866089e-05, -1.3882294297218323e-05, -1.3150274753570557e-05, -1.241825520992279e-05, -1.1686235666275024e-05, -1.0954216122627258e-05, -1.0222196578979492e-05, -9.490177035331726e-06, -8.75815749168396e-06, -8.026137948036194e-06, -7.294118404388428e-06, -6.562098860740662e-06, -5.8300793170928955e-06, -5.098059773445129e-06, -4.366040229797363e-06, -3.634020686149597e-06, -2.902001142501831e-06, -2.169981598854065e-06, -1.4379620552062988e-06, -7.059425115585327e-07, 2.60770320892334e-08, 7.580965757369995e-07, 1.4901161193847656e-06, 2.2221356630325317e-06, 2.954155206680298e-06, 3.686174750328064e-06, 4.41819429397583e-06, 5.150213837623596e-06, 5.882233381271362e-06, 6.614252924919128e-06, 7.3462724685668945e-06, 8.07829201221466e-06, 8.810311555862427e-06, 9.542331099510193e-06, 1.0274350643157959e-05, 1.1006370186805725e-05, 1.1738389730453491e-05, 1.2470409274101257e-05, 1.3202428817749023e-05, 1.393444836139679e-05, 1.4666467905044556e-05, 1.5398487448692322e-05, 1.6130506992340088e-05, 1.6862526535987854e-05, 1.759454607963562e-05, 1.8326565623283386e-05, 1.9058585166931152e-05, 1.979060471057892e-05, 2.0522624254226685e-05, 2.125464379787445e-05, 2.1986663341522217e-05, 2.2718682885169983e-05, 2.345070242881775e-05, 2.4182721972465515e-05, 2.491474151611328e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 10.0, 6.0, 23.0, 27.0, 36.0, 47.0, 71.0, 102.0, 135.0, 170.0, 222.0, 336.0, 443.0, 728.0, 967.0, 1485.0, 2247.0, 3610.0, 6058.0, 10621.0, 21170.0, 45270.0, 112743.0, 288730.0, 320100.0, 129034.0, 51392.0, 23140.0, 11718.0, 6487.0, 3885.0, 2497.0, 1528.0, 1038.0, 758.0, 481.0, 337.0, 251.0, 184.0, 115.0, 107.0, 65.0, 44.0, 34.0, 26.0, 24.0, 15.0, 5.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.54931640625, -0.5321884155273438, -0.5150604248046875, -0.49793243408203125, -0.480804443359375, -0.46367645263671875, -0.4465484619140625, -0.42942047119140625, -0.41229248046875, -0.39516448974609375, -0.3780364990234375, -0.36090850830078125, -0.343780517578125, -0.32665252685546875, -0.3095245361328125, -0.29239654541015625, -0.2752685546875, -0.25814056396484375, -0.2410125732421875, -0.22388458251953125, -0.206756591796875, -0.18962860107421875, -0.1725006103515625, -0.15537261962890625, -0.13824462890625, -0.12111663818359375, -0.1039886474609375, -0.08686065673828125, -0.069732666015625, -0.05260467529296875, -0.0354766845703125, -0.01834869384765625, -0.001220703125, 0.01590728759765625, 0.0330352783203125, 0.05016326904296875, 0.067291259765625, 0.08441925048828125, 0.1015472412109375, 0.11867523193359375, 0.13580322265625, 0.15293121337890625, 0.1700592041015625, 0.18718719482421875, 0.204315185546875, 0.22144317626953125, 0.2385711669921875, 0.25569915771484375, 0.2728271484375, 0.28995513916015625, 0.3070831298828125, 0.32421112060546875, 0.341339111328125, 0.35846710205078125, 0.3755950927734375, 0.39272308349609375, 0.40985107421875, 0.42697906494140625, 0.4441070556640625, 0.46123504638671875, 0.478363037109375, 0.49549102783203125, 0.5126190185546875, 0.5297470092773438, 0.546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 9.0, 11.0, 18.0, 17.0, 14.0, 19.0, 32.0, 41.0, 57.0, 77.0, 66.0, 87.0, 90.0, 77.0, 73.0, 50.0, 51.0, 32.0, 24.0, 31.0, 21.0, 16.0, 19.0, 15.0, 9.0, 5.0, 1.0, 5.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.130859375, -0.1275463104248047, -0.12423324584960938, -0.12092018127441406, -0.11760711669921875, -0.11429405212402344, -0.11098098754882812, -0.10766792297363281, -0.1043548583984375, -0.10104179382324219, -0.09772872924804688, -0.09441566467285156, -0.09110260009765625, -0.08778953552246094, -0.08447647094726562, -0.08116340637207031, -0.077850341796875, -0.07453727722167969, -0.07122421264648438, -0.06791114807128906, -0.06459808349609375, -0.06128501892089844, -0.057971954345703125, -0.05465888977050781, -0.0513458251953125, -0.04803276062011719, -0.044719696044921875, -0.04140663146972656, -0.03809356689453125, -0.03478050231933594, -0.031467437744140625, -0.028154373168945312, -0.02484130859375, -0.021528244018554688, -0.018215179443359375, -0.014902114868164062, -0.01158905029296875, -0.008275985717773438, -0.004962921142578125, -0.0016498565673828125, 0.0016632080078125, 0.0049762725830078125, 0.008289337158203125, 0.011602401733398438, 0.01491546630859375, 0.018228530883789062, 0.021541595458984375, 0.024854660034179688, 0.028167724609375, 0.03148078918457031, 0.034793853759765625, 0.03810691833496094, 0.04141998291015625, 0.04473304748535156, 0.048046112060546875, 0.05135917663574219, 0.0546722412109375, 0.05798530578613281, 0.061298370361328125, 0.06461143493652344, 0.06792449951171875, 0.07123756408691406, 0.07455062866210938, 0.07786369323730469, 0.0811767578125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 6.0, 12.0, 14.0, 20.0, 31.0, 35.0, 41.0, 50.0, 52.0, 54.0, 68.0, 69.0, 60.0, 68.0, 76.0, 65.0, 56.0, 40.0, 41.0, 37.0, 27.0, 13.0, 19.0, 9.0, 11.0, 11.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.616769790649414, -7.39704704284668, -7.177323818206787, -6.9576005935668945, -6.73787784576416, -6.518155097961426, -6.298431873321533, -6.078708648681641, -5.858985900878906, -5.639263153076172, -5.419539928436279, -5.199816703796387, -4.980093955993652, -4.760371208190918, -4.540647983551025, -4.320924758911133, -4.101202011108398, -3.881479024887085, -3.6617560386657715, -3.442033052444458, -3.2223100662231445, -3.002587080001831, -2.7828640937805176, -2.563141107559204, -2.3434181213378906, -2.123695135116577, -1.9039721488952637, -1.6842491626739502, -1.4645261764526367, -1.2448031902313232, -1.0250802040100098, -0.8053572177886963, -0.5856342315673828, -0.36591124534606934, -0.14618825912475586, 0.07353472709655762, 0.2932577133178711, 0.5129806995391846, 0.732703685760498, 0.9524266719818115, 1.172149658203125, 1.3918726444244385, 1.611595630645752, 1.8313186168670654, 2.051041603088379, 2.2707645893096924, 2.490487575531006, 2.7102105617523193, 2.929933547973633, 3.1496565341949463, 3.3693795204162598, 3.5891025066375732, 3.8088254928588867, 4.028548240661621, 4.248271465301514, 4.467994689941406, 4.687717437744141, 4.907440185546875, 5.127163410186768, 5.34688663482666, 5.5666093826293945, 5.786332130432129, 6.0060553550720215, 6.225778579711914, 6.445501327514648]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 2.0, 12.0, 14.0, 23.0, 12.0, 18.0, 26.0, 16.0, 34.0, 34.0, 39.0, 37.0, 43.0, 35.0, 34.0, 48.0, 49.0, 41.0, 25.0, 41.0, 42.0, 44.0, 32.0, 32.0, 35.0, 37.0, 29.0, 30.0, 23.0, 19.0, 11.0, 7.0, 12.0, 13.0, 9.0, 5.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.230863571166992, -3.121060609817505, -3.0112578868865967, -2.9014549255371094, -2.791652202606201, -2.681849241256714, -2.5720462799072266, -2.4622435569763184, -2.35244083404541, -2.242637872695923, -2.1328351497650146, -2.0230321884155273, -1.9132294654846191, -1.8034265041351318, -1.693623661994934, -1.5838208198547363, -1.474017858505249, -1.3642150163650513, -1.2544121742248535, -1.1446092128753662, -1.034806489944458, -0.9250035881996155, -0.815200686454773, -0.7053978443145752, -0.5955950021743774, -0.4857921600341797, -0.37598928809165955, -0.2661864161491394, -0.15638357400894165, -0.046580731868743896, 0.06322216987609863, 0.1730250120162964, 0.28282785415649414, 0.3926306962966919, 0.5024335384368896, 0.6122364401817322, 0.7220392823219299, 0.8318421244621277, 0.9416450262069702, 1.051447868347168, 1.1612507104873657, 1.2710535526275635, 1.3808563947677612, 1.490659236907959, 1.6004621982574463, 1.7102649211883545, 1.8200678825378418, 1.9298707246780396, 2.0396735668182373, 2.1494765281677246, 2.259279251098633, 2.36908221244812, 2.4788849353790283, 2.5886878967285156, 2.698490619659424, 2.808293581008911, 2.9180965423583984, 3.0278995037078857, 3.137702226638794, 3.2475051879882812, 3.3573079109191895, 3.4671108722686768, 3.576913833618164, 3.6867165565490723, 3.7965192794799805]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 11.0, 22.0, 25.0, 43.0, 69.0, 95.0, 174.0, 260.0, 445.0, 682.0, 1240.0, 2022.0, 3221.0, 5268.0, 8272.0, 12837.0, 19940.0, 29628.0, 42655.0, 59229.0, 78340.0, 96053.0, 109490.0, 113750.0, 108322.0, 95251.0, 77657.0, 59056.0, 42160.0, 29371.0, 19103.0, 12527.0, 8060.0, 5005.0, 3253.0, 1991.0, 1159.0, 727.0, 435.0, 275.0, 161.0, 107.0, 60.0, 45.0, 24.0, 18.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.775390625, -2.684326171875, -2.59326171875, -2.502197265625, -2.4111328125, -2.320068359375, -2.22900390625, -2.137939453125, -2.046875, -1.955810546875, -1.86474609375, -1.773681640625, -1.6826171875, -1.591552734375, -1.50048828125, -1.409423828125, -1.318359375, -1.227294921875, -1.13623046875, -1.045166015625, -0.9541015625, -0.863037109375, -0.77197265625, -0.680908203125, -0.58984375, -0.498779296875, -0.40771484375, -0.316650390625, -0.2255859375, -0.134521484375, -0.04345703125, 0.047607421875, 0.138671875, 0.229736328125, 0.32080078125, 0.411865234375, 0.5029296875, 0.593994140625, 0.68505859375, 0.776123046875, 0.8671875, 0.958251953125, 1.04931640625, 1.140380859375, 1.2314453125, 1.322509765625, 1.41357421875, 1.504638671875, 1.595703125, 1.686767578125, 1.77783203125, 1.868896484375, 1.9599609375, 2.051025390625, 2.14208984375, 2.233154296875, 2.32421875, 2.415283203125, 2.50634765625, 2.597412109375, 2.6884765625, 2.779541015625, 2.87060546875, 2.961669921875, 3.052734375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 9.0, 17.0, 29.0, 16.0, 16.0, 40.0, 46.0, 44.0, 32.0, 48.0, 48.0, 51.0, 46.0, 45.0, 42.0, 50.0, 56.0, 50.0, 43.0, 22.0, 43.0, 28.0, 31.0, 23.0, 19.0, 17.0, 12.0, 12.0, 10.0, 7.0, 2.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.748046875, -3.613006591796875, -3.47796630859375, -3.342926025390625, -3.2078857421875, -3.072845458984375, -2.93780517578125, -2.802764892578125, -2.667724609375, -2.532684326171875, -2.39764404296875, -2.262603759765625, -2.1275634765625, -1.992523193359375, -1.85748291015625, -1.722442626953125, -1.58740234375, -1.452362060546875, -1.31732177734375, -1.182281494140625, -1.0472412109375, -0.912200927734375, -0.77716064453125, -0.642120361328125, -0.507080078125, -0.372039794921875, -0.23699951171875, -0.101959228515625, 0.0330810546875, 0.168121337890625, 0.30316162109375, 0.438201904296875, 0.5732421875, 0.708282470703125, 0.84332275390625, 0.978363037109375, 1.1134033203125, 1.248443603515625, 1.38348388671875, 1.518524169921875, 1.653564453125, 1.788604736328125, 1.92364501953125, 2.058685302734375, 2.1937255859375, 2.328765869140625, 2.46380615234375, 2.598846435546875, 2.73388671875, 2.868927001953125, 3.00396728515625, 3.139007568359375, 3.2740478515625, 3.409088134765625, 3.54412841796875, 3.679168701171875, 3.814208984375, 3.949249267578125, 4.08428955078125, 4.219329833984375, 4.3543701171875, 4.489410400390625, 4.62445068359375, 4.759490966796875, 4.89453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 22.0, 25.0, 44.0, 53.0, 93.0, 164.0, 272.0, 409.0, 676.0, 1026.0, 1577.0, 2641.0, 3896.0, 5932.0, 8846.0, 13207.0, 19395.0, 27378.0, 37650.0, 50450.0, 64504.0, 78451.0, 89753.0, 97555.0, 98737.0, 94237.0, 83179.0, 70206.0, 55977.0, 42787.0, 31124.0, 22390.0, 15389.0, 10543.0, 7179.0, 4590.0, 2894.0, 1930.0, 1243.0, 778.0, 503.0, 317.0, 207.0, 129.0, 67.0, 55.0, 32.0, 17.0, 14.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.55859375, -2.476593017578125, -2.39459228515625, -2.312591552734375, -2.2305908203125, -2.148590087890625, -2.06658935546875, -1.984588623046875, -1.902587890625, -1.820587158203125, -1.73858642578125, -1.656585693359375, -1.5745849609375, -1.492584228515625, -1.41058349609375, -1.328582763671875, -1.24658203125, -1.164581298828125, -1.08258056640625, -1.000579833984375, -0.9185791015625, -0.836578369140625, -0.75457763671875, -0.672576904296875, -0.590576171875, -0.508575439453125, -0.42657470703125, -0.344573974609375, -0.2625732421875, -0.180572509765625, -0.09857177734375, -0.016571044921875, 0.0654296875, 0.147430419921875, 0.22943115234375, 0.311431884765625, 0.3934326171875, 0.475433349609375, 0.55743408203125, 0.639434814453125, 0.721435546875, 0.803436279296875, 0.88543701171875, 0.967437744140625, 1.0494384765625, 1.131439208984375, 1.21343994140625, 1.295440673828125, 1.37744140625, 1.459442138671875, 1.54144287109375, 1.623443603515625, 1.7054443359375, 1.787445068359375, 1.86944580078125, 1.951446533203125, 2.033447265625, 2.115447998046875, 2.19744873046875, 2.279449462890625, 2.3614501953125, 2.443450927734375, 2.52545166015625, 2.607452392578125, 2.689453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 9.0, 6.0, 19.0, 13.0, 5.0, 15.0, 16.0, 12.0, 24.0, 33.0, 30.0, 37.0, 37.0, 40.0, 33.0, 33.0, 44.0, 42.0, 45.0, 48.0, 30.0, 32.0, 50.0, 29.0, 36.0, 30.0, 33.0, 37.0, 18.0, 24.0, 23.0, 13.0, 12.0, 12.0, 21.0, 7.0, 7.0, 2.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.369140625, -2.29925537109375, -2.2293701171875, -2.15948486328125, -2.089599609375, -2.01971435546875, -1.9498291015625, -1.87994384765625, -1.81005859375, -1.74017333984375, -1.6702880859375, -1.60040283203125, -1.530517578125, -1.46063232421875, -1.3907470703125, -1.32086181640625, -1.2509765625, -1.18109130859375, -1.1112060546875, -1.04132080078125, -0.971435546875, -0.90155029296875, -0.8316650390625, -0.76177978515625, -0.69189453125, -0.62200927734375, -0.5521240234375, -0.48223876953125, -0.412353515625, -0.34246826171875, -0.2725830078125, -0.20269775390625, -0.1328125, -0.06292724609375, 0.0069580078125, 0.07684326171875, 0.146728515625, 0.21661376953125, 0.2864990234375, 0.35638427734375, 0.42626953125, 0.49615478515625, 0.5660400390625, 0.63592529296875, 0.705810546875, 0.77569580078125, 0.8455810546875, 0.91546630859375, 0.9853515625, 1.05523681640625, 1.1251220703125, 1.19500732421875, 1.264892578125, 1.33477783203125, 1.4046630859375, 1.47454833984375, 1.54443359375, 1.61431884765625, 1.6842041015625, 1.75408935546875, 1.823974609375, 1.89385986328125, 1.9637451171875, 2.03363037109375, 2.103515625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 13.0, 15.0, 20.0, 26.0, 28.0, 55.0, 86.0, 133.0, 174.0, 268.0, 449.0, 684.0, 1195.0, 1983.0, 3640.0, 6910.0, 14771.0, 34858.0, 82666.0, 174883.0, 262656.0, 232058.0, 128495.0, 56298.0, 23676.0, 10475.0, 5195.0, 2636.0, 1538.0, 959.0, 583.0, 396.0, 220.0, 179.0, 116.0, 77.0, 37.0, 38.0, 18.0, 14.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.590087890625, -3.46533203125, -3.340576171875, -3.2158203125, -3.091064453125, -2.96630859375, -2.841552734375, -2.716796875, -2.592041015625, -2.46728515625, -2.342529296875, -2.2177734375, -2.093017578125, -1.96826171875, -1.843505859375, -1.71875, -1.593994140625, -1.46923828125, -1.344482421875, -1.2197265625, -1.094970703125, -0.97021484375, -0.845458984375, -0.720703125, -0.595947265625, -0.47119140625, -0.346435546875, -0.2216796875, -0.096923828125, 0.02783203125, 0.152587890625, 0.27734375, 0.402099609375, 0.52685546875, 0.651611328125, 0.7763671875, 0.901123046875, 1.02587890625, 1.150634765625, 1.275390625, 1.400146484375, 1.52490234375, 1.649658203125, 1.7744140625, 1.899169921875, 2.02392578125, 2.148681640625, 2.2734375, 2.398193359375, 2.52294921875, 2.647705078125, 2.7724609375, 2.897216796875, 3.02197265625, 3.146728515625, 3.271484375, 3.396240234375, 3.52099609375, 3.645751953125, 3.7705078125, 3.895263671875, 4.02001953125, 4.144775390625, 4.26953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 2.0, 6.0, 8.0, 18.0, 25.0, 25.0, 41.0, 36.0, 48.0, 63.0, 92.0, 85.0, 83.0, 86.0, 76.0, 75.0, 46.0, 44.0, 31.0, 29.0, 16.0, 23.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0003840923309326172, -0.00037321075797080994, -0.0003623291850090027, -0.00035144761204719543, -0.0003405660390853882, -0.00032968446612358093, -0.0003188028931617737, -0.00030792132019996643, -0.0002970397472381592, -0.00028615817427635193, -0.0002752766013145447, -0.0002643950283527374, -0.0002535134553909302, -0.00024263188242912292, -0.00023175030946731567, -0.00022086873650550842, -0.00020998716354370117, -0.00019910559058189392, -0.00018822401762008667, -0.00017734244465827942, -0.00016646087169647217, -0.00015557929873466492, -0.00014469772577285767, -0.00013381615281105042, -0.00012293457984924316, -0.00011205300688743591, -0.00010117143392562866, -9.028986096382141e-05, -7.940828800201416e-05, -6.852671504020691e-05, -5.764514207839966e-05, -4.676356911659241e-05, -3.5881996154785156e-05, -2.5000423192977905e-05, -1.4118850231170654e-05, -3.2372772693634033e-06, 7.644295692443848e-06, 1.85258686542511e-05, 2.940744161605835e-05, 4.02890145778656e-05, 5.117058753967285e-05, 6.20521605014801e-05, 7.293373346328735e-05, 8.38153064250946e-05, 9.469687938690186e-05, 0.0001055784523487091, 0.00011646002531051636, 0.0001273415982723236, 0.00013822317123413086, 0.0001491047441959381, 0.00015998631715774536, 0.0001708678901195526, 0.00018174946308135986, 0.00019263103604316711, 0.00020351260900497437, 0.00021439418196678162, 0.00022527575492858887, 0.00023615732789039612, 0.00024703890085220337, 0.0002579204738140106, 0.00026880204677581787, 0.0002796836197376251, 0.0002905651926994324, 0.0003014467656612396, 0.0003123283386230469]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 11.0, 10.0, 14.0, 25.0, 25.0, 45.0, 55.0, 81.0, 135.0, 163.0, 228.0, 333.0, 493.0, 893.0, 1512.0, 2795.0, 5233.0, 10672.0, 23085.0, 48944.0, 100242.0, 176747.0, 229989.0, 200991.0, 124664.0, 62886.0, 29694.0, 13782.0, 6654.0, 3373.0, 1798.0, 1043.0, 604.0, 416.0, 283.0, 186.0, 121.0, 98.0, 68.0, 43.0, 30.0, 13.0, 11.0, 22.0, 10.0, 15.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.306640625, -3.198822021484375, -3.09100341796875, -2.983184814453125, -2.8753662109375, -2.767547607421875, -2.65972900390625, -2.551910400390625, -2.444091796875, -2.336273193359375, -2.22845458984375, -2.120635986328125, -2.0128173828125, -1.904998779296875, -1.79718017578125, -1.689361572265625, -1.58154296875, -1.473724365234375, -1.36590576171875, -1.258087158203125, -1.1502685546875, -1.042449951171875, -0.93463134765625, -0.826812744140625, -0.718994140625, -0.611175537109375, -0.50335693359375, -0.395538330078125, -0.2877197265625, -0.179901123046875, -0.07208251953125, 0.035736083984375, 0.1435546875, 0.251373291015625, 0.35919189453125, 0.467010498046875, 0.5748291015625, 0.682647705078125, 0.79046630859375, 0.898284912109375, 1.006103515625, 1.113922119140625, 1.22174072265625, 1.329559326171875, 1.4373779296875, 1.545196533203125, 1.65301513671875, 1.760833740234375, 1.86865234375, 1.976470947265625, 2.08428955078125, 2.192108154296875, 2.2999267578125, 2.407745361328125, 2.51556396484375, 2.623382568359375, 2.731201171875, 2.839019775390625, 2.94683837890625, 3.054656982421875, 3.1624755859375, 3.270294189453125, 3.37811279296875, 3.485931396484375, 3.59375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 5.0, 4.0, 6.0, 17.0, 18.0, 22.0, 26.0, 45.0, 46.0, 44.0, 42.0, 43.0, 52.0, 47.0, 66.0, 59.0, 65.0, 46.0, 50.0, 44.0, 32.0, 39.0, 33.0, 32.0, 31.0, 18.0, 13.0, 17.0, 7.0, 3.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.732421875, -0.71142578125, -0.6904296875, -0.66943359375, -0.6484375, -0.62744140625, -0.6064453125, -0.58544921875, -0.564453125, -0.54345703125, -0.5224609375, -0.50146484375, -0.48046875, -0.45947265625, -0.4384765625, -0.41748046875, -0.396484375, -0.37548828125, -0.3544921875, -0.33349609375, -0.3125, -0.29150390625, -0.2705078125, -0.24951171875, -0.228515625, -0.20751953125, -0.1865234375, -0.16552734375, -0.14453125, -0.12353515625, -0.1025390625, -0.08154296875, -0.060546875, -0.03955078125, -0.0185546875, 0.00244140625, 0.0234375, 0.04443359375, 0.0654296875, 0.08642578125, 0.107421875, 0.12841796875, 0.1494140625, 0.17041015625, 0.19140625, 0.21240234375, 0.2333984375, 0.25439453125, 0.275390625, 0.29638671875, 0.3173828125, 0.33837890625, 0.359375, 0.38037109375, 0.4013671875, 0.42236328125, 0.443359375, 0.46435546875, 0.4853515625, 0.50634765625, 0.52734375, 0.54833984375, 0.5693359375, 0.59033203125, 0.611328125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 14.0, 23.0, 34.0, 39.0, 38.0, 55.0, 68.0, 65.0, 74.0, 84.0, 50.0, 70.0, 74.0, 62.0, 48.0, 43.0, 43.0, 20.0, 17.0, 18.0, 11.0, 16.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28854751586914, -8.052145957946777, -7.815743923187256, -7.579342365264893, -7.342940330505371, -7.106538772583008, -6.8701372146606445, -6.633735656738281, -6.39733362197876, -6.1609320640563965, -5.924530029296875, -5.688128471374512, -5.451726913452148, -5.215324878692627, -4.978923320770264, -4.742521286010742, -4.506119728088379, -4.269718170166016, -4.033316135406494, -3.796914577484131, -3.5605127811431885, -3.324110984802246, -3.087709426879883, -2.8513076305389404, -2.614905834197998, -2.3785040378570557, -2.1421022415161133, -1.90570068359375, -1.6692988872528076, -1.4328970909118652, -1.1964954137802124, -0.9600937366485596, -0.7236919403076172, -0.4872902035713196, -0.250888466835022, -0.014486730098724365, 0.22191500663757324, 0.4583168029785156, 0.6947184801101685, 0.9311201572418213, 1.1675219535827637, 1.403923749923706, 1.6403254270553589, 1.8767271041870117, 2.113128900527954, 2.3495306968688965, 2.5859322547912598, 2.822334051132202, 3.0587358474731445, 3.295137643814087, 3.5315394401550293, 3.7679409980773926, 4.004343032836914, 4.240744590759277, 4.477146148681641, 4.713547706604004, 4.949949741363525, 5.186351299285889, 5.42275333404541, 5.659154891967773, 5.895556449890137, 6.131958484649658, 6.3683600425720215, 6.604762077331543, 6.841163635253906]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 6.0, 10.0, 6.0, 10.0, 12.0, 9.0, 9.0, 18.0, 16.0, 16.0, 17.0, 33.0, 39.0, 34.0, 24.0, 38.0, 34.0, 44.0, 45.0, 39.0, 44.0, 31.0, 31.0, 26.0, 36.0, 38.0, 43.0, 41.0, 32.0, 23.0, 27.0, 20.0, 23.0, 28.0, 22.0, 10.0, 16.0, 10.0, 8.0, 8.0, 6.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3707821369171143, -3.2623131275177, -3.153844118118286, -3.045374870300293, -2.936905860900879, -2.828436851501465, -2.719967842102051, -2.6114988327026367, -2.5030298233032227, -2.3945608139038086, -2.2860918045043945, -2.1776227951049805, -2.0691535472869873, -1.9606845378875732, -1.8522155284881592, -1.7437465190887451, -1.635277271270752, -1.526808261871338, -1.4183391332626343, -1.3098701238632202, -1.2014009952545166, -1.0929319858551025, -0.9844629764556885, -0.8759939074516296, -0.7675248384475708, -0.659055769443512, -0.5505867004394531, -0.44211769104003906, -0.3336486220359802, -0.2251795530319214, -0.11671054363250732, -0.008241474628448486, 0.10022759437561035, 0.208696648478508, 0.31716570258140564, 0.4256347417831421, 0.5341038107872009, 0.6425728797912598, 0.7510418891906738, 0.8595109581947327, 0.9679800271987915, 1.0764490365982056, 1.1849181652069092, 1.2933871746063232, 1.4018561840057373, 1.510325312614441, 1.618794322013855, 1.7272634506225586, 1.8357324600219727, 1.9442014694213867, 2.052670478820801, 2.161139488220215, 2.269608736038208, 2.378077745437622, 2.486546754837036, 2.59501576423645, 2.7034850120544434, 2.8119540214538574, 2.9204230308532715, 3.0288920402526855, 3.1373612880706787, 3.2458302974700928, 3.354299306869507, 3.462768316268921, 3.571237325668335]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [6.0, 0.0, 1.0, 3.0, 0.0, 9.0, 6.0, 9.0, 25.0, 27.0, 41.0, 52.0, 99.0, 121.0, 216.0, 328.0, 474.0, 882.0, 1294.0, 2005.0, 3441.0, 5669.0, 9781.0, 16293.0, 27603.0, 47054.0, 79282.0, 131984.0, 210585.0, 318324.0, 441944.0, 545218.0, 584554.0, 532190.0, 423579.0, 300194.0, 198935.0, 125002.0, 75818.0, 45473.0, 26579.0, 15924.0, 9238.0, 5714.0, 3298.0, 1901.0, 1201.0, 707.0, 416.0, 288.0, 200.0, 109.0, 68.0, 44.0, 35.0, 21.0, 11.0, 15.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.5234375, -4.38397216796875, -4.2445068359375, -4.10504150390625, -3.965576171875, -3.82611083984375, -3.6866455078125, -3.54718017578125, -3.40771484375, -3.26824951171875, -3.1287841796875, -2.98931884765625, -2.849853515625, -2.71038818359375, -2.5709228515625, -2.43145751953125, -2.2919921875, -2.15252685546875, -2.0130615234375, -1.87359619140625, -1.734130859375, -1.59466552734375, -1.4552001953125, -1.31573486328125, -1.17626953125, -1.03680419921875, -0.8973388671875, -0.75787353515625, -0.618408203125, -0.47894287109375, -0.3394775390625, -0.20001220703125, -0.060546875, 0.07891845703125, 0.2183837890625, 0.35784912109375, 0.497314453125, 0.63677978515625, 0.7762451171875, 0.91571044921875, 1.05517578125, 1.19464111328125, 1.3341064453125, 1.47357177734375, 1.613037109375, 1.75250244140625, 1.8919677734375, 2.03143310546875, 2.1708984375, 2.31036376953125, 2.4498291015625, 2.58929443359375, 2.728759765625, 2.86822509765625, 3.0076904296875, 3.14715576171875, 3.28662109375, 3.42608642578125, 3.5655517578125, 3.70501708984375, 3.844482421875, 3.98394775390625, 4.1234130859375, 4.26287841796875, 4.40234375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 8.0, 9.0, 4.0, 4.0, 6.0, 12.0, 21.0, 8.0, 18.0, 31.0, 22.0, 27.0, 31.0, 42.0, 39.0, 54.0, 34.0, 48.0, 45.0, 43.0, 43.0, 51.0, 47.0, 48.0, 47.0, 23.0, 35.0, 33.0, 28.0, 27.0, 19.0, 21.0, 14.0, 14.0, 11.0, 5.0, 3.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.392578125, -3.288726806640625, -3.18487548828125, -3.081024169921875, -2.9771728515625, -2.873321533203125, -2.76947021484375, -2.665618896484375, -2.561767578125, -2.457916259765625, -2.35406494140625, -2.250213623046875, -2.1463623046875, -2.042510986328125, -1.93865966796875, -1.834808349609375, -1.73095703125, -1.627105712890625, -1.52325439453125, -1.419403076171875, -1.3155517578125, -1.211700439453125, -1.10784912109375, -1.003997802734375, -0.900146484375, -0.796295166015625, -0.69244384765625, -0.588592529296875, -0.4847412109375, -0.380889892578125, -0.27703857421875, -0.173187255859375, -0.0693359375, 0.034515380859375, 0.13836669921875, 0.242218017578125, 0.3460693359375, 0.449920654296875, 0.55377197265625, 0.657623291015625, 0.761474609375, 0.865325927734375, 0.96917724609375, 1.073028564453125, 1.1768798828125, 1.280731201171875, 1.38458251953125, 1.488433837890625, 1.59228515625, 1.696136474609375, 1.79998779296875, 1.903839111328125, 2.0076904296875, 2.111541748046875, 2.21539306640625, 2.319244384765625, 2.423095703125, 2.526947021484375, 2.63079833984375, 2.734649658203125, 2.8385009765625, 2.942352294921875, 3.04620361328125, 3.150054931640625, 3.25390625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 15.0, 28.0, 35.0, 44.0, 71.0, 132.0, 242.0, 404.0, 631.0, 1063.0, 1805.0, 3135.0, 5428.0, 9313.0, 15919.0, 27559.0, 46356.0, 77730.0, 125361.0, 194659.0, 287766.0, 390683.0, 486410.0, 534112.0, 521570.0, 448837.0, 349057.0, 245463.0, 163810.0, 103338.0, 63193.0, 37409.0, 21834.0, 12803.0, 7622.0, 4385.0, 2514.0, 1457.0, 845.0, 483.0, 311.0, 180.0, 115.0, 61.0, 34.0, 32.0, 6.0, 8.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.04296875, -4.89373779296875, -4.7445068359375, -4.59527587890625, -4.446044921875, -4.29681396484375, -4.1475830078125, -3.99835205078125, -3.84912109375, -3.69989013671875, -3.5506591796875, -3.40142822265625, -3.252197265625, -3.10296630859375, -2.9537353515625, -2.80450439453125, -2.6552734375, -2.50604248046875, -2.3568115234375, -2.20758056640625, -2.058349609375, -1.90911865234375, -1.7598876953125, -1.61065673828125, -1.46142578125, -1.31219482421875, -1.1629638671875, -1.01373291015625, -0.864501953125, -0.71527099609375, -0.5660400390625, -0.41680908203125, -0.267578125, -0.11834716796875, 0.0308837890625, 0.18011474609375, 0.329345703125, 0.47857666015625, 0.6278076171875, 0.77703857421875, 0.92626953125, 1.07550048828125, 1.2247314453125, 1.37396240234375, 1.523193359375, 1.67242431640625, 1.8216552734375, 1.97088623046875, 2.1201171875, 2.26934814453125, 2.4185791015625, 2.56781005859375, 2.717041015625, 2.86627197265625, 3.0155029296875, 3.16473388671875, 3.31396484375, 3.46319580078125, 3.6124267578125, 3.76165771484375, 3.910888671875, 4.06011962890625, 4.2093505859375, 4.35858154296875, 4.5078125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 5.0, 11.0, 9.0, 14.0, 14.0, 21.0, 30.0, 36.0, 43.0, 66.0, 72.0, 77.0, 80.0, 92.0, 111.0, 135.0, 148.0, 157.0, 171.0, 177.0, 182.0, 200.0, 184.0, 204.0, 190.0, 191.0, 179.0, 176.0, 143.0, 138.0, 121.0, 125.0, 103.0, 94.0, 68.0, 50.0, 41.0, 47.0, 36.0, 28.0, 24.0, 20.0, 22.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6611328125, -1.611419677734375, -1.56170654296875, -1.511993408203125, -1.4622802734375, -1.412567138671875, -1.36285400390625, -1.313140869140625, -1.263427734375, -1.213714599609375, -1.16400146484375, -1.114288330078125, -1.0645751953125, -1.014862060546875, -0.96514892578125, -0.915435791015625, -0.86572265625, -0.816009521484375, -0.76629638671875, -0.716583251953125, -0.6668701171875, -0.617156982421875, -0.56744384765625, -0.517730712890625, -0.468017578125, -0.418304443359375, -0.36859130859375, -0.318878173828125, -0.2691650390625, -0.219451904296875, -0.16973876953125, -0.120025634765625, -0.0703125, -0.020599365234375, 0.02911376953125, 0.078826904296875, 0.1285400390625, 0.178253173828125, 0.22796630859375, 0.277679443359375, 0.327392578125, 0.377105712890625, 0.42681884765625, 0.476531982421875, 0.5262451171875, 0.575958251953125, 0.62567138671875, 0.675384521484375, 0.72509765625, 0.774810791015625, 0.82452392578125, 0.874237060546875, 0.9239501953125, 0.973663330078125, 1.02337646484375, 1.073089599609375, 1.122802734375, 1.172515869140625, 1.22222900390625, 1.271942138671875, 1.3216552734375, 1.371368408203125, 1.42108154296875, 1.470794677734375, 1.5205078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 10.0, 10.0, 7.0, 11.0, 15.0, 22.0, 28.0, 25.0, 42.0, 44.0, 45.0, 45.0, 58.0, 65.0, 49.0, 62.0, 55.0, 58.0, 40.0, 61.0, 49.0, 40.0, 35.0, 25.0, 19.0, 14.0, 12.0, 10.0, 12.0, 3.0, 8.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.58338737487793, -7.374189853668213, -7.164992332458496, -6.955794811248779, -6.7465972900390625, -6.5373992919921875, -6.328202247619629, -6.119004249572754, -5.909806728363037, -5.70060920715332, -5.4914116859436035, -5.282214164733887, -5.07301664352417, -4.863819122314453, -4.654621124267578, -4.445423603057861, -4.2362260818481445, -4.027028560638428, -3.817831039428711, -3.608633518218994, -3.3994357585906982, -3.1902382373809814, -2.9810407161712646, -2.7718429565429688, -2.56264591217041, -2.3534483909606934, -2.1442508697509766, -1.9350532293319702, -1.7258555889129639, -1.516658067703247, -1.3074605464935303, -1.098262906074524, -0.8890652656555176, -0.679867684841156, -0.4706701338291168, -0.26147258281707764, -0.052275002002716064, 0.1569225788116455, 0.3661201000213623, 0.5753177404403687, 0.7845152616500854, 0.993712842464447, 1.2029104232788086, 1.4121079444885254, 1.6213054656982422, 1.8305031061172485, 2.039700508117676, 2.2488982677459717, 2.4580957889556885, 2.6672933101654053, 2.876490831375122, 3.085688591003418, 3.2948861122131348, 3.5040836334228516, 3.7132811546325684, 3.922478675842285, 4.131676197052002, 4.340873718261719, 4.5500712394714355, 4.759268760681152, 4.968466281890869, 5.177663803100586, 5.386861801147461, 5.596059322357178, 5.8052568435668945]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 10.0, 4.0, 9.0, 15.0, 15.0, 12.0, 22.0, 17.0, 19.0, 29.0, 26.0, 25.0, 22.0, 33.0, 48.0, 42.0, 44.0, 34.0, 44.0, 39.0, 33.0, 33.0, 37.0, 51.0, 28.0, 37.0, 35.0, 29.0, 35.0, 32.0, 31.0, 13.0, 20.0, 13.0, 17.0, 9.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3664894104003906, -3.2480199337005615, -3.1295502185821533, -3.011080741882324, -2.892611265182495, -2.774141788482666, -2.655672073364258, -2.5372025966644287, -2.4187331199645996, -2.3002636432647705, -2.1817939281463623, -2.063324451446533, -1.944854974746704, -1.8263853788375854, -1.7079157829284668, -1.5894463062286377, -1.4709765911102295, -1.3525069952011108, -1.2340375185012817, -1.115567922592163, -0.9970983862876892, -0.8786288499832153, -0.7601592540740967, -0.6416897177696228, -0.5232201814651489, -0.40475064516067505, -0.2862810790538788, -0.16781151294708252, -0.04934197664260864, 0.06912755966186523, 0.1875971555709839, 0.30606669187545776, 0.42453622817993164, 0.5430057644844055, 0.6614753007888794, 0.779944896697998, 0.8984144330024719, 1.0168839693069458, 1.1353535652160645, 1.2538230419158936, 1.3722926378250122, 1.4907622337341309, 1.60923171043396, 1.7277013063430786, 1.8461709022521973, 1.9646403789520264, 2.0831098556518555, 2.2015795707702637, 2.3200490474700928, 2.438518524169922, 2.55698823928833, 2.675457715988159, 2.7939271926879883, 2.9123969078063965, 3.0308663845062256, 3.1493358612060547, 3.267805576324463, 3.386275053024292, 3.5047447681427, 3.6232142448425293, 3.7416837215423584, 3.8601531982421875, 3.9786229133605957, 4.097092628479004, 4.215561866760254]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 17.0, 21.0, 21.0, 29.0, 61.0, 92.0, 116.0, 205.0, 344.0, 479.0, 848.0, 1393.0, 2350.0, 4178.0, 7578.0, 14419.0, 27463.0, 55003.0, 112209.0, 203455.0, 253925.0, 175680.0, 92205.0, 46108.0, 23174.0, 11903.0, 6515.0, 3527.0, 2024.0, 1188.0, 753.0, 422.0, 283.0, 181.0, 128.0, 97.0, 46.0, 35.0, 26.0, 21.0, 11.0, 6.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2470703125, -1.207305908203125, -1.16754150390625, -1.127777099609375, -1.0880126953125, -1.048248291015625, -1.00848388671875, -0.968719482421875, -0.928955078125, -0.889190673828125, -0.84942626953125, -0.809661865234375, -0.7698974609375, -0.730133056640625, -0.69036865234375, -0.650604248046875, -0.61083984375, -0.571075439453125, -0.53131103515625, -0.491546630859375, -0.4517822265625, -0.412017822265625, -0.37225341796875, -0.332489013671875, -0.292724609375, -0.252960205078125, -0.21319580078125, -0.173431396484375, -0.1336669921875, -0.093902587890625, -0.05413818359375, -0.014373779296875, 0.025390625, 0.065155029296875, 0.10491943359375, 0.144683837890625, 0.1844482421875, 0.224212646484375, 0.26397705078125, 0.303741455078125, 0.343505859375, 0.383270263671875, 0.42303466796875, 0.462799072265625, 0.5025634765625, 0.542327880859375, 0.58209228515625, 0.621856689453125, 0.66162109375, 0.701385498046875, 0.74114990234375, 0.780914306640625, 0.8206787109375, 0.860443115234375, 0.90020751953125, 0.939971923828125, 0.979736328125, 1.019500732421875, 1.05926513671875, 1.099029541015625, 1.1387939453125, 1.178558349609375, 1.21832275390625, 1.258087158203125, 1.2978515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 7.0, 8.0, 14.0, 15.0, 11.0, 11.0, 18.0, 13.0, 29.0, 33.0, 25.0, 46.0, 30.0, 36.0, 35.0, 33.0, 36.0, 53.0, 43.0, 40.0, 48.0, 38.0, 42.0, 41.0, 23.0, 30.0, 35.0, 36.0, 33.0, 21.0, 30.0, 21.0, 9.0, 12.0, 5.0, 4.0, 7.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.39453125, -4.25921630859375, -4.1239013671875, -3.98858642578125, -3.853271484375, -3.71795654296875, -3.5826416015625, -3.44732666015625, -3.31201171875, -3.17669677734375, -3.0413818359375, -2.90606689453125, -2.770751953125, -2.63543701171875, -2.5001220703125, -2.36480712890625, -2.2294921875, -2.09417724609375, -1.9588623046875, -1.82354736328125, -1.688232421875, -1.55291748046875, -1.4176025390625, -1.28228759765625, -1.14697265625, -1.01165771484375, -0.8763427734375, -0.74102783203125, -0.605712890625, -0.47039794921875, -0.3350830078125, -0.19976806640625, -0.064453125, 0.07086181640625, 0.2061767578125, 0.34149169921875, 0.476806640625, 0.61212158203125, 0.7474365234375, 0.88275146484375, 1.01806640625, 1.15338134765625, 1.2886962890625, 1.42401123046875, 1.559326171875, 1.69464111328125, 1.8299560546875, 1.96527099609375, 2.1005859375, 2.23590087890625, 2.3712158203125, 2.50653076171875, 2.641845703125, 2.77716064453125, 2.9124755859375, 3.04779052734375, 3.18310546875, 3.31842041015625, 3.4537353515625, 3.58905029296875, 3.724365234375, 3.85968017578125, 3.9949951171875, 4.13031005859375, 4.265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 5.0, 16.0, 14.0, 19.0, 40.0, 55.0, 78.0, 99.0, 179.0, 289.0, 456.0, 733.0, 1227.0, 2230.0, 4030.0, 7687.0, 14822.0, 30142.0, 63432.0, 133244.0, 247344.0, 260006.0, 144718.0, 69755.0, 33215.0, 16274.0, 8273.0, 4253.0, 2379.0, 1342.0, 853.0, 477.0, 299.0, 202.0, 137.0, 85.0, 50.0, 38.0, 23.0, 9.0, 12.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.548828125, -1.5046539306640625, -1.460479736328125, -1.4163055419921875, -1.37213134765625, -1.3279571533203125, -1.283782958984375, -1.2396087646484375, -1.1954345703125, -1.1512603759765625, -1.107086181640625, -1.0629119873046875, -1.01873779296875, -0.9745635986328125, -0.930389404296875, -0.8862152099609375, -0.842041015625, -0.7978668212890625, -0.753692626953125, -0.7095184326171875, -0.66534423828125, -0.6211700439453125, -0.576995849609375, -0.5328216552734375, -0.4886474609375, -0.4444732666015625, -0.400299072265625, -0.3561248779296875, -0.31195068359375, -0.2677764892578125, -0.223602294921875, -0.1794281005859375, -0.13525390625, -0.0910797119140625, -0.046905517578125, -0.0027313232421875, 0.04144287109375, 0.0856170654296875, 0.129791259765625, 0.1739654541015625, 0.2181396484375, 0.2623138427734375, 0.306488037109375, 0.3506622314453125, 0.39483642578125, 0.4390106201171875, 0.483184814453125, 0.5273590087890625, 0.571533203125, 0.6157073974609375, 0.659881591796875, 0.7040557861328125, 0.74822998046875, 0.7924041748046875, 0.836578369140625, 0.8807525634765625, 0.9249267578125, 0.9691009521484375, 1.013275146484375, 1.0574493408203125, 1.10162353515625, 1.1457977294921875, 1.189971923828125, 1.2341461181640625, 1.2783203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 16.0, 9.0, 13.0, 18.0, 24.0, 14.0, 28.0, 34.0, 24.0, 31.0, 34.0, 36.0, 41.0, 44.0, 39.0, 34.0, 45.0, 50.0, 43.0, 42.0, 40.0, 36.0, 45.0, 31.0, 33.0, 24.0, 28.0, 30.0, 17.0, 17.0, 12.0, 6.0, 12.0, 7.0, 5.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.013671875, -2.928497314453125, -2.84332275390625, -2.758148193359375, -2.6729736328125, -2.587799072265625, -2.50262451171875, -2.417449951171875, -2.332275390625, -2.247100830078125, -2.16192626953125, -2.076751708984375, -1.9915771484375, -1.906402587890625, -1.82122802734375, -1.736053466796875, -1.65087890625, -1.565704345703125, -1.48052978515625, -1.395355224609375, -1.3101806640625, -1.225006103515625, -1.13983154296875, -1.054656982421875, -0.969482421875, -0.884307861328125, -0.79913330078125, -0.713958740234375, -0.6287841796875, -0.543609619140625, -0.45843505859375, -0.373260498046875, -0.2880859375, -0.202911376953125, -0.11773681640625, -0.032562255859375, 0.0526123046875, 0.137786865234375, 0.22296142578125, 0.308135986328125, 0.393310546875, 0.478485107421875, 0.56365966796875, 0.648834228515625, 0.7340087890625, 0.819183349609375, 0.90435791015625, 0.989532470703125, 1.07470703125, 1.159881591796875, 1.24505615234375, 1.330230712890625, 1.4154052734375, 1.500579833984375, 1.58575439453125, 1.670928955078125, 1.756103515625, 1.841278076171875, 1.92645263671875, 2.011627197265625, 2.0968017578125, 2.181976318359375, 2.26715087890625, 2.352325439453125, 2.4375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 11.0, 7.0, 9.0, 17.0, 15.0, 21.0, 45.0, 35.0, 48.0, 68.0, 84.0, 104.0, 130.0, 168.0, 226.0, 258.0, 377.0, 529.0, 766.0, 1304.0, 2660.0, 8120.0, 42002.0, 466593.0, 467792.0, 42031.0, 8117.0, 2827.0, 1313.0, 755.0, 487.0, 398.0, 277.0, 218.0, 172.0, 141.0, 108.0, 65.0, 63.0, 45.0, 37.0, 23.0, 27.0, 17.0, 14.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.83251953125, -0.8027877807617188, -0.7730560302734375, -0.7433242797851562, -0.713592529296875, -0.6838607788085938, -0.6541290283203125, -0.6243972778320312, -0.59466552734375, -0.5649337768554688, -0.5352020263671875, -0.5054702758789062, -0.475738525390625, -0.44600677490234375, -0.4162750244140625, -0.38654327392578125, -0.3568115234375, -0.32707977294921875, -0.2973480224609375, -0.26761627197265625, -0.237884521484375, -0.20815277099609375, -0.1784210205078125, -0.14868927001953125, -0.11895751953125, -0.08922576904296875, -0.0594940185546875, -0.02976226806640625, -3.0517578125e-05, 0.02970123291015625, 0.0594329833984375, 0.08916473388671875, 0.118896484375, 0.14862823486328125, 0.1783599853515625, 0.20809173583984375, 0.237823486328125, 0.26755523681640625, 0.2972869873046875, 0.32701873779296875, 0.35675048828125, 0.38648223876953125, 0.4162139892578125, 0.44594573974609375, 0.475677490234375, 0.5054092407226562, 0.5351409912109375, 0.5648727416992188, 0.5946044921875, 0.6243362426757812, 0.6540679931640625, 0.6837997436523438, 0.713531494140625, 0.7432632446289062, 0.7729949951171875, 0.8027267456054688, 0.83245849609375, 0.8621902465820312, 0.8919219970703125, 0.9216537475585938, 0.951385498046875, 0.9811172485351562, 1.0108489990234375, 1.0405807495117188, 1.0703125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 14.0, 9.0, 36.0, 59.0, 75.0, 115.0, 155.0, 160.0, 145.0, 86.0, 64.0, 37.0, 22.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.762411117553711e-05, -4.5944005250930786e-05, -4.426389932632446e-05, -4.258379340171814e-05, -4.0903687477111816e-05, -3.922358155250549e-05, -3.754347562789917e-05, -3.586336970329285e-05, -3.4183263778686523e-05, -3.25031578540802e-05, -3.082305192947388e-05, -2.9142946004867554e-05, -2.746284008026123e-05, -2.5782734155654907e-05, -2.4102628231048584e-05, -2.242252230644226e-05, -2.0742416381835938e-05, -1.9062310457229614e-05, -1.738220453262329e-05, -1.5702098608016968e-05, -1.4021992683410645e-05, -1.2341886758804321e-05, -1.0661780834197998e-05, -8.981674909591675e-06, -7.3015689849853516e-06, -5.621463060379028e-06, -3.941357135772705e-06, -2.261251211166382e-06, -5.811452865600586e-07, 1.0989606380462646e-06, 2.779066562652588e-06, 4.459172487258911e-06, 6.139278411865234e-06, 7.819384336471558e-06, 9.499490261077881e-06, 1.1179596185684204e-05, 1.2859702110290527e-05, 1.453980803489685e-05, 1.6219913959503174e-05, 1.7900019884109497e-05, 1.958012580871582e-05, 2.1260231733322144e-05, 2.2940337657928467e-05, 2.462044358253479e-05, 2.6300549507141113e-05, 2.7980655431747437e-05, 2.966076135635376e-05, 3.134086728096008e-05, 3.3020973205566406e-05, 3.470107913017273e-05, 3.638118505477905e-05, 3.8061290979385376e-05, 3.97413969039917e-05, 4.142150282859802e-05, 4.3101608753204346e-05, 4.478171467781067e-05, 4.646182060241699e-05, 4.8141926527023315e-05, 4.982203245162964e-05, 5.150213837623596e-05, 5.3182244300842285e-05, 5.486235022544861e-05, 5.654245615005493e-05, 5.8222562074661255e-05, 5.990266799926758e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 9.0, 16.0, 28.0, 33.0, 54.0, 63.0, 99.0, 133.0, 191.0, 301.0, 369.0, 531.0, 701.0, 962.0, 1302.0, 1737.0, 2786.0, 5414.0, 22623.0, 290426.0, 647081.0, 54455.0, 8365.0, 3363.0, 2075.0, 1465.0, 1101.0, 798.0, 558.0, 422.0, 300.0, 216.0, 165.0, 117.0, 80.0, 62.0, 38.0, 28.0, 29.0, 9.0, 13.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3011322021484375, -1.256561279296875, -1.2119903564453125, -1.16741943359375, -1.1228485107421875, -1.078277587890625, -1.0337066650390625, -0.9891357421875, -0.9445648193359375, -0.899993896484375, -0.8554229736328125, -0.81085205078125, -0.7662811279296875, -0.721710205078125, -0.6771392822265625, -0.632568359375, -0.5879974365234375, -0.543426513671875, -0.4988555908203125, -0.45428466796875, -0.4097137451171875, -0.365142822265625, -0.3205718994140625, -0.2760009765625, -0.2314300537109375, -0.186859130859375, -0.1422882080078125, -0.09771728515625, -0.0531463623046875, -0.008575439453125, 0.0359954833984375, 0.08056640625, 0.1251373291015625, 0.169708251953125, 0.2142791748046875, 0.25885009765625, 0.3034210205078125, 0.347991943359375, 0.3925628662109375, 0.4371337890625, 0.4817047119140625, 0.526275634765625, 0.5708465576171875, 0.61541748046875, 0.6599884033203125, 0.704559326171875, 0.7491302490234375, 0.793701171875, 0.8382720947265625, 0.882843017578125, 0.9274139404296875, 0.97198486328125, 1.0165557861328125, 1.061126708984375, 1.1056976318359375, 1.1502685546875, 1.1948394775390625, 1.239410400390625, 1.2839813232421875, 1.32855224609375, 1.3731231689453125, 1.417694091796875, 1.4622650146484375, 1.5068359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 5.0, 13.0, 4.0, 7.0, 12.0, 6.0, 17.0, 24.0, 27.0, 25.0, 34.0, 40.0, 65.0, 79.0, 78.0, 79.0, 96.0, 85.0, 50.0, 51.0, 32.0, 40.0, 19.0, 23.0, 19.0, 13.0, 7.0, 9.0, 11.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0816650390625, -0.07870292663574219, -0.07574081420898438, -0.07277870178222656, -0.06981658935546875, -0.06685447692871094, -0.06389236450195312, -0.06093025207519531, -0.0579681396484375, -0.05500602722167969, -0.052043914794921875, -0.04908180236816406, -0.04611968994140625, -0.04315757751464844, -0.040195465087890625, -0.03723335266113281, -0.034271240234375, -0.03130912780761719, -0.028347015380859375, -0.025384902954101562, -0.02242279052734375, -0.019460678100585938, -0.016498565673828125, -0.013536453247070312, -0.0105743408203125, -0.0076122283935546875, -0.004650115966796875, -0.0016880035400390625, 0.00127410888671875, 0.0042362213134765625, 0.007198333740234375, 0.010160446166992188, 0.01312255859375, 0.016084671020507812, 0.019046783447265625, 0.022008895874023438, 0.02497100830078125, 0.027933120727539062, 0.030895233154296875, 0.03385734558105469, 0.0368194580078125, 0.03978157043457031, 0.042743682861328125, 0.04570579528808594, 0.04866790771484375, 0.05163002014160156, 0.054592132568359375, 0.05755424499511719, 0.060516357421875, 0.06347846984863281, 0.06644058227539062, 0.06940269470214844, 0.07236480712890625, 0.07532691955566406, 0.07828903198242188, 0.08125114440917969, 0.0842132568359375, 0.08717536926269531, 0.09013748168945312, 0.09309959411621094, 0.09606170654296875, 0.09902381896972656, 0.10198593139648438, 0.10494804382324219, 0.10791015625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 9.0, 9.0, 13.0, 14.0, 17.0, 25.0, 26.0, 40.0, 43.0, 48.0, 37.0, 54.0, 62.0, 68.0, 48.0, 58.0, 58.0, 44.0, 60.0, 53.0, 49.0, 20.0, 32.0, 27.0, 8.0, 16.0, 13.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.657483100891113, -7.448243141174316, -7.239003658294678, -7.029763698577881, -6.820524215698242, -6.611284255981445, -6.402044296264648, -6.19280481338501, -5.983565330505371, -5.774325370788574, -5.5650858879089355, -5.355845928192139, -5.1466064453125, -4.937366485595703, -4.728126525878906, -4.518887042999268, -4.309647083282471, -4.100407123565674, -3.891167640686035, -3.6819276809692383, -3.4726881980895996, -3.2634482383728027, -3.054208517074585, -2.844968795776367, -2.6357290744781494, -2.4264893531799316, -2.217249631881714, -2.008009910583496, -1.7987700700759888, -1.589530348777771, -1.3802905082702637, -1.171050786972046, -0.9618105888366699, -0.7525708675384521, -0.5433310866355896, -0.33409130573272705, -0.12485158443450928, 0.0843881368637085, 0.2936279773712158, 0.5028676986694336, 0.7121074199676514, 0.9213471412658691, 1.130586862564087, 1.3398267030715942, 1.549066424369812, 1.7583061456680298, 1.967545986175537, 2.176785707473755, 2.3860254287719727, 2.5952651500701904, 2.804504871368408, 3.013744831085205, 3.2229843139648438, 3.4322242736816406, 3.6414639949798584, 3.850703716278076, 4.059943199157715, 4.269183158874512, 4.47842264175415, 4.687662601470947, 4.896902084350586, 5.106142044067383, 5.31538200378418, 5.524621486663818, 5.733861446380615]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 6.0, 8.0, 4.0, 10.0, 15.0, 14.0, 14.0, 24.0, 13.0, 20.0, 31.0, 23.0, 27.0, 27.0, 29.0, 47.0, 43.0, 41.0, 34.0, 45.0, 40.0, 33.0, 35.0, 38.0, 47.0, 31.0, 37.0, 33.0, 27.0, 43.0, 32.0, 25.0, 12.0, 19.0, 15.0, 16.0, 9.0, 3.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3791987895965576, -3.2606797218322754, -3.142160415649414, -3.023641347885132, -2.9051220417022705, -2.7866029739379883, -2.668083667755127, -2.5495645999908447, -2.4310455322265625, -2.3125264644622803, -2.194007158279419, -2.0754880905151367, -1.9569687843322754, -1.8384497165679932, -1.7199305295944214, -1.6014113426208496, -1.4828920364379883, -1.3643728494644165, -1.2458536624908447, -1.1273345947265625, -1.0088152885437012, -0.8902961611747742, -0.7717770338058472, -0.6532578468322754, -0.5347386598587036, -0.41621947288513184, -0.29770031571388245, -0.17918115854263306, -0.06066197156906128, 0.0578572154045105, 0.1763763427734375, 0.2948955297470093, 0.41341495513916016, 0.5319341421127319, 0.6504533290863037, 0.7689724564552307, 0.8874916434288025, 1.0060107707977295, 1.1245299577713013, 1.243049144744873, 1.3615683317184448, 1.4800875186920166, 1.5986067056655884, 1.7171258926391602, 1.8356449604034424, 1.9541642665863037, 2.072683334350586, 2.1912026405334473, 2.3097217082977295, 2.4282407760620117, 2.546760082244873, 2.6652791500091553, 2.7837984561920166, 2.902317523956299, 3.02083683013916, 3.1393558979034424, 3.2578749656677246, 3.376394033432007, 3.494913339614868, 3.6134324073791504, 3.7319517135620117, 3.850470781326294, 3.968989849090576, 4.0875091552734375, 4.206028461456299]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 15.0, 22.0, 25.0, 39.0, 49.0, 97.0, 179.0, 272.0, 486.0, 730.0, 1233.0, 1993.0, 3092.0, 5167.0, 8394.0, 13554.0, 20735.0, 31606.0, 45902.0, 64191.0, 84930.0, 103492.0, 115434.0, 117213.0, 108625.0, 92651.0, 71849.0, 52968.0, 36692.0, 24308.0, 15909.0, 10240.0, 6309.0, 3889.0, 2415.0, 1440.0, 914.0, 575.0, 340.0, 222.0, 141.0, 85.0, 52.0, 34.0, 19.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.46875, -3.3673095703125, -3.265869140625, -3.1644287109375, -3.06298828125, -2.9615478515625, -2.860107421875, -2.7586669921875, -2.6572265625, -2.5557861328125, -2.454345703125, -2.3529052734375, -2.25146484375, -2.1500244140625, -2.048583984375, -1.9471435546875, -1.845703125, -1.7442626953125, -1.642822265625, -1.5413818359375, -1.43994140625, -1.3385009765625, -1.237060546875, -1.1356201171875, -1.0341796875, -0.9327392578125, -0.831298828125, -0.7298583984375, -0.62841796875, -0.5269775390625, -0.425537109375, -0.3240966796875, -0.22265625, -0.1212158203125, -0.019775390625, 0.0816650390625, 0.18310546875, 0.2845458984375, 0.385986328125, 0.4874267578125, 0.5888671875, 0.6903076171875, 0.791748046875, 0.8931884765625, 0.99462890625, 1.0960693359375, 1.197509765625, 1.2989501953125, 1.400390625, 1.5018310546875, 1.603271484375, 1.7047119140625, 1.80615234375, 1.9075927734375, 2.009033203125, 2.1104736328125, 2.2119140625, 2.3133544921875, 2.414794921875, 2.5162353515625, 2.61767578125, 2.7191162109375, 2.820556640625, 2.9219970703125, 3.0234375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 8.0, 10.0, 18.0, 12.0, 13.0, 17.0, 26.0, 28.0, 27.0, 29.0, 33.0, 40.0, 33.0, 45.0, 40.0, 42.0, 35.0, 43.0, 43.0, 36.0, 48.0, 34.0, 38.0, 38.0, 38.0, 28.0, 34.0, 25.0, 24.0, 18.0, 19.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.53125, -4.3909912109375, -4.250732421875, -4.1104736328125, -3.97021484375, -3.8299560546875, -3.689697265625, -3.5494384765625, -3.4091796875, -3.2689208984375, -3.128662109375, -2.9884033203125, -2.84814453125, -2.7078857421875, -2.567626953125, -2.4273681640625, -2.287109375, -2.1468505859375, -2.006591796875, -1.8663330078125, -1.72607421875, -1.5858154296875, -1.445556640625, -1.3052978515625, -1.1650390625, -1.0247802734375, -0.884521484375, -0.7442626953125, -0.60400390625, -0.4637451171875, -0.323486328125, -0.1832275390625, -0.04296875, 0.0972900390625, 0.237548828125, 0.3778076171875, 0.51806640625, 0.6583251953125, 0.798583984375, 0.9388427734375, 1.0791015625, 1.2193603515625, 1.359619140625, 1.4998779296875, 1.64013671875, 1.7803955078125, 1.920654296875, 2.0609130859375, 2.201171875, 2.3414306640625, 2.481689453125, 2.6219482421875, 2.76220703125, 2.9024658203125, 3.042724609375, 3.1829833984375, 3.3232421875, 3.4635009765625, 3.603759765625, 3.7440185546875, 3.88427734375, 4.0245361328125, 4.164794921875, 4.3050537109375, 4.4453125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 15.0, 24.0, 31.0, 61.0, 86.0, 161.0, 217.0, 368.0, 595.0, 922.0, 1372.0, 2119.0, 3247.0, 4984.0, 7193.0, 11016.0, 16070.0, 23444.0, 32271.0, 43692.0, 56253.0, 69976.0, 82315.0, 91573.0, 95506.0, 94925.0, 88063.0, 77304.0, 64428.0, 51437.0, 38871.0, 28435.0, 20146.0, 13904.0, 9571.0, 6376.0, 4141.0, 2712.0, 1691.0, 1122.0, 673.0, 453.0, 279.0, 203.0, 110.0, 74.0, 37.0, 36.0, 14.0, 11.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.755859375, -2.669189453125, -2.58251953125, -2.495849609375, -2.4091796875, -2.322509765625, -2.23583984375, -2.149169921875, -2.0625, -1.975830078125, -1.88916015625, -1.802490234375, -1.7158203125, -1.629150390625, -1.54248046875, -1.455810546875, -1.369140625, -1.282470703125, -1.19580078125, -1.109130859375, -1.0224609375, -0.935791015625, -0.84912109375, -0.762451171875, -0.67578125, -0.589111328125, -0.50244140625, -0.415771484375, -0.3291015625, -0.242431640625, -0.15576171875, -0.069091796875, 0.017578125, 0.104248046875, 0.19091796875, 0.277587890625, 0.3642578125, 0.450927734375, 0.53759765625, 0.624267578125, 0.7109375, 0.797607421875, 0.88427734375, 0.970947265625, 1.0576171875, 1.144287109375, 1.23095703125, 1.317626953125, 1.404296875, 1.490966796875, 1.57763671875, 1.664306640625, 1.7509765625, 1.837646484375, 1.92431640625, 2.010986328125, 2.09765625, 2.184326171875, 2.27099609375, 2.357666015625, 2.4443359375, 2.531005859375, 2.61767578125, 2.704345703125, 2.791015625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 7.0, 18.0, 12.0, 13.0, 15.0, 17.0, 28.0, 34.0, 26.0, 35.0, 28.0, 34.0, 25.0, 48.0, 39.0, 36.0, 27.0, 39.0, 30.0, 41.0, 34.0, 25.0, 24.0, 32.0, 37.0, 30.0, 27.0, 26.0, 30.0, 18.0, 21.0, 14.0, 15.0, 13.0, 9.0, 10.0, 8.0, 10.0, 7.0, 9.0, 11.0, 1.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.392578125, -2.319610595703125, -2.24664306640625, -2.173675537109375, -2.1007080078125, -2.027740478515625, -1.95477294921875, -1.881805419921875, -1.808837890625, -1.735870361328125, -1.66290283203125, -1.589935302734375, -1.5169677734375, -1.444000244140625, -1.37103271484375, -1.298065185546875, -1.22509765625, -1.152130126953125, -1.07916259765625, -1.006195068359375, -0.9332275390625, -0.860260009765625, -0.78729248046875, -0.714324951171875, -0.641357421875, -0.568389892578125, -0.49542236328125, -0.422454833984375, -0.3494873046875, -0.276519775390625, -0.20355224609375, -0.130584716796875, -0.0576171875, 0.015350341796875, 0.08831787109375, 0.161285400390625, 0.2342529296875, 0.307220458984375, 0.38018798828125, 0.453155517578125, 0.526123046875, 0.599090576171875, 0.67205810546875, 0.745025634765625, 0.8179931640625, 0.890960693359375, 0.96392822265625, 1.036895751953125, 1.10986328125, 1.182830810546875, 1.25579833984375, 1.328765869140625, 1.4017333984375, 1.474700927734375, 1.54766845703125, 1.620635986328125, 1.693603515625, 1.766571044921875, 1.83953857421875, 1.912506103515625, 1.9854736328125, 2.058441162109375, 2.13140869140625, 2.204376220703125, 2.27734375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 11.0, 13.0, 14.0, 22.0, 44.0, 62.0, 78.0, 125.0, 201.0, 334.0, 518.0, 761.0, 1201.0, 1874.0, 3044.0, 4817.0, 7758.0, 12866.0, 20754.0, 33636.0, 53231.0, 79667.0, 110211.0, 135450.0, 143120.0, 131123.0, 104180.0, 73748.0, 48773.0, 31038.0, 19231.0, 11501.0, 7188.0, 4350.0, 2737.0, 1747.0, 1106.0, 706.0, 443.0, 290.0, 205.0, 136.0, 81.0, 60.0, 36.0, 19.0, 13.0, 13.0, 2.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.263671875, -2.19158935546875, -2.1195068359375, -2.04742431640625, -1.975341796875, -1.90325927734375, -1.8311767578125, -1.75909423828125, -1.68701171875, -1.61492919921875, -1.5428466796875, -1.47076416015625, -1.398681640625, -1.32659912109375, -1.2545166015625, -1.18243408203125, -1.1103515625, -1.03826904296875, -0.9661865234375, -0.89410400390625, -0.822021484375, -0.74993896484375, -0.6778564453125, -0.60577392578125, -0.53369140625, -0.46160888671875, -0.3895263671875, -0.31744384765625, -0.245361328125, -0.17327880859375, -0.1011962890625, -0.02911376953125, 0.04296875, 0.11505126953125, 0.1871337890625, 0.25921630859375, 0.331298828125, 0.40338134765625, 0.4754638671875, 0.54754638671875, 0.61962890625, 0.69171142578125, 0.7637939453125, 0.83587646484375, 0.907958984375, 0.98004150390625, 1.0521240234375, 1.12420654296875, 1.1962890625, 1.26837158203125, 1.3404541015625, 1.41253662109375, 1.484619140625, 1.55670166015625, 1.6287841796875, 1.70086669921875, 1.77294921875, 1.84503173828125, 1.9171142578125, 1.98919677734375, 2.061279296875, 2.13336181640625, 2.2054443359375, 2.27752685546875, 2.349609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 4.0, 2.0, 17.0, 16.0, 13.0, 15.0, 19.0, 25.0, 30.0, 41.0, 44.0, 42.0, 50.0, 51.0, 43.0, 47.0, 56.0, 49.0, 53.0, 55.0, 52.0, 47.0, 41.0, 37.0, 23.0, 25.0, 16.0, 15.0, 14.0, 17.0, 10.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023317337036132812, -0.00022549927234649658, -0.00021782517433166504, -0.0002101510763168335, -0.00020247697830200195, -0.0001948028802871704, -0.00018712878227233887, -0.00017945468425750732, -0.00017178058624267578, -0.00016410648822784424, -0.0001564323902130127, -0.00014875829219818115, -0.0001410841941833496, -0.00013341009616851807, -0.00012573599815368652, -0.00011806190013885498, -0.00011038780212402344, -0.0001027137041091919, -9.503960609436035e-05, -8.736550807952881e-05, -7.969141006469727e-05, -7.201731204986572e-05, -6.434321403503418e-05, -5.666911602020264e-05, -4.8995018005371094e-05, -4.132091999053955e-05, -3.364682197570801e-05, -2.5972723960876465e-05, -1.8298625946044922e-05, -1.0624527931213379e-05, -2.950429916381836e-06, 4.723668098449707e-06, 1.239776611328125e-05, 2.0071864128112793e-05, 2.7745962142944336e-05, 3.542006015777588e-05, 4.309415817260742e-05, 5.0768256187438965e-05, 5.844235420227051e-05, 6.611645221710205e-05, 7.37905502319336e-05, 8.146464824676514e-05, 8.913874626159668e-05, 9.681284427642822e-05, 0.00010448694229125977, 0.00011216104030609131, 0.00011983513832092285, 0.0001275092363357544, 0.00013518333435058594, 0.00014285743236541748, 0.00015053153038024902, 0.00015820562839508057, 0.0001658797264099121, 0.00017355382442474365, 0.0001812279224395752, 0.00018890202045440674, 0.00019657611846923828, 0.00020425021648406982, 0.00021192431449890137, 0.0002195984125137329, 0.00022727251052856445, 0.000234946608543396, 0.00024262070655822754, 0.0002502948045730591, 0.0002579689025878906]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 7.0, 7.0, 22.0, 29.0, 38.0, 46.0, 77.0, 120.0, 151.0, 251.0, 388.0, 572.0, 891.0, 1489.0, 2502.0, 4135.0, 6987.0, 12443.0, 22104.0, 38809.0, 65369.0, 103665.0, 144547.0, 167596.0, 157480.0, 121994.0, 81381.0, 48867.0, 28111.0, 15985.0, 9237.0, 5219.0, 2958.0, 1923.0, 1135.0, 659.0, 470.0, 285.0, 211.0, 126.0, 81.0, 55.0, 59.0, 31.0, 11.0, 6.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.740234375, -2.653839111328125, -2.56744384765625, -2.481048583984375, -2.3946533203125, -2.308258056640625, -2.22186279296875, -2.135467529296875, -2.049072265625, -1.962677001953125, -1.87628173828125, -1.789886474609375, -1.7034912109375, -1.617095947265625, -1.53070068359375, -1.444305419921875, -1.35791015625, -1.271514892578125, -1.18511962890625, -1.098724365234375, -1.0123291015625, -0.925933837890625, -0.83953857421875, -0.753143310546875, -0.666748046875, -0.580352783203125, -0.49395751953125, -0.407562255859375, -0.3211669921875, -0.234771728515625, -0.14837646484375, -0.061981201171875, 0.0244140625, 0.110809326171875, 0.19720458984375, 0.283599853515625, 0.3699951171875, 0.456390380859375, 0.54278564453125, 0.629180908203125, 0.715576171875, 0.801971435546875, 0.88836669921875, 0.974761962890625, 1.0611572265625, 1.147552490234375, 1.23394775390625, 1.320343017578125, 1.40673828125, 1.493133544921875, 1.57952880859375, 1.665924072265625, 1.7523193359375, 1.838714599609375, 1.92510986328125, 2.011505126953125, 2.097900390625, 2.184295654296875, 2.27069091796875, 2.357086181640625, 2.4434814453125, 2.529876708984375, 2.61627197265625, 2.702667236328125, 2.7890625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 13.0, 10.0, 19.0, 20.0, 29.0, 37.0, 32.0, 42.0, 27.0, 41.0, 49.0, 46.0, 51.0, 65.0, 59.0, 53.0, 41.0, 48.0, 51.0, 42.0, 50.0, 35.0, 22.0, 15.0, 19.0, 13.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6989898681640625, -0.677764892578125, -0.6565399169921875, -0.63531494140625, -0.6140899658203125, -0.592864990234375, -0.5716400146484375, -0.5504150390625, -0.5291900634765625, -0.507965087890625, -0.4867401123046875, -0.46551513671875, -0.4442901611328125, -0.423065185546875, -0.4018402099609375, -0.380615234375, -0.3593902587890625, -0.338165283203125, -0.3169403076171875, -0.29571533203125, -0.2744903564453125, -0.253265380859375, -0.2320404052734375, -0.2108154296875, -0.1895904541015625, -0.168365478515625, -0.1471405029296875, -0.12591552734375, -0.1046905517578125, -0.083465576171875, -0.0622406005859375, -0.041015625, -0.0197906494140625, 0.001434326171875, 0.0226593017578125, 0.04388427734375, 0.0651092529296875, 0.086334228515625, 0.1075592041015625, 0.1287841796875, 0.1500091552734375, 0.171234130859375, 0.1924591064453125, 0.21368408203125, 0.2349090576171875, 0.256134033203125, 0.2773590087890625, 0.298583984375, 0.3198089599609375, 0.341033935546875, 0.3622589111328125, 0.38348388671875, 0.4047088623046875, 0.425933837890625, 0.4471588134765625, 0.4683837890625, 0.4896087646484375, 0.510833740234375, 0.5320587158203125, 0.55328369140625, 0.5745086669921875, 0.595733642578125, 0.6169586181640625, 0.63818359375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 11.0, 13.0, 15.0, 17.0, 21.0, 36.0, 32.0, 41.0, 57.0, 45.0, 51.0, 69.0, 54.0, 51.0, 59.0, 60.0, 60.0, 57.0, 50.0, 34.0, 26.0, 28.0, 22.0, 15.0, 15.0, 10.0, 14.0, 5.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.845996379852295, -7.62587833404541, -7.405760288238525, -7.185642242431641, -6.965524196624756, -6.745406150817871, -6.525287628173828, -6.305170059204102, -6.085051536560059, -5.864933490753174, -5.644815444946289, -5.424697399139404, -5.2045793533325195, -4.984461307525635, -4.76434326171875, -4.544224739074707, -4.3241071701049805, -4.103989124298096, -3.883871078491211, -3.663753032684326, -3.4436349868774414, -3.2235169410705566, -3.0033986568450928, -2.783280611038208, -2.5631625652313232, -2.3430445194244385, -2.1229264736175537, -1.9028083086013794, -1.6826902627944946, -1.4625722169876099, -1.2424540519714355, -1.0223360061645508, -0.802217960357666, -0.5820999145507812, -0.3619818091392517, -0.14186370372772217, 0.0782543420791626, 0.29837238788604736, 0.5184905529022217, 0.7386085987091064, 0.9587266445159912, 1.178844690322876, 1.3989627361297607, 1.619080901145935, 1.8391989469528198, 2.059317111968994, 2.279435157775879, 2.4995532035827637, 2.7196712493896484, 2.939789295196533, 3.159907341003418, 3.3800253868103027, 3.6001434326171875, 3.8202614784240723, 4.040379524230957, 4.260498046875, 4.480615615844727, 4.700733661651611, 4.920851707458496, 5.140969753265381, 5.361087799072266, 5.58120584487915, 5.801323890686035, 6.021442413330078, 6.241560459136963]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 2.0, 3.0, 5.0, 7.0, 12.0, 7.0, 15.0, 12.0, 17.0, 26.0, 16.0, 21.0, 29.0, 24.0, 21.0, 28.0, 31.0, 49.0, 38.0, 33.0, 26.0, 30.0, 36.0, 41.0, 39.0, 40.0, 38.0, 27.0, 29.0, 43.0, 23.0, 33.0, 27.0, 23.0, 25.0, 21.0, 17.0, 13.0, 20.0, 13.0, 8.0, 5.0, 6.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.8718767166137695, -3.7532548904418945, -3.6346330642700195, -3.5160112380981445, -3.3973894119262695, -3.2787675857543945, -3.1601457595825195, -3.0415239334106445, -2.9229021072387695, -2.8042802810668945, -2.6856584548950195, -2.5670366287231445, -2.4484148025512695, -2.3297929763793945, -2.2111711502075195, -2.0925493240356445, -1.9739272594451904, -1.8553054332733154, -1.7366836071014404, -1.6180617809295654, -1.4994399547576904, -1.3808181285858154, -1.2621961832046509, -1.1435743570327759, -1.0249525308609009, -0.9063307046890259, -0.7877088785171509, -0.6690869927406311, -0.5504651665687561, -0.4318433403968811, -0.31322145462036133, -0.19459962844848633, -0.07597756385803223, 0.04264427721500397, 0.16126611828804016, 0.27988797426223755, 0.39850980043411255, 0.5171316266059875, 0.6357535123825073, 0.7543753385543823, 0.8729971647262573, 0.9916189908981323, 1.1102408170700073, 1.2288627624511719, 1.3474845886230469, 1.4661064147949219, 1.5847282409667969, 1.7033500671386719, 1.8219718933105469, 1.9405937194824219, 2.059215545654297, 2.177837371826172, 2.296459197998047, 2.415081024169922, 2.533702850341797, 2.652324676513672, 2.770946502685547, 2.889568328857422, 3.008190155029297, 3.126811981201172, 3.245433807373047, 3.364055633544922, 3.482677459716797, 3.601299285888672, 3.719921350479126]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 2.0, 7.0, 11.0, 15.0, 21.0, 42.0, 56.0, 92.0, 148.0, 213.0, 324.0, 492.0, 783.0, 1241.0, 1965.0, 3073.0, 4835.0, 7514.0, 12118.0, 19012.0, 30271.0, 47643.0, 74326.0, 114921.0, 172975.0, 249186.0, 339479.0, 430866.0, 491507.0, 501987.0, 457826.0, 374543.0, 282939.0, 198749.0, 135204.0, 88146.0, 56064.0, 35555.0, 22388.0, 13807.0, 8750.0, 5561.0, 3533.0, 2206.0, 1391.0, 866.0, 593.0, 390.0, 201.0, 156.0, 94.0, 66.0, 48.0, 33.0, 17.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0], "bins": [-4.5, -4.36016845703125, -4.2203369140625, -4.08050537109375, -3.940673828125, -3.80084228515625, -3.6610107421875, -3.52117919921875, -3.38134765625, -3.24151611328125, -3.1016845703125, -2.96185302734375, -2.822021484375, -2.68218994140625, -2.5423583984375, -2.40252685546875, -2.2626953125, -2.12286376953125, -1.9830322265625, -1.84320068359375, -1.703369140625, -1.56353759765625, -1.4237060546875, -1.28387451171875, -1.14404296875, -1.00421142578125, -0.8643798828125, -0.72454833984375, -0.584716796875, -0.44488525390625, -0.3050537109375, -0.16522216796875, -0.025390625, 0.11444091796875, 0.2542724609375, 0.39410400390625, 0.533935546875, 0.67376708984375, 0.8135986328125, 0.95343017578125, 1.09326171875, 1.23309326171875, 1.3729248046875, 1.51275634765625, 1.652587890625, 1.79241943359375, 1.9322509765625, 2.07208251953125, 2.2119140625, 2.35174560546875, 2.4915771484375, 2.63140869140625, 2.771240234375, 2.91107177734375, 3.0509033203125, 3.19073486328125, 3.33056640625, 3.47039794921875, 3.6102294921875, 3.75006103515625, 3.889892578125, 4.02972412109375, 4.1695556640625, 4.30938720703125, 4.44921875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 13.0, 7.0, 11.0, 13.0, 9.0, 12.0, 20.0, 19.0, 24.0, 27.0, 35.0, 24.0, 35.0, 28.0, 41.0, 40.0, 38.0, 42.0, 56.0, 36.0, 47.0, 36.0, 43.0, 36.0, 25.0, 32.0, 28.0, 27.0, 35.0, 25.0, 27.0, 16.0, 17.0, 13.0, 11.0, 8.0, 9.0, 11.0, 4.0, 3.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.908203125, -3.796539306640625, -3.68487548828125, -3.573211669921875, -3.4615478515625, -3.349884033203125, -3.23822021484375, -3.126556396484375, -3.014892578125, -2.903228759765625, -2.79156494140625, -2.679901123046875, -2.5682373046875, -2.456573486328125, -2.34490966796875, -2.233245849609375, -2.12158203125, -2.009918212890625, -1.89825439453125, -1.786590576171875, -1.6749267578125, -1.563262939453125, -1.45159912109375, -1.339935302734375, -1.228271484375, -1.116607666015625, -1.00494384765625, -0.893280029296875, -0.7816162109375, -0.669952392578125, -0.55828857421875, -0.446624755859375, -0.3349609375, -0.223297119140625, -0.11163330078125, 3.0517578125e-05, 0.1116943359375, 0.223358154296875, 0.33502197265625, 0.446685791015625, 0.558349609375, 0.670013427734375, 0.78167724609375, 0.893341064453125, 1.0050048828125, 1.116668701171875, 1.22833251953125, 1.339996337890625, 1.45166015625, 1.563323974609375, 1.67498779296875, 1.786651611328125, 1.8983154296875, 2.009979248046875, 2.12164306640625, 2.233306884765625, 2.344970703125, 2.456634521484375, 2.56829833984375, 2.679962158203125, 2.7916259765625, 2.903289794921875, 3.01495361328125, 3.126617431640625, 3.23828125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 17.0, 37.0, 60.0, 99.0, 166.0, 279.0, 570.0, 1065.0, 2032.0, 3925.0, 7419.0, 14070.0, 27283.0, 51441.0, 94944.0, 166571.0, 275278.0, 415958.0, 553248.0, 632454.0, 606452.0, 494096.0, 347670.0, 219182.0, 128340.0, 71284.0, 38019.0, 20249.0, 10570.0, 5440.0, 2823.0, 1540.0, 741.0, 438.0, 218.0, 123.0, 66.0, 51.0, 22.0, 15.0, 10.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-7.1953125, -6.98834228515625, -6.7813720703125, -6.57440185546875, -6.367431640625, -6.16046142578125, -5.9534912109375, -5.74652099609375, -5.53955078125, -5.33258056640625, -5.1256103515625, -4.91864013671875, -4.711669921875, -4.50469970703125, -4.2977294921875, -4.09075927734375, -3.8837890625, -3.67681884765625, -3.4698486328125, -3.26287841796875, -3.055908203125, -2.84893798828125, -2.6419677734375, -2.43499755859375, -2.22802734375, -2.02105712890625, -1.8140869140625, -1.60711669921875, -1.400146484375, -1.19317626953125, -0.9862060546875, -0.77923583984375, -0.572265625, -0.36529541015625, -0.1583251953125, 0.04864501953125, 0.255615234375, 0.46258544921875, 0.6695556640625, 0.87652587890625, 1.08349609375, 1.29046630859375, 1.4974365234375, 1.70440673828125, 1.911376953125, 2.11834716796875, 2.3253173828125, 2.53228759765625, 2.7392578125, 2.94622802734375, 3.1531982421875, 3.36016845703125, 3.567138671875, 3.77410888671875, 3.9810791015625, 4.18804931640625, 4.39501953125, 4.60198974609375, 4.8089599609375, 5.01593017578125, 5.222900390625, 5.42987060546875, 5.6368408203125, 5.84381103515625, 6.05078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 5.0, 9.0, 8.0, 12.0, 17.0, 16.0, 29.0, 31.0, 43.0, 42.0, 54.0, 62.0, 80.0, 73.0, 124.0, 140.0, 143.0, 165.0, 164.0, 197.0, 176.0, 189.0, 229.0, 221.0, 218.0, 205.0, 196.0, 195.0, 159.0, 134.0, 120.0, 105.0, 95.0, 70.0, 60.0, 56.0, 48.0, 36.0, 39.0, 28.0, 22.0, 17.0, 10.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8755340576171875, -1.812591552734375, -1.7496490478515625, -1.68670654296875, -1.6237640380859375, -1.560821533203125, -1.4978790283203125, -1.4349365234375, -1.3719940185546875, -1.309051513671875, -1.2461090087890625, -1.18316650390625, -1.1202239990234375, -1.057281494140625, -0.9943389892578125, -0.931396484375, -0.8684539794921875, -0.805511474609375, -0.7425689697265625, -0.67962646484375, -0.6166839599609375, -0.553741455078125, -0.4907989501953125, -0.4278564453125, -0.3649139404296875, -0.301971435546875, -0.2390289306640625, -0.17608642578125, -0.1131439208984375, -0.050201416015625, 0.0127410888671875, 0.07568359375, 0.1386260986328125, 0.201568603515625, 0.2645111083984375, 0.32745361328125, 0.3903961181640625, 0.453338623046875, 0.5162811279296875, 0.5792236328125, 0.6421661376953125, 0.705108642578125, 0.7680511474609375, 0.83099365234375, 0.8939361572265625, 0.956878662109375, 1.0198211669921875, 1.082763671875, 1.1457061767578125, 1.208648681640625, 1.2715911865234375, 1.33453369140625, 1.3974761962890625, 1.460418701171875, 1.5233612060546875, 1.5863037109375, 1.6492462158203125, 1.712188720703125, 1.7751312255859375, 1.83807373046875, 1.9010162353515625, 1.963958740234375, 2.0269012451171875, 2.08984375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 8.0, 10.0, 10.0, 13.0, 11.0, 14.0, 20.0, 18.0, 18.0, 25.0, 44.0, 37.0, 52.0, 40.0, 56.0, 45.0, 44.0, 62.0, 44.0, 36.0, 46.0, 38.0, 43.0, 34.0, 37.0, 30.0, 38.0, 25.0, 22.0, 15.0, 16.0, 9.0, 4.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.672953128814697, -6.461115837097168, -6.249279022216797, -6.037441730499268, -5.825604438781738, -5.613767147064209, -5.40192985534668, -5.190093040466309, -4.978255748748779, -4.76641845703125, -4.554581642150879, -4.34274435043335, -4.13090705871582, -3.919069766998291, -3.707232713699341, -3.4953956604003906, -3.2835583686828613, -3.071721076965332, -2.859884023666382, -2.6480469703674316, -2.4362096786499023, -2.224372386932373, -2.012535333633423, -1.800698161125183, -1.5888609886169434, -1.3770238161087036, -1.1651866436004639, -0.9533494710922241, -0.7415122985839844, -0.5296751260757446, -0.3178379535675049, -0.10600078105926514, 0.1058359146118164, 0.31767308712005615, 0.5295102596282959, 0.7413474321365356, 0.9531846046447754, 1.1650217771530151, 1.3768589496612549, 1.5886961221694946, 1.8005332946777344, 2.0123705863952637, 2.224207639694214, 2.436044692993164, 2.6478819847106934, 2.8597192764282227, 3.071556329727173, 3.283393383026123, 3.4952306747436523, 3.7070679664611816, 3.918905019760132, 4.130742073059082, 4.342579364776611, 4.554416656494141, 4.766253471374512, 4.978090763092041, 5.18992805480957, 5.4017653465271, 5.613602638244629, 5.825439453125, 6.037276744842529, 6.249114036560059, 6.46095085144043, 6.672788143157959, 6.884625434875488]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 5.0, 10.0, 12.0, 9.0, 12.0, 13.0, 22.0, 25.0, 18.0, 29.0, 32.0, 35.0, 41.0, 25.0, 33.0, 46.0, 47.0, 33.0, 27.0, 35.0, 39.0, 41.0, 34.0, 35.0, 47.0, 41.0, 34.0, 34.0, 22.0, 30.0, 14.0, 16.0, 22.0, 9.0, 15.0, 4.0, 4.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.070306777954102, -3.9342706203460693, -3.798234462738037, -3.662198543548584, -3.5261623859405518, -3.3901262283325195, -3.2540903091430664, -3.118054151535034, -2.982017993927002, -2.8459818363189697, -2.7099456787109375, -2.5739097595214844, -2.437873601913452, -2.30183744430542, -2.165801525115967, -2.0297653675079346, -1.8937292098999023, -1.7576930522918701, -1.6216570138931274, -1.4856209754943848, -1.3495848178863525, -1.2135486602783203, -1.0775126218795776, -0.9414765238761902, -0.8054404258728027, -0.6694043278694153, -0.5333682298660278, -0.3973321318626404, -0.26129603385925293, -0.12525993585586548, 0.010776162147521973, 0.14681226015090942, 0.28284788131713867, 0.4188839793205261, 0.5549200773239136, 0.690956175327301, 0.8269922733306885, 0.9630283713340759, 1.0990644693374634, 1.235100507736206, 1.3711366653442383, 1.5071728229522705, 1.6432088613510132, 1.7792448997497559, 1.915281057357788, 2.0513172149658203, 2.1873531341552734, 2.3233892917633057, 2.459425449371338, 2.59546160697937, 2.7314977645874023, 2.8675336837768555, 3.0035698413848877, 3.13960599899292, 3.275641918182373, 3.4116780757904053, 3.5477142333984375, 3.6837503910064697, 3.819786548614502, 3.955822467803955, 4.091858863830566, 4.2278947830200195, 4.363930702209473, 4.499967098236084, 4.636003017425537]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 8.0, 7.0, 12.0, 14.0, 17.0, 35.0, 56.0, 58.0, 119.0, 154.0, 249.0, 410.0, 584.0, 941.0, 1490.0, 2422.0, 3849.0, 6336.0, 10686.0, 18690.0, 32219.0, 56169.0, 98285.0, 161943.0, 212304.0, 177622.0, 110933.0, 64872.0, 36242.0, 20869.0, 12149.0, 7206.0, 4291.0, 2687.0, 1676.0, 1027.0, 668.0, 433.0, 288.0, 190.0, 114.0, 77.0, 42.0, 34.0, 28.0, 17.0, 11.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.2607421875, -1.223236083984375, -1.18572998046875, -1.148223876953125, -1.1107177734375, -1.073211669921875, -1.03570556640625, -0.998199462890625, -0.960693359375, -0.923187255859375, -0.88568115234375, -0.848175048828125, -0.8106689453125, -0.773162841796875, -0.73565673828125, -0.698150634765625, -0.66064453125, -0.623138427734375, -0.58563232421875, -0.548126220703125, -0.5106201171875, -0.473114013671875, -0.43560791015625, -0.398101806640625, -0.360595703125, -0.323089599609375, -0.28558349609375, -0.248077392578125, -0.2105712890625, -0.173065185546875, -0.13555908203125, -0.098052978515625, -0.060546875, -0.023040771484375, 0.01446533203125, 0.051971435546875, 0.0894775390625, 0.126983642578125, 0.16448974609375, 0.201995849609375, 0.239501953125, 0.277008056640625, 0.31451416015625, 0.352020263671875, 0.3895263671875, 0.427032470703125, 0.46453857421875, 0.502044677734375, 0.53955078125, 0.577056884765625, 0.61456298828125, 0.652069091796875, 0.6895751953125, 0.727081298828125, 0.76458740234375, 0.802093505859375, 0.839599609375, 0.877105712890625, 0.91461181640625, 0.952117919921875, 0.9896240234375, 1.027130126953125, 1.06463623046875, 1.102142333984375, 1.1396484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 3.0, 4.0, 12.0, 6.0, 8.0, 9.0, 11.0, 19.0, 17.0, 26.0, 23.0, 24.0, 18.0, 28.0, 22.0, 41.0, 33.0, 27.0, 45.0, 33.0, 46.0, 31.0, 43.0, 36.0, 41.0, 49.0, 35.0, 31.0, 31.0, 28.0, 27.0, 28.0, 26.0, 21.0, 22.0, 16.0, 20.0, 16.0, 2.0, 6.0, 6.0, 5.0, 7.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.76171875, -4.61328125, -4.46484375, -4.31640625, -4.16796875, -4.01953125, -3.87109375, -3.72265625, -3.57421875, -3.42578125, -3.27734375, -3.12890625, -2.98046875, -2.83203125, -2.68359375, -2.53515625, -2.38671875, -2.23828125, -2.08984375, -1.94140625, -1.79296875, -1.64453125, -1.49609375, -1.34765625, -1.19921875, -1.05078125, -0.90234375, -0.75390625, -0.60546875, -0.45703125, -0.30859375, -0.16015625, -0.01171875, 0.13671875, 0.28515625, 0.43359375, 0.58203125, 0.73046875, 0.87890625, 1.02734375, 1.17578125, 1.32421875, 1.47265625, 1.62109375, 1.76953125, 1.91796875, 2.06640625, 2.21484375, 2.36328125, 2.51171875, 2.66015625, 2.80859375, 2.95703125, 3.10546875, 3.25390625, 3.40234375, 3.55078125, 3.69921875, 3.84765625, 3.99609375, 4.14453125, 4.29296875, 4.44140625, 4.58984375, 4.73828125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 12.0, 15.0, 16.0, 34.0, 46.0, 68.0, 113.0, 166.0, 246.0, 386.0, 627.0, 1026.0, 1786.0, 3042.0, 5568.0, 10422.0, 19843.0, 39376.0, 80896.0, 161851.0, 263762.0, 222235.0, 118117.0, 57356.0, 28695.0, 14736.0, 7776.0, 4269.0, 2440.0, 1360.0, 856.0, 490.0, 339.0, 167.0, 143.0, 80.0, 70.0, 43.0, 24.0, 18.0, 8.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7236328125, -1.6740570068359375, -1.624481201171875, -1.5749053955078125, -1.52532958984375, -1.4757537841796875, -1.426177978515625, -1.3766021728515625, -1.3270263671875, -1.2774505615234375, -1.227874755859375, -1.1782989501953125, -1.12872314453125, -1.0791473388671875, -1.029571533203125, -0.9799957275390625, -0.930419921875, -0.8808441162109375, -0.831268310546875, -0.7816925048828125, -0.73211669921875, -0.6825408935546875, -0.632965087890625, -0.5833892822265625, -0.5338134765625, -0.4842376708984375, -0.434661865234375, -0.3850860595703125, -0.33551025390625, -0.2859344482421875, -0.236358642578125, -0.1867828369140625, -0.13720703125, -0.0876312255859375, -0.038055419921875, 0.0115203857421875, 0.06109619140625, 0.1106719970703125, 0.160247802734375, 0.2098236083984375, 0.2593994140625, 0.3089752197265625, 0.358551025390625, 0.4081268310546875, 0.45770263671875, 0.5072784423828125, 0.556854248046875, 0.6064300537109375, 0.656005859375, 0.7055816650390625, 0.755157470703125, 0.8047332763671875, 0.85430908203125, 0.9038848876953125, 0.953460693359375, 1.0030364990234375, 1.0526123046875, 1.1021881103515625, 1.151763916015625, 1.2013397216796875, 1.25091552734375, 1.3004913330078125, 1.350067138671875, 1.3996429443359375, 1.44921875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 2.0, 7.0, 7.0, 11.0, 13.0, 8.0, 17.0, 18.0, 20.0, 20.0, 24.0, 29.0, 32.0, 34.0, 34.0, 33.0, 40.0, 51.0, 51.0, 43.0, 44.0, 41.0, 44.0, 44.0, 49.0, 39.0, 27.0, 31.0, 26.0, 23.0, 22.0, 24.0, 22.0, 19.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.2890625, -3.187744140625, -3.08642578125, -2.985107421875, -2.8837890625, -2.782470703125, -2.68115234375, -2.579833984375, -2.478515625, -2.377197265625, -2.27587890625, -2.174560546875, -2.0732421875, -1.971923828125, -1.87060546875, -1.769287109375, -1.66796875, -1.566650390625, -1.46533203125, -1.364013671875, -1.2626953125, -1.161376953125, -1.06005859375, -0.958740234375, -0.857421875, -0.756103515625, -0.65478515625, -0.553466796875, -0.4521484375, -0.350830078125, -0.24951171875, -0.148193359375, -0.046875, 0.054443359375, 0.15576171875, 0.257080078125, 0.3583984375, 0.459716796875, 0.56103515625, 0.662353515625, 0.763671875, 0.864990234375, 0.96630859375, 1.067626953125, 1.1689453125, 1.270263671875, 1.37158203125, 1.472900390625, 1.57421875, 1.675537109375, 1.77685546875, 1.878173828125, 1.9794921875, 2.080810546875, 2.18212890625, 2.283447265625, 2.384765625, 2.486083984375, 2.58740234375, 2.688720703125, 2.7900390625, 2.891357421875, 2.99267578125, 3.093994140625, 3.1953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 8.0, 15.0, 21.0, 24.0, 31.0, 41.0, 67.0, 74.0, 92.0, 164.0, 198.0, 264.0, 436.0, 778.0, 1555.0, 4101.0, 14184.0, 74503.0, 557705.0, 335413.0, 43144.0, 9690.0, 2931.0, 1190.0, 636.0, 364.0, 246.0, 179.0, 119.0, 92.0, 79.0, 44.0, 43.0, 26.0, 27.0, 20.0, 10.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1669921875, -1.1314697265625, -1.095947265625, -1.0604248046875, -1.02490234375, -0.9893798828125, -0.953857421875, -0.9183349609375, -0.8828125, -0.8472900390625, -0.811767578125, -0.7762451171875, -0.74072265625, -0.7052001953125, -0.669677734375, -0.6341552734375, -0.5986328125, -0.5631103515625, -0.527587890625, -0.4920654296875, -0.45654296875, -0.4210205078125, -0.385498046875, -0.3499755859375, -0.314453125, -0.2789306640625, -0.243408203125, -0.2078857421875, -0.17236328125, -0.1368408203125, -0.101318359375, -0.0657958984375, -0.0302734375, 0.0052490234375, 0.040771484375, 0.0762939453125, 0.11181640625, 0.1473388671875, 0.182861328125, 0.2183837890625, 0.25390625, 0.2894287109375, 0.324951171875, 0.3604736328125, 0.39599609375, 0.4315185546875, 0.467041015625, 0.5025634765625, 0.5380859375, 0.5736083984375, 0.609130859375, 0.6446533203125, 0.68017578125, 0.7156982421875, 0.751220703125, 0.7867431640625, 0.822265625, 0.8577880859375, 0.893310546875, 0.9288330078125, 0.96435546875, 0.9998779296875, 1.035400390625, 1.0709228515625, 1.1064453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 29.0, 43.0, 70.0, 91.0, 94.0, 127.0, 115.0, 104.0, 95.0, 63.0, 53.0, 26.0, 17.0, 15.0, 9.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.947185516357422e-05, -4.78280708193779e-05, -4.618428647518158e-05, -4.454050213098526e-05, -4.289671778678894e-05, -4.125293344259262e-05, -3.96091490983963e-05, -3.796536475419998e-05, -3.632158041000366e-05, -3.467779606580734e-05, -3.303401172161102e-05, -3.13902273774147e-05, -2.9746443033218384e-05, -2.8102658689022064e-05, -2.6458874344825745e-05, -2.4815090000629425e-05, -2.3171305656433105e-05, -2.1527521312236786e-05, -1.9883736968040466e-05, -1.8239952623844147e-05, -1.6596168279647827e-05, -1.4952383935451508e-05, -1.3308599591255188e-05, -1.1664815247058868e-05, -1.0021030902862549e-05, -8.37724655866623e-06, -6.73346221446991e-06, -5.08967787027359e-06, -3.4458935260772705e-06, -1.802109181880951e-06, -1.5832483768463135e-07, 1.4854595065116882e-06, 3.129243850708008e-06, 4.773028194904327e-06, 6.416812539100647e-06, 8.060596883296967e-06, 9.704381227493286e-06, 1.1348165571689606e-05, 1.2991949915885925e-05, 1.4635734260082245e-05, 1.6279518604278564e-05, 1.7923302948474884e-05, 1.9567087292671204e-05, 2.1210871636867523e-05, 2.2854655981063843e-05, 2.4498440325260162e-05, 2.6142224669456482e-05, 2.77860090136528e-05, 2.942979335784912e-05, 3.107357770204544e-05, 3.271736204624176e-05, 3.436114639043808e-05, 3.60049307346344e-05, 3.764871507883072e-05, 3.929249942302704e-05, 4.093628376722336e-05, 4.258006811141968e-05, 4.4223852455616e-05, 4.586763679981232e-05, 4.7511421144008636e-05, 4.9155205488204956e-05, 5.0798989832401276e-05, 5.2442774176597595e-05, 5.4086558520793915e-05, 5.5730342864990234e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 19.0, 26.0, 21.0, 33.0, 53.0, 92.0, 102.0, 143.0, 200.0, 261.0, 370.0, 466.0, 673.0, 958.0, 1314.0, 1919.0, 3436.0, 7729.0, 23780.0, 102146.0, 446180.0, 351039.0, 73680.0, 18277.0, 6415.0, 3020.0, 1783.0, 1178.0, 862.0, 620.0, 471.0, 324.0, 263.0, 186.0, 137.0, 107.0, 84.0, 47.0, 31.0, 21.0, 15.0, 16.0, 13.0, 9.0, 4.0, 7.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.189453125, -1.15216064453125, -1.1148681640625, -1.07757568359375, -1.040283203125, -1.00299072265625, -0.9656982421875, -0.92840576171875, -0.89111328125, -0.85382080078125, -0.8165283203125, -0.77923583984375, -0.741943359375, -0.70465087890625, -0.6673583984375, -0.63006591796875, -0.5927734375, -0.55548095703125, -0.5181884765625, -0.48089599609375, -0.443603515625, -0.40631103515625, -0.3690185546875, -0.33172607421875, -0.29443359375, -0.25714111328125, -0.2198486328125, -0.18255615234375, -0.145263671875, -0.10797119140625, -0.0706787109375, -0.03338623046875, 0.00390625, 0.04119873046875, 0.0784912109375, 0.11578369140625, 0.153076171875, 0.19036865234375, 0.2276611328125, 0.26495361328125, 0.30224609375, 0.33953857421875, 0.3768310546875, 0.41412353515625, 0.451416015625, 0.48870849609375, 0.5260009765625, 0.56329345703125, 0.6005859375, 0.63787841796875, 0.6751708984375, 0.71246337890625, 0.749755859375, 0.78704833984375, 0.8243408203125, 0.86163330078125, 0.89892578125, 0.93621826171875, 0.9735107421875, 1.01080322265625, 1.048095703125, 1.08538818359375, 1.1226806640625, 1.15997314453125, 1.197265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 5.0, 21.0, 18.0, 20.0, 47.0, 61.0, 76.0, 122.0, 136.0, 115.0, 113.0, 86.0, 48.0, 37.0, 25.0, 17.0, 11.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.265869140625, -0.2577476501464844, -0.24962615966796875, -0.24150466918945312, -0.2333831787109375, -0.22526168823242188, -0.21714019775390625, -0.20901870727539062, -0.200897216796875, -0.19277572631835938, -0.18465423583984375, -0.17653274536132812, -0.1684112548828125, -0.16028976440429688, -0.15216827392578125, -0.14404678344726562, -0.13592529296875, -0.12780380249023438, -0.11968231201171875, -0.11156082153320312, -0.1034393310546875, -0.09531784057617188, -0.08719635009765625, -0.07907485961914062, -0.070953369140625, -0.06283187866210938, -0.05471038818359375, -0.046588897705078125, -0.0384674072265625, -0.030345916748046875, -0.02222442626953125, -0.014102935791015625, -0.0059814453125, 0.002140045166015625, 0.01026153564453125, 0.018383026123046875, 0.0265045166015625, 0.034626007080078125, 0.04274749755859375, 0.050868988037109375, 0.058990478515625, 0.06711196899414062, 0.07523345947265625, 0.08335494995117188, 0.0914764404296875, 0.09959793090820312, 0.10771942138671875, 0.11584091186523438, 0.12396240234375, 0.13208389282226562, 0.14020538330078125, 0.14832687377929688, 0.1564483642578125, 0.16456985473632812, 0.17269134521484375, 0.18081283569335938, 0.188934326171875, 0.19705581665039062, 0.20517730712890625, 0.21329879760742188, 0.2214202880859375, 0.22954177856445312, 0.23766326904296875, 0.24578475952148438, 0.25390625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 7.0, 13.0, 11.0, 13.0, 14.0, 11.0, 23.0, 18.0, 21.0, 39.0, 37.0, 56.0, 34.0, 58.0, 51.0, 41.0, 54.0, 50.0, 38.0, 43.0, 44.0, 45.0, 41.0, 33.0, 28.0, 38.0, 35.0, 16.0, 16.0, 19.0, 9.0, 10.0, 3.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80856466293335, -6.594701290130615, -6.380838394165039, -6.166975021362305, -5.9531121253967285, -5.739248752593994, -5.525385856628418, -5.311522483825684, -5.097659111022949, -4.883795738220215, -4.669932842254639, -4.456069469451904, -4.242206573486328, -4.028343200683594, -3.8144800662994385, -3.600616931915283, -3.386754035949707, -3.1728909015655518, -2.9590277671813965, -2.745164394378662, -2.531301498413086, -2.3174381256103516, -2.1035749912261963, -1.889711856842041, -1.6758487224578857, -1.4619855880737305, -1.2481224536895752, -1.0342592000961304, -0.8203960657119751, -0.6065329313278198, -0.392669677734375, -0.17880654335021973, 0.03505706787109375, 0.2489202320575714, 0.4627833962440491, 0.6766465902328491, 0.8905097246170044, 1.1043728590011597, 1.3182361125946045, 1.5320992469787598, 1.745962381362915, 1.9598255157470703, 2.1736886501312256, 2.387551784515381, 2.6014151573181152, 2.8152780532836914, 3.029141426086426, 3.243004560470581, 3.4568676948547363, 3.6707308292388916, 3.884593963623047, 4.098457336425781, 4.312320232391357, 4.526183605194092, 4.740046501159668, 4.953909873962402, 5.167773246765137, 5.381636619567871, 5.595499515533447, 5.809362888336182, 6.023225784301758, 6.237089157104492, 6.450952529907227, 6.664815425872803, 6.878678321838379]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 7.0, 3.0, 7.0, 7.0, 12.0, 13.0, 9.0, 13.0, 21.0, 30.0, 14.0, 29.0, 32.0, 33.0, 40.0, 31.0, 27.0, 54.0, 42.0, 34.0, 32.0, 29.0, 43.0, 41.0, 32.0, 34.0, 47.0, 44.0, 32.0, 35.0, 26.0, 25.0, 14.0, 17.0, 23.0, 9.0, 12.0, 5.0, 5.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.087047100067139, -3.9503676891326904, -3.813688278198242, -3.677008867263794, -3.5403294563293457, -3.4036502838134766, -3.2669708728790283, -3.13029146194458, -2.993612051010132, -2.8569326400756836, -2.7202532291412354, -2.583573818206787, -2.446894645690918, -2.3102149963378906, -2.1735358238220215, -2.0368564128875732, -1.900177001953125, -1.7634975910186768, -1.6268181800842285, -1.4901388883590698, -1.3534594774246216, -1.2167800664901733, -1.0801007747650146, -0.9434213638305664, -0.8067419528961182, -0.6700625419616699, -0.5333831906318665, -0.3967038094997406, -0.26002442836761475, -0.1233450174331665, 0.013334333896636963, 0.15001368522644043, 0.28669309616088867, 0.4233724772930145, 0.5600518584251404, 0.6967312097549438, 0.8334106206893921, 0.9700900316238403, 1.106769323348999, 1.2434487342834473, 1.3801281452178955, 1.5168075561523438, 1.653486967086792, 1.7901662588119507, 1.926845669746399, 2.0635251998901367, 2.200204372406006, 2.336883783340454, 2.4735631942749023, 2.6102426052093506, 2.746922016143799, 2.883601427078247, 3.0202808380126953, 3.1569600105285645, 3.2936394214630127, 3.430318832397461, 3.566998243331909, 3.7036776542663574, 3.8403570652008057, 3.977036476135254, 4.113715648651123, 4.25039529800415, 4.3870744705200195, 4.523754119873047, 4.660433292388916]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 22.0, 44.0, 72.0, 92.0, 147.0, 260.0, 421.0, 648.0, 994.0, 1729.0, 2607.0, 4146.0, 6347.0, 9787.0, 14983.0, 21961.0, 32579.0, 45299.0, 60023.0, 76395.0, 92095.0, 102728.0, 106200.0, 102489.0, 91035.0, 75790.0, 60251.0, 44454.0, 31356.0, 21979.0, 14740.0, 9577.0, 6387.0, 4034.0, 2558.0, 1627.0, 975.0, 611.0, 409.0, 268.0, 156.0, 113.0, 72.0, 39.0, 18.0, 11.0, 8.0, 8.0, 2.0, 1.0], "bins": [-3.697265625, -3.595916748046875, -3.49456787109375, -3.393218994140625, -3.2918701171875, -3.190521240234375, -3.08917236328125, -2.987823486328125, -2.886474609375, -2.785125732421875, -2.68377685546875, -2.582427978515625, -2.4810791015625, -2.379730224609375, -2.27838134765625, -2.177032470703125, -2.07568359375, -1.974334716796875, -1.87298583984375, -1.771636962890625, -1.6702880859375, -1.568939208984375, -1.46759033203125, -1.366241455078125, -1.264892578125, -1.163543701171875, -1.06219482421875, -0.960845947265625, -0.8594970703125, -0.758148193359375, -0.65679931640625, -0.555450439453125, -0.4541015625, -0.352752685546875, -0.25140380859375, -0.150054931640625, -0.0487060546875, 0.052642822265625, 0.15399169921875, 0.255340576171875, 0.356689453125, 0.458038330078125, 0.55938720703125, 0.660736083984375, 0.7620849609375, 0.863433837890625, 0.96478271484375, 1.066131591796875, 1.16748046875, 1.268829345703125, 1.37017822265625, 1.471527099609375, 1.5728759765625, 1.674224853515625, 1.77557373046875, 1.876922607421875, 1.978271484375, 2.079620361328125, 2.18096923828125, 2.282318115234375, 2.3836669921875, 2.485015869140625, 2.58636474609375, 2.687713623046875, 2.7890625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 4.0, 6.0, 10.0, 4.0, 9.0, 15.0, 13.0, 16.0, 19.0, 10.0, 29.0, 20.0, 25.0, 30.0, 48.0, 29.0, 30.0, 32.0, 39.0, 29.0, 42.0, 36.0, 41.0, 25.0, 45.0, 43.0, 43.0, 34.0, 30.0, 26.0, 26.0, 30.0, 22.0, 18.0, 19.0, 24.0, 11.0, 7.0, 4.0, 7.0, 12.0, 6.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.390625, -4.249755859375, -4.10888671875, -3.968017578125, -3.8271484375, -3.686279296875, -3.54541015625, -3.404541015625, -3.263671875, -3.122802734375, -2.98193359375, -2.841064453125, -2.7001953125, -2.559326171875, -2.41845703125, -2.277587890625, -2.13671875, -1.995849609375, -1.85498046875, -1.714111328125, -1.5732421875, -1.432373046875, -1.29150390625, -1.150634765625, -1.009765625, -0.868896484375, -0.72802734375, -0.587158203125, -0.4462890625, -0.305419921875, -0.16455078125, -0.023681640625, 0.1171875, 0.258056640625, 0.39892578125, 0.539794921875, 0.6806640625, 0.821533203125, 0.96240234375, 1.103271484375, 1.244140625, 1.385009765625, 1.52587890625, 1.666748046875, 1.8076171875, 1.948486328125, 2.08935546875, 2.230224609375, 2.37109375, 2.511962890625, 2.65283203125, 2.793701171875, 2.9345703125, 3.075439453125, 3.21630859375, 3.357177734375, 3.498046875, 3.638916015625, 3.77978515625, 3.920654296875, 4.0615234375, 4.202392578125, 4.34326171875, 4.484130859375, 4.625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 14.0, 26.0, 31.0, 55.0, 88.0, 154.0, 217.0, 368.0, 626.0, 966.0, 1495.0, 2320.0, 3785.0, 6088.0, 9419.0, 14274.0, 21329.0, 31038.0, 43358.0, 58821.0, 74916.0, 90323.0, 101422.0, 105980.0, 102832.0, 92913.0, 77749.0, 61642.0, 46410.0, 33296.0, 22822.0, 15634.0, 10032.0, 6672.0, 4098.0, 2742.0, 1690.0, 1057.0, 697.0, 437.0, 270.0, 164.0, 104.0, 51.0, 52.0, 31.0, 19.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0], "bins": [-3.640625, -3.535400390625, -3.43017578125, -3.324951171875, -3.2197265625, -3.114501953125, -3.00927734375, -2.904052734375, -2.798828125, -2.693603515625, -2.58837890625, -2.483154296875, -2.3779296875, -2.272705078125, -2.16748046875, -2.062255859375, -1.95703125, -1.851806640625, -1.74658203125, -1.641357421875, -1.5361328125, -1.430908203125, -1.32568359375, -1.220458984375, -1.115234375, -1.010009765625, -0.90478515625, -0.799560546875, -0.6943359375, -0.589111328125, -0.48388671875, -0.378662109375, -0.2734375, -0.168212890625, -0.06298828125, 0.042236328125, 0.1474609375, 0.252685546875, 0.35791015625, 0.463134765625, 0.568359375, 0.673583984375, 0.77880859375, 0.884033203125, 0.9892578125, 1.094482421875, 1.19970703125, 1.304931640625, 1.41015625, 1.515380859375, 1.62060546875, 1.725830078125, 1.8310546875, 1.936279296875, 2.04150390625, 2.146728515625, 2.251953125, 2.357177734375, 2.46240234375, 2.567626953125, 2.6728515625, 2.778076171875, 2.88330078125, 2.988525390625, 3.09375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 6.0, 7.0, 11.0, 11.0, 8.0, 15.0, 17.0, 29.0, 30.0, 30.0, 29.0, 37.0, 39.0, 48.0, 32.0, 33.0, 42.0, 31.0, 39.0, 33.0, 46.0, 38.0, 53.0, 45.0, 31.0, 40.0, 29.0, 33.0, 20.0, 29.0, 20.0, 16.0, 12.0, 16.0, 9.0, 10.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.329864501953125, -3.22808837890625, -3.126312255859375, -3.0245361328125, -2.922760009765625, -2.82098388671875, -2.719207763671875, -2.617431640625, -2.515655517578125, -2.41387939453125, -2.312103271484375, -2.2103271484375, -2.108551025390625, -2.00677490234375, -1.904998779296875, -1.80322265625, -1.701446533203125, -1.59967041015625, -1.497894287109375, -1.3961181640625, -1.294342041015625, -1.19256591796875, -1.090789794921875, -0.989013671875, -0.887237548828125, -0.78546142578125, -0.683685302734375, -0.5819091796875, -0.480133056640625, -0.37835693359375, -0.276580810546875, -0.1748046875, -0.073028564453125, 0.02874755859375, 0.130523681640625, 0.2322998046875, 0.334075927734375, 0.43585205078125, 0.537628173828125, 0.639404296875, 0.741180419921875, 0.84295654296875, 0.944732666015625, 1.0465087890625, 1.148284912109375, 1.25006103515625, 1.351837158203125, 1.45361328125, 1.555389404296875, 1.65716552734375, 1.758941650390625, 1.8607177734375, 1.962493896484375, 2.06427001953125, 2.166046142578125, 2.267822265625, 2.369598388671875, 2.47137451171875, 2.573150634765625, 2.6749267578125, 2.776702880859375, 2.87847900390625, 2.980255126953125, 3.08203125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 9.0, 15.0, 27.0, 32.0, 50.0, 68.0, 100.0, 153.0, 243.0, 382.0, 595.0, 859.0, 1418.0, 2275.0, 3684.0, 6418.0, 11098.0, 19823.0, 35511.0, 62922.0, 106483.0, 156357.0, 184896.0, 167479.0, 119578.0, 72642.0, 41170.0, 22738.0, 12793.0, 7429.0, 4306.0, 2540.0, 1629.0, 986.0, 621.0, 400.0, 287.0, 188.0, 118.0, 79.0, 52.0, 37.0, 14.0, 14.0, 18.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.1484375, -3.05194091796875, -2.9554443359375, -2.85894775390625, -2.762451171875, -2.66595458984375, -2.5694580078125, -2.47296142578125, -2.37646484375, -2.27996826171875, -2.1834716796875, -2.08697509765625, -1.990478515625, -1.89398193359375, -1.7974853515625, -1.70098876953125, -1.6044921875, -1.50799560546875, -1.4114990234375, -1.31500244140625, -1.218505859375, -1.12200927734375, -1.0255126953125, -0.92901611328125, -0.83251953125, -0.73602294921875, -0.6395263671875, -0.54302978515625, -0.446533203125, -0.35003662109375, -0.2535400390625, -0.15704345703125, -0.060546875, 0.03594970703125, 0.1324462890625, 0.22894287109375, 0.325439453125, 0.42193603515625, 0.5184326171875, 0.61492919921875, 0.71142578125, 0.80792236328125, 0.9044189453125, 1.00091552734375, 1.097412109375, 1.19390869140625, 1.2904052734375, 1.38690185546875, 1.4833984375, 1.57989501953125, 1.6763916015625, 1.77288818359375, 1.869384765625, 1.96588134765625, 2.0623779296875, 2.15887451171875, 2.25537109375, 2.35186767578125, 2.4483642578125, 2.54486083984375, 2.641357421875, 2.73785400390625, 2.8343505859375, 2.93084716796875, 3.02734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 18.0, 16.0, 15.0, 27.0, 37.0, 36.0, 58.0, 78.0, 67.0, 69.0, 76.0, 81.0, 63.0, 72.0, 49.0, 52.0, 35.0, 37.0, 22.0, 25.0, 10.0, 13.0, 8.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003075599670410156, -0.0002962350845336914, -0.0002849102020263672, -0.00027358531951904297, -0.00026226043701171875, -0.00025093555450439453, -0.0002396106719970703, -0.0002282857894897461, -0.00021696090698242188, -0.00020563602447509766, -0.00019431114196777344, -0.00018298625946044922, -0.000171661376953125, -0.00016033649444580078, -0.00014901161193847656, -0.00013768672943115234, -0.00012636184692382812, -0.0001150369644165039, -0.00010371208190917969, -9.238719940185547e-05, -8.106231689453125e-05, -6.973743438720703e-05, -5.841255187988281e-05, -4.7087669372558594e-05, -3.5762786865234375e-05, -2.4437904357910156e-05, -1.3113021850585938e-05, -1.7881393432617188e-06, 9.5367431640625e-06, 2.086162567138672e-05, 3.218650817871094e-05, 4.3511390686035156e-05, 5.4836273193359375e-05, 6.61611557006836e-05, 7.748603820800781e-05, 8.881092071533203e-05, 0.00010013580322265625, 0.00011146068572998047, 0.0001227855682373047, 0.0001341104507446289, 0.00014543533325195312, 0.00015676021575927734, 0.00016808509826660156, 0.00017940998077392578, 0.00019073486328125, 0.00020205974578857422, 0.00021338462829589844, 0.00022470951080322266, 0.00023603439331054688, 0.0002473592758178711, 0.0002586841583251953, 0.00027000904083251953, 0.00028133392333984375, 0.00029265880584716797, 0.0003039836883544922, 0.0003153085708618164, 0.0003266334533691406, 0.00033795833587646484, 0.00034928321838378906, 0.0003606081008911133, 0.0003719329833984375, 0.0003832578659057617, 0.00039458274841308594, 0.00040590763092041016, 0.0004172325134277344]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 5.0, 11.0, 5.0, 12.0, 31.0, 24.0, 41.0, 70.0, 101.0, 120.0, 172.0, 287.0, 379.0, 622.0, 1043.0, 1698.0, 3106.0, 5529.0, 10473.0, 20655.0, 42530.0, 86704.0, 159193.0, 222504.0, 210720.0, 137900.0, 72274.0, 34840.0, 17120.0, 8773.0, 4814.0, 2657.0, 1563.0, 869.0, 559.0, 354.0, 251.0, 165.0, 95.0, 87.0, 62.0, 37.0, 27.0, 19.0, 8.0, 15.0, 10.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.71875, -3.59423828125, -3.4697265625, -3.34521484375, -3.220703125, -3.09619140625, -2.9716796875, -2.84716796875, -2.72265625, -2.59814453125, -2.4736328125, -2.34912109375, -2.224609375, -2.10009765625, -1.9755859375, -1.85107421875, -1.7265625, -1.60205078125, -1.4775390625, -1.35302734375, -1.228515625, -1.10400390625, -0.9794921875, -0.85498046875, -0.73046875, -0.60595703125, -0.4814453125, -0.35693359375, -0.232421875, -0.10791015625, 0.0166015625, 0.14111328125, 0.265625, 0.39013671875, 0.5146484375, 0.63916015625, 0.763671875, 0.88818359375, 1.0126953125, 1.13720703125, 1.26171875, 1.38623046875, 1.5107421875, 1.63525390625, 1.759765625, 1.88427734375, 2.0087890625, 2.13330078125, 2.2578125, 2.38232421875, 2.5068359375, 2.63134765625, 2.755859375, 2.88037109375, 3.0048828125, 3.12939453125, 3.25390625, 3.37841796875, 3.5029296875, 3.62744140625, 3.751953125, 3.87646484375, 4.0009765625, 4.12548828125, 4.25]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 7.0, 4.0, 2.0, 10.0, 8.0, 7.0, 14.0, 12.0, 17.0, 28.0, 22.0, 29.0, 42.0, 46.0, 44.0, 56.0, 49.0, 46.0, 44.0, 63.0, 49.0, 52.0, 59.0, 44.0, 29.0, 39.0, 28.0, 27.0, 22.0, 15.0, 9.0, 16.0, 11.0, 7.0, 4.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.740234375, -0.7150726318359375, -0.689910888671875, -0.6647491455078125, -0.63958740234375, -0.6144256591796875, -0.589263916015625, -0.5641021728515625, -0.5389404296875, -0.5137786865234375, -0.488616943359375, -0.4634552001953125, -0.43829345703125, -0.4131317138671875, -0.387969970703125, -0.3628082275390625, -0.337646484375, -0.3124847412109375, -0.287322998046875, -0.2621612548828125, -0.23699951171875, -0.2118377685546875, -0.186676025390625, -0.1615142822265625, -0.1363525390625, -0.1111907958984375, -0.086029052734375, -0.0608673095703125, -0.03570556640625, -0.0105438232421875, 0.014617919921875, 0.0397796630859375, 0.06494140625, 0.0901031494140625, 0.115264892578125, 0.1404266357421875, 0.16558837890625, 0.1907501220703125, 0.215911865234375, 0.2410736083984375, 0.2662353515625, 0.2913970947265625, 0.316558837890625, 0.3417205810546875, 0.36688232421875, 0.3920440673828125, 0.417205810546875, 0.4423675537109375, 0.467529296875, 0.4926910400390625, 0.517852783203125, 0.5430145263671875, 0.56817626953125, 0.5933380126953125, 0.618499755859375, 0.6436614990234375, 0.6688232421875, 0.6939849853515625, 0.719146728515625, 0.7443084716796875, 0.76947021484375, 0.7946319580078125, 0.819793701171875, 0.8449554443359375, 0.8701171875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 9.0, 7.0, 12.0, 15.0, 14.0, 18.0, 14.0, 27.0, 26.0, 32.0, 35.0, 39.0, 61.0, 46.0, 44.0, 52.0, 43.0, 48.0, 55.0, 46.0, 36.0, 41.0, 37.0, 35.0, 32.0, 27.0, 25.0, 17.0, 19.0, 16.0, 13.0, 9.0, 9.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20192813873291, -5.988082408905029, -5.774236679077148, -5.560390949249268, -5.346545219421387, -5.132699012756348, -4.918853282928467, -4.705007553100586, -4.491161823272705, -4.277316093444824, -4.063470363616943, -3.8496243953704834, -3.6357786655426025, -3.4219329357147217, -3.2080869674682617, -2.994241237640381, -2.7803955078125, -2.566549777984619, -2.3527040481567383, -2.1388580799102783, -1.9250123500823975, -1.7111666202545166, -1.4973207712173462, -1.2834749221801758, -1.069629192352295, -0.8557834029197693, -0.6419376134872437, -0.428091824054718, -0.21424603462219238, -0.00040030479431152344, 0.2134455442428589, 0.4272913932800293, 0.6411375999450684, 0.854983389377594, 1.0688291788101196, 1.28267502784729, 1.496520757675171, 1.7103664875030518, 1.9242123365402222, 2.1380581855773926, 2.3519039154052734, 2.5657496452331543, 2.779595375061035, 2.993441343307495, 3.207287073135376, 3.421132802963257, 3.634978771209717, 3.8488245010375977, 4.0626702308654785, 4.276515960693359, 4.49036169052124, 4.704207420349121, 4.91805362701416, 5.131898880004883, 5.345745086669922, 5.559590816497803, 5.773436546325684, 5.9872822761535645, 6.201128005981445, 6.414973735809326, 6.628819465637207, 6.842665672302246, 7.056511402130127, 7.270357131958008, 7.484202861785889]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 1.0, 4.0, 1.0, 12.0, 10.0, 5.0, 10.0, 10.0, 17.0, 16.0, 22.0, 13.0, 20.0, 31.0, 28.0, 33.0, 35.0, 30.0, 35.0, 37.0, 34.0, 42.0, 32.0, 30.0, 35.0, 32.0, 46.0, 40.0, 44.0, 39.0, 21.0, 28.0, 36.0, 26.0, 20.0, 29.0, 20.0, 18.0, 10.0, 9.0, 8.0, 4.0, 6.0, 1.0, 7.0, 5.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.300610065460205, -4.158552646636963, -4.016495227813721, -3.8744378089904785, -3.7323803901672363, -3.590322971343994, -3.448265314102173, -3.3062078952789307, -3.1641504764556885, -3.0220930576324463, -2.880035638809204, -2.737978219985962, -2.5959205627441406, -2.4538631439208984, -2.3118057250976562, -2.169748306274414, -2.027690887451172, -1.8856334686279297, -1.7435760498046875, -1.6015185117721558, -1.4594610929489136, -1.3174036741256714, -1.1753461360931396, -1.0332887172698975, -0.8912312984466553, -0.7491738796234131, -0.6071164011955261, -0.46505895256996155, -0.323001503944397, -0.18094408512115479, -0.03888660669326782, 0.10317087173461914, 0.24522829055786133, 0.3872857391834259, 0.5293431878089905, 0.6714006662368774, 0.8134580850601196, 0.9555155038833618, 1.0975730419158936, 1.2396304607391357, 1.381687879562378, 1.5237452983856201, 1.6658027172088623, 1.807860255241394, 1.9499176740646362, 2.091975212097168, 2.23403263092041, 2.3760900497436523, 2.5181474685668945, 2.6602048873901367, 2.802262306213379, 2.944319725036621, 3.0863771438598633, 3.2284345626831055, 3.3704922199249268, 3.512549638748169, 3.654607057571411, 3.7966644763946533, 3.9387218952178955, 4.080779552459717, 4.222836971282959, 4.364894390106201, 4.506951808929443, 4.6490092277526855, 4.791066646575928]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 13.0, 25.0, 43.0, 60.0, 86.0, 126.0, 235.0, 348.0, 550.0, 910.0, 1515.0, 2313.0, 4028.0, 6474.0, 11123.0, 18035.0, 29741.0, 48626.0, 78718.0, 122931.0, 185814.0, 266971.0, 360308.0, 446100.0, 499045.0, 500238.0, 448195.0, 363659.0, 271364.0, 189824.0, 126348.0, 81271.0, 50983.0, 31070.0, 18857.0, 11261.0, 6836.0, 4096.0, 2381.0, 1482.0, 918.0, 530.0, 320.0, 213.0, 114.0, 61.0, 48.0, 29.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-5.74609375, -5.57720947265625, -5.4083251953125, -5.23944091796875, -5.070556640625, -4.90167236328125, -4.7327880859375, -4.56390380859375, -4.39501953125, -4.22613525390625, -4.0572509765625, -3.88836669921875, -3.719482421875, -3.55059814453125, -3.3817138671875, -3.21282958984375, -3.0439453125, -2.87506103515625, -2.7061767578125, -2.53729248046875, -2.368408203125, -2.19952392578125, -2.0306396484375, -1.86175537109375, -1.69287109375, -1.52398681640625, -1.3551025390625, -1.18621826171875, -1.017333984375, -0.84844970703125, -0.6795654296875, -0.51068115234375, -0.341796875, -0.17291259765625, -0.0040283203125, 0.16485595703125, 0.333740234375, 0.50262451171875, 0.6715087890625, 0.84039306640625, 1.00927734375, 1.17816162109375, 1.3470458984375, 1.51593017578125, 1.684814453125, 1.85369873046875, 2.0225830078125, 2.19146728515625, 2.3603515625, 2.52923583984375, 2.6981201171875, 2.86700439453125, 3.035888671875, 3.20477294921875, 3.3736572265625, 3.54254150390625, 3.71142578125, 3.88031005859375, 4.0491943359375, 4.21807861328125, 4.386962890625, 4.55584716796875, 4.7247314453125, 4.89361572265625, 5.0625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 9.0, 7.0, 5.0, 7.0, 11.0, 21.0, 18.0, 14.0, 15.0, 33.0, 26.0, 24.0, 24.0, 35.0, 32.0, 37.0, 32.0, 42.0, 33.0, 43.0, 46.0, 43.0, 37.0, 37.0, 37.0, 47.0, 36.0, 32.0, 30.0, 22.0, 25.0, 24.0, 22.0, 16.0, 15.0, 14.0, 11.0, 10.0, 9.0, 4.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.3671875, -4.236724853515625, -4.10626220703125, -3.975799560546875, -3.8453369140625, -3.714874267578125, -3.58441162109375, -3.453948974609375, -3.323486328125, -3.193023681640625, -3.06256103515625, -2.932098388671875, -2.8016357421875, -2.671173095703125, -2.54071044921875, -2.410247802734375, -2.27978515625, -2.149322509765625, -2.01885986328125, -1.888397216796875, -1.7579345703125, -1.627471923828125, -1.49700927734375, -1.366546630859375, -1.236083984375, -1.105621337890625, -0.97515869140625, -0.844696044921875, -0.7142333984375, -0.583770751953125, -0.45330810546875, -0.322845458984375, -0.1923828125, -0.061920166015625, 0.06854248046875, 0.199005126953125, 0.3294677734375, 0.459930419921875, 0.59039306640625, 0.720855712890625, 0.851318359375, 0.981781005859375, 1.11224365234375, 1.242706298828125, 1.3731689453125, 1.503631591796875, 1.63409423828125, 1.764556884765625, 1.89501953125, 2.025482177734375, 2.15594482421875, 2.286407470703125, 2.4168701171875, 2.547332763671875, 2.67779541015625, 2.808258056640625, 2.938720703125, 3.069183349609375, 3.19964599609375, 3.330108642578125, 3.4605712890625, 3.591033935546875, 3.72149658203125, 3.851959228515625, 3.982421875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 5.0, 6.0, 4.0, 14.0, 18.0, 14.0, 38.0, 59.0, 101.0, 142.0, 293.0, 423.0, 809.0, 1297.0, 2145.0, 4052.0, 7195.0, 12196.0, 21671.0, 37520.0, 62789.0, 104134.0, 165269.0, 248552.0, 345872.0, 442942.0, 510550.0, 525875.0, 483457.0, 396573.0, 293819.0, 202399.0, 130567.0, 80536.0, 47978.0, 27742.0, 15926.0, 9147.0, 5253.0, 2931.0, 1666.0, 970.0, 568.0, 327.0, 188.0, 97.0, 63.0, 35.0, 18.0, 18.0, 10.0, 7.0, 10.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.6292724609375, -5.422607421875, -5.2159423828125, -5.00927734375, -4.8026123046875, -4.595947265625, -4.3892822265625, -4.1826171875, -3.9759521484375, -3.769287109375, -3.5626220703125, -3.35595703125, -3.1492919921875, -2.942626953125, -2.7359619140625, -2.529296875, -2.3226318359375, -2.115966796875, -1.9093017578125, -1.70263671875, -1.4959716796875, -1.289306640625, -1.0826416015625, -0.8759765625, -0.6693115234375, -0.462646484375, -0.2559814453125, -0.04931640625, 0.1573486328125, 0.364013671875, 0.5706787109375, 0.77734375, 0.9840087890625, 1.190673828125, 1.3973388671875, 1.60400390625, 1.8106689453125, 2.017333984375, 2.2239990234375, 2.4306640625, 2.6373291015625, 2.843994140625, 3.0506591796875, 3.25732421875, 3.4639892578125, 3.670654296875, 3.8773193359375, 4.083984375, 4.2906494140625, 4.497314453125, 4.7039794921875, 4.91064453125, 5.1173095703125, 5.323974609375, 5.5306396484375, 5.7373046875, 5.9439697265625, 6.150634765625, 6.3572998046875, 6.56396484375, 6.7706298828125, 6.977294921875, 7.1839599609375, 7.390625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 5.0, 4.0, 9.0, 12.0, 15.0, 21.0, 16.0, 16.0, 36.0, 33.0, 36.0, 51.0, 58.0, 80.0, 87.0, 108.0, 128.0, 137.0, 148.0, 164.0, 183.0, 193.0, 170.0, 207.0, 203.0, 190.0, 188.0, 174.0, 156.0, 174.0, 149.0, 139.0, 130.0, 99.0, 91.0, 89.0, 76.0, 61.0, 39.0, 44.0, 39.0, 25.0, 25.0, 12.0, 16.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.20703125, -2.136993408203125, -2.06695556640625, -1.996917724609375, -1.9268798828125, -1.856842041015625, -1.78680419921875, -1.716766357421875, -1.646728515625, -1.576690673828125, -1.50665283203125, -1.436614990234375, -1.3665771484375, -1.296539306640625, -1.22650146484375, -1.156463623046875, -1.08642578125, -1.016387939453125, -0.94635009765625, -0.876312255859375, -0.8062744140625, -0.736236572265625, -0.66619873046875, -0.596160888671875, -0.526123046875, -0.456085205078125, -0.38604736328125, -0.316009521484375, -0.2459716796875, -0.175933837890625, -0.10589599609375, -0.035858154296875, 0.0341796875, 0.104217529296875, 0.17425537109375, 0.244293212890625, 0.3143310546875, 0.384368896484375, 0.45440673828125, 0.524444580078125, 0.594482421875, 0.664520263671875, 0.73455810546875, 0.804595947265625, 0.8746337890625, 0.944671630859375, 1.01470947265625, 1.084747314453125, 1.15478515625, 1.224822998046875, 1.29486083984375, 1.364898681640625, 1.4349365234375, 1.504974365234375, 1.57501220703125, 1.645050048828125, 1.715087890625, 1.785125732421875, 1.85516357421875, 1.925201416015625, 1.9952392578125, 2.065277099609375, 2.13531494140625, 2.205352783203125, 2.275390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 8.0, 9.0, 24.0, 18.0, 34.0, 35.0, 40.0, 42.0, 39.0, 47.0, 46.0, 37.0, 53.0, 44.0, 35.0, 53.0, 54.0, 38.0, 47.0, 33.0, 58.0, 32.0, 19.0, 27.0, 23.0, 18.0, 6.0, 19.0, 8.0, 8.0, 11.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.741555213928223, -8.470038414001465, -8.198522567749023, -7.927005767822266, -7.655489444732666, -7.383973121643066, -7.112456321716309, -6.840939998626709, -6.569423675537109, -6.29790735244751, -6.02639102935791, -5.754874229431152, -5.483357906341553, -5.211841583251953, -4.940324783325195, -4.668808460235596, -4.397292137145996, -4.1257758140563965, -3.8542592525482178, -3.582742691040039, -3.3112263679504395, -3.03971004486084, -2.768193483352661, -2.4966769218444824, -2.225160598754883, -1.9536441564559937, -1.6821277141571045, -1.4106112718582153, -1.1390948295593262, -0.867578387260437, -0.5960619449615479, -0.3245455026626587, -0.053028106689453125, 0.21848833560943604, 0.4900047779083252, 0.7615212202072144, 1.0330376625061035, 1.3045541048049927, 1.5760705471038818, 1.847586989402771, 2.11910343170166, 2.3906197547912598, 2.6621363162994385, 2.933652877807617, 3.205169200897217, 3.4766855239868164, 3.748202085494995, 4.019718647003174, 4.291234970092773, 4.562751293182373, 4.834267616271973, 5.1057844161987305, 5.37730073928833, 5.64881706237793, 5.9203338623046875, 6.191850185394287, 6.463366508483887, 6.734882831573486, 7.006399154663086, 7.277915954589844, 7.549432277679443, 7.820948600769043, 8.0924654006958, 8.363981246948242, 8.635498046875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 7.0, 11.0, 12.0, 16.0, 17.0, 20.0, 28.0, 29.0, 30.0, 32.0, 36.0, 43.0, 48.0, 33.0, 52.0, 52.0, 45.0, 63.0, 47.0, 42.0, 42.0, 40.0, 33.0, 36.0, 35.0, 30.0, 21.0, 15.0, 17.0, 18.0, 7.0, 8.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.577807426452637, -6.385506629943848, -6.193205833435059, -6.0009050369262695, -5.8086042404174805, -5.61630392074585, -5.4240031242370605, -5.2317023277282715, -5.039401531219482, -4.847100734710693, -4.654799938201904, -4.462499141693115, -4.270198822021484, -4.077898025512695, -3.8855972290039062, -3.693296432495117, -3.500995635986328, -3.308694839477539, -3.11639404296875, -2.92409348487854, -2.731792688369751, -2.539491891860962, -2.347191333770752, -2.154890537261963, -1.9625897407531738, -1.7702889442443848, -1.5779882669448853, -1.3856875896453857, -1.1933867931365967, -1.0010859966278076, -0.8087853193283081, -0.6164846420288086, -0.42418384552001953, -0.23188310861587524, -0.03958237171173096, 0.15271836519241333, 0.3450191020965576, 0.5373198390007019, 0.7296205759048462, 0.9219212532043457, 1.1142220497131348, 1.3065228462219238, 1.4988235235214233, 1.6911242008209229, 1.883424997329712, 2.075725793838501, 2.268026351928711, 2.4603271484375, 2.652627944946289, 2.844928741455078, 3.037229537963867, 3.229530096054077, 3.421830892562866, 3.6141316890716553, 3.8064322471618652, 3.9987330436706543, 4.191033840179443, 4.383334636688232, 4.5756354331970215, 4.7679362297058105, 4.960236549377441, 5.1525373458862305, 5.3448381423950195, 5.537138938903809, 5.729439735412598]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 10.0, 14.0, 18.0, 19.0, 48.0, 59.0, 102.0, 114.0, 187.0, 277.0, 400.0, 555.0, 838.0, 1280.0, 1922.0, 2968.0, 4512.0, 7112.0, 11599.0, 18891.0, 31221.0, 51440.0, 86402.0, 137925.0, 191145.0, 180859.0, 123982.0, 76179.0, 45625.0, 27295.0, 16741.0, 10368.0, 6439.0, 4059.0, 2698.0, 1708.0, 1189.0, 753.0, 517.0, 356.0, 262.0, 147.0, 93.0, 78.0, 56.0, 38.0, 23.0, 11.0, 11.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.396484375, -1.3526763916015625, -1.308868408203125, -1.2650604248046875, -1.22125244140625, -1.1774444580078125, -1.133636474609375, -1.0898284912109375, -1.0460205078125, -1.0022125244140625, -0.958404541015625, -0.9145965576171875, -0.87078857421875, -0.8269805908203125, -0.783172607421875, -0.7393646240234375, -0.695556640625, -0.6517486572265625, -0.607940673828125, -0.5641326904296875, -0.52032470703125, -0.4765167236328125, -0.432708740234375, -0.3889007568359375, -0.3450927734375, -0.3012847900390625, -0.257476806640625, -0.2136688232421875, -0.16986083984375, -0.1260528564453125, -0.082244873046875, -0.0384368896484375, 0.00537109375, 0.0491790771484375, 0.092987060546875, 0.1367950439453125, 0.18060302734375, 0.2244110107421875, 0.268218994140625, 0.3120269775390625, 0.3558349609375, 0.3996429443359375, 0.443450927734375, 0.4872589111328125, 0.53106689453125, 0.5748748779296875, 0.618682861328125, 0.6624908447265625, 0.706298828125, 0.7501068115234375, 0.793914794921875, 0.8377227783203125, 0.88153076171875, 0.9253387451171875, 0.969146728515625, 1.0129547119140625, 1.0567626953125, 1.1005706787109375, 1.144378662109375, 1.1881866455078125, 1.23199462890625, 1.2758026123046875, 1.319610595703125, 1.3634185791015625, 1.4072265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 6.0, 9.0, 16.0, 15.0, 10.0, 24.0, 21.0, 18.0, 21.0, 38.0, 32.0, 36.0, 50.0, 31.0, 42.0, 47.0, 42.0, 46.0, 41.0, 43.0, 57.0, 36.0, 31.0, 50.0, 27.0, 19.0, 21.0, 17.0, 28.0, 23.0, 19.0, 17.0, 18.0, 11.0, 11.0, 6.0, 8.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.63671875, -6.440673828125, -6.24462890625, -6.048583984375, -5.8525390625, -5.656494140625, -5.46044921875, -5.264404296875, -5.068359375, -4.872314453125, -4.67626953125, -4.480224609375, -4.2841796875, -4.088134765625, -3.89208984375, -3.696044921875, -3.5, -3.303955078125, -3.10791015625, -2.911865234375, -2.7158203125, -2.519775390625, -2.32373046875, -2.127685546875, -1.931640625, -1.735595703125, -1.53955078125, -1.343505859375, -1.1474609375, -0.951416015625, -0.75537109375, -0.559326171875, -0.36328125, -0.167236328125, 0.02880859375, 0.224853515625, 0.4208984375, 0.616943359375, 0.81298828125, 1.009033203125, 1.205078125, 1.401123046875, 1.59716796875, 1.793212890625, 1.9892578125, 2.185302734375, 2.38134765625, 2.577392578125, 2.7734375, 2.969482421875, 3.16552734375, 3.361572265625, 3.5576171875, 3.753662109375, 3.94970703125, 4.145751953125, 4.341796875, 4.537841796875, 4.73388671875, 4.929931640625, 5.1259765625, 5.322021484375, 5.51806640625, 5.714111328125, 5.91015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 26.0, 29.0, 31.0, 69.0, 87.0, 139.0, 180.0, 288.0, 408.0, 668.0, 1126.0, 1675.0, 2893.0, 4664.0, 7998.0, 13623.0, 24358.0, 43657.0, 80287.0, 146338.0, 227476.0, 210532.0, 125259.0, 68550.0, 37748.0, 20723.0, 11978.0, 6907.0, 4061.0, 2500.0, 1534.0, 981.0, 558.0, 413.0, 260.0, 164.0, 121.0, 80.0, 42.0, 39.0, 28.0, 16.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-1.810546875, -1.7570953369140625, -1.703643798828125, -1.6501922607421875, -1.59674072265625, -1.5432891845703125, -1.489837646484375, -1.4363861083984375, -1.3829345703125, -1.3294830322265625, -1.276031494140625, -1.2225799560546875, -1.16912841796875, -1.1156768798828125, -1.062225341796875, -1.0087738037109375, -0.955322265625, -0.9018707275390625, -0.848419189453125, -0.7949676513671875, -0.74151611328125, -0.6880645751953125, -0.634613037109375, -0.5811614990234375, -0.5277099609375, -0.4742584228515625, -0.420806884765625, -0.3673553466796875, -0.31390380859375, -0.2604522705078125, -0.207000732421875, -0.1535491943359375, -0.10009765625, -0.0466461181640625, 0.006805419921875, 0.0602569580078125, 0.11370849609375, 0.1671600341796875, 0.220611572265625, 0.2740631103515625, 0.3275146484375, 0.3809661865234375, 0.434417724609375, 0.4878692626953125, 0.54132080078125, 0.5947723388671875, 0.648223876953125, 0.7016754150390625, 0.755126953125, 0.8085784912109375, 0.862030029296875, 0.9154815673828125, 0.96893310546875, 1.0223846435546875, 1.075836181640625, 1.1292877197265625, 1.1827392578125, 1.2361907958984375, 1.289642333984375, 1.3430938720703125, 1.39654541015625, 1.4499969482421875, 1.503448486328125, 1.5569000244140625, 1.6103515625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 10.0, 11.0, 14.0, 28.0, 17.0, 22.0, 21.0, 27.0, 28.0, 27.0, 39.0, 39.0, 44.0, 43.0, 34.0, 37.0, 36.0, 46.0, 51.0, 32.0, 31.0, 21.0, 32.0, 26.0, 33.0, 27.0, 23.0, 17.0, 22.0, 19.0, 19.0, 14.0, 14.0, 10.0, 10.0, 5.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.318359375, -3.2122802734375, -3.106201171875, -3.0001220703125, -2.89404296875, -2.7879638671875, -2.681884765625, -2.5758056640625, -2.4697265625, -2.3636474609375, -2.257568359375, -2.1514892578125, -2.04541015625, -1.9393310546875, -1.833251953125, -1.7271728515625, -1.62109375, -1.5150146484375, -1.408935546875, -1.3028564453125, -1.19677734375, -1.0906982421875, -0.984619140625, -0.8785400390625, -0.7724609375, -0.6663818359375, -0.560302734375, -0.4542236328125, -0.34814453125, -0.2420654296875, -0.135986328125, -0.0299072265625, 0.076171875, 0.1822509765625, 0.288330078125, 0.3944091796875, 0.50048828125, 0.6065673828125, 0.712646484375, 0.8187255859375, 0.9248046875, 1.0308837890625, 1.136962890625, 1.2430419921875, 1.34912109375, 1.4552001953125, 1.561279296875, 1.6673583984375, 1.7734375, 1.8795166015625, 1.985595703125, 2.0916748046875, 2.19775390625, 2.3038330078125, 2.409912109375, 2.5159912109375, 2.6220703125, 2.7281494140625, 2.834228515625, 2.9403076171875, 3.04638671875, 3.1524658203125, 3.258544921875, 3.3646240234375, 3.470703125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 10.0, 12.0, 13.0, 18.0, 20.0, 29.0, 55.0, 100.0, 127.0, 205.0, 268.0, 417.0, 690.0, 1028.0, 1800.0, 3098.0, 5721.0, 11769.0, 27272.0, 73973.0, 237806.0, 420358.0, 167648.0, 53842.0, 21089.0, 9683.0, 4780.0, 2616.0, 1442.0, 967.0, 596.0, 325.0, 232.0, 191.0, 114.0, 75.0, 46.0, 39.0, 17.0, 24.0, 13.0, 5.0, 4.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.78125, -0.7597579956054688, -0.7382659912109375, -0.7167739868164062, -0.695281982421875, -0.6737899780273438, -0.6522979736328125, -0.6308059692382812, -0.60931396484375, -0.5878219604492188, -0.5663299560546875, -0.5448379516601562, -0.523345947265625, -0.5018539428710938, -0.4803619384765625, -0.45886993408203125, -0.4373779296875, -0.41588592529296875, -0.3943939208984375, -0.37290191650390625, -0.351409912109375, -0.32991790771484375, -0.3084259033203125, -0.28693389892578125, -0.26544189453125, -0.24394989013671875, -0.2224578857421875, -0.20096588134765625, -0.179473876953125, -0.15798187255859375, -0.1364898681640625, -0.11499786376953125, -0.093505859375, -0.07201385498046875, -0.0505218505859375, -0.02902984619140625, -0.007537841796875, 0.01395416259765625, 0.0354461669921875, 0.05693817138671875, 0.07843017578125, 0.09992218017578125, 0.1214141845703125, 0.14290618896484375, 0.164398193359375, 0.18589019775390625, 0.2073822021484375, 0.22887420654296875, 0.2503662109375, 0.27185821533203125, 0.2933502197265625, 0.31484222412109375, 0.336334228515625, 0.35782623291015625, 0.3793182373046875, 0.40081024169921875, 0.42230224609375, 0.44379425048828125, 0.4652862548828125, 0.48677825927734375, 0.508270263671875, 0.5297622680664062, 0.5512542724609375, 0.5727462768554688, 0.59423828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 13.0, 6.0, 9.0, 12.0, 21.0, 24.0, 37.0, 35.0, 56.0, 70.0, 56.0, 87.0, 73.0, 65.0, 78.0, 63.0, 63.0, 43.0, 42.0, 29.0, 31.0, 20.0, 20.0, 7.0, 9.0, 7.0, 7.0, 8.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.466568887233734e-05, -3.350898623466492e-05, -3.235228359699249e-05, -3.119558095932007e-05, -3.0038878321647644e-05, -2.888217568397522e-05, -2.7725473046302795e-05, -2.656877040863037e-05, -2.5412067770957947e-05, -2.4255365133285522e-05, -2.3098662495613098e-05, -2.1941959857940674e-05, -2.078525722026825e-05, -1.9628554582595825e-05, -1.84718519449234e-05, -1.7315149307250977e-05, -1.6158446669578552e-05, -1.5001744031906128e-05, -1.3845041394233704e-05, -1.268833875656128e-05, -1.1531636118888855e-05, -1.037493348121643e-05, -9.218230843544006e-06, -8.061528205871582e-06, -6.904825568199158e-06, -5.748122930526733e-06, -4.591420292854309e-06, -3.4347176551818848e-06, -2.2780150175094604e-06, -1.1213123798370361e-06, 3.5390257835388184e-08, 1.1920928955078125e-06, 2.348795533180237e-06, 3.505498170852661e-06, 4.6622008085250854e-06, 5.81890344619751e-06, 6.975606083869934e-06, 8.132308721542358e-06, 9.289011359214783e-06, 1.0445713996887207e-05, 1.1602416634559631e-05, 1.2759119272232056e-05, 1.391582190990448e-05, 1.5072524547576904e-05, 1.622922718524933e-05, 1.7385929822921753e-05, 1.8542632460594177e-05, 1.96993350982666e-05, 2.0856037735939026e-05, 2.201274037361145e-05, 2.3169443011283875e-05, 2.43261456489563e-05, 2.5482848286628723e-05, 2.6639550924301147e-05, 2.7796253561973572e-05, 2.8952956199645996e-05, 3.010965883731842e-05, 3.1266361474990845e-05, 3.242306411266327e-05, 3.357976675033569e-05, 3.473646938800812e-05, 3.589317202568054e-05, 3.7049874663352966e-05, 3.820657730102539e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 13.0, 20.0, 26.0, 30.0, 52.0, 66.0, 99.0, 125.0, 202.0, 280.0, 429.0, 596.0, 890.0, 1308.0, 1943.0, 3022.0, 5083.0, 8602.0, 15757.0, 30742.0, 66124.0, 150366.0, 294873.0, 247504.0, 113559.0, 50525.0, 24272.0, 12708.0, 7076.0, 4203.0, 2723.0, 1744.0, 1115.0, 758.0, 478.0, 374.0, 243.0, 182.0, 111.0, 88.0, 59.0, 51.0, 29.0, 26.0, 19.0, 15.0, 13.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.82177734375, -0.7974853515625, -0.773193359375, -0.7489013671875, -0.724609375, -0.7003173828125, -0.676025390625, -0.6517333984375, -0.62744140625, -0.6031494140625, -0.578857421875, -0.5545654296875, -0.5302734375, -0.5059814453125, -0.481689453125, -0.4573974609375, -0.43310546875, -0.4088134765625, -0.384521484375, -0.3602294921875, -0.3359375, -0.3116455078125, -0.287353515625, -0.2630615234375, -0.23876953125, -0.2144775390625, -0.190185546875, -0.1658935546875, -0.1416015625, -0.1173095703125, -0.093017578125, -0.0687255859375, -0.04443359375, -0.0201416015625, 0.004150390625, 0.0284423828125, 0.052734375, 0.0770263671875, 0.101318359375, 0.1256103515625, 0.14990234375, 0.1741943359375, 0.198486328125, 0.2227783203125, 0.2470703125, 0.2713623046875, 0.295654296875, 0.3199462890625, 0.34423828125, 0.3685302734375, 0.392822265625, 0.4171142578125, 0.44140625, 0.4656982421875, 0.489990234375, 0.5142822265625, 0.53857421875, 0.5628662109375, 0.587158203125, 0.6114501953125, 0.6357421875, 0.6600341796875, 0.684326171875, 0.7086181640625, 0.73291015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 9.0, 14.0, 16.0, 15.0, 19.0, 33.0, 38.0, 62.0, 59.0, 74.0, 103.0, 142.0, 98.0, 69.0, 51.0, 35.0, 33.0, 20.0, 23.0, 14.0, 23.0, 8.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.278076171875, -0.2706108093261719, -0.26314544677734375, -0.2556800842285156, -0.2482147216796875, -0.24074935913085938, -0.23328399658203125, -0.22581863403320312, -0.218353271484375, -0.21088790893554688, -0.20342254638671875, -0.19595718383789062, -0.1884918212890625, -0.18102645874023438, -0.17356109619140625, -0.16609573364257812, -0.15863037109375, -0.15116500854492188, -0.14369964599609375, -0.13623428344726562, -0.1287689208984375, -0.12130355834960938, -0.11383819580078125, -0.10637283325195312, -0.098907470703125, -0.09144210815429688, -0.08397674560546875, -0.07651138305664062, -0.0690460205078125, -0.061580657958984375, -0.05411529541015625, -0.046649932861328125, -0.0391845703125, -0.031719207763671875, -0.02425384521484375, -0.016788482666015625, -0.0093231201171875, -0.001857757568359375, 0.00560760498046875, 0.013072967529296875, 0.020538330078125, 0.028003692626953125, 0.03546905517578125, 0.042934417724609375, 0.0503997802734375, 0.057865142822265625, 0.06533050537109375, 0.07279586791992188, 0.08026123046875, 0.08772659301757812, 0.09519195556640625, 0.10265731811523438, 0.1101226806640625, 0.11758804321289062, 0.12505340576171875, 0.13251876831054688, 0.139984130859375, 0.14744949340820312, 0.15491485595703125, 0.16238021850585938, 0.1698455810546875, 0.17731094360351562, 0.18477630615234375, 0.19224166870117188, 0.19970703125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 10.0, 18.0, 22.0, 30.0, 41.0, 33.0, 37.0, 43.0, 47.0, 56.0, 36.0, 41.0, 48.0, 42.0, 55.0, 46.0, 45.0, 42.0, 34.0, 52.0, 39.0, 26.0, 16.0, 31.0, 13.0, 12.0, 12.0, 12.0, 9.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.763997077941895, -8.492717742919922, -8.221439361572266, -7.950160503387451, -7.678881645202637, -7.407602310180664, -7.13632345199585, -6.865044593811035, -6.593765735626221, -6.322486877441406, -6.051208019256592, -5.779929161071777, -5.508649826049805, -5.237371444702148, -4.966092109680176, -4.694813251495361, -4.423534393310547, -4.152255535125732, -3.880976676940918, -3.6096975803375244, -3.33841872215271, -3.0671398639678955, -2.795860767364502, -2.5245819091796875, -2.253303050994873, -1.9820241928100586, -1.7107452154159546, -1.4394662380218506, -1.1681873798370361, -0.8969085216522217, -0.6256295442581177, -0.35435056686401367, -0.08307266235351562, 0.1882062554359436, 0.45948517322540283, 0.7307640910148621, 1.0020430088043213, 1.2733218669891357, 1.5446008443832397, 1.8158798217773438, 2.087158679962158, 2.3584375381469727, 2.629716396331787, 2.9009954929351807, 3.172274351119995, 3.4435532093048096, 3.714832305908203, 3.9861111640930176, 4.257390022277832, 4.5286688804626465, 4.799947738647461, 5.071226596832275, 5.34250545501709, 5.6137847900390625, 5.885063648223877, 6.156342506408691, 6.427621364593506, 6.69890022277832, 6.970179080963135, 7.241457939147949, 7.512737274169922, 7.784015655517578, 8.05529499053955, 8.326574325561523, 8.59785270690918]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 11.0, 7.0, 14.0, 18.0, 14.0, 20.0, 30.0, 24.0, 31.0, 32.0, 37.0, 39.0, 49.0, 41.0, 49.0, 47.0, 51.0, 60.0, 49.0, 42.0, 44.0, 41.0, 33.0, 38.0, 34.0, 31.0, 20.0, 13.0, 18.0, 20.0, 5.0, 9.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.703939437866211, -6.509706020355225, -6.31547212600708, -6.121238708496094, -5.927004814147949, -5.732771396636963, -5.538537979125977, -5.344304084777832, -5.1500701904296875, -4.955836772918701, -4.761602878570557, -4.56736946105957, -4.373135566711426, -4.1789021492004395, -3.984668493270874, -3.7904348373413086, -3.5962014198303223, -3.401967763900757, -3.2077341079711914, -3.013500690460205, -2.8192667961120605, -2.625033378601074, -2.430799722671509, -2.2365660667419434, -2.042332410812378, -1.8480987548828125, -1.653865098953247, -1.4596315622329712, -1.2653979063034058, -1.0711642503738403, -0.8769307136535645, -0.682697057723999, -0.4884629249572754, -0.29422929883003235, -0.0999956727027893, 0.09423792362213135, 0.2884715795516968, 0.4827052354812622, 0.6769387722015381, 0.8711724281311035, 1.065406084060669, 1.2596397399902344, 1.4538733959197998, 1.6481069326400757, 1.8423405885696411, 2.036574363708496, 2.2308077812194824, 2.425041437149048, 2.6192750930786133, 2.8135087490081787, 3.007742404937744, 3.2019758224487305, 3.396209716796875, 3.5904431343078613, 3.7846767902374268, 3.978910446166992, 4.173144340515137, 4.367377758026123, 4.561611652374268, 4.755845069885254, 4.950078964233398, 5.144312381744385, 5.338545799255371, 5.532779693603516, 5.727013111114502]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 7.0, 11.0, 22.0, 30.0, 51.0, 80.0, 145.0, 247.0, 317.0, 598.0, 1049.0, 1654.0, 2525.0, 3951.0, 6292.0, 9449.0, 14332.0, 21140.0, 30289.0, 41643.0, 55553.0, 71009.0, 85769.0, 95841.0, 102028.0, 100508.0, 92960.0, 79853.0, 64658.0, 50309.0, 37287.0, 26196.0, 18295.0, 12168.0, 8104.0, 5177.0, 3474.0, 2166.0, 1331.0, 776.0, 476.0, 312.0, 206.0, 115.0, 62.0, 40.0, 30.0, 12.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.912811279296875, -2.80413818359375, -2.695465087890625, -2.5867919921875, -2.478118896484375, -2.36944580078125, -2.260772705078125, -2.152099609375, -2.043426513671875, -1.93475341796875, -1.826080322265625, -1.7174072265625, -1.608734130859375, -1.50006103515625, -1.391387939453125, -1.28271484375, -1.174041748046875, -1.06536865234375, -0.956695556640625, -0.8480224609375, -0.739349365234375, -0.63067626953125, -0.522003173828125, -0.413330078125, -0.304656982421875, -0.19598388671875, -0.087310791015625, 0.0213623046875, 0.130035400390625, 0.23870849609375, 0.347381591796875, 0.4560546875, 0.564727783203125, 0.67340087890625, 0.782073974609375, 0.8907470703125, 0.999420166015625, 1.10809326171875, 1.216766357421875, 1.325439453125, 1.434112548828125, 1.54278564453125, 1.651458740234375, 1.7601318359375, 1.868804931640625, 1.97747802734375, 2.086151123046875, 2.19482421875, 2.303497314453125, 2.41217041015625, 2.520843505859375, 2.6295166015625, 2.738189697265625, 2.84686279296875, 2.955535888671875, 3.064208984375, 3.172882080078125, 3.28155517578125, 3.390228271484375, 3.4989013671875, 3.607574462890625, 3.71624755859375, 3.824920654296875, 3.93359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 12.0, 8.0, 6.0, 12.0, 14.0, 18.0, 20.0, 20.0, 44.0, 24.0, 37.0, 42.0, 36.0, 44.0, 44.0, 46.0, 56.0, 37.0, 56.0, 37.0, 55.0, 44.0, 49.0, 38.0, 19.0, 26.0, 23.0, 22.0, 24.0, 18.0, 13.0, 15.0, 9.0, 5.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4815673828125, -6.275634765625, -6.0697021484375, -5.86376953125, -5.6578369140625, -5.451904296875, -5.2459716796875, -5.0400390625, -4.8341064453125, -4.628173828125, -4.4222412109375, -4.21630859375, -4.0103759765625, -3.804443359375, -3.5985107421875, -3.392578125, -3.1866455078125, -2.980712890625, -2.7747802734375, -2.56884765625, -2.3629150390625, -2.156982421875, -1.9510498046875, -1.7451171875, -1.5391845703125, -1.333251953125, -1.1273193359375, -0.92138671875, -0.7154541015625, -0.509521484375, -0.3035888671875, -0.09765625, 0.1082763671875, 0.314208984375, 0.5201416015625, 0.72607421875, 0.9320068359375, 1.137939453125, 1.3438720703125, 1.5498046875, 1.7557373046875, 1.961669921875, 2.1676025390625, 2.37353515625, 2.5794677734375, 2.785400390625, 2.9913330078125, 3.197265625, 3.4031982421875, 3.609130859375, 3.8150634765625, 4.02099609375, 4.2269287109375, 4.432861328125, 4.6387939453125, 4.8447265625, 5.0506591796875, 5.256591796875, 5.4625244140625, 5.66845703125, 5.8743896484375, 6.080322265625, 6.2862548828125, 6.4921875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 14.0, 16.0, 27.0, 33.0, 72.0, 91.0, 146.0, 248.0, 378.0, 594.0, 913.0, 1388.0, 2186.0, 3173.0, 4752.0, 7060.0, 10329.0, 14696.0, 20764.0, 28174.0, 37303.0, 48306.0, 59222.0, 70581.0, 80328.0, 86985.0, 89547.0, 87138.0, 80466.0, 71124.0, 59988.0, 48752.0, 38060.0, 28414.0, 20730.0, 14917.0, 10376.0, 7058.0, 4792.0, 3241.0, 2209.0, 1357.0, 924.0, 608.0, 373.0, 248.0, 158.0, 91.0, 73.0, 50.0, 33.0, 22.0, 14.0, 4.0, 3.0, 3.0, 3.0, 2.0], "bins": [-3.12890625, -3.032684326171875, -2.93646240234375, -2.840240478515625, -2.7440185546875, -2.647796630859375, -2.55157470703125, -2.455352783203125, -2.359130859375, -2.262908935546875, -2.16668701171875, -2.070465087890625, -1.9742431640625, -1.878021240234375, -1.78179931640625, -1.685577392578125, -1.58935546875, -1.493133544921875, -1.39691162109375, -1.300689697265625, -1.2044677734375, -1.108245849609375, -1.01202392578125, -0.915802001953125, -0.819580078125, -0.723358154296875, -0.62713623046875, -0.530914306640625, -0.4346923828125, -0.338470458984375, -0.24224853515625, -0.146026611328125, -0.0498046875, 0.046417236328125, 0.14263916015625, 0.238861083984375, 0.3350830078125, 0.431304931640625, 0.52752685546875, 0.623748779296875, 0.719970703125, 0.816192626953125, 0.91241455078125, 1.008636474609375, 1.1048583984375, 1.201080322265625, 1.29730224609375, 1.393524169921875, 1.48974609375, 1.585968017578125, 1.68218994140625, 1.778411865234375, 1.8746337890625, 1.970855712890625, 2.06707763671875, 2.163299560546875, 2.259521484375, 2.355743408203125, 2.45196533203125, 2.548187255859375, 2.6444091796875, 2.740631103515625, 2.83685302734375, 2.933074951171875, 3.029296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 8.0, 2.0, 11.0, 8.0, 11.0, 13.0, 18.0, 16.0, 22.0, 21.0, 29.0, 31.0, 27.0, 28.0, 30.0, 37.0, 38.0, 44.0, 35.0, 40.0, 42.0, 38.0, 41.0, 43.0, 47.0, 41.0, 25.0, 34.0, 29.0, 39.0, 27.0, 21.0, 21.0, 16.0, 9.0, 9.0, 8.0, 12.0, 9.0, 4.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.198699951171875, -3.08685302734375, -2.975006103515625, -2.8631591796875, -2.751312255859375, -2.63946533203125, -2.527618408203125, -2.415771484375, -2.303924560546875, -2.19207763671875, -2.080230712890625, -1.9683837890625, -1.856536865234375, -1.74468994140625, -1.632843017578125, -1.52099609375, -1.409149169921875, -1.29730224609375, -1.185455322265625, -1.0736083984375, -0.961761474609375, -0.84991455078125, -0.738067626953125, -0.626220703125, -0.514373779296875, -0.40252685546875, -0.290679931640625, -0.1788330078125, -0.066986083984375, 0.04486083984375, 0.156707763671875, 0.2685546875, 0.380401611328125, 0.49224853515625, 0.604095458984375, 0.7159423828125, 0.827789306640625, 0.93963623046875, 1.051483154296875, 1.163330078125, 1.275177001953125, 1.38702392578125, 1.498870849609375, 1.6107177734375, 1.722564697265625, 1.83441162109375, 1.946258544921875, 2.05810546875, 2.169952392578125, 2.28179931640625, 2.393646240234375, 2.5054931640625, 2.617340087890625, 2.72918701171875, 2.841033935546875, 2.952880859375, 3.064727783203125, 3.17657470703125, 3.288421630859375, 3.4002685546875, 3.512115478515625, 3.62396240234375, 3.735809326171875, 3.84765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 20.0, 18.0, 28.0, 42.0, 45.0, 87.0, 127.0, 164.0, 230.0, 370.0, 594.0, 826.0, 1366.0, 2069.0, 3408.0, 5233.0, 8527.0, 13709.0, 21914.0, 34443.0, 52678.0, 76116.0, 103096.0, 124857.0, 134277.0, 127312.0, 104674.0, 79374.0, 55010.0, 35964.0, 23064.0, 14398.0, 8954.0, 5634.0, 3476.0, 2259.0, 1426.0, 900.0, 584.0, 418.0, 260.0, 180.0, 129.0, 90.0, 57.0, 42.0, 30.0, 18.0, 15.0, 11.0, 7.0, 9.0, 2.0, 3.0, 0.0, 4.0], "bins": [-2.5234375, -2.4459228515625, -2.368408203125, -2.2908935546875, -2.21337890625, -2.1358642578125, -2.058349609375, -1.9808349609375, -1.9033203125, -1.8258056640625, -1.748291015625, -1.6707763671875, -1.59326171875, -1.5157470703125, -1.438232421875, -1.3607177734375, -1.283203125, -1.2056884765625, -1.128173828125, -1.0506591796875, -0.97314453125, -0.8956298828125, -0.818115234375, -0.7406005859375, -0.6630859375, -0.5855712890625, -0.508056640625, -0.4305419921875, -0.35302734375, -0.2755126953125, -0.197998046875, -0.1204833984375, -0.04296875, 0.0345458984375, 0.112060546875, 0.1895751953125, 0.26708984375, 0.3446044921875, 0.422119140625, 0.4996337890625, 0.5771484375, 0.6546630859375, 0.732177734375, 0.8096923828125, 0.88720703125, 0.9647216796875, 1.042236328125, 1.1197509765625, 1.197265625, 1.2747802734375, 1.352294921875, 1.4298095703125, 1.50732421875, 1.5848388671875, 1.662353515625, 1.7398681640625, 1.8173828125, 1.8948974609375, 1.972412109375, 2.0499267578125, 2.12744140625, 2.2049560546875, 2.282470703125, 2.3599853515625, 2.4375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 6.0, 15.0, 14.0, 19.0, 25.0, 24.0, 27.0, 39.0, 33.0, 47.0, 57.0, 67.0, 67.0, 91.0, 65.0, 63.0, 40.0, 54.0, 42.0, 32.0, 37.0, 31.0, 22.0, 16.0, 17.0, 11.0, 12.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004189014434814453, -0.0004082620143890381, -0.00039762258529663086, -0.00038698315620422363, -0.0003763437271118164, -0.0003657042980194092, -0.00035506486892700195, -0.0003444254398345947, -0.0003337860107421875, -0.0003231465816497803, -0.00031250715255737305, -0.0003018677234649658, -0.0002912282943725586, -0.00028058886528015137, -0.00026994943618774414, -0.0002593100070953369, -0.0002486705780029297, -0.00023803114891052246, -0.00022739171981811523, -0.000216752290725708, -0.00020611286163330078, -0.00019547343254089355, -0.00018483400344848633, -0.0001741945743560791, -0.00016355514526367188, -0.00015291571617126465, -0.00014227628707885742, -0.0001316368579864502, -0.00012099742889404297, -0.00011035799980163574, -9.971857070922852e-05, -8.907914161682129e-05, -7.843971252441406e-05, -6.780028343200684e-05, -5.716085433959961e-05, -4.652142524719238e-05, -3.5881996154785156e-05, -2.524256706237793e-05, -1.4603137969970703e-05, -3.9637088775634766e-06, 6.67572021484375e-06, 1.7315149307250977e-05, 2.7954578399658203e-05, 3.859400749206543e-05, 4.9233436584472656e-05, 5.987286567687988e-05, 7.051229476928711e-05, 8.115172386169434e-05, 9.179115295410156e-05, 0.00010243058204650879, 0.00011307001113891602, 0.00012370944023132324, 0.00013434886932373047, 0.0001449882984161377, 0.00015562772750854492, 0.00016626715660095215, 0.00017690658569335938, 0.0001875460147857666, 0.00019818544387817383, 0.00020882487297058105, 0.00021946430206298828, 0.0002301037311553955, 0.00024074316024780273, 0.00025138258934020996, 0.0002620220184326172]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 11.0, 12.0, 11.0, 21.0, 34.0, 49.0, 72.0, 120.0, 203.0, 283.0, 509.0, 748.0, 1404.0, 2288.0, 4190.0, 7770.0, 14576.0, 28134.0, 53884.0, 97557.0, 155561.0, 196851.0, 184605.0, 132630.0, 77970.0, 41693.0, 21781.0, 11475.0, 6103.0, 3484.0, 1882.0, 1005.0, 625.0, 382.0, 226.0, 141.0, 103.0, 46.0, 43.0, 18.0, 16.0, 14.0, 8.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1468505859375, -4.024169921875, -3.9014892578125, -3.77880859375, -3.6561279296875, -3.533447265625, -3.4107666015625, -3.2880859375, -3.1654052734375, -3.042724609375, -2.9200439453125, -2.79736328125, -2.6746826171875, -2.552001953125, -2.4293212890625, -2.306640625, -2.1839599609375, -2.061279296875, -1.9385986328125, -1.81591796875, -1.6932373046875, -1.570556640625, -1.4478759765625, -1.3251953125, -1.2025146484375, -1.079833984375, -0.9571533203125, -0.83447265625, -0.7117919921875, -0.589111328125, -0.4664306640625, -0.34375, -0.2210693359375, -0.098388671875, 0.0242919921875, 0.14697265625, 0.2696533203125, 0.392333984375, 0.5150146484375, 0.6376953125, 0.7603759765625, 0.883056640625, 1.0057373046875, 1.12841796875, 1.2510986328125, 1.373779296875, 1.4964599609375, 1.619140625, 1.7418212890625, 1.864501953125, 1.9871826171875, 2.10986328125, 2.2325439453125, 2.355224609375, 2.4779052734375, 2.6005859375, 2.7232666015625, 2.845947265625, 2.9686279296875, 3.09130859375, 3.2139892578125, 3.336669921875, 3.4593505859375, 3.58203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 3.0, 6.0, 4.0, 12.0, 22.0, 14.0, 25.0, 18.0, 24.0, 25.0, 51.0, 41.0, 50.0, 49.0, 51.0, 74.0, 65.0, 72.0, 57.0, 52.0, 53.0, 43.0, 29.0, 30.0, 27.0, 22.0, 19.0, 11.0, 12.0, 11.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87255859375, -0.8431015014648438, -0.8136444091796875, -0.7841873168945312, -0.754730224609375, -0.7252731323242188, -0.6958160400390625, -0.6663589477539062, -0.63690185546875, -0.6074447631835938, -0.5779876708984375, -0.5485305786132812, -0.519073486328125, -0.48961639404296875, -0.4601593017578125, -0.43070220947265625, -0.4012451171875, -0.37178802490234375, -0.3423309326171875, -0.31287384033203125, -0.283416748046875, -0.25395965576171875, -0.2245025634765625, -0.19504547119140625, -0.16558837890625, -0.13613128662109375, -0.1066741943359375, -0.07721710205078125, -0.047760009765625, -0.01830291748046875, 0.0111541748046875, 0.04061126708984375, 0.070068359375, 0.09952545166015625, 0.1289825439453125, 0.15843963623046875, 0.187896728515625, 0.21735382080078125, 0.2468109130859375, 0.27626800537109375, 0.30572509765625, 0.33518218994140625, 0.3646392822265625, 0.39409637451171875, 0.423553466796875, 0.45301055908203125, 0.4824676513671875, 0.5119247436523438, 0.5413818359375, 0.5708389282226562, 0.6002960205078125, 0.6297531127929688, 0.659210205078125, 0.6886672973632812, 0.7181243896484375, 0.7475814819335938, 0.77703857421875, 0.8064956665039062, 0.8359527587890625, 0.8654098510742188, 0.894866943359375, 0.9243240356445312, 0.9537811279296875, 0.9832382202148438, 1.0126953125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 5.0, 17.0, 15.0, 16.0, 19.0, 30.0, 34.0, 31.0, 37.0, 47.0, 41.0, 36.0, 47.0, 56.0, 42.0, 40.0, 39.0, 43.0, 44.0, 42.0, 48.0, 33.0, 39.0, 17.0, 30.0, 21.0, 22.0, 22.0, 14.0, 5.0, 11.0, 14.0, 8.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.10930347442627, -7.853832244873047, -7.598361015319824, -7.34289026260376, -7.087419033050537, -6.8319478034973145, -6.57647705078125, -6.321005821228027, -6.065534591674805, -5.810063362121582, -5.554592132568359, -5.299121379852295, -5.043650150299072, -4.78817892074585, -4.532708168029785, -4.2772369384765625, -4.02176570892334, -3.766294479370117, -3.5108234882354736, -3.25535249710083, -2.9998812675476074, -2.7444100379943848, -2.488939046859741, -2.2334680557250977, -1.977996826171875, -1.722525715827942, -1.4670546054840088, -1.2115834951400757, -0.9561123847961426, -0.7006412744522095, -0.44517016410827637, -0.18969905376434326, 0.06577301025390625, 0.32124412059783936, 0.5767152309417725, 0.8321863412857056, 1.0876574516296387, 1.3431285619735718, 1.5985996723175049, 1.854070782661438, 2.109541893005371, 2.3650131225585938, 2.6204841136932373, 2.875955104827881, 3.1314263343811035, 3.386897563934326, 3.6423685550689697, 3.8978395462036133, 4.153310775756836, 4.408782005310059, 4.664253234863281, 4.919723987579346, 5.175195217132568, 5.430666446685791, 5.6861371994018555, 5.941608428955078, 6.197079658508301, 6.452550888061523, 6.708022117614746, 6.9634928703308105, 7.218964099884033, 7.474435329437256, 7.72990608215332, 7.985377311706543, 8.240848541259766]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 17.0, 15.0, 15.0, 32.0, 19.0, 20.0, 35.0, 27.0, 31.0, 35.0, 29.0, 52.0, 41.0, 54.0, 50.0, 50.0, 43.0, 49.0, 42.0, 33.0, 44.0, 40.0, 37.0, 29.0, 23.0, 17.0, 18.0, 17.0, 10.0, 11.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.037112236022949, -6.83136510848999, -6.625617980957031, -6.419870853424072, -6.214123725891113, -6.008376121520996, -5.802629470825195, -5.596881866455078, -5.391134738922119, -5.18538761138916, -4.979640483856201, -4.773893356323242, -4.568146228790283, -4.362399101257324, -4.156651496887207, -3.950904369354248, -3.745157480239868, -3.539410352706909, -3.33366322517395, -3.127915859222412, -2.922168731689453, -2.716421604156494, -2.510674476623535, -2.304927349090576, -2.099180221557617, -1.8934330940246582, -1.6876858472824097, -1.4819387197494507, -1.2761914730072021, -1.0704443454742432, -0.8646972179412842, -0.6589499711990356, -0.4532027244567871, -0.24745555222034454, -0.04170837998390198, 0.1640387773513794, 0.36978596448898315, 0.5755331516265869, 0.7812802791595459, 0.9870275259017944, 1.1927746534347534, 1.3985217809677124, 1.604269027709961, 1.81001615524292, 2.015763282775879, 2.221510410308838, 2.427257537841797, 2.633004903793335, 2.838752031326294, 3.044499158859253, 3.250246286392212, 3.45599365234375, 3.661740779876709, 3.867487907409668, 4.073235034942627, 4.278982162475586, 4.484729290008545, 4.690476417541504, 4.896223545074463, 5.101970672607422, 5.307717800140381, 5.51346492767334, 5.719212532043457, 5.924959659576416, 6.130706787109375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 25.0, 33.0, 53.0, 84.0, 129.0, 205.0, 341.0, 545.0, 797.0, 1391.0, 2377.0, 3697.0, 6123.0, 10170.0, 16467.0, 27065.0, 43757.0, 70466.0, 109666.0, 166196.0, 240421.0, 327676.0, 413422.0, 476480.0, 495881.0, 461312.0, 389177.0, 302140.0, 216725.0, 150108.0, 97728.0, 62982.0, 39451.0, 23800.0, 14747.0, 8985.0, 5366.0, 3401.0, 1991.0, 1172.0, 680.0, 409.0, 259.0, 154.0, 87.0, 52.0, 41.0, 7.0, 13.0, 10.0, 1.0, 5.0, 3.0], "bins": [-7.05859375, -6.8590087890625, -6.659423828125, -6.4598388671875, -6.26025390625, -6.0606689453125, -5.861083984375, -5.6614990234375, -5.4619140625, -5.2623291015625, -5.062744140625, -4.8631591796875, -4.66357421875, -4.4639892578125, -4.264404296875, -4.0648193359375, -3.865234375, -3.6656494140625, -3.466064453125, -3.2664794921875, -3.06689453125, -2.8673095703125, -2.667724609375, -2.4681396484375, -2.2685546875, -2.0689697265625, -1.869384765625, -1.6697998046875, -1.47021484375, -1.2706298828125, -1.071044921875, -0.8714599609375, -0.671875, -0.4722900390625, -0.272705078125, -0.0731201171875, 0.12646484375, 0.3260498046875, 0.525634765625, 0.7252197265625, 0.9248046875, 1.1243896484375, 1.323974609375, 1.5235595703125, 1.72314453125, 1.9227294921875, 2.122314453125, 2.3218994140625, 2.521484375, 2.7210693359375, 2.920654296875, 3.1202392578125, 3.31982421875, 3.5194091796875, 3.718994140625, 3.9185791015625, 4.1181640625, 4.3177490234375, 4.517333984375, 4.7169189453125, 4.91650390625, 5.1160888671875, 5.315673828125, 5.5152587890625, 5.71484375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 8.0, 10.0, 12.0, 10.0, 18.0, 20.0, 23.0, 24.0, 27.0, 28.0, 41.0, 45.0, 22.0, 39.0, 28.0, 43.0, 38.0, 46.0, 41.0, 51.0, 57.0, 44.0, 41.0, 32.0, 26.0, 35.0, 20.0, 25.0, 22.0, 20.0, 20.0, 15.0, 15.0, 9.0, 6.0, 3.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.32708740234375, -5.1541748046875, -4.98126220703125, -4.808349609375, -4.63543701171875, -4.4625244140625, -4.28961181640625, -4.11669921875, -3.94378662109375, -3.7708740234375, -3.59796142578125, -3.425048828125, -3.25213623046875, -3.0792236328125, -2.90631103515625, -2.7333984375, -2.56048583984375, -2.3875732421875, -2.21466064453125, -2.041748046875, -1.86883544921875, -1.6959228515625, -1.52301025390625, -1.35009765625, -1.17718505859375, -1.0042724609375, -0.83135986328125, -0.658447265625, -0.48553466796875, -0.3126220703125, -0.13970947265625, 0.033203125, 0.20611572265625, 0.3790283203125, 0.55194091796875, 0.724853515625, 0.89776611328125, 1.0706787109375, 1.24359130859375, 1.41650390625, 1.58941650390625, 1.7623291015625, 1.93524169921875, 2.108154296875, 2.28106689453125, 2.4539794921875, 2.62689208984375, 2.7998046875, 2.97271728515625, 3.1456298828125, 3.31854248046875, 3.491455078125, 3.66436767578125, 3.8372802734375, 4.01019287109375, 4.18310546875, 4.35601806640625, 4.5289306640625, 4.70184326171875, 4.874755859375, 5.04766845703125, 5.2205810546875, 5.39349365234375, 5.56640625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 13.0, 20.0, 33.0, 48.0, 69.0, 148.0, 180.0, 306.0, 456.0, 812.0, 1245.0, 2072.0, 3383.0, 5498.0, 8758.0, 14622.0, 22904.0, 36415.0, 58289.0, 88215.0, 132699.0, 189978.0, 260808.0, 337730.0, 406040.0, 449886.0, 456567.0, 423390.0, 362168.0, 286106.0, 212510.0, 150954.0, 101780.0, 66985.0, 42504.0, 26945.0, 16938.0, 10212.0, 6290.0, 3918.0, 2444.0, 1478.0, 924.0, 603.0, 353.0, 213.0, 149.0, 88.0, 52.0, 27.0, 18.0, 17.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0], "bins": [-7.16796875, -6.94512939453125, -6.7222900390625, -6.49945068359375, -6.276611328125, -6.05377197265625, -5.8309326171875, -5.60809326171875, -5.38525390625, -5.16241455078125, -4.9395751953125, -4.71673583984375, -4.493896484375, -4.27105712890625, -4.0482177734375, -3.82537841796875, -3.6025390625, -3.37969970703125, -3.1568603515625, -2.93402099609375, -2.711181640625, -2.48834228515625, -2.2655029296875, -2.04266357421875, -1.81982421875, -1.59698486328125, -1.3741455078125, -1.15130615234375, -0.928466796875, -0.70562744140625, -0.4827880859375, -0.25994873046875, -0.037109375, 0.18572998046875, 0.4085693359375, 0.63140869140625, 0.854248046875, 1.07708740234375, 1.2999267578125, 1.52276611328125, 1.74560546875, 1.96844482421875, 2.1912841796875, 2.41412353515625, 2.636962890625, 2.85980224609375, 3.0826416015625, 3.30548095703125, 3.5283203125, 3.75115966796875, 3.9739990234375, 4.19683837890625, 4.419677734375, 4.64251708984375, 4.8653564453125, 5.08819580078125, 5.31103515625, 5.53387451171875, 5.7567138671875, 5.97955322265625, 6.202392578125, 6.42523193359375, 6.6480712890625, 6.87091064453125, 7.09375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 4.0, 11.0, 12.0, 11.0, 16.0, 16.0, 26.0, 37.0, 34.0, 29.0, 57.0, 63.0, 57.0, 89.0, 84.0, 131.0, 133.0, 129.0, 155.0, 174.0, 173.0, 156.0, 171.0, 188.0, 182.0, 189.0, 190.0, 170.0, 176.0, 147.0, 160.0, 125.0, 125.0, 120.0, 93.0, 69.0, 76.0, 71.0, 50.0, 35.0, 28.0, 20.0, 22.0, 15.0, 9.0, 15.0, 6.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.5360107421875, -2.448974609375, -2.3619384765625, -2.27490234375, -2.1878662109375, -2.100830078125, -2.0137939453125, -1.9267578125, -1.8397216796875, -1.752685546875, -1.6656494140625, -1.57861328125, -1.4915771484375, -1.404541015625, -1.3175048828125, -1.23046875, -1.1434326171875, -1.056396484375, -0.9693603515625, -0.88232421875, -0.7952880859375, -0.708251953125, -0.6212158203125, -0.5341796875, -0.4471435546875, -0.360107421875, -0.2730712890625, -0.18603515625, -0.0989990234375, -0.011962890625, 0.0750732421875, 0.162109375, 0.2491455078125, 0.336181640625, 0.4232177734375, 0.51025390625, 0.5972900390625, 0.684326171875, 0.7713623046875, 0.8583984375, 0.9454345703125, 1.032470703125, 1.1195068359375, 1.20654296875, 1.2935791015625, 1.380615234375, 1.4676513671875, 1.5546875, 1.6417236328125, 1.728759765625, 1.8157958984375, 1.90283203125, 1.9898681640625, 2.076904296875, 2.1639404296875, 2.2509765625, 2.3380126953125, 2.425048828125, 2.5120849609375, 2.59912109375, 2.6861572265625, 2.773193359375, 2.8602294921875, 2.947265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 7.0, 5.0, 9.0, 18.0, 21.0, 26.0, 32.0, 23.0, 35.0, 32.0, 39.0, 46.0, 45.0, 59.0, 60.0, 47.0, 58.0, 57.0, 53.0, 46.0, 39.0, 38.0, 31.0, 25.0, 20.0, 21.0, 24.0, 15.0, 18.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.073060035705566, -11.724485397338867, -11.375911712646484, -11.027337074279785, -10.678762435913086, -10.330188751220703, -9.981614112854004, -9.633039474487305, -9.284465789794922, -8.935891151428223, -8.58731746673584, -8.23874282836914, -7.8901686668396, -7.541594505310059, -7.193019866943359, -6.844445705413818, -6.495871543884277, -6.147297382354736, -5.798723220825195, -5.450148582458496, -5.101574420928955, -4.753000259399414, -4.404425621032715, -4.055851459503174, -3.707277297973633, -3.358703136444092, -3.0101287364959717, -2.6615543365478516, -2.3129801750183105, -1.96440589427948, -1.6158316135406494, -1.2672572135925293, -0.9186840057373047, -0.5701097249984741, -0.22153544425964355, 0.127038836479187, 0.4756131172180176, 0.8241873979568481, 1.1727616786956787, 1.5213360786437988, 1.8699102401733398, 2.218484401702881, 2.567058801651001, 2.915633201599121, 3.264207363128662, 3.612781524658203, 3.9613559246063232, 4.309930324554443, 4.658504486083984, 5.007078647613525, 5.355652809143066, 5.704227447509766, 6.052801609039307, 6.401375770568848, 6.749950408935547, 7.098524570465088, 7.447098731994629, 7.79567289352417, 8.144247055053711, 8.49282169342041, 8.84139633178711, 9.189970016479492, 9.538544654846191, 9.88711929321289, 10.235692977905273]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 11.0, 11.0, 12.0, 4.0, 11.0, 15.0, 15.0, 27.0, 20.0, 26.0, 49.0, 26.0, 31.0, 29.0, 46.0, 38.0, 43.0, 44.0, 35.0, 57.0, 51.0, 36.0, 44.0, 31.0, 41.0, 33.0, 32.0, 26.0, 34.0, 14.0, 20.0, 12.0, 20.0, 11.0, 7.0, 9.0, 5.0, 2.0, 5.0, 4.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.456097602844238, -7.230588912963867, -7.005080223083496, -6.779571533203125, -6.554063320159912, -6.328554630279541, -6.10304594039917, -5.877537250518799, -5.652029037475586, -5.426520347595215, -5.201011657714844, -4.975502967834473, -4.74999475479126, -4.524486064910889, -4.298977375030518, -4.0734686851501465, -3.8479599952697754, -3.6224513053894043, -3.3969428539276123, -3.171434164047241, -2.945925712585449, -2.720417022705078, -2.494908332824707, -2.269399642944336, -2.043891191482544, -1.8183826208114624, -1.5928740501403809, -1.3673653602600098, -1.1418567895889282, -0.9163482189178467, -0.6908395290374756, -0.46533095836639404, -0.2398228645324707, -0.014314264059066772, 0.21119433641433716, 0.4367029666900635, 0.662211537361145, 0.8877201080322266, 1.1132287979125977, 1.3387373685836792, 1.5642459392547607, 1.7897545099258423, 2.015263080596924, 2.240771770477295, 2.466280460357666, 2.691788911819458, 2.917297601699829, 3.142806053161621, 3.368314743041992, 3.5938234329223633, 3.8193318843841553, 4.0448408126831055, 4.270349025726318, 4.4958577156066895, 4.7213664054870605, 4.946875095367432, 5.1723833084106445, 5.397891998291016, 5.623400688171387, 5.848909378051758, 6.074417591094971, 6.299926280975342, 6.525434970855713, 6.750943660736084, 6.976452350616455]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 17.0, 13.0, 28.0, 31.0, 48.0, 61.0, 111.0, 152.0, 240.0, 355.0, 509.0, 729.0, 1126.0, 1640.0, 2664.0, 4199.0, 6613.0, 10510.0, 17119.0, 28089.0, 47070.0, 80103.0, 132370.0, 192447.0, 191034.0, 131689.0, 79372.0, 46608.0, 27845.0, 16849.0, 10492.0, 6507.0, 4153.0, 2698.0, 1679.0, 1054.0, 758.0, 492.0, 346.0, 240.0, 147.0, 117.0, 67.0, 52.0, 36.0, 23.0, 17.0, 9.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.70703125, -1.6552886962890625, -1.603546142578125, -1.5518035888671875, -1.50006103515625, -1.4483184814453125, -1.396575927734375, -1.3448333740234375, -1.2930908203125, -1.2413482666015625, -1.189605712890625, -1.1378631591796875, -1.08612060546875, -1.0343780517578125, -0.982635498046875, -0.9308929443359375, -0.879150390625, -0.8274078369140625, -0.775665283203125, -0.7239227294921875, -0.67218017578125, -0.6204376220703125, -0.568695068359375, -0.5169525146484375, -0.4652099609375, -0.4134674072265625, -0.361724853515625, -0.3099822998046875, -0.25823974609375, -0.2064971923828125, -0.154754638671875, -0.1030120849609375, -0.05126953125, 0.0004730224609375, 0.052215576171875, 0.1039581298828125, 0.15570068359375, 0.2074432373046875, 0.259185791015625, 0.3109283447265625, 0.3626708984375, 0.4144134521484375, 0.466156005859375, 0.5178985595703125, 0.56964111328125, 0.6213836669921875, 0.673126220703125, 0.7248687744140625, 0.776611328125, 0.8283538818359375, 0.880096435546875, 0.9318389892578125, 0.98358154296875, 1.0353240966796875, 1.087066650390625, 1.1388092041015625, 1.1905517578125, 1.2422943115234375, 1.294036865234375, 1.3457794189453125, 1.39752197265625, 1.4492645263671875, 1.501007080078125, 1.5527496337890625, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 5.0, 9.0, 12.0, 8.0, 18.0, 20.0, 21.0, 26.0, 23.0, 29.0, 29.0, 43.0, 33.0, 28.0, 44.0, 40.0, 44.0, 45.0, 50.0, 50.0, 43.0, 43.0, 33.0, 37.0, 43.0, 20.0, 31.0, 20.0, 22.0, 20.0, 17.0, 17.0, 16.0, 5.0, 7.0, 12.0, 1.0, 6.0, 5.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.3946533203125, -7.148681640625, -6.9027099609375, -6.65673828125, -6.4107666015625, -6.164794921875, -5.9188232421875, -5.6728515625, -5.4268798828125, -5.180908203125, -4.9349365234375, -4.68896484375, -4.4429931640625, -4.197021484375, -3.9510498046875, -3.705078125, -3.4591064453125, -3.213134765625, -2.9671630859375, -2.72119140625, -2.4752197265625, -2.229248046875, -1.9832763671875, -1.7373046875, -1.4913330078125, -1.245361328125, -0.9993896484375, -0.75341796875, -0.5074462890625, -0.261474609375, -0.0155029296875, 0.23046875, 0.4764404296875, 0.722412109375, 0.9683837890625, 1.21435546875, 1.4603271484375, 1.706298828125, 1.9522705078125, 2.1982421875, 2.4442138671875, 2.690185546875, 2.9361572265625, 3.18212890625, 3.4281005859375, 3.674072265625, 3.9200439453125, 4.166015625, 4.4119873046875, 4.657958984375, 4.9039306640625, 5.14990234375, 5.3958740234375, 5.641845703125, 5.8878173828125, 6.1337890625, 6.3797607421875, 6.625732421875, 6.8717041015625, 7.11767578125, 7.3636474609375, 7.609619140625, 7.8555908203125, 8.1015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 14.0, 17.0, 11.0, 32.0, 50.0, 68.0, 100.0, 131.0, 199.0, 342.0, 476.0, 834.0, 1332.0, 2090.0, 3817.0, 6646.0, 11916.0, 22178.0, 41570.0, 79408.0, 149606.0, 236420.0, 217529.0, 127628.0, 67588.0, 35279.0, 18883.0, 10294.0, 5609.0, 3334.0, 1945.0, 1183.0, 724.0, 422.0, 298.0, 176.0, 139.0, 78.0, 48.0, 45.0, 31.0, 19.0, 14.0, 8.0, 11.0, 0.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8773651123046875, -1.812347412109375, -1.7473297119140625, -1.68231201171875, -1.6172943115234375, -1.552276611328125, -1.4872589111328125, -1.4222412109375, -1.3572235107421875, -1.292205810546875, -1.2271881103515625, -1.16217041015625, -1.0971527099609375, -1.032135009765625, -0.9671173095703125, -0.902099609375, -0.8370819091796875, -0.772064208984375, -0.7070465087890625, -0.64202880859375, -0.5770111083984375, -0.511993408203125, -0.4469757080078125, -0.3819580078125, -0.3169403076171875, -0.251922607421875, -0.1869049072265625, -0.12188720703125, -0.0568695068359375, 0.008148193359375, 0.0731658935546875, 0.13818359375, 0.2032012939453125, 0.268218994140625, 0.3332366943359375, 0.39825439453125, 0.4632720947265625, 0.528289794921875, 0.5933074951171875, 0.6583251953125, 0.7233428955078125, 0.788360595703125, 0.8533782958984375, 0.91839599609375, 0.9834136962890625, 1.048431396484375, 1.1134490966796875, 1.178466796875, 1.2434844970703125, 1.308502197265625, 1.3735198974609375, 1.43853759765625, 1.5035552978515625, 1.568572998046875, 1.6335906982421875, 1.6986083984375, 1.7636260986328125, 1.828643798828125, 1.8936614990234375, 1.95867919921875, 2.0236968994140625, 2.088714599609375, 2.1537322998046875, 2.21875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 16.0, 7.0, 13.0, 12.0, 14.0, 11.0, 12.0, 26.0, 30.0, 25.0, 27.0, 18.0, 36.0, 36.0, 31.0, 28.0, 35.0, 32.0, 39.0, 34.0, 44.0, 34.0, 41.0, 45.0, 43.0, 33.0, 23.0, 25.0, 27.0, 23.0, 20.0, 18.0, 21.0, 21.0, 7.0, 14.0, 14.0, 12.0, 10.0, 4.0, 4.0, 12.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.919921875, -3.787567138671875, -3.65521240234375, -3.522857666015625, -3.3905029296875, -3.258148193359375, -3.12579345703125, -2.993438720703125, -2.861083984375, -2.728729248046875, -2.59637451171875, -2.464019775390625, -2.3316650390625, -2.199310302734375, -2.06695556640625, -1.934600830078125, -1.80224609375, -1.669891357421875, -1.53753662109375, -1.405181884765625, -1.2728271484375, -1.140472412109375, -1.00811767578125, -0.875762939453125, -0.743408203125, -0.611053466796875, -0.47869873046875, -0.346343994140625, -0.2139892578125, -0.081634521484375, 0.05072021484375, 0.183074951171875, 0.3154296875, 0.447784423828125, 0.58013916015625, 0.712493896484375, 0.8448486328125, 0.977203369140625, 1.10955810546875, 1.241912841796875, 1.374267578125, 1.506622314453125, 1.63897705078125, 1.771331787109375, 1.9036865234375, 2.036041259765625, 2.16839599609375, 2.300750732421875, 2.43310546875, 2.565460205078125, 2.69781494140625, 2.830169677734375, 2.9625244140625, 3.094879150390625, 3.22723388671875, 3.359588623046875, 3.491943359375, 3.624298095703125, 3.75665283203125, 3.889007568359375, 4.0213623046875, 4.153717041015625, 4.28607177734375, 4.418426513671875, 4.55078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 10.0, 6.0, 12.0, 15.0, 21.0, 27.0, 34.0, 53.0, 71.0, 97.0, 161.0, 248.0, 440.0, 760.0, 1344.0, 2952.0, 6426.0, 16677.0, 53704.0, 234290.0, 517715.0, 152275.0, 38030.0, 12674.0, 5219.0, 2421.0, 1192.0, 652.0, 336.0, 241.0, 121.0, 88.0, 55.0, 52.0, 30.0, 29.0, 18.0, 14.0, 14.0, 5.0, 14.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.2545623779296875, -1.219085693359375, -1.1836090087890625, -1.14813232421875, -1.1126556396484375, -1.077178955078125, -1.0417022705078125, -1.0062255859375, -0.9707489013671875, -0.935272216796875, -0.8997955322265625, -0.86431884765625, -0.8288421630859375, -0.793365478515625, -0.7578887939453125, -0.722412109375, -0.6869354248046875, -0.651458740234375, -0.6159820556640625, -0.58050537109375, -0.5450286865234375, -0.509552001953125, -0.4740753173828125, -0.4385986328125, -0.4031219482421875, -0.367645263671875, -0.3321685791015625, -0.29669189453125, -0.2612152099609375, -0.225738525390625, -0.1902618408203125, -0.15478515625, -0.1193084716796875, -0.083831787109375, -0.0483551025390625, -0.01287841796875, 0.0225982666015625, 0.058074951171875, 0.0935516357421875, 0.1290283203125, 0.1645050048828125, 0.199981689453125, 0.2354583740234375, 0.27093505859375, 0.3064117431640625, 0.341888427734375, 0.3773651123046875, 0.412841796875, 0.4483184814453125, 0.483795166015625, 0.5192718505859375, 0.55474853515625, 0.5902252197265625, 0.625701904296875, 0.6611785888671875, 0.6966552734375, 0.7321319580078125, 0.767608642578125, 0.8030853271484375, 0.83856201171875, 0.8740386962890625, 0.909515380859375, 0.9449920654296875, 0.98046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 3.0, 16.0, 15.0, 8.0, 11.0, 26.0, 28.0, 36.0, 36.0, 51.0, 36.0, 42.0, 61.0, 53.0, 62.0, 40.0, 59.0, 57.0, 51.0, 39.0, 42.0, 37.0, 34.0, 36.0, 27.0, 18.0, 9.0, 17.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.651941031217575e-05, -2.5441870093345642e-05, -2.4364329874515533e-05, -2.3286789655685425e-05, -2.2209249436855316e-05, -2.1131709218025208e-05, -2.00541689991951e-05, -1.897662878036499e-05, -1.789908856153488e-05, -1.6821548342704773e-05, -1.5744008123874664e-05, -1.4666467905044556e-05, -1.3588927686214447e-05, -1.2511387467384338e-05, -1.143384724855423e-05, -1.0356307029724121e-05, -9.278766810894012e-06, -8.201226592063904e-06, -7.123686373233795e-06, -6.0461461544036865e-06, -4.968605935573578e-06, -3.891065716743469e-06, -2.8135254979133606e-06, -1.735985279083252e-06, -6.584450602531433e-07, 4.1909515857696533e-07, 1.496635377407074e-06, 2.5741755962371826e-06, 3.6517158150672913e-06, 4.7292560338974e-06, 5.8067962527275085e-06, 6.884336471557617e-06, 7.961876690387726e-06, 9.039416909217834e-06, 1.0116957128047943e-05, 1.1194497346878052e-05, 1.227203756570816e-05, 1.3349577784538269e-05, 1.4427118003368378e-05, 1.5504658222198486e-05, 1.6582198441028595e-05, 1.7659738659858704e-05, 1.8737278878688812e-05, 1.981481909751892e-05, 2.089235931634903e-05, 2.1969899535179138e-05, 2.3047439754009247e-05, 2.4124979972839355e-05, 2.5202520191669464e-05, 2.6280060410499573e-05, 2.735760062932968e-05, 2.843514084815979e-05, 2.95126810669899e-05, 3.059022128582001e-05, 3.1667761504650116e-05, 3.2745301723480225e-05, 3.382284194231033e-05, 3.490038216114044e-05, 3.597792237997055e-05, 3.705546259880066e-05, 3.813300281763077e-05, 3.9210543036460876e-05, 4.0288083255290985e-05, 4.1365623474121094e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 14.0, 13.0, 15.0, 22.0, 25.0, 40.0, 48.0, 82.0, 103.0, 141.0, 220.0, 317.0, 495.0, 771.0, 1257.0, 1983.0, 3495.0, 6383.0, 12373.0, 24934.0, 54649.0, 130626.0, 291593.0, 286714.0, 127404.0, 53261.0, 24260.0, 11975.0, 6228.0, 3534.0, 2028.0, 1266.0, 773.0, 491.0, 299.0, 208.0, 143.0, 94.0, 75.0, 56.0, 52.0, 22.0, 18.0, 15.0, 14.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.064453125, -1.0311737060546875, -0.997894287109375, -0.9646148681640625, -0.93133544921875, -0.8980560302734375, -0.864776611328125, -0.8314971923828125, -0.7982177734375, -0.7649383544921875, -0.731658935546875, -0.6983795166015625, -0.66510009765625, -0.6318206787109375, -0.598541259765625, -0.5652618408203125, -0.531982421875, -0.4987030029296875, -0.465423583984375, -0.4321441650390625, -0.39886474609375, -0.3655853271484375, -0.332305908203125, -0.2990264892578125, -0.2657470703125, -0.2324676513671875, -0.199188232421875, -0.1659088134765625, -0.13262939453125, -0.0993499755859375, -0.066070556640625, -0.0327911376953125, 0.00048828125, 0.0337677001953125, 0.067047119140625, 0.1003265380859375, 0.13360595703125, 0.1668853759765625, 0.200164794921875, 0.2334442138671875, 0.2667236328125, 0.3000030517578125, 0.333282470703125, 0.3665618896484375, 0.39984130859375, 0.4331207275390625, 0.466400146484375, 0.4996795654296875, 0.532958984375, 0.5662384033203125, 0.599517822265625, 0.6327972412109375, 0.66607666015625, 0.6993560791015625, 0.732635498046875, 0.7659149169921875, 0.7991943359375, 0.8324737548828125, 0.865753173828125, 0.8990325927734375, 0.93231201171875, 0.9655914306640625, 0.998870849609375, 1.0321502685546875, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 8.0, 10.0, 12.0, 11.0, 10.0, 9.0, 17.0, 15.0, 25.0, 20.0, 35.0, 43.0, 62.0, 76.0, 111.0, 98.0, 86.0, 70.0, 45.0, 39.0, 27.0, 27.0, 20.0, 20.0, 12.0, 10.0, 7.0, 14.0, 7.0, 10.0, 8.0, 3.0, 8.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.294189453125, -0.2862052917480469, -0.27822113037109375, -0.2702369689941406, -0.2622528076171875, -0.2542686462402344, -0.24628448486328125, -0.23830032348632812, -0.230316162109375, -0.22233200073242188, -0.21434783935546875, -0.20636367797851562, -0.1983795166015625, -0.19039535522460938, -0.18241119384765625, -0.17442703247070312, -0.16644287109375, -0.15845870971679688, -0.15047454833984375, -0.14249038696289062, -0.1345062255859375, -0.12652206420898438, -0.11853790283203125, -0.11055374145507812, -0.102569580078125, -0.09458541870117188, -0.08660125732421875, -0.07861709594726562, -0.0706329345703125, -0.06264877319335938, -0.05466461181640625, -0.046680450439453125, -0.0386962890625, -0.030712127685546875, -0.02272796630859375, -0.014743804931640625, -0.0067596435546875, 0.001224517822265625, 0.00920867919921875, 0.017192840576171875, 0.025177001953125, 0.033161163330078125, 0.04114532470703125, 0.049129486083984375, 0.0571136474609375, 0.06509780883789062, 0.07308197021484375, 0.08106613159179688, 0.08905029296875, 0.09703445434570312, 0.10501861572265625, 0.11300277709960938, 0.1209869384765625, 0.12897109985351562, 0.13695526123046875, 0.14493942260742188, 0.152923583984375, 0.16090774536132812, 0.16889190673828125, 0.17687606811523438, 0.1848602294921875, 0.19284439086914062, 0.20082855224609375, 0.20881271362304688, 0.216796875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 8.0, 17.0, 19.0, 23.0, 30.0, 30.0, 27.0, 41.0, 35.0, 44.0, 47.0, 48.0, 65.0, 55.0, 49.0, 66.0, 47.0, 44.0, 48.0, 37.0, 26.0, 32.0, 18.0, 23.0, 18.0, 22.0, 15.0, 9.0, 15.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-12.130864143371582, -11.783266067504883, -11.4356689453125, -11.0880708694458, -10.740472793579102, -10.392874717712402, -10.045276641845703, -9.69767951965332, -9.350081443786621, -9.002483367919922, -8.654886245727539, -8.30728816986084, -7.959690093994141, -7.612092018127441, -7.2644944190979, -6.916896820068359, -6.56929874420166, -6.221700668334961, -5.87410306930542, -5.526505470275879, -5.17890739440918, -4.8313093185424805, -4.4837117195129395, -4.136114120483398, -3.788516044616699, -3.440918207168579, -3.093320369720459, -2.745722532272339, -2.3981246948242188, -2.0505268573760986, -1.7029290199279785, -1.3553311824798584, -1.0077342987060547, -0.6601364612579346, -0.31253862380981445, 0.035059213638305664, 0.3826570510864258, 0.7302548885345459, 1.077852725982666, 1.4254505634307861, 1.7730484008789062, 2.1206462383270264, 2.4682440757751465, 2.8158419132232666, 3.1634397506713867, 3.511037588119507, 3.858635425567627, 4.206233024597168, 4.553831100463867, 4.901429176330566, 5.249026775360107, 5.596624374389648, 5.944222450256348, 6.291820526123047, 6.639418125152588, 6.987015724182129, 7.334613800048828, 7.682211875915527, 8.029809951782227, 8.37740707397461, 8.725005149841309, 9.072603225708008, 9.42020034790039, 9.76779842376709, 10.115396499633789]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 2.0, 7.0, 11.0, 12.0, 5.0, 10.0, 16.0, 15.0, 23.0, 22.0, 23.0, 43.0, 32.0, 34.0, 25.0, 45.0, 42.0, 35.0, 52.0, 35.0, 49.0, 52.0, 40.0, 49.0, 27.0, 41.0, 38.0, 31.0, 24.0, 36.0, 17.0, 16.0, 15.0, 17.0, 12.0, 9.0, 10.0, 5.0, 2.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.47013521194458, -7.243905067443848, -7.017674922943115, -6.791444778442383, -6.565214157104492, -6.338984489440918, -6.112753868103027, -5.886523723602295, -5.6602935791015625, -5.43406343460083, -5.207833290100098, -4.981603145599365, -4.755373001098633, -4.529142379760742, -4.30291223526001, -4.076682090759277, -3.850451946258545, -3.6242218017578125, -3.39799165725708, -3.1717612743377686, -2.945531129837036, -2.7193009853363037, -2.493070602416992, -2.2668404579162598, -2.0406103134155273, -1.814380168914795, -1.588149905204773, -1.361919641494751, -1.1356894969940186, -0.9094593524932861, -0.6832290887832642, -0.4569988250732422, -0.23076820373535156, -0.004537999629974365, 0.22169220447540283, 0.44792240858078003, 0.6741526126861572, 0.9003827571868896, 1.1266130208969116, 1.3528432846069336, 1.579073429107666, 1.8053035736083984, 2.031533718109131, 2.2577641010284424, 2.483994245529175, 2.7102243900299072, 2.9364547729492188, 3.162684917449951, 3.3889150619506836, 3.615145206451416, 3.8413753509521484, 4.067605495452881, 4.293835639953613, 4.520066261291504, 4.746296405792236, 4.972526550292969, 5.198756694793701, 5.424986839294434, 5.651216983795166, 5.877447128295898, 6.103677749633789, 6.329907417297363, 6.556138038635254, 6.782368183135986, 7.008598327636719]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 9.0, 13.0, 18.0, 33.0, 36.0, 69.0, 99.0, 163.0, 263.0, 425.0, 668.0, 973.0, 1566.0, 2332.0, 3740.0, 5764.0, 8882.0, 13170.0, 19482.0, 28085.0, 39300.0, 53078.0, 67883.0, 82291.0, 94117.0, 101567.0, 101543.0, 94101.0, 82687.0, 67988.0, 52851.0, 39268.0, 28111.0, 19456.0, 13458.0, 8948.0, 5850.0, 3693.0, 2344.0, 1476.0, 969.0, 642.0, 405.0, 270.0, 184.0, 92.0, 70.0, 45.0, 36.0, 20.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.171875, -4.04150390625, -3.9111328125, -3.78076171875, -3.650390625, -3.52001953125, -3.3896484375, -3.25927734375, -3.12890625, -2.99853515625, -2.8681640625, -2.73779296875, -2.607421875, -2.47705078125, -2.3466796875, -2.21630859375, -2.0859375, -1.95556640625, -1.8251953125, -1.69482421875, -1.564453125, -1.43408203125, -1.3037109375, -1.17333984375, -1.04296875, -0.91259765625, -0.7822265625, -0.65185546875, -0.521484375, -0.39111328125, -0.2607421875, -0.13037109375, 0.0, 0.13037109375, 0.2607421875, 0.39111328125, 0.521484375, 0.65185546875, 0.7822265625, 0.91259765625, 1.04296875, 1.17333984375, 1.3037109375, 1.43408203125, 1.564453125, 1.69482421875, 1.8251953125, 1.95556640625, 2.0859375, 2.21630859375, 2.3466796875, 2.47705078125, 2.607421875, 2.73779296875, 2.8681640625, 2.99853515625, 3.12890625, 3.25927734375, 3.3896484375, 3.52001953125, 3.650390625, 3.78076171875, 3.9111328125, 4.04150390625, 4.171875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 13.0, 15.0, 12.0, 20.0, 19.0, 18.0, 20.0, 27.0, 25.0, 25.0, 25.0, 37.0, 27.0, 46.0, 41.0, 34.0, 34.0, 32.0, 40.0, 36.0, 51.0, 34.0, 34.0, 34.0, 27.0, 36.0, 21.0, 30.0, 18.0, 22.0, 20.0, 16.0, 10.0, 10.0, 7.0, 11.0, 8.0, 6.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.75390625, -6.53973388671875, -6.3255615234375, -6.11138916015625, -5.897216796875, -5.68304443359375, -5.4688720703125, -5.25469970703125, -5.04052734375, -4.82635498046875, -4.6121826171875, -4.39801025390625, -4.183837890625, -3.96966552734375, -3.7554931640625, -3.54132080078125, -3.3271484375, -3.11297607421875, -2.8988037109375, -2.68463134765625, -2.470458984375, -2.25628662109375, -2.0421142578125, -1.82794189453125, -1.61376953125, -1.39959716796875, -1.1854248046875, -0.97125244140625, -0.757080078125, -0.54290771484375, -0.3287353515625, -0.11456298828125, 0.099609375, 0.31378173828125, 0.5279541015625, 0.74212646484375, 0.956298828125, 1.17047119140625, 1.3846435546875, 1.59881591796875, 1.81298828125, 2.02716064453125, 2.2413330078125, 2.45550537109375, 2.669677734375, 2.88385009765625, 3.0980224609375, 3.31219482421875, 3.5263671875, 3.74053955078125, 3.9547119140625, 4.16888427734375, 4.383056640625, 4.59722900390625, 4.8114013671875, 5.02557373046875, 5.23974609375, 5.45391845703125, 5.6680908203125, 5.88226318359375, 6.096435546875, 6.31060791015625, 6.5247802734375, 6.73895263671875, 6.953125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 18.0, 21.0, 29.0, 62.0, 75.0, 126.0, 188.0, 298.0, 426.0, 707.0, 1134.0, 1695.0, 2743.0, 4331.0, 6805.0, 10234.0, 15359.0, 22613.0, 32567.0, 44600.0, 59340.0, 74595.0, 88859.0, 99380.0, 103408.0, 100135.0, 90773.0, 76188.0, 61458.0, 46354.0, 33697.0, 23686.0, 16324.0, 10849.0, 7050.0, 4385.0, 2927.0, 1824.0, 1224.0, 747.0, 489.0, 305.0, 178.0, 127.0, 84.0, 50.0, 26.0, 17.0, 16.0, 10.0, 6.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.10546875, -3.97113037109375, -3.8367919921875, -3.70245361328125, -3.568115234375, -3.43377685546875, -3.2994384765625, -3.16510009765625, -3.03076171875, -2.89642333984375, -2.7620849609375, -2.62774658203125, -2.493408203125, -2.35906982421875, -2.2247314453125, -2.09039306640625, -1.9560546875, -1.82171630859375, -1.6873779296875, -1.55303955078125, -1.418701171875, -1.28436279296875, -1.1500244140625, -1.01568603515625, -0.88134765625, -0.74700927734375, -0.6126708984375, -0.47833251953125, -0.343994140625, -0.20965576171875, -0.0753173828125, 0.05902099609375, 0.193359375, 0.32769775390625, 0.4620361328125, 0.59637451171875, 0.730712890625, 0.86505126953125, 0.9993896484375, 1.13372802734375, 1.26806640625, 1.40240478515625, 1.5367431640625, 1.67108154296875, 1.805419921875, 1.93975830078125, 2.0740966796875, 2.20843505859375, 2.3427734375, 2.47711181640625, 2.6114501953125, 2.74578857421875, 2.880126953125, 3.01446533203125, 3.1488037109375, 3.28314208984375, 3.41748046875, 3.55181884765625, 3.6861572265625, 3.82049560546875, 3.954833984375, 4.08917236328125, 4.2235107421875, 4.35784912109375, 4.4921875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 9.0, 17.0, 16.0, 16.0, 17.0, 13.0, 31.0, 12.0, 31.0, 23.0, 26.0, 36.0, 45.0, 45.0, 32.0, 39.0, 40.0, 54.0, 45.0, 50.0, 43.0, 34.0, 45.0, 31.0, 30.0, 37.0, 26.0, 21.0, 23.0, 12.0, 13.0, 11.0, 17.0, 14.0, 8.0, 5.0, 5.0, 3.0, 10.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.06829833984375, -4.9100341796875, -4.75177001953125, -4.593505859375, -4.43524169921875, -4.2769775390625, -4.11871337890625, -3.96044921875, -3.80218505859375, -3.6439208984375, -3.48565673828125, -3.327392578125, -3.16912841796875, -3.0108642578125, -2.85260009765625, -2.6943359375, -2.53607177734375, -2.3778076171875, -2.21954345703125, -2.061279296875, -1.90301513671875, -1.7447509765625, -1.58648681640625, -1.42822265625, -1.26995849609375, -1.1116943359375, -0.95343017578125, -0.795166015625, -0.63690185546875, -0.4786376953125, -0.32037353515625, -0.162109375, -0.00384521484375, 0.1544189453125, 0.31268310546875, 0.470947265625, 0.62921142578125, 0.7874755859375, 0.94573974609375, 1.10400390625, 1.26226806640625, 1.4205322265625, 1.57879638671875, 1.737060546875, 1.89532470703125, 2.0535888671875, 2.21185302734375, 2.3701171875, 2.52838134765625, 2.6866455078125, 2.84490966796875, 3.003173828125, 3.16143798828125, 3.3197021484375, 3.47796630859375, 3.63623046875, 3.79449462890625, 3.9527587890625, 4.11102294921875, 4.269287109375, 4.42755126953125, 4.5858154296875, 4.74407958984375, 4.90234375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 3.0, 6.0, 14.0, 21.0, 42.0, 37.0, 66.0, 77.0, 118.0, 179.0, 272.0, 405.0, 622.0, 944.0, 1555.0, 2596.0, 4416.0, 7419.0, 13691.0, 25079.0, 45054.0, 76121.0, 115602.0, 152489.0, 166539.0, 149499.0, 113028.0, 73663.0, 43252.0, 24124.0, 13234.0, 7336.0, 4130.0, 2532.0, 1521.0, 967.0, 632.0, 421.0, 284.0, 167.0, 123.0, 96.0, 55.0, 34.0, 23.0, 23.0, 14.0, 9.0, 5.0, 4.0, 6.0, 1.0, 4.0, 2.0], "bins": [-3.62890625, -3.52362060546875, -3.4183349609375, -3.31304931640625, -3.207763671875, -3.10247802734375, -2.9971923828125, -2.89190673828125, -2.78662109375, -2.68133544921875, -2.5760498046875, -2.47076416015625, -2.365478515625, -2.26019287109375, -2.1549072265625, -2.04962158203125, -1.9443359375, -1.83905029296875, -1.7337646484375, -1.62847900390625, -1.523193359375, -1.41790771484375, -1.3126220703125, -1.20733642578125, -1.10205078125, -0.99676513671875, -0.8914794921875, -0.78619384765625, -0.680908203125, -0.57562255859375, -0.4703369140625, -0.36505126953125, -0.259765625, -0.15447998046875, -0.0491943359375, 0.05609130859375, 0.161376953125, 0.26666259765625, 0.3719482421875, 0.47723388671875, 0.58251953125, 0.68780517578125, 0.7930908203125, 0.89837646484375, 1.003662109375, 1.10894775390625, 1.2142333984375, 1.31951904296875, 1.4248046875, 1.53009033203125, 1.6353759765625, 1.74066162109375, 1.845947265625, 1.95123291015625, 2.0565185546875, 2.16180419921875, 2.26708984375, 2.37237548828125, 2.4776611328125, 2.58294677734375, 2.688232421875, 2.79351806640625, 2.8988037109375, 3.00408935546875, 3.109375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 17.0, 17.0, 19.0, 33.0, 41.0, 39.0, 51.0, 52.0, 58.0, 62.0, 59.0, 71.0, 53.0, 55.0, 53.0, 47.0, 47.0, 35.0, 28.0, 26.0, 23.0, 17.0, 15.0, 9.0, 8.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037097930908203125, -0.0003603808581829071, -0.00034978240728378296, -0.0003391839563846588, -0.00032858550548553467, -0.0003179870545864105, -0.0003073886036872864, -0.00029679015278816223, -0.0002861917018890381, -0.00027559325098991394, -0.0002649948000907898, -0.00025439634919166565, -0.0002437978982925415, -0.00023319944739341736, -0.0002226009964942932, -0.00021200254559516907, -0.00020140409469604492, -0.00019080564379692078, -0.00018020719289779663, -0.00016960874199867249, -0.00015901029109954834, -0.0001484118402004242, -0.00013781338930130005, -0.0001272149384021759, -0.00011661648750305176, -0.00010601803660392761, -9.541958570480347e-05, -8.482113480567932e-05, -7.422268390655518e-05, -6.362423300743103e-05, -5.3025782108306885e-05, -4.242733120918274e-05, -3.1828880310058594e-05, -2.1230429410934448e-05, -1.0631978511810303e-05, -3.3527612686157227e-08, 1.0564923286437988e-05, 2.1163374185562134e-05, 3.176182508468628e-05, 4.2360275983810425e-05, 5.295872688293457e-05, 6.355717778205872e-05, 7.415562868118286e-05, 8.475407958030701e-05, 9.535253047943115e-05, 0.0001059509813785553, 0.00011654943227767944, 0.0001271478831768036, 0.00013774633407592773, 0.00014834478497505188, 0.00015894323587417603, 0.00016954168677330017, 0.00018014013767242432, 0.00019073858857154846, 0.0002013370394706726, 0.00021193549036979675, 0.0002225339412689209, 0.00023313239216804504, 0.0002437308430671692, 0.00025432929396629333, 0.0002649277448654175, 0.0002755261957645416, 0.00028612464666366577, 0.0002967230975627899, 0.00030732154846191406]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 14.0, 11.0, 22.0, 23.0, 43.0, 58.0, 106.0, 129.0, 212.0, 316.0, 456.0, 767.0, 1129.0, 1833.0, 3303.0, 6028.0, 12304.0, 26500.0, 58727.0, 118097.0, 194502.0, 228210.0, 185176.0, 109093.0, 52611.0, 23963.0, 11246.0, 5735.0, 3104.0, 1800.0, 1028.0, 724.0, 418.0, 291.0, 192.0, 119.0, 86.0, 62.0, 39.0, 25.0, 20.0, 16.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.23046875, -5.07403564453125, -4.9176025390625, -4.76116943359375, -4.604736328125, -4.44830322265625, -4.2918701171875, -4.13543701171875, -3.97900390625, -3.82257080078125, -3.6661376953125, -3.50970458984375, -3.353271484375, -3.19683837890625, -3.0404052734375, -2.88397216796875, -2.7275390625, -2.57110595703125, -2.4146728515625, -2.25823974609375, -2.101806640625, -1.94537353515625, -1.7889404296875, -1.63250732421875, -1.47607421875, -1.31964111328125, -1.1632080078125, -1.00677490234375, -0.850341796875, -0.69390869140625, -0.5374755859375, -0.38104248046875, -0.224609375, -0.06817626953125, 0.0882568359375, 0.24468994140625, 0.401123046875, 0.55755615234375, 0.7139892578125, 0.87042236328125, 1.02685546875, 1.18328857421875, 1.3397216796875, 1.49615478515625, 1.652587890625, 1.80902099609375, 1.9654541015625, 2.12188720703125, 2.2783203125, 2.43475341796875, 2.5911865234375, 2.74761962890625, 2.904052734375, 3.06048583984375, 3.2169189453125, 3.37335205078125, 3.52978515625, 3.68621826171875, 3.8426513671875, 3.99908447265625, 4.155517578125, 4.31195068359375, 4.4683837890625, 4.62481689453125, 4.78125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 9.0, 7.0, 11.0, 7.0, 16.0, 14.0, 23.0, 18.0, 23.0, 39.0, 39.0, 37.0, 36.0, 33.0, 52.0, 59.0, 45.0, 47.0, 45.0, 55.0, 46.0, 49.0, 37.0, 35.0, 34.0, 24.0, 27.0, 21.0, 19.0, 12.0, 10.0, 8.0, 7.0, 6.0, 8.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.95361328125, -0.9244384765625, -0.895263671875, -0.8660888671875, -0.8369140625, -0.8077392578125, -0.778564453125, -0.7493896484375, -0.72021484375, -0.6910400390625, -0.661865234375, -0.6326904296875, -0.603515625, -0.5743408203125, -0.545166015625, -0.5159912109375, -0.48681640625, -0.4576416015625, -0.428466796875, -0.3992919921875, -0.3701171875, -0.3409423828125, -0.311767578125, -0.2825927734375, -0.25341796875, -0.2242431640625, -0.195068359375, -0.1658935546875, -0.13671875, -0.1075439453125, -0.078369140625, -0.0491943359375, -0.02001953125, 0.0091552734375, 0.038330078125, 0.0675048828125, 0.0966796875, 0.1258544921875, 0.155029296875, 0.1842041015625, 0.21337890625, 0.2425537109375, 0.271728515625, 0.3009033203125, 0.330078125, 0.3592529296875, 0.388427734375, 0.4176025390625, 0.44677734375, 0.4759521484375, 0.505126953125, 0.5343017578125, 0.5634765625, 0.5926513671875, 0.621826171875, 0.6510009765625, 0.68017578125, 0.7093505859375, 0.738525390625, 0.7677001953125, 0.796875, 0.8260498046875, 0.855224609375, 0.8843994140625, 0.91357421875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 17.0, 10.0, 22.0, 22.0, 22.0, 31.0, 24.0, 37.0, 37.0, 47.0, 48.0, 55.0, 48.0, 50.0, 56.0, 48.0, 52.0, 61.0, 48.0, 33.0, 36.0, 33.0, 27.0, 21.0, 16.0, 22.0, 12.0, 7.0, 8.0, 6.0, 9.0, 8.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.98258113861084, -11.630254745483398, -11.277929306030273, -10.925602912902832, -10.57327651977539, -10.220951080322266, -9.868624687194824, -9.516298294067383, -9.163972854614258, -8.811646461486816, -8.459321022033691, -8.10699462890625, -7.754668712615967, -7.402342796325684, -7.050016403198242, -6.697690486907959, -6.345364570617676, -5.993038654327393, -5.640712738037109, -5.288386344909668, -4.936060428619385, -4.583734512329102, -4.23140811920166, -3.879082202911377, -3.5267562866210938, -3.1744303703308105, -2.8221042156219482, -2.469778060913086, -2.1174521446228027, -1.76512610912323, -1.4128000736236572, -1.060473918914795, -0.7081480026245117, -0.35582196712493896, -0.003495931625366211, 0.34883010387420654, 0.7011561393737793, 1.053482174873352, 1.4058082103729248, 1.758134365081787, 2.1104602813720703, 2.4627861976623535, 2.815112352371216, 3.167438507080078, 3.5197644233703613, 3.8720903396606445, 4.224416732788086, 4.576742649078369, 4.929068565368652, 5.2813944816589355, 5.633720397949219, 5.98604679107666, 6.338372707366943, 6.690698623657227, 7.043025016784668, 7.395350933074951, 7.747676849365234, 8.100003242492676, 8.4523286819458, 8.804655075073242, 9.156980514526367, 9.509306907653809, 9.86163330078125, 10.213958740234375, 10.566285133361816]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 9.0, 9.0, 6.0, 11.0, 13.0, 16.0, 14.0, 13.0, 16.0, 23.0, 27.0, 29.0, 32.0, 33.0, 41.0, 38.0, 50.0, 43.0, 44.0, 50.0, 33.0, 45.0, 32.0, 38.0, 36.0, 24.0, 23.0, 31.0, 34.0, 20.0, 29.0, 22.0, 14.0, 18.0, 14.0, 13.0, 10.0, 10.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0], "bins": [-7.4137349128723145, -7.188457012176514, -6.963178634643555, -6.737900733947754, -6.512622833251953, -6.287344455718994, -6.062066555023193, -5.836788177490234, -5.611510276794434, -5.386232376098633, -5.160953998565674, -4.935676097869873, -4.710397720336914, -4.485119819641113, -4.2598419189453125, -4.034564018249512, -3.8092856407165527, -3.584007501602173, -3.358729362487793, -3.133451461791992, -2.9081733226776123, -2.6828951835632324, -2.4576172828674316, -2.2323391437530518, -2.007061004638672, -1.781782865524292, -1.5565048456192017, -1.3312268257141113, -1.1059486865997314, -0.8806705474853516, -0.6553925275802612, -0.4301145076751709, -0.2048358917236328, 0.020442187786102295, 0.2457202672958374, 0.4709983468055725, 0.6962764263153076, 0.9215545654296875, 1.1468325853347778, 1.3721106052398682, 1.597388744354248, 1.822666883468628, 2.047945022583008, 2.2732229232788086, 2.4985010623931885, 2.7237792015075684, 2.949057102203369, 3.174335241317749, 3.399613380432129, 3.624891519546509, 3.8501696586608887, 4.0754475593566895, 4.300725936889648, 4.526003837585449, 4.75128173828125, 4.976559638977051, 5.20183801651001, 5.4271159172058105, 5.6523942947387695, 5.87767219543457, 6.102950096130371, 6.32822847366333, 6.553506374359131, 6.77878475189209, 7.004062652587891]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 6.0, 11.0, 22.0, 28.0, 30.0, 51.0, 88.0, 132.0, 235.0, 378.0, 570.0, 889.0, 1398.0, 2257.0, 3777.0, 6240.0, 9785.0, 16307.0, 26556.0, 42328.0, 67516.0, 105505.0, 159355.0, 233683.0, 323280.0, 416206.0, 488708.0, 510099.0, 473967.0, 395356.0, 300167.0, 213948.0, 144380.0, 94864.0, 59795.0, 37513.0, 22980.0, 14143.0, 8469.0, 5115.0, 3166.0, 1930.0, 1138.0, 732.0, 463.0, 294.0, 160.0, 107.0, 62.0, 33.0, 26.0, 15.0, 11.0, 8.0, 4.0, 2.0, 2.0], "bins": [-9.015625, -8.7532958984375, -8.490966796875, -8.2286376953125, -7.96630859375, -7.7039794921875, -7.441650390625, -7.1793212890625, -6.9169921875, -6.6546630859375, -6.392333984375, -6.1300048828125, -5.86767578125, -5.6053466796875, -5.343017578125, -5.0806884765625, -4.818359375, -4.5560302734375, -4.293701171875, -4.0313720703125, -3.76904296875, -3.5067138671875, -3.244384765625, -2.9820556640625, -2.7197265625, -2.4573974609375, -2.195068359375, -1.9327392578125, -1.67041015625, -1.4080810546875, -1.145751953125, -0.8834228515625, -0.62109375, -0.3587646484375, -0.096435546875, 0.1658935546875, 0.42822265625, 0.6905517578125, 0.952880859375, 1.2152099609375, 1.4775390625, 1.7398681640625, 2.002197265625, 2.2645263671875, 2.52685546875, 2.7891845703125, 3.051513671875, 3.3138427734375, 3.576171875, 3.8385009765625, 4.100830078125, 4.3631591796875, 4.62548828125, 4.8878173828125, 5.150146484375, 5.4124755859375, 5.6748046875, 5.9371337890625, 6.199462890625, 6.4617919921875, 6.72412109375, 6.9864501953125, 7.248779296875, 7.5111083984375, 7.7734375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 9.0, 4.0, 6.0, 9.0, 7.0, 6.0, 14.0, 14.0, 15.0, 27.0, 27.0, 28.0, 20.0, 35.0, 24.0, 47.0, 46.0, 41.0, 46.0, 53.0, 56.0, 33.0, 46.0, 30.0, 35.0, 35.0, 37.0, 32.0, 28.0, 27.0, 24.0, 24.0, 29.0, 14.0, 12.0, 13.0, 17.0, 6.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.10791015625, -6.8759765625, -6.64404296875, -6.412109375, -6.18017578125, -5.9482421875, -5.71630859375, -5.484375, -5.25244140625, -5.0205078125, -4.78857421875, -4.556640625, -4.32470703125, -4.0927734375, -3.86083984375, -3.62890625, -3.39697265625, -3.1650390625, -2.93310546875, -2.701171875, -2.46923828125, -2.2373046875, -2.00537109375, -1.7734375, -1.54150390625, -1.3095703125, -1.07763671875, -0.845703125, -0.61376953125, -0.3818359375, -0.14990234375, 0.08203125, 0.31396484375, 0.5458984375, 0.77783203125, 1.009765625, 1.24169921875, 1.4736328125, 1.70556640625, 1.9375, 2.16943359375, 2.4013671875, 2.63330078125, 2.865234375, 3.09716796875, 3.3291015625, 3.56103515625, 3.79296875, 4.02490234375, 4.2568359375, 4.48876953125, 4.720703125, 4.95263671875, 5.1845703125, 5.41650390625, 5.6484375, 5.88037109375, 6.1123046875, 6.34423828125, 6.576171875, 6.80810546875, 7.0400390625, 7.27197265625, 7.50390625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 20.0, 45.0, 73.0, 120.0, 214.0, 313.0, 472.0, 796.0, 1313.0, 2121.0, 3719.0, 5919.0, 9913.0, 16172.0, 26155.0, 41564.0, 66298.0, 102518.0, 153259.0, 222093.0, 299119.0, 381474.0, 447007.0, 477693.0, 462363.0, 406672.0, 327092.0, 245658.0, 172676.0, 117537.0, 76947.0, 48616.0, 30452.0, 18658.0, 11386.0, 6955.0, 4294.0, 2576.0, 1590.0, 961.0, 563.0, 361.0, 211.0, 127.0, 69.0, 42.0, 23.0, 20.0, 19.0, 6.0, 0.0, 3.0, 0.0, 3.0], "bins": [-10.3671875, -10.0592041015625, -9.751220703125, -9.4432373046875, -9.13525390625, -8.8272705078125, -8.519287109375, -8.2113037109375, -7.9033203125, -7.5953369140625, -7.287353515625, -6.9793701171875, -6.67138671875, -6.3634033203125, -6.055419921875, -5.7474365234375, -5.439453125, -5.1314697265625, -4.823486328125, -4.5155029296875, -4.20751953125, -3.8995361328125, -3.591552734375, -3.2835693359375, -2.9755859375, -2.6676025390625, -2.359619140625, -2.0516357421875, -1.74365234375, -1.4356689453125, -1.127685546875, -0.8197021484375, -0.51171875, -0.2037353515625, 0.104248046875, 0.4122314453125, 0.72021484375, 1.0281982421875, 1.336181640625, 1.6441650390625, 1.9521484375, 2.2601318359375, 2.568115234375, 2.8760986328125, 3.18408203125, 3.4920654296875, 3.800048828125, 4.1080322265625, 4.416015625, 4.7239990234375, 5.031982421875, 5.3399658203125, 5.64794921875, 5.9559326171875, 6.263916015625, 6.5718994140625, 6.8798828125, 7.1878662109375, 7.495849609375, 7.8038330078125, 8.11181640625, 8.4197998046875, 8.727783203125, 9.0357666015625, 9.34375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 7.0, 10.0, 21.0, 30.0, 22.0, 40.0, 63.0, 46.0, 79.0, 97.0, 99.0, 128.0, 154.0, 166.0, 176.0, 184.0, 208.0, 198.0, 204.0, 214.0, 203.0, 183.0, 200.0, 186.0, 182.0, 170.0, 146.0, 117.0, 100.0, 76.0, 70.0, 60.0, 56.0, 51.0, 33.0, 24.0, 16.0, 13.0, 11.0, 10.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.12603759765625, -3.9942626953125, -3.86248779296875, -3.730712890625, -3.59893798828125, -3.4671630859375, -3.33538818359375, -3.20361328125, -3.07183837890625, -2.9400634765625, -2.80828857421875, -2.676513671875, -2.54473876953125, -2.4129638671875, -2.28118896484375, -2.1494140625, -2.01763916015625, -1.8858642578125, -1.75408935546875, -1.622314453125, -1.49053955078125, -1.3587646484375, -1.22698974609375, -1.09521484375, -0.96343994140625, -0.8316650390625, -0.69989013671875, -0.568115234375, -0.43634033203125, -0.3045654296875, -0.17279052734375, -0.041015625, 0.09075927734375, 0.2225341796875, 0.35430908203125, 0.486083984375, 0.61785888671875, 0.7496337890625, 0.88140869140625, 1.01318359375, 1.14495849609375, 1.2767333984375, 1.40850830078125, 1.540283203125, 1.67205810546875, 1.8038330078125, 1.93560791015625, 2.0673828125, 2.19915771484375, 2.3309326171875, 2.46270751953125, 2.594482421875, 2.72625732421875, 2.8580322265625, 2.98980712890625, 3.12158203125, 3.25335693359375, 3.3851318359375, 3.51690673828125, 3.648681640625, 3.78045654296875, 3.9122314453125, 4.04400634765625, 4.17578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 9.0, 9.0, 10.0, 9.0, 9.0, 19.0, 18.0, 17.0, 24.0, 32.0, 42.0, 51.0, 50.0, 52.0, 53.0, 51.0, 39.0, 49.0, 49.0, 60.0, 50.0, 56.0, 47.0, 28.0, 25.0, 23.0, 30.0, 24.0, 7.0, 7.0, 11.0, 10.0, 4.0, 2.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.964387893676758, -17.475332260131836, -16.986276626586914, -16.497220993041992, -16.00816535949707, -15.519109725952148, -15.030054092407227, -14.540998458862305, -14.051942825317383, -13.562887191772461, -13.073831558227539, -12.584775924682617, -12.095720291137695, -11.606664657592773, -11.117609024047852, -10.62855339050293, -10.139497756958008, -9.650442123413086, -9.161386489868164, -8.672330856323242, -8.18327522277832, -7.694219589233398, -7.205163955688477, -6.716108322143555, -6.227052688598633, -5.737997055053711, -5.248941421508789, -4.759885787963867, -4.270830154418945, -3.7817745208740234, -3.2927188873291016, -2.8036632537841797, -2.314608573913574, -1.8255529403686523, -1.3364973068237305, -0.8474416732788086, -0.3583860397338867, 0.13066959381103516, 0.619725227355957, 1.108780860900879, 1.5978364944458008, 2.0868921279907227, 2.5759477615356445, 3.0650033950805664, 3.5540590286254883, 4.04311466217041, 4.532170295715332, 5.021225929260254, 5.510281562805176, 5.999337196350098, 6.4883928298950195, 6.977448463439941, 7.466504096984863, 7.955559730529785, 8.444615364074707, 8.933670997619629, 9.42272663116455, 9.911782264709473, 10.400837898254395, 10.889893531799316, 11.378949165344238, 11.86800479888916, 12.357060432434082, 12.846116065979004, 13.335171699523926]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 9.0, 6.0, 7.0, 15.0, 16.0, 18.0, 24.0, 16.0, 26.0, 27.0, 30.0, 34.0, 38.0, 37.0, 43.0, 44.0, 49.0, 57.0, 56.0, 51.0, 42.0, 39.0, 34.0, 39.0, 28.0, 26.0, 30.0, 21.0, 22.0, 24.0, 16.0, 19.0, 11.0, 13.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-10.519302368164062, -10.202309608459473, -9.885316848754883, -9.56832504272461, -9.25133228302002, -8.93433952331543, -8.61734676361084, -8.30035400390625, -7.983362197875977, -7.666369438171387, -7.349377155303955, -7.032384395599365, -6.715392112731934, -6.398399353027344, -6.081406593322754, -5.764414310455322, -5.447421550750732, -5.130428791046143, -4.813436508178711, -4.496443748474121, -4.1794514656066895, -3.8624587059020996, -3.545466184616089, -3.228473663330078, -2.9114811420440674, -2.5944886207580566, -2.277496099472046, -1.9605034589767456, -1.6435109376907349, -1.3265184164047241, -1.0095257759094238, -0.6925332546234131, -0.37554073333740234, -0.058548182249069214, 0.2584443688392639, 0.5754369497299194, 0.8924294710159302, 1.209421992301941, 1.5264146327972412, 1.843407154083252, 2.1603996753692627, 2.4773921966552734, 2.794384717941284, 3.111377239227295, 3.4283699989318848, 3.7453622817993164, 4.062355041503906, 4.379347801208496, 4.696340084075928, 5.013332843780518, 5.330325126647949, 5.647317886352539, 5.964310169219971, 6.2813029289245605, 6.598295211791992, 6.915287971496582, 7.232280731201172, 7.549273490905762, 7.866265773773193, 8.183258056640625, 8.500250816345215, 8.817243576049805, 9.134236335754395, 9.451229095458984, 9.768220901489258]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 13.0, 18.0, 30.0, 39.0, 38.0, 67.0, 92.0, 145.0, 252.0, 346.0, 473.0, 706.0, 1153.0, 1928.0, 2929.0, 4750.0, 7789.0, 12969.0, 22486.0, 39165.0, 69854.0, 121584.0, 187161.0, 207991.0, 152492.0, 90550.0, 51453.0, 29158.0, 16837.0, 10051.0, 5964.0, 3682.0, 2282.0, 1415.0, 930.0, 568.0, 353.0, 253.0, 176.0, 137.0, 84.0, 46.0, 42.0, 30.0, 25.0, 11.0, 10.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.38671875, -2.310302734375, -2.23388671875, -2.157470703125, -2.0810546875, -2.004638671875, -1.92822265625, -1.851806640625, -1.775390625, -1.698974609375, -1.62255859375, -1.546142578125, -1.4697265625, -1.393310546875, -1.31689453125, -1.240478515625, -1.1640625, -1.087646484375, -1.01123046875, -0.934814453125, -0.8583984375, -0.781982421875, -0.70556640625, -0.629150390625, -0.552734375, -0.476318359375, -0.39990234375, -0.323486328125, -0.2470703125, -0.170654296875, -0.09423828125, -0.017822265625, 0.05859375, 0.135009765625, 0.21142578125, 0.287841796875, 0.3642578125, 0.440673828125, 0.51708984375, 0.593505859375, 0.669921875, 0.746337890625, 0.82275390625, 0.899169921875, 0.9755859375, 1.052001953125, 1.12841796875, 1.204833984375, 1.28125, 1.357666015625, 1.43408203125, 1.510498046875, 1.5869140625, 1.663330078125, 1.73974609375, 1.816162109375, 1.892578125, 1.968994140625, 2.04541015625, 2.121826171875, 2.1982421875, 2.274658203125, 2.35107421875, 2.427490234375, 2.50390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 1.0, 6.0, 4.0, 5.0, 18.0, 13.0, 17.0, 17.0, 19.0, 22.0, 25.0, 32.0, 38.0, 35.0, 43.0, 37.0, 55.0, 68.0, 43.0, 49.0, 54.0, 45.0, 53.0, 41.0, 33.0, 36.0, 34.0, 30.0, 20.0, 26.0, 21.0, 17.0, 14.0, 11.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3515625, -11.96435546875, -11.5771484375, -11.18994140625, -10.802734375, -10.41552734375, -10.0283203125, -9.64111328125, -9.25390625, -8.86669921875, -8.4794921875, -8.09228515625, -7.705078125, -7.31787109375, -6.9306640625, -6.54345703125, -6.15625, -5.76904296875, -5.3818359375, -4.99462890625, -4.607421875, -4.22021484375, -3.8330078125, -3.44580078125, -3.05859375, -2.67138671875, -2.2841796875, -1.89697265625, -1.509765625, -1.12255859375, -0.7353515625, -0.34814453125, 0.0390625, 0.42626953125, 0.8134765625, 1.20068359375, 1.587890625, 1.97509765625, 2.3623046875, 2.74951171875, 3.13671875, 3.52392578125, 3.9111328125, 4.29833984375, 4.685546875, 5.07275390625, 5.4599609375, 5.84716796875, 6.234375, 6.62158203125, 7.0087890625, 7.39599609375, 7.783203125, 8.17041015625, 8.5576171875, 8.94482421875, 9.33203125, 9.71923828125, 10.1064453125, 10.49365234375, 10.880859375, 11.26806640625, 11.6552734375, 12.04248046875, 12.4296875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 11.0, 12.0, 16.0, 30.0, 35.0, 59.0, 85.0, 151.0, 251.0, 379.0, 617.0, 1103.0, 2083.0, 4174.0, 8606.0, 18270.0, 40845.0, 96188.0, 223586.0, 325367.0, 185059.0, 77915.0, 33796.0, 14949.0, 7196.0, 3538.0, 1769.0, 1019.0, 555.0, 344.0, 195.0, 134.0, 77.0, 47.0, 36.0, 23.0, 14.0, 9.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.623046875, -3.499725341796875, -3.37640380859375, -3.253082275390625, -3.1297607421875, -3.006439208984375, -2.88311767578125, -2.759796142578125, -2.636474609375, -2.513153076171875, -2.38983154296875, -2.266510009765625, -2.1431884765625, -2.019866943359375, -1.89654541015625, -1.773223876953125, -1.64990234375, -1.526580810546875, -1.40325927734375, -1.279937744140625, -1.1566162109375, -1.033294677734375, -0.90997314453125, -0.786651611328125, -0.663330078125, -0.540008544921875, -0.41668701171875, -0.293365478515625, -0.1700439453125, -0.046722412109375, 0.07659912109375, 0.199920654296875, 0.3232421875, 0.446563720703125, 0.56988525390625, 0.693206787109375, 0.8165283203125, 0.939849853515625, 1.06317138671875, 1.186492919921875, 1.309814453125, 1.433135986328125, 1.55645751953125, 1.679779052734375, 1.8031005859375, 1.926422119140625, 2.04974365234375, 2.173065185546875, 2.29638671875, 2.419708251953125, 2.54302978515625, 2.666351318359375, 2.7896728515625, 2.912994384765625, 3.03631591796875, 3.159637451171875, 3.282958984375, 3.406280517578125, 3.52960205078125, 3.652923583984375, 3.7762451171875, 3.899566650390625, 4.02288818359375, 4.146209716796875, 4.26953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 5.0, 13.0, 16.0, 16.0, 15.0, 27.0, 18.0, 20.0, 32.0, 26.0, 25.0, 31.0, 38.0, 47.0, 35.0, 26.0, 43.0, 48.0, 32.0, 33.0, 38.0, 34.0, 40.0, 45.0, 30.0, 44.0, 23.0, 33.0, 15.0, 18.0, 18.0, 12.0, 21.0, 19.0, 11.0, 6.0, 5.0, 4.0, 7.0, 4.0, 3.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 4.0], "bins": [-6.94921875, -6.74627685546875, -6.5433349609375, -6.34039306640625, -6.137451171875, -5.93450927734375, -5.7315673828125, -5.52862548828125, -5.32568359375, -5.12274169921875, -4.9197998046875, -4.71685791015625, -4.513916015625, -4.31097412109375, -4.1080322265625, -3.90509033203125, -3.7021484375, -3.49920654296875, -3.2962646484375, -3.09332275390625, -2.890380859375, -2.68743896484375, -2.4844970703125, -2.28155517578125, -2.07861328125, -1.87567138671875, -1.6727294921875, -1.46978759765625, -1.266845703125, -1.06390380859375, -0.8609619140625, -0.65802001953125, -0.455078125, -0.25213623046875, -0.0491943359375, 0.15374755859375, 0.356689453125, 0.55963134765625, 0.7625732421875, 0.96551513671875, 1.16845703125, 1.37139892578125, 1.5743408203125, 1.77728271484375, 1.980224609375, 2.18316650390625, 2.3861083984375, 2.58905029296875, 2.7919921875, 2.99493408203125, 3.1978759765625, 3.40081787109375, 3.603759765625, 3.80670166015625, 4.0096435546875, 4.21258544921875, 4.41552734375, 4.61846923828125, 4.8214111328125, 5.02435302734375, 5.227294921875, 5.43023681640625, 5.6331787109375, 5.83612060546875, 6.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 13.0, 11.0, 17.0, 33.0, 41.0, 35.0, 82.0, 94.0, 139.0, 175.0, 299.0, 394.0, 607.0, 1022.0, 1589.0, 2593.0, 4414.0, 8327.0, 16096.0, 36962.0, 97389.0, 271655.0, 359010.0, 147793.0, 52973.0, 21959.0, 10611.0, 5599.0, 3150.0, 1867.0, 1241.0, 767.0, 491.0, 360.0, 233.0, 144.0, 128.0, 75.0, 57.0, 29.0, 26.0, 12.0, 15.0, 7.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99267578125, -0.9598007202148438, -0.9269256591796875, -0.8940505981445312, -0.861175537109375, -0.8283004760742188, -0.7954254150390625, -0.7625503540039062, -0.72967529296875, -0.6968002319335938, -0.6639251708984375, -0.6310501098632812, -0.598175048828125, -0.5652999877929688, -0.5324249267578125, -0.49954986572265625, -0.4666748046875, -0.43379974365234375, -0.4009246826171875, -0.36804962158203125, -0.335174560546875, -0.30229949951171875, -0.2694244384765625, -0.23654937744140625, -0.20367431640625, -0.17079925537109375, -0.1379241943359375, -0.10504913330078125, -0.072174072265625, -0.03929901123046875, -0.0064239501953125, 0.02645111083984375, 0.059326171875, 0.09220123291015625, 0.1250762939453125, 0.15795135498046875, 0.190826416015625, 0.22370147705078125, 0.2565765380859375, 0.28945159912109375, 0.32232666015625, 0.35520172119140625, 0.3880767822265625, 0.42095184326171875, 0.453826904296875, 0.48670196533203125, 0.5195770263671875, 0.5524520874023438, 0.5853271484375, 0.6182022094726562, 0.6510772705078125, 0.6839523315429688, 0.716827392578125, 0.7497024536132812, 0.7825775146484375, 0.8154525756835938, 0.84832763671875, 0.8812026977539062, 0.9140777587890625, 0.9469528198242188, 0.979827880859375, 1.0127029418945312, 1.0455780029296875, 1.0784530639648438, 1.111328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 7.0, 3.0, 4.0, 10.0, 10.0, 9.0, 14.0, 16.0, 31.0, 24.0, 34.0, 38.0, 46.0, 46.0, 56.0, 43.0, 61.0, 46.0, 71.0, 53.0, 58.0, 54.0, 43.0, 42.0, 30.0, 31.0, 24.0, 19.0, 17.0, 14.0, 10.0, 8.0, 6.0, 10.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.416704177856445e-05, -4.277750849723816e-05, -4.1387975215911865e-05, -3.999844193458557e-05, -3.860890865325928e-05, -3.7219375371932983e-05, -3.582984209060669e-05, -3.4440308809280396e-05, -3.30507755279541e-05, -3.166124224662781e-05, -3.0271708965301514e-05, -2.888217568397522e-05, -2.7492642402648926e-05, -2.6103109121322632e-05, -2.4713575839996338e-05, -2.3324042558670044e-05, -2.193450927734375e-05, -2.0544975996017456e-05, -1.9155442714691162e-05, -1.7765909433364868e-05, -1.6376376152038574e-05, -1.498684287071228e-05, -1.3597309589385986e-05, -1.2207776308059692e-05, -1.0818243026733398e-05, -9.428709745407104e-06, -8.03917646408081e-06, -6.649643182754517e-06, -5.260109901428223e-06, -3.870576620101929e-06, -2.4810433387756348e-06, -1.0915100574493408e-06, 2.980232238769531e-07, 1.687556505203247e-06, 3.077089786529541e-06, 4.466623067855835e-06, 5.856156349182129e-06, 7.245689630508423e-06, 8.635222911834717e-06, 1.002475619316101e-05, 1.1414289474487305e-05, 1.2803822755813599e-05, 1.4193356037139893e-05, 1.5582889318466187e-05, 1.697242259979248e-05, 1.8361955881118774e-05, 1.975148916244507e-05, 2.1141022443771362e-05, 2.2530555725097656e-05, 2.392008900642395e-05, 2.5309622287750244e-05, 2.6699155569076538e-05, 2.8088688850402832e-05, 2.9478222131729126e-05, 3.086775541305542e-05, 3.2257288694381714e-05, 3.364682197570801e-05, 3.50363552570343e-05, 3.6425888538360596e-05, 3.781542181968689e-05, 3.9204955101013184e-05, 4.059448838233948e-05, 4.198402166366577e-05, 4.3373554944992065e-05, 4.476308822631836e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 8.0, 12.0, 8.0, 5.0, 9.0, 14.0, 17.0, 47.0, 42.0, 81.0, 100.0, 149.0, 262.0, 365.0, 623.0, 945.0, 1573.0, 2669.0, 4628.0, 8303.0, 14681.0, 26793.0, 50322.0, 97269.0, 183340.0, 260226.0, 185421.0, 97699.0, 51022.0, 27101.0, 14881.0, 8175.0, 4735.0, 2634.0, 1646.0, 1004.0, 607.0, 391.0, 250.0, 174.0, 104.0, 62.0, 49.0, 31.0, 22.0, 20.0, 9.0, 3.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.1875, -1.149810791015625, -1.11212158203125, -1.074432373046875, -1.0367431640625, -0.999053955078125, -0.96136474609375, -0.923675537109375, -0.885986328125, -0.848297119140625, -0.81060791015625, -0.772918701171875, -0.7352294921875, -0.697540283203125, -0.65985107421875, -0.622161865234375, -0.58447265625, -0.546783447265625, -0.50909423828125, -0.471405029296875, -0.4337158203125, -0.396026611328125, -0.35833740234375, -0.320648193359375, -0.282958984375, -0.245269775390625, -0.20758056640625, -0.169891357421875, -0.1322021484375, -0.094512939453125, -0.05682373046875, -0.019134521484375, 0.0185546875, 0.056243896484375, 0.09393310546875, 0.131622314453125, 0.1693115234375, 0.207000732421875, 0.24468994140625, 0.282379150390625, 0.320068359375, 0.357757568359375, 0.39544677734375, 0.433135986328125, 0.4708251953125, 0.508514404296875, 0.54620361328125, 0.583892822265625, 0.62158203125, 0.659271240234375, 0.69696044921875, 0.734649658203125, 0.7723388671875, 0.810028076171875, 0.84771728515625, 0.885406494140625, 0.923095703125, 0.960784912109375, 0.99847412109375, 1.036163330078125, 1.0738525390625, 1.111541748046875, 1.14923095703125, 1.186920166015625, 1.224609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 4.0, 12.0, 15.0, 11.0, 15.0, 20.0, 25.0, 21.0, 37.0, 26.0, 36.0, 45.0, 41.0, 35.0, 44.0, 45.0, 50.0, 58.0, 47.0, 47.0, 42.0, 39.0, 46.0, 39.0, 40.0, 26.0, 18.0, 12.0, 18.0, 13.0, 17.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.2235107421875, -0.2171344757080078, -0.21075820922851562, -0.20438194274902344, -0.19800567626953125, -0.19162940979003906, -0.18525314331054688, -0.1788768768310547, -0.1725006103515625, -0.1661243438720703, -0.15974807739257812, -0.15337181091308594, -0.14699554443359375, -0.14061927795410156, -0.13424301147460938, -0.1278667449951172, -0.121490478515625, -0.11511421203613281, -0.10873794555664062, -0.10236167907714844, -0.09598541259765625, -0.08960914611816406, -0.08323287963867188, -0.07685661315917969, -0.0704803466796875, -0.06410408020019531, -0.057727813720703125, -0.05135154724121094, -0.04497528076171875, -0.03859901428222656, -0.032222747802734375, -0.025846481323242188, -0.01947021484375, -0.013093948364257812, -0.006717681884765625, -0.0003414154052734375, 0.00603485107421875, 0.012411117553710938, 0.018787384033203125, 0.025163650512695312, 0.0315399169921875, 0.03791618347167969, 0.044292449951171875, 0.05066871643066406, 0.05704498291015625, 0.06342124938964844, 0.06979751586914062, 0.07617378234863281, 0.082550048828125, 0.08892631530761719, 0.09530258178710938, 0.10167884826660156, 0.10805511474609375, 0.11443138122558594, 0.12080764770507812, 0.1271839141845703, 0.1335601806640625, 0.1399364471435547, 0.14631271362304688, 0.15268898010253906, 0.15906524658203125, 0.16544151306152344, 0.17181777954101562, 0.1781940460205078, 0.1845703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 12.0, 5.0, 15.0, 17.0, 14.0, 15.0, 24.0, 36.0, 38.0, 48.0, 50.0, 50.0, 55.0, 53.0, 43.0, 47.0, 58.0, 52.0, 46.0, 58.0, 53.0, 29.0, 26.0, 17.0, 33.0, 24.0, 8.0, 8.0, 11.0, 12.0, 3.0, 2.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-18.235641479492188, -17.740930557250977, -17.246217727661133, -16.751506805419922, -16.25679588317871, -15.762084007263184, -15.267372131347656, -14.772661209106445, -14.277950286865234, -13.783238410949707, -13.288527488708496, -12.793815612792969, -12.299104690551758, -11.80439281463623, -11.309680938720703, -10.814970016479492, -10.320258140563965, -9.825546264648438, -9.330835342407227, -8.8361234664917, -8.341412544250488, -7.846700668334961, -7.351989269256592, -6.857277870178223, -6.3625664710998535, -5.867855072021484, -5.373143672943115, -4.878432273864746, -4.383720397949219, -3.8890092372894287, -3.3942975997924805, -2.8995862007141113, -2.404874801635742, -1.910163402557373, -1.4154518842697144, -0.9207403659820557, -0.4260289669036865, 0.06868243217468262, 0.5633940696716309, 1.05810546875, 1.5528168678283691, 2.0475282669067383, 2.5422396659851074, 3.0369513034820557, 3.531662702560425, 4.026373863220215, 4.521085739135742, 5.015797138214111, 5.5105085372924805, 6.00521993637085, 6.499931335449219, 6.994643211364746, 7.489354133605957, 7.984066009521484, 8.478776931762695, 8.973488807678223, 9.46820068359375, 9.962912559509277, 10.457623481750488, 10.952335357666016, 11.447046279907227, 11.941758155822754, 12.436470031738281, 12.931180953979492, 13.425891876220703]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 9.0, 7.0, 5.0, 15.0, 14.0, 20.0, 22.0, 14.0, 28.0, 29.0, 32.0, 32.0, 37.0, 38.0, 41.0, 46.0, 48.0, 61.0, 56.0, 50.0, 41.0, 40.0, 34.0, 37.0, 31.0, 27.0, 29.0, 19.0, 23.0, 22.0, 18.0, 18.0, 12.0, 13.0, 7.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-10.522765159606934, -10.20352840423584, -9.884291648864746, -9.565054893493652, -9.245818138122559, -8.926582336425781, -8.607345581054688, -8.288108825683594, -7.9688720703125, -7.649635314941406, -7.3303985595703125, -7.011161804199219, -6.691925525665283, -6.3726887702941895, -6.053452014923096, -5.73421573638916, -5.414978504180908, -5.0957417488098145, -4.776504993438721, -4.457268714904785, -4.138031959533691, -3.8187952041625977, -3.499558448791504, -3.1803219318389893, -2.8610851764678955, -2.5418484210968018, -2.222611904144287, -1.9033751487731934, -1.5841385126113892, -1.264901876449585, -0.9456651210784912, -0.6264286041259766, -0.3071918487548828, 0.012044817209243774, 0.33128148317337036, 0.6505181789398193, 0.9697548151016235, 1.2889914512634277, 1.6082282066345215, 1.9274647235870361, 2.24670147895813, 2.5659382343292236, 2.8851747512817383, 3.204411506652832, 3.523648262023926, 3.8428847789764404, 4.162121772766113, 4.481358051300049, 4.800594806671143, 5.119831562042236, 5.43906831741333, 5.758304595947266, 6.077541351318359, 6.396778106689453, 6.716014862060547, 7.035251617431641, 7.354488372802734, 7.673725128173828, 7.992961883544922, 8.312198638916016, 8.63143539428711, 8.950672149658203, 9.269908905029297, 9.589144706726074, 9.908381462097168]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 3.0, 18.0, 20.0, 30.0, 48.0, 77.0, 115.0, 151.0, 281.0, 407.0, 648.0, 1055.0, 1658.0, 2631.0, 4452.0, 7116.0, 11307.0, 17589.0, 28148.0, 41880.0, 60275.0, 81745.0, 103248.0, 117860.0, 122332.0, 114786.0, 97021.0, 75347.0, 54491.0, 37142.0, 24424.0, 15758.0, 10023.0, 6183.0, 3810.0, 2334.0, 1460.0, 898.0, 636.0, 408.0, 265.0, 161.0, 94.0, 73.0, 52.0, 33.0, 27.0, 10.0, 12.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.8671875, -6.66131591796875, -6.4554443359375, -6.24957275390625, -6.043701171875, -5.83782958984375, -5.6319580078125, -5.42608642578125, -5.22021484375, -5.01434326171875, -4.8084716796875, -4.60260009765625, -4.396728515625, -4.19085693359375, -3.9849853515625, -3.77911376953125, -3.5732421875, -3.36737060546875, -3.1614990234375, -2.95562744140625, -2.749755859375, -2.54388427734375, -2.3380126953125, -2.13214111328125, -1.92626953125, -1.72039794921875, -1.5145263671875, -1.30865478515625, -1.102783203125, -0.89691162109375, -0.6910400390625, -0.48516845703125, -0.279296875, -0.07342529296875, 0.1324462890625, 0.33831787109375, 0.544189453125, 0.75006103515625, 0.9559326171875, 1.16180419921875, 1.36767578125, 1.57354736328125, 1.7794189453125, 1.98529052734375, 2.191162109375, 2.39703369140625, 2.6029052734375, 2.80877685546875, 3.0146484375, 3.22052001953125, 3.4263916015625, 3.63226318359375, 3.838134765625, 4.04400634765625, 4.2498779296875, 4.45574951171875, 4.66162109375, 4.86749267578125, 5.0733642578125, 5.27923583984375, 5.485107421875, 5.69097900390625, 5.8968505859375, 6.10272216796875, 6.30859375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 13.0, 8.0, 9.0, 16.0, 22.0, 24.0, 22.0, 21.0, 22.0, 31.0, 21.0, 36.0, 47.0, 38.0, 47.0, 42.0, 52.0, 39.0, 41.0, 45.0, 42.0, 39.0, 44.0, 31.0, 35.0, 29.0, 31.0, 21.0, 22.0, 20.0, 16.0, 13.0, 12.0, 5.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.347412109375, -9.00732421875, -8.667236328125, -8.3271484375, -7.987060546875, -7.64697265625, -7.306884765625, -6.966796875, -6.626708984375, -6.28662109375, -5.946533203125, -5.6064453125, -5.266357421875, -4.92626953125, -4.586181640625, -4.24609375, -3.906005859375, -3.56591796875, -3.225830078125, -2.8857421875, -2.545654296875, -2.20556640625, -1.865478515625, -1.525390625, -1.185302734375, -0.84521484375, -0.505126953125, -0.1650390625, 0.175048828125, 0.51513671875, 0.855224609375, 1.1953125, 1.535400390625, 1.87548828125, 2.215576171875, 2.5556640625, 2.895751953125, 3.23583984375, 3.575927734375, 3.916015625, 4.256103515625, 4.59619140625, 4.936279296875, 5.2763671875, 5.616455078125, 5.95654296875, 6.296630859375, 6.63671875, 6.976806640625, 7.31689453125, 7.656982421875, 7.9970703125, 8.337158203125, 8.67724609375, 9.017333984375, 9.357421875, 9.697509765625, 10.03759765625, 10.377685546875, 10.7177734375, 11.057861328125, 11.39794921875, 11.738037109375, 12.078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 16.0, 17.0, 20.0, 33.0, 51.0, 95.0, 132.0, 203.0, 313.0, 386.0, 700.0, 1013.0, 1469.0, 2254.0, 3445.0, 5075.0, 7502.0, 11366.0, 16955.0, 25075.0, 35830.0, 48868.0, 64784.0, 81688.0, 96345.0, 104928.0, 106115.0, 99489.0, 86079.0, 70264.0, 53610.0, 38963.0, 27705.0, 18923.0, 12962.0, 8700.0, 5662.0, 3866.0, 2469.0, 1701.0, 1159.0, 791.0, 529.0, 358.0, 225.0, 153.0, 82.0, 65.0, 44.0, 36.0, 15.0, 19.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.8828125, -5.68768310546875, -5.4925537109375, -5.29742431640625, -5.102294921875, -4.90716552734375, -4.7120361328125, -4.51690673828125, -4.32177734375, -4.12664794921875, -3.9315185546875, -3.73638916015625, -3.541259765625, -3.34613037109375, -3.1510009765625, -2.95587158203125, -2.7607421875, -2.56561279296875, -2.3704833984375, -2.17535400390625, -1.980224609375, -1.78509521484375, -1.5899658203125, -1.39483642578125, -1.19970703125, -1.00457763671875, -0.8094482421875, -0.61431884765625, -0.419189453125, -0.22406005859375, -0.0289306640625, 0.16619873046875, 0.361328125, 0.55645751953125, 0.7515869140625, 0.94671630859375, 1.141845703125, 1.33697509765625, 1.5321044921875, 1.72723388671875, 1.92236328125, 2.11749267578125, 2.3126220703125, 2.50775146484375, 2.702880859375, 2.89801025390625, 3.0931396484375, 3.28826904296875, 3.4833984375, 3.67852783203125, 3.8736572265625, 4.06878662109375, 4.263916015625, 4.45904541015625, 4.6541748046875, 4.84930419921875, 5.04443359375, 5.23956298828125, 5.4346923828125, 5.62982177734375, 5.824951171875, 6.02008056640625, 6.2152099609375, 6.41033935546875, 6.60546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 6.0, 5.0, 4.0, 8.0, 14.0, 12.0, 14.0, 12.0, 16.0, 24.0, 24.0, 28.0, 26.0, 27.0, 39.0, 45.0, 32.0, 29.0, 32.0, 37.0, 33.0, 37.0, 54.0, 36.0, 34.0, 32.0, 40.0, 34.0, 32.0, 36.0, 31.0, 24.0, 22.0, 17.0, 18.0, 15.0, 11.0, 14.0, 10.0, 8.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.76654052734375, -5.5760498046875, -5.38555908203125, -5.195068359375, -5.00457763671875, -4.8140869140625, -4.62359619140625, -4.43310546875, -4.24261474609375, -4.0521240234375, -3.86163330078125, -3.671142578125, -3.48065185546875, -3.2901611328125, -3.09967041015625, -2.9091796875, -2.71868896484375, -2.5281982421875, -2.33770751953125, -2.147216796875, -1.95672607421875, -1.7662353515625, -1.57574462890625, -1.38525390625, -1.19476318359375, -1.0042724609375, -0.81378173828125, -0.623291015625, -0.43280029296875, -0.2423095703125, -0.05181884765625, 0.138671875, 0.32916259765625, 0.5196533203125, 0.71014404296875, 0.900634765625, 1.09112548828125, 1.2816162109375, 1.47210693359375, 1.66259765625, 1.85308837890625, 2.0435791015625, 2.23406982421875, 2.424560546875, 2.61505126953125, 2.8055419921875, 2.99603271484375, 3.1865234375, 3.37701416015625, 3.5675048828125, 3.75799560546875, 3.948486328125, 4.13897705078125, 4.3294677734375, 4.51995849609375, 4.71044921875, 4.90093994140625, 5.0914306640625, 5.28192138671875, 5.472412109375, 5.66290283203125, 5.8533935546875, 6.04388427734375, 6.234375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 13.0, 11.0, 17.0, 28.0, 34.0, 40.0, 60.0, 89.0, 120.0, 211.0, 250.0, 385.0, 612.0, 907.0, 1357.0, 2170.0, 3546.0, 6014.0, 11302.0, 26493.0, 76743.0, 204053.0, 319813.0, 236103.0, 94898.0, 32489.0, 13154.0, 6769.0, 3822.0, 2392.0, 1593.0, 989.0, 646.0, 464.0, 303.0, 214.0, 130.0, 75.0, 68.0, 54.0, 26.0, 31.0, 15.0, 13.0, 7.0, 7.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.96484375, -8.671875, -8.37890625, -8.0859375, -7.79296875, -7.5, -7.20703125, -6.9140625, -6.62109375, -6.328125, -6.03515625, -5.7421875, -5.44921875, -5.15625, -4.86328125, -4.5703125, -4.27734375, -3.984375, -3.69140625, -3.3984375, -3.10546875, -2.8125, -2.51953125, -2.2265625, -1.93359375, -1.640625, -1.34765625, -1.0546875, -0.76171875, -0.46875, -0.17578125, 0.1171875, 0.41015625, 0.703125, 0.99609375, 1.2890625, 1.58203125, 1.875, 2.16796875, 2.4609375, 2.75390625, 3.046875, 3.33984375, 3.6328125, 3.92578125, 4.21875, 4.51171875, 4.8046875, 5.09765625, 5.390625, 5.68359375, 5.9765625, 6.26953125, 6.5625, 6.85546875, 7.1484375, 7.44140625, 7.734375, 8.02734375, 8.3203125, 8.61328125, 8.90625, 9.19921875, 9.4921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 0.0, 1.0, 7.0, 17.0, 15.0, 10.0, 20.0, 35.0, 30.0, 35.0, 44.0, 72.0, 73.0, 87.0, 82.0, 75.0, 68.0, 70.0, 52.0, 48.0, 37.0, 23.0, 28.0, 15.0, 15.0, 7.0, 6.0, 3.0, 12.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007181167602539062, -0.0006967037916183472, -0.0006752908229827881, -0.000653877854347229, -0.0006324648857116699, -0.0006110519170761108, -0.0005896389484405518, -0.0005682259798049927, -0.0005468130111694336, -0.0005254000425338745, -0.0005039870738983154, -0.00048257410526275635, -0.00046116113662719727, -0.0004397481679916382, -0.0004183351993560791, -0.00039692223072052, -0.00037550926208496094, -0.00035409629344940186, -0.0003326833248138428, -0.0003112703561782837, -0.0002898573875427246, -0.00026844441890716553, -0.00024703145027160645, -0.00022561848163604736, -0.00020420551300048828, -0.0001827925443649292, -0.00016137957572937012, -0.00013996660709381104, -0.00011855363845825195, -9.714066982269287e-05, -7.572770118713379e-05, -5.431473255157471e-05, -3.2901763916015625e-05, -1.1488795280456543e-05, 9.924173355102539e-06, 3.133714199066162e-05, 5.27501106262207e-05, 7.416307926177979e-05, 9.557604789733887e-05, 0.00011698901653289795, 0.00013840198516845703, 0.0001598149538040161, 0.0001812279224395752, 0.00020264089107513428, 0.00022405385971069336, 0.00024546682834625244, 0.0002668797969818115, 0.0002882927656173706, 0.0003097057342529297, 0.00033111870288848877, 0.00035253167152404785, 0.00037394464015960693, 0.000395357608795166, 0.0004167705774307251, 0.0004381835460662842, 0.00045959651470184326, 0.00048100948333740234, 0.0005024224519729614, 0.0005238354206085205, 0.0005452483892440796, 0.0005666613578796387, 0.0005880743265151978, 0.0006094872951507568, 0.0006309002637863159, 0.000652313232421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 3.0, 2.0, 6.0, 8.0, 25.0, 23.0, 34.0, 51.0, 60.0, 92.0, 162.0, 174.0, 279.0, 410.0, 573.0, 871.0, 1351.0, 2048.0, 3360.0, 5848.0, 11481.0, 26637.0, 75846.0, 208719.0, 332809.0, 231120.0, 87313.0, 30113.0, 12575.0, 6423.0, 3608.0, 2224.0, 1431.0, 902.0, 612.0, 391.0, 277.0, 208.0, 150.0, 104.0, 68.0, 47.0, 35.0, 27.0, 17.0, 15.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-10.5625, -10.247802734375, -9.93310546875, -9.618408203125, -9.3037109375, -8.989013671875, -8.67431640625, -8.359619140625, -8.044921875, -7.730224609375, -7.41552734375, -7.100830078125, -6.7861328125, -6.471435546875, -6.15673828125, -5.842041015625, -5.52734375, -5.212646484375, -4.89794921875, -4.583251953125, -4.2685546875, -3.953857421875, -3.63916015625, -3.324462890625, -3.009765625, -2.695068359375, -2.38037109375, -2.065673828125, -1.7509765625, -1.436279296875, -1.12158203125, -0.806884765625, -0.4921875, -0.177490234375, 0.13720703125, 0.451904296875, 0.7666015625, 1.081298828125, 1.39599609375, 1.710693359375, 2.025390625, 2.340087890625, 2.65478515625, 2.969482421875, 3.2841796875, 3.598876953125, 3.91357421875, 4.228271484375, 4.54296875, 4.857666015625, 5.17236328125, 5.487060546875, 5.8017578125, 6.116455078125, 6.43115234375, 6.745849609375, 7.060546875, 7.375244140625, 7.68994140625, 8.004638671875, 8.3193359375, 8.634033203125, 8.94873046875, 9.263427734375, 9.578125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 8.0, 17.0, 15.0, 43.0, 46.0, 66.0, 76.0, 88.0, 111.0, 107.0, 90.0, 76.0, 68.0, 62.0, 35.0, 24.0, 20.0, 11.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.4072265625, -2.33203125, -2.2568359375, -2.181640625, -2.1064453125, -2.03125, -1.9560546875, -1.880859375, -1.8056640625, -1.73046875, -1.6552734375, -1.580078125, -1.5048828125, -1.4296875, -1.3544921875, -1.279296875, -1.2041015625, -1.12890625, -1.0537109375, -0.978515625, -0.9033203125, -0.828125, -0.7529296875, -0.677734375, -0.6025390625, -0.52734375, -0.4521484375, -0.376953125, -0.3017578125, -0.2265625, -0.1513671875, -0.076171875, -0.0009765625, 0.07421875, 0.1494140625, 0.224609375, 0.2998046875, 0.375, 0.4501953125, 0.525390625, 0.6005859375, 0.67578125, 0.7509765625, 0.826171875, 0.9013671875, 0.9765625, 1.0517578125, 1.126953125, 1.2021484375, 1.27734375, 1.3525390625, 1.427734375, 1.5029296875, 1.578125, 1.6533203125, 1.728515625, 1.8037109375, 1.87890625, 1.9541015625, 2.029296875, 2.1044921875, 2.1796875, 2.2548828125, 2.330078125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 3.0, 5.0, 12.0, 7.0, 10.0, 7.0, 10.0, 16.0, 21.0, 16.0, 25.0, 26.0, 41.0, 34.0, 51.0, 45.0, 52.0, 47.0, 53.0, 57.0, 49.0, 37.0, 57.0, 60.0, 32.0, 42.0, 29.0, 31.0, 17.0, 21.0, 20.0, 13.0, 16.0, 11.0, 5.0, 2.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-17.63814353942871, -17.150489807128906, -16.662837982177734, -16.17518424987793, -15.687530517578125, -15.199877738952637, -14.712224960327148, -14.224571228027344, -13.736917495727539, -13.24926471710205, -12.761610984802246, -12.273958206176758, -11.786304473876953, -11.298651695251465, -10.810998916625977, -10.323345184326172, -9.835692405700684, -9.348039627075195, -8.86038589477539, -8.372733116149902, -7.885079383850098, -7.397426605224609, -6.909773349761963, -6.422120094299316, -5.93446683883667, -5.446813583374023, -4.959160327911377, -4.4715070724487305, -3.983854055404663, -3.4962007999420166, -3.008547782897949, -2.5208945274353027, -2.0332422256469727, -1.5455889701843262, -1.0579358339309692, -0.5702826976776123, -0.08262944221496582, 0.40502381324768066, 0.892676830291748, 1.3803300857543945, 1.867983341217041, 2.3556365966796875, 2.843289852142334, 3.3309428691864014, 3.818596124649048, 4.306249618530273, 4.793902397155762, 5.281555652618408, 5.769208908081055, 6.256862163543701, 6.744515419006348, 7.232168197631836, 7.719821929931641, 8.207474708557129, 8.695127487182617, 9.182781219482422, 9.670434951782227, 10.158087730407715, 10.64574146270752, 11.133394241333008, 11.621047973632812, 12.1087007522583, 12.596353530883789, 13.084007263183594, 13.571660041809082]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 14.0, 20.0, 19.0, 23.0, 20.0, 25.0, 21.0, 27.0, 31.0, 32.0, 45.0, 36.0, 37.0, 47.0, 61.0, 43.0, 54.0, 44.0, 36.0, 44.0, 35.0, 39.0, 31.0, 30.0, 20.0, 29.0, 14.0, 15.0, 27.0, 10.0, 17.0, 7.0, 5.0, 7.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.576552391052246, -11.220346450805664, -10.864141464233398, -10.507935523986816, -10.151729583740234, -9.795523643493652, -9.43931770324707, -9.083112716674805, -8.726906776428223, -8.37070083618164, -8.014495849609375, -7.658289909362793, -7.302083969116211, -6.945878028869629, -6.589672565460205, -6.233467102050781, -5.877261161804199, -5.521055221557617, -5.164849758148193, -4.8086442947387695, -4.4524383544921875, -4.0962324142456055, -3.7400269508361816, -3.3838212490081787, -3.027615547180176, -2.671409845352173, -2.31520414352417, -1.958998441696167, -1.602792739868164, -1.2465870380401611, -0.8903813362121582, -0.5341756343841553, -0.17796993255615234, 0.17823576927185059, 0.5344414710998535, 0.8906471729278564, 1.2468528747558594, 1.6030585765838623, 1.9592642784118652, 2.315469980239868, 2.671675682067871, 3.027881383895874, 3.384087085723877, 3.74029278755188, 4.096498489379883, 4.452704429626465, 4.808909893035889, 5.1651153564453125, 5.5213212966918945, 5.877527236938477, 6.2337327003479, 6.589938163757324, 6.946144104003906, 7.302350044250488, 7.658555507659912, 8.014760971069336, 8.370966911315918, 8.7271728515625, 9.083377838134766, 9.439583778381348, 9.79578971862793, 10.151995658874512, 10.508201599121094, 10.86440658569336, 11.220612525939941]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 5.0, 12.0, 15.0, 28.0, 34.0, 64.0, 73.0, 164.0, 251.0, 429.0, 663.0, 1093.0, 1908.0, 3012.0, 5242.0, 8895.0, 15874.0, 28181.0, 50543.0, 90216.0, 161531.0, 282277.0, 466215.0, 674167.0, 761500.0, 637497.0, 424777.0, 253315.0, 144332.0, 80599.0, 44420.0, 24742.0, 13795.0, 7819.0, 4393.0, 2598.0, 1474.0, 846.0, 524.0, 292.0, 182.0, 107.0, 69.0, 45.0, 28.0, 15.0, 9.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0], "bins": [-18.203125, -17.6888427734375, -17.174560546875, -16.6602783203125, -16.14599609375, -15.6317138671875, -15.117431640625, -14.6031494140625, -14.0888671875, -13.5745849609375, -13.060302734375, -12.5460205078125, -12.03173828125, -11.5174560546875, -11.003173828125, -10.4888916015625, -9.974609375, -9.4603271484375, -8.946044921875, -8.4317626953125, -7.91748046875, -7.4031982421875, -6.888916015625, -6.3746337890625, -5.8603515625, -5.3460693359375, -4.831787109375, -4.3175048828125, -3.80322265625, -3.2889404296875, -2.774658203125, -2.2603759765625, -1.74609375, -1.2318115234375, -0.717529296875, -0.2032470703125, 0.31103515625, 0.8253173828125, 1.339599609375, 1.8538818359375, 2.3681640625, 2.8824462890625, 3.396728515625, 3.9110107421875, 4.42529296875, 4.9395751953125, 5.453857421875, 5.9681396484375, 6.482421875, 6.9967041015625, 7.510986328125, 8.0252685546875, 8.53955078125, 9.0538330078125, 9.568115234375, 10.0823974609375, 10.5966796875, 11.1109619140625, 11.625244140625, 12.1395263671875, 12.65380859375, 13.1680908203125, 13.682373046875, 14.1966552734375, 14.7109375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 14.0, 32.0, 23.0, 33.0, 34.0, 38.0, 43.0, 37.0, 45.0, 46.0, 44.0, 51.0, 51.0, 50.0, 54.0, 47.0, 46.0, 35.0, 36.0, 27.0, 27.0, 31.0, 22.0, 20.0, 22.0, 8.0, 10.0, 13.0, 4.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -12.14013671875, -11.7255859375, -11.31103515625, -10.896484375, -10.48193359375, -10.0673828125, -9.65283203125, -9.23828125, -8.82373046875, -8.4091796875, -7.99462890625, -7.580078125, -7.16552734375, -6.7509765625, -6.33642578125, -5.921875, -5.50732421875, -5.0927734375, -4.67822265625, -4.263671875, -3.84912109375, -3.4345703125, -3.02001953125, -2.60546875, -2.19091796875, -1.7763671875, -1.36181640625, -0.947265625, -0.53271484375, -0.1181640625, 0.29638671875, 0.7109375, 1.12548828125, 1.5400390625, 1.95458984375, 2.369140625, 2.78369140625, 3.1982421875, 3.61279296875, 4.02734375, 4.44189453125, 4.8564453125, 5.27099609375, 5.685546875, 6.10009765625, 6.5146484375, 6.92919921875, 7.34375, 7.75830078125, 8.1728515625, 8.58740234375, 9.001953125, 9.41650390625, 9.8310546875, 10.24560546875, 10.66015625, 11.07470703125, 11.4892578125, 11.90380859375, 12.318359375, 12.73291015625, 13.1474609375, 13.56201171875, 13.9765625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 7.0, 16.0, 12.0, 38.0, 60.0, 95.0, 179.0, 299.0, 459.0, 701.0, 1160.0, 1916.0, 3342.0, 5397.0, 9348.0, 15538.0, 26876.0, 45022.0, 75697.0, 126391.0, 205365.0, 318866.0, 458834.0, 590108.0, 633314.0, 551285.0, 408646.0, 275974.0, 175414.0, 107265.0, 64423.0, 37828.0, 22313.0, 12947.0, 7611.0, 4612.0, 2738.0, 1657.0, 1031.0, 562.0, 347.0, 218.0, 143.0, 77.0, 62.0, 33.0, 19.0, 14.0, 3.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.46875, -16.892822265625, -16.31689453125, -15.740966796875, -15.1650390625, -14.589111328125, -14.01318359375, -13.437255859375, -12.861328125, -12.285400390625, -11.70947265625, -11.133544921875, -10.5576171875, -9.981689453125, -9.40576171875, -8.829833984375, -8.25390625, -7.677978515625, -7.10205078125, -6.526123046875, -5.9501953125, -5.374267578125, -4.79833984375, -4.222412109375, -3.646484375, -3.070556640625, -2.49462890625, -1.918701171875, -1.3427734375, -0.766845703125, -0.19091796875, 0.385009765625, 0.9609375, 1.536865234375, 2.11279296875, 2.688720703125, 3.2646484375, 3.840576171875, 4.41650390625, 4.992431640625, 5.568359375, 6.144287109375, 6.72021484375, 7.296142578125, 7.8720703125, 8.447998046875, 9.02392578125, 9.599853515625, 10.17578125, 10.751708984375, 11.32763671875, 11.903564453125, 12.4794921875, 13.055419921875, 13.63134765625, 14.207275390625, 14.783203125, 15.359130859375, 15.93505859375, 16.510986328125, 17.0869140625, 17.662841796875, 18.23876953125, 18.814697265625, 19.390625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 8.0, 7.0, 12.0, 18.0, 20.0, 42.0, 45.0, 65.0, 64.0, 78.0, 109.0, 132.0, 153.0, 195.0, 192.0, 214.0, 222.0, 240.0, 247.0, 242.0, 225.0, 244.0, 207.0, 190.0, 141.0, 151.0, 131.0, 102.0, 74.0, 67.0, 51.0, 41.0, 27.0, 24.0, 24.0, 13.0, 16.0, 5.0, 7.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.70703125, -7.48394775390625, -7.2608642578125, -7.03778076171875, -6.814697265625, -6.59161376953125, -6.3685302734375, -6.14544677734375, -5.92236328125, -5.69927978515625, -5.4761962890625, -5.25311279296875, -5.030029296875, -4.80694580078125, -4.5838623046875, -4.36077880859375, -4.1376953125, -3.91461181640625, -3.6915283203125, -3.46844482421875, -3.245361328125, -3.02227783203125, -2.7991943359375, -2.57611083984375, -2.35302734375, -2.12994384765625, -1.9068603515625, -1.68377685546875, -1.460693359375, -1.23760986328125, -1.0145263671875, -0.79144287109375, -0.568359375, -0.34527587890625, -0.1221923828125, 0.10089111328125, 0.323974609375, 0.54705810546875, 0.7701416015625, 0.99322509765625, 1.21630859375, 1.43939208984375, 1.6624755859375, 1.88555908203125, 2.108642578125, 2.33172607421875, 2.5548095703125, 2.77789306640625, 3.0009765625, 3.22406005859375, 3.4471435546875, 3.67022705078125, 3.893310546875, 4.11639404296875, 4.3394775390625, 4.56256103515625, 4.78564453125, 5.00872802734375, 5.2318115234375, 5.45489501953125, 5.677978515625, 5.90106201171875, 6.1241455078125, 6.34722900390625, 6.5703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 12.0, 17.0, 17.0, 19.0, 24.0, 28.0, 31.0, 44.0, 48.0, 54.0, 45.0, 57.0, 64.0, 53.0, 44.0, 55.0, 47.0, 46.0, 37.0, 49.0, 26.0, 26.0, 19.0, 21.0, 15.0, 18.0, 14.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.725021362304688, -24.89894676208496, -24.072872161865234, -23.246797561645508, -22.42072296142578, -21.594648361206055, -20.768573760986328, -19.9424991607666, -19.116424560546875, -18.29034996032715, -17.464275360107422, -16.638200759887695, -15.812126159667969, -14.986051559448242, -14.159976959228516, -13.333902359008789, -12.507826805114746, -11.68175220489502, -10.855677604675293, -10.029603004455566, -9.20352840423584, -8.377452850341797, -7.5513787269592285, -6.725304126739502, -5.899229526519775, -5.073154926300049, -4.247080326080322, -3.4210054874420166, -2.59493088722229, -1.7688560485839844, -0.9427814483642578, -0.11670684814453125, 0.7093677520751953, 1.5354423522949219, 2.3615169525146484, 3.187591791152954, 4.013666152954102, 4.839741230010986, 5.665815830230713, 6.4918904304504395, 7.317965030670166, 8.14404010772705, 8.970114707946777, 9.796189308166504, 10.62226390838623, 11.448338508605957, 12.274413108825684, 13.10048770904541, 13.926562309265137, 14.752636909484863, 15.57871150970459, 16.404787063598633, 17.23086166381836, 18.056936264038086, 18.883010864257812, 19.70908546447754, 20.535160064697266, 21.361234664916992, 22.18730926513672, 23.013383865356445, 23.839458465576172, 24.6655330657959, 25.491607666015625, 26.31768226623535, 27.143756866455078]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 4.0, 11.0, 12.0, 17.0, 19.0, 25.0, 29.0, 27.0, 28.0, 18.0, 34.0, 29.0, 35.0, 42.0, 42.0, 42.0, 48.0, 43.0, 40.0, 50.0, 40.0, 43.0, 32.0, 43.0, 24.0, 25.0, 22.0, 26.0, 19.0, 21.0, 21.0, 8.0, 9.0, 13.0, 5.0, 11.0, 5.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.536376953125, -16.035737991333008, -15.5350980758667, -15.03445816040039, -14.533819198608398, -14.033180236816406, -13.532540321350098, -13.031900405883789, -12.531261444091797, -12.030622482299805, -11.529982566833496, -11.029342651367188, -10.528703689575195, -10.028064727783203, -9.527424812316895, -9.026784896850586, -8.526145935058594, -8.025506973266602, -7.524867057800293, -7.024227619171143, -6.523588180541992, -6.022948741912842, -5.522309303283691, -5.021669864654541, -4.521030426025391, -4.02039098739624, -3.51975154876709, -3.0191121101379395, -2.518472671508789, -2.0178332328796387, -1.5171937942504883, -1.016554355621338, -0.5159130096435547, -0.015273571014404297, 0.4853658676147461, 0.9860053062438965, 1.4866447448730469, 1.9872841835021973, 2.4879236221313477, 2.988563060760498, 3.4892024993896484, 3.989841938018799, 4.490481376647949, 4.9911208152771, 5.49176025390625, 5.9923996925354, 6.493039131164551, 6.993678569793701, 7.494318008422852, 7.994957447052002, 8.495596885681152, 8.996236801147461, 9.496875762939453, 9.997514724731445, 10.498154640197754, 10.998794555664062, 11.499433517456055, 12.000072479248047, 12.500712394714355, 13.001352310180664, 13.501991271972656, 14.002630233764648, 14.503270149230957, 15.003910064697266, 15.504549026489258]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 8.0, 10.0, 19.0, 22.0, 29.0, 49.0, 94.0, 129.0, 198.0, 290.0, 416.0, 581.0, 1031.0, 1535.0, 2325.0, 3716.0, 5961.0, 10132.0, 16847.0, 29404.0, 52331.0, 96816.0, 175595.0, 240462.0, 180521.0, 100727.0, 54413.0, 30397.0, 17106.0, 10255.0, 6273.0, 3952.0, 2408.0, 1633.0, 965.0, 655.0, 432.0, 262.0, 186.0, 121.0, 89.0, 49.0, 36.0, 28.0, 20.0, 11.0, 6.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.912109375, -3.783966064453125, -3.65582275390625, -3.527679443359375, -3.3995361328125, -3.271392822265625, -3.14324951171875, -3.015106201171875, -2.886962890625, -2.758819580078125, -2.63067626953125, -2.502532958984375, -2.3743896484375, -2.246246337890625, -2.11810302734375, -1.989959716796875, -1.86181640625, -1.733673095703125, -1.60552978515625, -1.477386474609375, -1.3492431640625, -1.221099853515625, -1.09295654296875, -0.964813232421875, -0.836669921875, -0.708526611328125, -0.58038330078125, -0.452239990234375, -0.3240966796875, -0.195953369140625, -0.06781005859375, 0.060333251953125, 0.1884765625, 0.316619873046875, 0.44476318359375, 0.572906494140625, 0.7010498046875, 0.829193115234375, 0.95733642578125, 1.085479736328125, 1.213623046875, 1.341766357421875, 1.46990966796875, 1.598052978515625, 1.7261962890625, 1.854339599609375, 1.98248291015625, 2.110626220703125, 2.23876953125, 2.366912841796875, 2.49505615234375, 2.623199462890625, 2.7513427734375, 2.879486083984375, 3.00762939453125, 3.135772705078125, 3.263916015625, 3.392059326171875, 3.52020263671875, 3.648345947265625, 3.7764892578125, 3.904632568359375, 4.03277587890625, 4.160919189453125, 4.2890625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 7.0, 4.0, 9.0, 4.0, 9.0, 7.0, 13.0, 18.0, 14.0, 15.0, 24.0, 20.0, 33.0, 28.0, 37.0, 29.0, 31.0, 40.0, 45.0, 35.0, 40.0, 52.0, 43.0, 35.0, 40.0, 45.0, 36.0, 36.0, 37.0, 27.0, 29.0, 26.0, 20.0, 18.0, 15.0, 16.0, 11.0, 12.0, 8.0, 8.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.236572265625, -16.67626953125, -16.115966796875, -15.5556640625, -14.995361328125, -14.43505859375, -13.874755859375, -13.314453125, -12.754150390625, -12.19384765625, -11.633544921875, -11.0732421875, -10.512939453125, -9.95263671875, -9.392333984375, -8.83203125, -8.271728515625, -7.71142578125, -7.151123046875, -6.5908203125, -6.030517578125, -5.47021484375, -4.909912109375, -4.349609375, -3.789306640625, -3.22900390625, -2.668701171875, -2.1083984375, -1.548095703125, -0.98779296875, -0.427490234375, 0.1328125, 0.693115234375, 1.25341796875, 1.813720703125, 2.3740234375, 2.934326171875, 3.49462890625, 4.054931640625, 4.615234375, 5.175537109375, 5.73583984375, 6.296142578125, 6.8564453125, 7.416748046875, 7.97705078125, 8.537353515625, 9.09765625, 9.657958984375, 10.21826171875, 10.778564453125, 11.3388671875, 11.899169921875, 12.45947265625, 13.019775390625, 13.580078125, 14.140380859375, 14.70068359375, 15.260986328125, 15.8212890625, 16.381591796875, 16.94189453125, 17.502197265625, 18.0625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 7.0, 16.0, 23.0, 26.0, 31.0, 56.0, 66.0, 120.0, 177.0, 233.0, 407.0, 605.0, 1021.0, 1885.0, 3419.0, 7092.0, 15608.0, 36270.0, 86955.0, 202260.0, 331288.0, 204808.0, 88221.0, 36782.0, 15820.0, 7129.0, 3500.0, 1902.0, 1008.0, 637.0, 412.0, 228.0, 171.0, 105.0, 78.0, 47.0, 45.0, 21.0, 23.0, 19.0, 4.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.421875, -6.23577880859375, -6.0496826171875, -5.86358642578125, -5.677490234375, -5.49139404296875, -5.3052978515625, -5.11920166015625, -4.93310546875, -4.74700927734375, -4.5609130859375, -4.37481689453125, -4.188720703125, -4.00262451171875, -3.8165283203125, -3.63043212890625, -3.4443359375, -3.25823974609375, -3.0721435546875, -2.88604736328125, -2.699951171875, -2.51385498046875, -2.3277587890625, -2.14166259765625, -1.95556640625, -1.76947021484375, -1.5833740234375, -1.39727783203125, -1.211181640625, -1.02508544921875, -0.8389892578125, -0.65289306640625, -0.466796875, -0.28070068359375, -0.0946044921875, 0.09149169921875, 0.277587890625, 0.46368408203125, 0.6497802734375, 0.83587646484375, 1.02197265625, 1.20806884765625, 1.3941650390625, 1.58026123046875, 1.766357421875, 1.95245361328125, 2.1385498046875, 2.32464599609375, 2.5107421875, 2.69683837890625, 2.8829345703125, 3.06903076171875, 3.255126953125, 3.44122314453125, 3.6273193359375, 3.81341552734375, 3.99951171875, 4.18560791015625, 4.3717041015625, 4.55780029296875, 4.743896484375, 4.92999267578125, 5.1160888671875, 5.30218505859375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 7.0, 7.0, 22.0, 13.0, 9.0, 17.0, 19.0, 17.0, 21.0, 25.0, 23.0, 26.0, 42.0, 36.0, 27.0, 40.0, 27.0, 48.0, 53.0, 37.0, 42.0, 29.0, 35.0, 31.0, 27.0, 25.0, 36.0, 37.0, 30.0, 26.0, 20.0, 27.0, 16.0, 24.0, 17.0, 6.0, 12.0, 10.0, 12.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.2156982421875, -7.900146484375, -7.5845947265625, -7.26904296875, -6.9534912109375, -6.637939453125, -6.3223876953125, -6.0068359375, -5.6912841796875, -5.375732421875, -5.0601806640625, -4.74462890625, -4.4290771484375, -4.113525390625, -3.7979736328125, -3.482421875, -3.1668701171875, -2.851318359375, -2.5357666015625, -2.22021484375, -1.9046630859375, -1.589111328125, -1.2735595703125, -0.9580078125, -0.6424560546875, -0.326904296875, -0.0113525390625, 0.30419921875, 0.6197509765625, 0.935302734375, 1.2508544921875, 1.56640625, 1.8819580078125, 2.197509765625, 2.5130615234375, 2.82861328125, 3.1441650390625, 3.459716796875, 3.7752685546875, 4.0908203125, 4.4063720703125, 4.721923828125, 5.0374755859375, 5.35302734375, 5.6685791015625, 5.984130859375, 6.2996826171875, 6.615234375, 6.9307861328125, 7.246337890625, 7.5618896484375, 7.87744140625, 8.1929931640625, 8.508544921875, 8.8240966796875, 9.1396484375, 9.4552001953125, 9.770751953125, 10.0863037109375, 10.40185546875, 10.7174072265625, 11.032958984375, 11.3485107421875, 11.6640625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 14.0, 12.0, 32.0, 46.0, 72.0, 102.0, 144.0, 218.0, 365.0, 578.0, 830.0, 1508.0, 2624.0, 4919.0, 9918.0, 22174.0, 56433.0, 166351.0, 402533.0, 242603.0, 80594.0, 29574.0, 12777.0, 6072.0, 3280.0, 1857.0, 1092.0, 624.0, 415.0, 263.0, 142.0, 112.0, 75.0, 50.0, 33.0, 22.0, 22.0, 13.0, 10.0, 11.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.24609375, -1.2111587524414062, -1.1762237548828125, -1.1412887573242188, -1.106353759765625, -1.0714187622070312, -1.0364837646484375, -1.0015487670898438, -0.96661376953125, -0.9316787719726562, -0.8967437744140625, -0.8618087768554688, -0.826873779296875, -0.7919387817382812, -0.7570037841796875, -0.7220687866210938, -0.6871337890625, -0.6521987915039062, -0.6172637939453125, -0.5823287963867188, -0.547393798828125, -0.5124588012695312, -0.4775238037109375, -0.44258880615234375, -0.40765380859375, -0.37271881103515625, -0.3377838134765625, -0.30284881591796875, -0.267913818359375, -0.23297882080078125, -0.1980438232421875, -0.16310882568359375, -0.128173828125, -0.09323883056640625, -0.0583038330078125, -0.02336883544921875, 0.011566162109375, 0.04650115966796875, 0.0814361572265625, 0.11637115478515625, 0.15130615234375, 0.18624114990234375, 0.2211761474609375, 0.25611114501953125, 0.291046142578125, 0.32598114013671875, 0.3609161376953125, 0.39585113525390625, 0.4307861328125, 0.46572113037109375, 0.5006561279296875, 0.5355911254882812, 0.570526123046875, 0.6054611206054688, 0.6403961181640625, 0.6753311157226562, 0.71026611328125, 0.7452011108398438, 0.7801361083984375, 0.8150711059570312, 0.850006103515625, 0.8849411010742188, 0.9198760986328125, 0.9548110961914062, 0.98974609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 9.0, 9.0, 12.0, 19.0, 15.0, 21.0, 22.0, 31.0, 21.0, 32.0, 45.0, 46.0, 47.0, 46.0, 54.0, 57.0, 69.0, 64.0, 50.0, 45.0, 41.0, 50.0, 39.0, 35.0, 22.0, 18.0, 18.0, 15.0, 7.0, 16.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.342477768659592e-05, -4.160962998867035e-05, -3.979448229074478e-05, -3.7979334592819214e-05, -3.6164186894893646e-05, -3.434903919696808e-05, -3.253389149904251e-05, -3.071874380111694e-05, -2.8903596103191376e-05, -2.7088448405265808e-05, -2.527330070734024e-05, -2.3458153009414673e-05, -2.1643005311489105e-05, -1.9827857613563538e-05, -1.801270991563797e-05, -1.6197562217712402e-05, -1.4382414519786835e-05, -1.2567266821861267e-05, -1.07521191239357e-05, -8.936971426010132e-06, -7.121823728084564e-06, -5.306676030158997e-06, -3.491528332233429e-06, -1.6763806343078613e-06, 1.387670636177063e-07, 1.953914761543274e-06, 3.7690624594688416e-06, 5.584210157394409e-06, 7.399357855319977e-06, 9.214505553245544e-06, 1.1029653251171112e-05, 1.284480094909668e-05, 1.4659948647022247e-05, 1.6475096344947815e-05, 1.8290244042873383e-05, 2.010539174079895e-05, 2.1920539438724518e-05, 2.3735687136650085e-05, 2.5550834834575653e-05, 2.736598253250122e-05, 2.918113023042679e-05, 3.0996277928352356e-05, 3.2811425626277924e-05, 3.462657332420349e-05, 3.644172102212906e-05, 3.8256868720054626e-05, 4.0072016417980194e-05, 4.188716411590576e-05, 4.370231181383133e-05, 4.55174595117569e-05, 4.7332607209682465e-05, 4.914775490760803e-05, 5.09629026055336e-05, 5.277805030345917e-05, 5.4593198001384735e-05, 5.64083456993103e-05, 5.822349339723587e-05, 6.003864109516144e-05, 6.1853788793087e-05, 6.366893649101257e-05, 6.548408418893814e-05, 6.729923188686371e-05, 6.911437958478928e-05, 7.092952728271484e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 6.0, 15.0, 19.0, 29.0, 37.0, 68.0, 98.0, 170.0, 252.0, 410.0, 665.0, 1146.0, 1899.0, 3388.0, 6521.0, 12345.0, 25863.0, 58299.0, 142829.0, 331676.0, 267569.0, 107554.0, 44990.0, 20431.0, 9903.0, 5264.0, 2939.0, 1661.0, 955.0, 583.0, 319.0, 218.0, 149.0, 94.0, 55.0, 36.0, 23.0, 25.0, 13.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7021484375, -1.65185546875, -1.6015625, -1.55126953125, -1.5009765625, -1.45068359375, -1.400390625, -1.35009765625, -1.2998046875, -1.24951171875, -1.19921875, -1.14892578125, -1.0986328125, -1.04833984375, -0.998046875, -0.94775390625, -0.8974609375, -0.84716796875, -0.796875, -0.74658203125, -0.6962890625, -0.64599609375, -0.595703125, -0.54541015625, -0.4951171875, -0.44482421875, -0.39453125, -0.34423828125, -0.2939453125, -0.24365234375, -0.193359375, -0.14306640625, -0.0927734375, -0.04248046875, 0.0078125, 0.05810546875, 0.1083984375, 0.15869140625, 0.208984375, 0.25927734375, 0.3095703125, 0.35986328125, 0.41015625, 0.46044921875, 0.5107421875, 0.56103515625, 0.611328125, 0.66162109375, 0.7119140625, 0.76220703125, 0.8125, 0.86279296875, 0.9130859375, 0.96337890625, 1.013671875, 1.06396484375, 1.1142578125, 1.16455078125, 1.21484375, 1.26513671875, 1.3154296875, 1.36572265625, 1.416015625, 1.46630859375, 1.5166015625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 9.0, 18.0, 12.0, 24.0, 23.0, 26.0, 32.0, 48.0, 73.0, 86.0, 102.0, 88.0, 95.0, 68.0, 65.0, 38.0, 29.0, 24.0, 27.0, 16.0, 11.0, 14.0, 10.0, 8.0, 8.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3515625, -0.34032440185546875, -0.3290863037109375, -0.31784820556640625, -0.306610107421875, -0.29537200927734375, -0.2841339111328125, -0.27289581298828125, -0.26165771484375, -0.25041961669921875, -0.2391815185546875, -0.22794342041015625, -0.216705322265625, -0.20546722412109375, -0.1942291259765625, -0.18299102783203125, -0.1717529296875, -0.16051483154296875, -0.1492767333984375, -0.13803863525390625, -0.126800537109375, -0.11556243896484375, -0.1043243408203125, -0.09308624267578125, -0.08184814453125, -0.07061004638671875, -0.0593719482421875, -0.04813385009765625, -0.036895751953125, -0.02565765380859375, -0.0144195556640625, -0.00318145751953125, 0.008056640625, 0.01929473876953125, 0.0305328369140625, 0.04177093505859375, 0.053009033203125, 0.06424713134765625, 0.0754852294921875, 0.08672332763671875, 0.09796142578125, 0.10919952392578125, 0.1204376220703125, 0.13167572021484375, 0.142913818359375, 0.15415191650390625, 0.1653900146484375, 0.17662811279296875, 0.1878662109375, 0.19910430908203125, 0.2103424072265625, 0.22158050537109375, 0.232818603515625, 0.24405670166015625, 0.2552947998046875, 0.26653289794921875, 0.27777099609375, 0.28900909423828125, 0.3002471923828125, 0.31148529052734375, 0.322723388671875, 0.33396148681640625, 0.3451995849609375, 0.35643768310546875, 0.36767578125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 14.0, 18.0, 22.0, 15.0, 25.0, 28.0, 30.0, 43.0, 49.0, 57.0, 50.0, 52.0, 67.0, 46.0, 55.0, 47.0, 44.0, 47.0, 40.0, 43.0, 31.0, 21.0, 23.0, 20.0, 18.0, 11.0, 15.0, 8.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.85535430908203, -25.023740768432617, -24.192127227783203, -23.360515594482422, -22.528902053833008, -21.697288513183594, -20.865676879882812, -20.0340633392334, -19.202449798583984, -18.37083625793457, -17.539222717285156, -16.707611083984375, -15.875997543334961, -15.044384002685547, -14.21277141571045, -13.381158828735352, -12.549545288085938, -11.717931747436523, -10.886319160461426, -10.054706573486328, -9.223093032836914, -8.3914794921875, -7.559866905212402, -6.7282538414001465, -5.896640777587891, -5.065027713775635, -4.233414649963379, -3.401801586151123, -2.570188522338867, -1.7385754585266113, -0.9069623947143555, -0.07534933090209961, 0.7562618255615234, 1.5878748893737793, 2.419487953186035, 3.251101016998291, 4.082714080810547, 4.914327144622803, 5.745940208435059, 6.5775532722473145, 7.40916633605957, 8.240779876708984, 9.072392463684082, 9.90400505065918, 10.735618591308594, 11.567232131958008, 12.398844718933105, 13.230457305908203, 14.062070846557617, 14.893684387207031, 15.725296974182129, 16.556909561157227, 17.38852310180664, 18.220136642456055, 19.05175018310547, 19.88336181640625, 20.714975357055664, 21.546588897705078, 22.37820053100586, 23.209814071655273, 24.041427612304688, 24.8730411529541, 25.704654693603516, 26.536266326904297, 27.36787986755371]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 7.0, 11.0, 13.0, 15.0, 18.0, 26.0, 28.0, 28.0, 24.0, 25.0, 31.0, 29.0, 35.0, 45.0, 40.0, 42.0, 48.0, 43.0, 43.0, 47.0, 40.0, 44.0, 32.0, 42.0, 24.0, 24.0, 25.0, 28.0, 20.0, 16.0, 22.0, 8.0, 9.0, 14.0, 4.0, 10.0, 5.0, 6.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.82365608215332, -16.316802978515625, -15.809948921203613, -15.303094863891602, -14.796241760253906, -14.289387702941895, -13.782533645629883, -13.275680541992188, -12.768826484680176, -12.261972427368164, -11.755119323730469, -11.248265266418457, -10.741411209106445, -10.23455810546875, -9.727704048156738, -9.220849990844727, -8.713996887207031, -8.20714282989502, -7.700289726257324, -7.1934356689453125, -6.686582088470459, -6.1797285079956055, -5.672874450683594, -5.16602087020874, -4.659167289733887, -4.152313709259033, -3.6454598903656006, -3.138606071472168, -2.6317524909973145, -2.124898910522461, -1.6180450916290283, -1.1111912727355957, -0.6043376922607422, -0.09748399257659912, 0.40936970710754395, 0.916223406791687, 1.42307710647583, 1.9299306869506836, 2.436784505844116, 2.943638324737549, 3.4504919052124023, 3.957345485687256, 4.464199066162109, 4.971053123474121, 5.477906703948975, 5.984760284423828, 6.49161434173584, 6.998467922210693, 7.505321502685547, 8.012175559997559, 8.519028663635254, 9.025882720947266, 9.532735824584961, 10.039589881896973, 10.546443939208984, 11.05329704284668, 11.560151100158691, 12.067005157470703, 12.573858261108398, 13.08071231842041, 13.587566375732422, 14.094419479370117, 14.601273536682129, 15.10812759399414, 15.614980697631836]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 5.0, 9.0, 18.0, 25.0, 40.0, 61.0, 102.0, 113.0, 201.0, 276.0, 436.0, 620.0, 942.0, 1449.0, 2144.0, 3367.0, 5425.0, 8863.0, 14251.0, 24064.0, 39697.0, 64724.0, 99214.0, 135284.0, 158342.0, 151582.0, 119922.0, 82618.0, 52738.0, 31782.0, 19031.0, 11579.0, 6980.0, 4341.0, 2838.0, 1736.0, 1211.0, 809.0, 576.0, 360.0, 230.0, 179.0, 98.0, 68.0, 71.0, 34.0, 33.0, 16.0, 15.0, 9.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-13.8984375, -13.4610595703125, -13.023681640625, -12.5863037109375, -12.14892578125, -11.7115478515625, -11.274169921875, -10.8367919921875, -10.3994140625, -9.9620361328125, -9.524658203125, -9.0872802734375, -8.64990234375, -8.2125244140625, -7.775146484375, -7.3377685546875, -6.900390625, -6.4630126953125, -6.025634765625, -5.5882568359375, -5.15087890625, -4.7135009765625, -4.276123046875, -3.8387451171875, -3.4013671875, -2.9639892578125, -2.526611328125, -2.0892333984375, -1.65185546875, -1.2144775390625, -0.777099609375, -0.3397216796875, 0.09765625, 0.5350341796875, 0.972412109375, 1.4097900390625, 1.84716796875, 2.2845458984375, 2.721923828125, 3.1593017578125, 3.5966796875, 4.0340576171875, 4.471435546875, 4.9088134765625, 5.34619140625, 5.7835693359375, 6.220947265625, 6.6583251953125, 7.095703125, 7.5330810546875, 7.970458984375, 8.4078369140625, 8.84521484375, 9.2825927734375, 9.719970703125, 10.1573486328125, 10.5947265625, 11.0321044921875, 11.469482421875, 11.9068603515625, 12.34423828125, 12.7816162109375, 13.218994140625, 13.6563720703125, 14.09375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 2.0, 3.0, 7.0, 11.0, 6.0, 3.0, 9.0, 18.0, 20.0, 17.0, 24.0, 22.0, 27.0, 21.0, 33.0, 32.0, 33.0, 46.0, 31.0, 40.0, 44.0, 35.0, 50.0, 49.0, 41.0, 36.0, 47.0, 40.0, 31.0, 28.0, 21.0, 21.0, 32.0, 24.0, 16.0, 12.0, 13.0, 7.0, 14.0, 4.0, 8.0, 2.0, 6.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.265625, -15.720458984375, -15.17529296875, -14.630126953125, -14.0849609375, -13.539794921875, -12.99462890625, -12.449462890625, -11.904296875, -11.359130859375, -10.81396484375, -10.268798828125, -9.7236328125, -9.178466796875, -8.63330078125, -8.088134765625, -7.54296875, -6.997802734375, -6.45263671875, -5.907470703125, -5.3623046875, -4.817138671875, -4.27197265625, -3.726806640625, -3.181640625, -2.636474609375, -2.09130859375, -1.546142578125, -1.0009765625, -0.455810546875, 0.08935546875, 0.634521484375, 1.1796875, 1.724853515625, 2.27001953125, 2.815185546875, 3.3603515625, 3.905517578125, 4.45068359375, 4.995849609375, 5.541015625, 6.086181640625, 6.63134765625, 7.176513671875, 7.7216796875, 8.266845703125, 8.81201171875, 9.357177734375, 9.90234375, 10.447509765625, 10.99267578125, 11.537841796875, 12.0830078125, 12.628173828125, 13.17333984375, 13.718505859375, 14.263671875, 14.808837890625, 15.35400390625, 15.899169921875, 16.4443359375, 16.989501953125, 17.53466796875, 18.079833984375, 18.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 10.0, 15.0, 23.0, 33.0, 64.0, 72.0, 132.0, 181.0, 233.0, 441.0, 682.0, 1020.0, 1711.0, 2785.0, 4509.0, 7514.0, 12694.0, 21799.0, 38302.0, 71337.0, 128453.0, 194217.0, 208427.0, 153164.0, 87746.0, 48125.0, 26338.0, 15403.0, 8828.0, 5439.0, 3289.0, 2021.0, 1273.0, 823.0, 493.0, 332.0, 186.0, 153.0, 80.0, 66.0, 44.0, 29.0, 18.0, 13.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0], "bins": [-26.90625, -26.141357421875, -25.37646484375, -24.611572265625, -23.8466796875, -23.081787109375, -22.31689453125, -21.552001953125, -20.787109375, -20.022216796875, -19.25732421875, -18.492431640625, -17.7275390625, -16.962646484375, -16.19775390625, -15.432861328125, -14.66796875, -13.903076171875, -13.13818359375, -12.373291015625, -11.6083984375, -10.843505859375, -10.07861328125, -9.313720703125, -8.548828125, -7.783935546875, -7.01904296875, -6.254150390625, -5.4892578125, -4.724365234375, -3.95947265625, -3.194580078125, -2.4296875, -1.664794921875, -0.89990234375, -0.135009765625, 0.6298828125, 1.394775390625, 2.15966796875, 2.924560546875, 3.689453125, 4.454345703125, 5.21923828125, 5.984130859375, 6.7490234375, 7.513916015625, 8.27880859375, 9.043701171875, 9.80859375, 10.573486328125, 11.33837890625, 12.103271484375, 12.8681640625, 13.633056640625, 14.39794921875, 15.162841796875, 15.927734375, 16.692626953125, 17.45751953125, 18.222412109375, 18.9873046875, 19.752197265625, 20.51708984375, 21.281982421875, 22.046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 13.0, 10.0, 18.0, 14.0, 17.0, 23.0, 33.0, 34.0, 32.0, 24.0, 36.0, 40.0, 31.0, 36.0, 32.0, 42.0, 57.0, 46.0, 35.0, 48.0, 42.0, 27.0, 31.0, 24.0, 35.0, 26.0, 29.0, 23.0, 18.0, 21.0, 18.0, 16.0, 10.0, 6.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.34375, -10.009521484375, -9.67529296875, -9.341064453125, -9.0068359375, -8.672607421875, -8.33837890625, -8.004150390625, -7.669921875, -7.335693359375, -7.00146484375, -6.667236328125, -6.3330078125, -5.998779296875, -5.66455078125, -5.330322265625, -4.99609375, -4.661865234375, -4.32763671875, -3.993408203125, -3.6591796875, -3.324951171875, -2.99072265625, -2.656494140625, -2.322265625, -1.988037109375, -1.65380859375, -1.319580078125, -0.9853515625, -0.651123046875, -0.31689453125, 0.017333984375, 0.3515625, 0.685791015625, 1.02001953125, 1.354248046875, 1.6884765625, 2.022705078125, 2.35693359375, 2.691162109375, 3.025390625, 3.359619140625, 3.69384765625, 4.028076171875, 4.3623046875, 4.696533203125, 5.03076171875, 5.364990234375, 5.69921875, 6.033447265625, 6.36767578125, 6.701904296875, 7.0361328125, 7.370361328125, 7.70458984375, 8.038818359375, 8.373046875, 8.707275390625, 9.04150390625, 9.375732421875, 9.7099609375, 10.044189453125, 10.37841796875, 10.712646484375, 11.046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 14.0, 22.0, 25.0, 45.0, 87.0, 106.0, 203.0, 309.0, 518.0, 806.0, 1284.0, 2070.0, 3483.0, 5641.0, 9139.0, 14768.0, 23693.0, 36814.0, 54761.0, 77116.0, 101145.0, 119514.0, 127746.0, 122465.0, 103540.0, 81023.0, 57734.0, 38758.0, 24921.0, 15596.0, 9686.0, 5890.0, 3751.0, 2226.0, 1374.0, 827.0, 559.0, 337.0, 199.0, 135.0, 71.0, 65.0, 32.0, 18.0, 11.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.98626708984375, -3.8514404296875, -3.71661376953125, -3.581787109375, -3.44696044921875, -3.3121337890625, -3.17730712890625, -3.04248046875, -2.90765380859375, -2.7728271484375, -2.63800048828125, -2.503173828125, -2.36834716796875, -2.2335205078125, -2.09869384765625, -1.9638671875, -1.82904052734375, -1.6942138671875, -1.55938720703125, -1.424560546875, -1.28973388671875, -1.1549072265625, -1.02008056640625, -0.88525390625, -0.75042724609375, -0.6156005859375, -0.48077392578125, -0.345947265625, -0.21112060546875, -0.0762939453125, 0.05853271484375, 0.193359375, 0.32818603515625, 0.4630126953125, 0.59783935546875, 0.732666015625, 0.86749267578125, 1.0023193359375, 1.13714599609375, 1.27197265625, 1.40679931640625, 1.5416259765625, 1.67645263671875, 1.811279296875, 1.94610595703125, 2.0809326171875, 2.21575927734375, 2.3505859375, 2.48541259765625, 2.6202392578125, 2.75506591796875, 2.889892578125, 3.02471923828125, 3.1595458984375, 3.29437255859375, 3.42919921875, 3.56402587890625, 3.6988525390625, 3.83367919921875, 3.968505859375, 4.10333251953125, 4.2381591796875, 4.37298583984375, 4.5078125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 9.0, 3.0, 15.0, 12.0, 14.0, 33.0, 25.0, 32.0, 42.0, 45.0, 45.0, 41.0, 49.0, 55.0, 50.0, 66.0, 47.0, 56.0, 35.0, 57.0, 40.0, 43.0, 31.0, 23.0, 21.0, 15.0, 12.0, 19.0, 11.0, 7.0, 8.0, 4.0, 6.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005626678466796875, -0.0005427002906799316, -0.0005227327346801758, -0.0005027651786804199, -0.00048279762268066406, -0.0004628300666809082, -0.00044286251068115234, -0.0004228949546813965, -0.0004029273986816406, -0.00038295984268188477, -0.0003629922866821289, -0.00034302473068237305, -0.0003230571746826172, -0.00030308961868286133, -0.00028312206268310547, -0.0002631545066833496, -0.00024318695068359375, -0.0002232193946838379, -0.00020325183868408203, -0.00018328428268432617, -0.0001633167266845703, -0.00014334917068481445, -0.0001233816146850586, -0.00010341405868530273, -8.344650268554688e-05, -6.347894668579102e-05, -4.3511390686035156e-05, -2.3543834686279297e-05, -3.5762786865234375e-06, 1.6391277313232422e-05, 3.635883331298828e-05, 5.632638931274414e-05, 7.62939453125e-05, 9.626150131225586e-05, 0.00011622905731201172, 0.00013619661331176758, 0.00015616416931152344, 0.0001761317253112793, 0.00019609928131103516, 0.00021606683731079102, 0.00023603439331054688, 0.00025600194931030273, 0.0002759695053100586, 0.00029593706130981445, 0.0003159046173095703, 0.00033587217330932617, 0.00035583972930908203, 0.0003758072853088379, 0.00039577484130859375, 0.0004157423973083496, 0.00043570995330810547, 0.00045567750930786133, 0.0004756450653076172, 0.000495612621307373, 0.0005155801773071289, 0.0005355477333068848, 0.0005555152893066406, 0.0005754828453063965, 0.0005954504013061523, 0.0006154179573059082, 0.0006353855133056641, 0.0006553530693054199, 0.0006753206253051758, 0.0006952881813049316, 0.0007152557373046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 12.0, 13.0, 30.0, 58.0, 61.0, 107.0, 137.0, 237.0, 413.0, 607.0, 986.0, 1594.0, 2623.0, 4662.0, 7495.0, 12281.0, 19785.0, 31897.0, 48446.0, 69765.0, 93936.0, 114920.0, 126316.0, 126040.0, 112129.0, 88951.0, 65175.0, 44550.0, 28895.0, 18306.0, 10978.0, 6732.0, 4050.0, 2463.0, 1470.0, 909.0, 593.0, 332.0, 212.0, 132.0, 86.0, 50.0, 46.0, 28.0, 13.0, 10.0, 4.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.98773193359375, -3.8543701171875, -3.72100830078125, -3.587646484375, -3.45428466796875, -3.3209228515625, -3.18756103515625, -3.05419921875, -2.92083740234375, -2.7874755859375, -2.65411376953125, -2.520751953125, -2.38739013671875, -2.2540283203125, -2.12066650390625, -1.9873046875, -1.85394287109375, -1.7205810546875, -1.58721923828125, -1.453857421875, -1.32049560546875, -1.1871337890625, -1.05377197265625, -0.92041015625, -0.78704833984375, -0.6536865234375, -0.52032470703125, -0.386962890625, -0.25360107421875, -0.1202392578125, 0.01312255859375, 0.146484375, 0.27984619140625, 0.4132080078125, 0.54656982421875, 0.679931640625, 0.81329345703125, 0.9466552734375, 1.08001708984375, 1.21337890625, 1.34674072265625, 1.4801025390625, 1.61346435546875, 1.746826171875, 1.88018798828125, 2.0135498046875, 2.14691162109375, 2.2802734375, 2.41363525390625, 2.5469970703125, 2.68035888671875, 2.813720703125, 2.94708251953125, 3.0804443359375, 3.21380615234375, 3.34716796875, 3.48052978515625, 3.6138916015625, 3.74725341796875, 3.880615234375, 4.01397705078125, 4.1473388671875, 4.28070068359375, 4.4140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 8.0, 14.0, 16.0, 15.0, 24.0, 22.0, 24.0, 22.0, 30.0, 43.0, 65.0, 56.0, 50.0, 56.0, 57.0, 49.0, 40.0, 45.0, 44.0, 46.0, 49.0, 35.0, 27.0, 26.0, 20.0, 11.0, 22.0, 11.0, 11.0, 13.0, 12.0, 11.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3601226806640625, -1.311065673828125, -1.2620086669921875, -1.21295166015625, -1.1638946533203125, -1.114837646484375, -1.0657806396484375, -1.0167236328125, -0.9676666259765625, -0.918609619140625, -0.8695526123046875, -0.82049560546875, -0.7714385986328125, -0.722381591796875, -0.6733245849609375, -0.624267578125, -0.5752105712890625, -0.526153564453125, -0.4770965576171875, -0.42803955078125, -0.3789825439453125, -0.329925537109375, -0.2808685302734375, -0.2318115234375, -0.1827545166015625, -0.133697509765625, -0.0846405029296875, -0.03558349609375, 0.0134735107421875, 0.062530517578125, 0.1115875244140625, 0.16064453125, 0.2097015380859375, 0.258758544921875, 0.3078155517578125, 0.35687255859375, 0.4059295654296875, 0.454986572265625, 0.5040435791015625, 0.5531005859375, 0.6021575927734375, 0.651214599609375, 0.7002716064453125, 0.74932861328125, 0.7983856201171875, 0.847442626953125, 0.8964996337890625, 0.945556640625, 0.9946136474609375, 1.043670654296875, 1.0927276611328125, 1.14178466796875, 1.1908416748046875, 1.239898681640625, 1.2889556884765625, 1.3380126953125, 1.3870697021484375, 1.436126708984375, 1.4851837158203125, 1.53424072265625, 1.5832977294921875, 1.632354736328125, 1.6814117431640625, 1.73046875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 8.0, 13.0, 15.0, 13.0, 19.0, 24.0, 26.0, 30.0, 37.0, 36.0, 36.0, 42.0, 45.0, 47.0, 52.0, 50.0, 50.0, 46.0, 40.0, 46.0, 43.0, 41.0, 32.0, 26.0, 22.0, 26.0, 19.0, 19.0, 22.0, 10.0, 7.0, 9.0, 4.0, 1.0, 10.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.880517959594727, -23.07769012451172, -22.274864196777344, -21.472036361694336, -20.669208526611328, -19.86638069152832, -19.063552856445312, -18.260726928710938, -17.45789909362793, -16.655071258544922, -15.85224437713623, -15.049417495727539, -14.246589660644531, -13.443761825561523, -12.640934944152832, -11.83810806274414, -11.035280227661133, -10.232452392578125, -9.429625511169434, -8.626798629760742, -7.823970794677734, -7.021143436431885, -6.218316078186035, -5.4154887199401855, -4.612661361694336, -3.8098340034484863, -3.0070066452026367, -2.204179286956787, -1.4013519287109375, -0.5985245704650879, 0.20430278778076172, 1.0071301460266113, 1.8099594116210938, 2.6127867698669434, 3.415614128112793, 4.218441486358643, 5.021268844604492, 5.824096202850342, 6.626923561096191, 7.429750919342041, 8.23257827758789, 9.035406112670898, 9.83823299407959, 10.641059875488281, 11.443887710571289, 12.246715545654297, 13.049542427062988, 13.85236930847168, 14.655197143554688, 15.458024978637695, 16.260852813720703, 17.063678741455078, 17.866506576538086, 18.669334411621094, 19.47216033935547, 20.274988174438477, 21.077816009521484, 21.880643844604492, 22.6834716796875, 23.486297607421875, 24.289125442504883, 25.09195327758789, 25.894779205322266, 26.697607040405273, 27.50043487548828]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 2.0, 4.0, 9.0, 10.0, 11.0, 12.0, 14.0, 16.0, 16.0, 30.0, 23.0, 18.0, 24.0, 39.0, 27.0, 51.0, 33.0, 51.0, 36.0, 38.0, 47.0, 38.0, 43.0, 54.0, 35.0, 42.0, 40.0, 34.0, 29.0, 27.0, 19.0, 27.0, 18.0, 14.0, 11.0, 12.0, 7.0, 13.0, 6.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.928369522094727, -18.264009475708008, -17.599651336669922, -16.935291290283203, -16.270931243896484, -15.606571197509766, -14.942212104797363, -14.277853012084961, -13.613492965698242, -12.949132919311523, -12.284773826599121, -11.620414733886719, -10.9560546875, -10.291694641113281, -9.627335548400879, -8.962976455688477, -8.298616409301758, -7.634256839752197, -6.969897270202637, -6.305537700653076, -5.641178131103516, -4.976818561553955, -4.3124589920043945, -3.648099422454834, -2.9837398529052734, -2.319380283355713, -1.6550207138061523, -0.9906611442565918, -0.32630157470703125, 0.3380579948425293, 1.0024175643920898, 1.6667771339416504, 2.3311386108398438, 2.9954981803894043, 3.659857749938965, 4.324217319488525, 4.988576889038086, 5.6529364585876465, 6.317296028137207, 6.981655597686768, 7.646015167236328, 8.310375213623047, 8.97473430633545, 9.639093399047852, 10.30345344543457, 10.967813491821289, 11.632172584533691, 12.296531677246094, 12.960891723632812, 13.625251770019531, 14.289610862731934, 14.953969955444336, 15.618330001831055, 16.282690048217773, 16.94704818725586, 17.611408233642578, 18.275768280029297, 18.940128326416016, 19.604488372802734, 20.26884651184082, 20.93320655822754, 21.597566604614258, 22.261924743652344, 22.926284790039062, 23.59064483642578]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 3.0, 7.0, 8.0, 15.0, 17.0, 17.0, 26.0, 36.0, 46.0, 65.0, 85.0, 123.0, 164.0, 208.0, 332.0, 436.0, 701.0, 906.0, 1304.0, 1947.0, 2906.0, 4318.0, 6882.0, 476493.0, 10099.0, 5475.0, 3597.0, 2507.0, 1730.0, 1121.0, 775.0, 522.0, 374.0, 279.0, 185.0, 156.0, 104.0, 81.0, 53.0, 41.0, 37.0, 21.0, 13.0, 13.0, 13.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-262.853271484375, -255.07308959960938, -247.29290771484375, -239.51272583007812, -231.7325439453125, -223.95236206054688, -216.17218017578125, -208.39199829101562, -200.61181640625, -192.83163452148438, -185.05145263671875, -177.27127075195312, -169.4910888671875, -161.71090698242188, -153.93072509765625, -146.15054321289062, -138.37037658691406, -130.59019470214844, -122.81001281738281, -115.02983093261719, -107.24964904785156, -99.46946716308594, -91.68929290771484, -83.90911102294922, -76.1289291381836, -68.34874725341797, -60.568565368652344, -52.788387298583984, -45.00820541381836, -37.228023529052734, -29.447845458984375, -21.66766357421875, -13.887481689453125, -6.107300758361816, 1.6728801727294922, 9.453060150146484, 17.23324203491211, 25.013423919677734, 32.793601989746094, 40.57378387451172, 48.353965759277344, 56.13414764404297, 63.914329528808594, 71.69450378417969, 79.47468566894531, 87.25486755371094, 95.03504943847656, 102.81523132324219, 110.59541320800781, 118.37559509277344, 126.15577697753906, 133.9359588623047, 141.7161407470703, 149.49632263183594, 157.2764892578125, 165.05667114257812, 172.83685302734375, 180.61703491210938, 188.397216796875, 196.17739868164062, 203.95758056640625, 211.73776245117188, 219.5179443359375, 227.29812622070312, 235.07830810546875]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 15.0, 12.0, 14.0, 14.0, 17.0, 29.0, 24.0, 22.0, 26.0, 34.0, 37.0, 49.0, 26.0, 51.0, 39.0, 44.0, 1068.0, 42.0, 40.0, 47.0, 38.0, 45.0, 38.0, 38.0, 25.0, 24.0, 21.0, 26.0, 17.0, 14.0, 10.0, 10.0, 9.0, 11.0, 5.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-569.2527465820312, -549.275390625, -529.298095703125, -509.3207702636719, -489.34344482421875, -469.3661193847656, -449.3887939453125, -429.4114685058594, -409.43414306640625, -389.4568176269531, -369.4794921875, -349.5021667480469, -329.52484130859375, -309.5475158691406, -289.5701904296875, -269.5928649902344, -249.61553955078125, -229.63821411132812, -209.660888671875, -189.68356323242188, -169.70623779296875, -149.72891235351562, -129.7515869140625, -109.77426147460938, -89.79693603515625, -69.81961059570312, -49.84228515625, -29.864959716796875, -9.88763427734375, 10.089691162109375, 30.0670166015625, 50.044342041015625, 70.02166748046875, 89.99899291992188, 109.976318359375, 129.95364379882812, 149.93096923828125, 169.90829467773438, 189.8856201171875, 209.86294555664062, 229.84027099609375, 249.81759643554688, 269.794921875, 289.7722473144531, 309.74957275390625, 329.7268981933594, 349.7042236328125, 369.6815490722656, 389.65887451171875, 409.6361999511719, 429.613525390625, 449.5908508300781, 469.56817626953125, 489.5455017089844, 509.5228271484375, 529.5001220703125, 549.4774780273438, 569.454833984375, 589.43212890625, 609.409423828125, 629.3867797851562, 649.3641357421875, 669.3414306640625, 689.3187255859375, 709.2960815429688]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 11.0, 4.0, 13.0, 12.0, 23.0, 19.0, 25.0, 30.0, 39.0, 57.0, 61.0, 83.0, 115.0, 169.0, 187.0, 270.0, 332.0, 454.0, 768.0, 1085.0, 1634.0, 2553.0, 4024.0, 6090.0, 8545.0, 11610.0, 17066.0, 25962.0, 329084.0, 30730356.0, 46675.0, 33437.0, 14869.0, 7545.0, 4124.0, 2577.0, 1621.0, 1047.0, 640.0, 405.0, 292.0, 210.0, 119.0, 82.0, 59.0, 44.0, 29.0, 20.0, 19.0, 11.0, 10.0, 3.0, 2.0, 1.0, 3.0], "bins": [-342.8861999511719, -333.8775329589844, -324.86883544921875, -315.86016845703125, -306.8514709472656, -297.8428039550781, -288.8341064453125, -279.825439453125, -270.8167724609375, -261.80810546875, -252.79940795898438, -243.7907257080078, -234.78204345703125, -225.77337646484375, -216.7646942138672, -207.75601196289062, -198.747314453125, -189.73863220214844, -180.72994995117188, -171.7212677001953, -162.71258544921875, -153.70391845703125, -144.6952362060547, -135.68655395507812, -126.67787170410156, -117.669189453125, -108.66050720214844, -99.6518325805664, -90.64315032958984, -81.63446807861328, -72.62579345703125, -63.61711120605469, -54.60844421386719, -45.599761962890625, -36.59108352661133, -27.5824031829834, -18.57372283935547, -9.565040588378906, -0.5563621520996094, 8.452316284179688, 17.46099853515625, 26.46967887878418, 35.47835922241211, 44.487037658691406, 53.49571990966797, 62.50440216064453, 71.51307678222656, 80.52175903320312, 89.53044128417969, 98.53912353515625, 107.54780578613281, 116.55648040771484, 125.5651626586914, 134.5738525390625, 143.58251953125, 152.59120178222656, 161.59988403320312, 170.6085662841797, 179.61724853515625, 188.6259307861328, 197.63461303710938, 206.64328002929688, 215.65196228027344, 224.66064453125, 233.66932678222656]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 26.0, 30.0, 37.0, 63.0, 61.0, 107.0, 143.0, 202.0, 329.0, 444.0, 621.0, 894.0, 1354.0, 2017.0, 3146.0, 4826.0, 7562.0, 11852.0, 20052.0, 35450.0, 67156.0, 138020.0, 322803.0, 933733.0, 2966787.0, 1090137.0, 363266.0, 151850.0, 73041.0, 38556.0, 21264.0, 12682.0, 7813.0, 4975.0, 3415.0, 2162.0, 1516.0, 925.0, 633.0, 425.0, 270.0, 221.0, 161.0, 105.0, 80.0, 66.0, 37.0, 30.0, 25.0, 11.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 4.0], "bins": [-11.640625, -11.2718505859375, -10.903076171875, -10.5343017578125, -10.16552734375, -9.7967529296875, -9.427978515625, -9.0592041015625, -8.6904296875, -8.3216552734375, -7.952880859375, -7.5841064453125, -7.21533203125, -6.8465576171875, -6.477783203125, -6.1090087890625, -5.740234375, -5.3714599609375, -5.002685546875, -4.6339111328125, -4.26513671875, -3.8963623046875, -3.527587890625, -3.1588134765625, -2.7900390625, -2.4212646484375, -2.052490234375, -1.6837158203125, -1.31494140625, -0.9461669921875, -0.577392578125, -0.2086181640625, 0.16015625, 0.5289306640625, 0.897705078125, 1.2664794921875, 1.63525390625, 2.0040283203125, 2.372802734375, 2.7415771484375, 3.1103515625, 3.4791259765625, 3.847900390625, 4.2166748046875, 4.58544921875, 4.9542236328125, 5.322998046875, 5.6917724609375, 6.060546875, 6.4293212890625, 6.798095703125, 7.1668701171875, 7.53564453125, 7.9044189453125, 8.273193359375, 8.6419677734375, 9.0107421875, 9.3795166015625, 9.748291015625, 10.1170654296875, 10.48583984375, 10.8546142578125, 11.223388671875, 11.5921630859375, 11.9609375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 7.0, 5.0, 7.0, 6.0, 12.0, 10.0, 17.0, 30.0, 16.0, 27.0, 28.0, 25.0, 33.0, 30.0, 34.0, 35.0, 39.0, 43.0, 86.0, 400.0, 425.0, 194.0, 102.0, 68.0, 42.0, 44.0, 48.0, 33.0, 29.0, 24.0, 17.0, 16.0, 21.0, 13.0, 13.0, 13.0, 10.0, 9.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.515625, -22.83984375, -22.1640625, -21.48828125, -20.8125, -20.13671875, -19.4609375, -18.78515625, -18.109375, -17.43359375, -16.7578125, -16.08203125, -15.40625, -14.73046875, -14.0546875, -13.37890625, -12.703125, -12.02734375, -11.3515625, -10.67578125, -10.0, -9.32421875, -8.6484375, -7.97265625, -7.296875, -6.62109375, -5.9453125, -5.26953125, -4.59375, -3.91796875, -3.2421875, -2.56640625, -1.890625, -1.21484375, -0.5390625, 0.13671875, 0.8125, 1.48828125, 2.1640625, 2.83984375, 3.515625, 4.19140625, 4.8671875, 5.54296875, 6.21875, 6.89453125, 7.5703125, 8.24609375, 8.921875, 9.59765625, 10.2734375, 10.94921875, 11.625, 12.30078125, 12.9765625, 13.65234375, 14.328125, 15.00390625, 15.6796875, 16.35546875, 17.03125, 17.70703125, 18.3828125, 19.05859375, 19.734375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 11.0, 19.0, 36.0, 49.0, 47.0, 82.0, 117.0, 162.0, 229.0, 302.0, 571.0, 876.0, 1395.0, 2356.0, 4273.0, 7873.0, 15766.0, 36341.0, 99453.0, 359812.0, 3019000.0, 2259936.0, 324117.0, 92091.0, 34082.0, 14838.0, 7519.0, 3975.0, 2172.0, 1399.0, 883.0, 510.0, 370.0, 263.0, 155.0, 98.0, 60.0, 34.0, 38.0, 39.0, 26.0, 14.0, 10.0, 8.0, 8.0, 6.0, 0.0, 1.0, 5.0, 0.0, 4.0, 2.0], "bins": [-20.609375, -19.984130859375, -19.35888671875, -18.733642578125, -18.1083984375, -17.483154296875, -16.85791015625, -16.232666015625, -15.607421875, -14.982177734375, -14.35693359375, -13.731689453125, -13.1064453125, -12.481201171875, -11.85595703125, -11.230712890625, -10.60546875, -9.980224609375, -9.35498046875, -8.729736328125, -8.1044921875, -7.479248046875, -6.85400390625, -6.228759765625, -5.603515625, -4.978271484375, -4.35302734375, -3.727783203125, -3.1025390625, -2.477294921875, -1.85205078125, -1.226806640625, -0.6015625, 0.023681640625, 0.64892578125, 1.274169921875, 1.8994140625, 2.524658203125, 3.14990234375, 3.775146484375, 4.400390625, 5.025634765625, 5.65087890625, 6.276123046875, 6.9013671875, 7.526611328125, 8.15185546875, 8.777099609375, 9.40234375, 10.027587890625, 10.65283203125, 11.278076171875, 11.9033203125, 12.528564453125, 13.15380859375, 13.779052734375, 14.404296875, 15.029541015625, 15.65478515625, 16.280029296875, 16.9052734375, 17.530517578125, 18.15576171875, 18.781005859375, 19.40625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 2.0, 4.0, 11.0, 9.0, 13.0, 14.0, 22.0, 21.0, 28.0, 32.0, 37.0, 33.0, 47.0, 45.0, 62.0, 84.0, 461.0, 537.0, 165.0, 76.0, 57.0, 46.0, 31.0, 28.0, 34.0, 20.0, 21.0, 17.0, 10.0, 13.0, 11.0, 9.0, 4.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.015625, -26.931396484375, -25.84716796875, -24.762939453125, -23.6787109375, -22.594482421875, -21.51025390625, -20.426025390625, -19.341796875, -18.257568359375, -17.17333984375, -16.089111328125, -15.0048828125, -13.920654296875, -12.83642578125, -11.752197265625, -10.66796875, -9.583740234375, -8.49951171875, -7.415283203125, -6.3310546875, -5.246826171875, -4.16259765625, -3.078369140625, -1.994140625, -0.909912109375, 0.17431640625, 1.258544921875, 2.3427734375, 3.427001953125, 4.51123046875, 5.595458984375, 6.6796875, 7.763916015625, 8.84814453125, 9.932373046875, 11.0166015625, 12.100830078125, 13.18505859375, 14.269287109375, 15.353515625, 16.437744140625, 17.52197265625, 18.606201171875, 19.6904296875, 20.774658203125, 21.85888671875, 22.943115234375, 24.02734375, 25.111572265625, 26.19580078125, 27.280029296875, 28.3642578125, 29.448486328125, 30.53271484375, 31.616943359375, 32.701171875, 33.785400390625, 34.86962890625, 35.953857421875, 37.0380859375, 38.122314453125, 39.20654296875, 40.290771484375, 41.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 4.0, 9.0, 19.0, 17.0, 31.0, 30.0, 41.0, 37.0, 49.0, 88.0, 110.0, 139.0, 225.0, 320.0, 398.0, 592.0, 1103.0, 1766.0, 3329.0, 6911.0, 18645.0, 88253.0, 6040959.0, 94348.0, 18993.0, 6898.0, 3218.0, 1733.0, 1017.0, 629.0, 383.0, 268.0, 251.0, 170.0, 92.0, 64.0, 60.0, 42.0, 40.0, 29.0, 24.0, 14.0, 26.0, 20.0, 12.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-147.375, -142.841796875, -138.30859375, -133.775390625, -129.2421875, -124.708984375, -120.17578125, -115.642578125, -111.109375, -106.576171875, -102.04296875, -97.509765625, -92.9765625, -88.443359375, -83.91015625, -79.376953125, -74.84375, -70.310546875, -65.77734375, -61.244140625, -56.7109375, -52.177734375, -47.64453125, -43.111328125, -38.578125, -34.044921875, -29.51171875, -24.978515625, -20.4453125, -15.912109375, -11.37890625, -6.845703125, -2.3125, 2.220703125, 6.75390625, 11.287109375, 15.8203125, 20.353515625, 24.88671875, 29.419921875, 33.953125, 38.486328125, 43.01953125, 47.552734375, 52.0859375, 56.619140625, 61.15234375, 65.685546875, 70.21875, 74.751953125, 79.28515625, 83.818359375, 88.3515625, 92.884765625, 97.41796875, 101.951171875, 106.484375, 111.017578125, 115.55078125, 120.083984375, 124.6171875, 129.150390625, 133.68359375, 138.216796875, 142.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 11.0, 8.0, 10.0, 12.0, 13.0, 28.0, 25.0, 34.0, 38.0, 35.0, 58.0, 60.0, 87.0, 271.0, 789.0, 157.0, 71.0, 46.0, 59.0, 38.0, 38.0, 24.0, 25.0, 11.0, 10.0, 17.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.5625, -70.49267578125, -68.4228515625, -66.35302734375, -64.283203125, -62.21337890625, -60.1435546875, -58.07373046875, -56.00390625, -53.93408203125, -51.8642578125, -49.79443359375, -47.724609375, -45.65478515625, -43.5849609375, -41.51513671875, -39.4453125, -37.37548828125, -35.3056640625, -33.23583984375, -31.166015625, -29.09619140625, -27.0263671875, -24.95654296875, -22.88671875, -20.81689453125, -18.7470703125, -16.67724609375, -14.607421875, -12.53759765625, -10.4677734375, -8.39794921875, -6.328125, -4.25830078125, -2.1884765625, -0.11865234375, 1.951171875, 4.02099609375, 6.0908203125, 8.16064453125, 10.23046875, 12.30029296875, 14.3701171875, 16.43994140625, 18.509765625, 20.57958984375, 22.6494140625, 24.71923828125, 26.7890625, 28.85888671875, 30.9287109375, 32.99853515625, 35.068359375, 37.13818359375, 39.2080078125, 41.27783203125, 43.34765625, 45.41748046875, 47.4873046875, 49.55712890625, 51.626953125, 53.69677734375, 55.7666015625, 57.83642578125, 59.90625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 13.0, 59.0, 740.0, 130.0, 34.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-805.911865234375, -774.5433349609375, -743.1748046875, -711.8062133789062, -680.4376831054688, -649.0691528320312, -617.7006225585938, -586.33203125, -554.9635009765625, -523.594970703125, -492.2264099121094, -460.8578796386719, -429.48931884765625, -398.12078857421875, -366.75225830078125, -335.3836975097656, -304.0151672363281, -272.6466369628906, -241.278076171875, -209.9095458984375, -178.54098510742188, -147.17245483398438, -115.80390930175781, -84.43536376953125, -53.06681823730469, -21.698274612426758, 9.670269012451172, 41.03881072998047, 72.40735626220703, 103.77589416503906, 135.14443969726562, 166.5129852294922, 197.88153076171875, 229.2500762939453, 260.6186218261719, 291.9871520996094, 323.355712890625, 354.7242431640625, 386.0927734375, 417.4613342285156, 448.82989501953125, 480.19842529296875, 511.5669860839844, 542.935546875, 574.3040771484375, 605.672607421875, 637.0411376953125, 668.40966796875, 699.7781982421875, 731.146728515625, 762.5152587890625, 793.8838500976562, 825.2523803710938, 856.6209106445312, 887.9894409179688, 919.3580322265625, 950.7265625, 982.0950927734375, 1013.463623046875, 1044.8321533203125, 1076.20068359375, 1107.5693359375, 1138.9378662109375, 1170.306396484375, 1201.6749267578125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 14.0, 13.0, 66.0, 669.0, 144.0, 42.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1166.099365234375, -1104.119384765625, -1042.139404296875, -980.159423828125, -918.179443359375, -856.199462890625, -794.219482421875, -732.239501953125, -670.259521484375, -608.279541015625, -546.299560546875, -484.319580078125, -422.339599609375, -360.359619140625, -298.379638671875, -236.399658203125, -174.419677734375, -112.439697265625, -50.459716796875, 11.520263671875, 73.500244140625, 135.480224609375, 197.460205078125, 259.440185546875, 321.420166015625, 383.400146484375, 445.380126953125, 507.360107421875, 569.340087890625, 631.320068359375, 693.300048828125, 755.280029296875, 817.260009765625, 879.239990234375, 941.219970703125, 1003.199951171875, 1065.179931640625, 1127.159912109375, 1189.139892578125, 1251.119873046875, 1313.099853515625, 1375.079833984375, 1437.059814453125, 1499.039794921875, 1561.019775390625, 1622.999755859375, 1684.979736328125, 1746.959716796875, 1808.939697265625, 1870.919677734375, 1932.899658203125, 1994.879638671875, 2056.859619140625, 2118.839599609375, 2180.819580078125, 2242.799560546875, 2304.779541015625, 2366.759521484375, 2428.739501953125, 2490.719482421875, 2552.699462890625, 2614.679443359375, 2676.659423828125, 2738.639404296875, 2800.619384765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 9.0, 9.0, 15.0, 26.0, 56.0, 88.0, 138.0, 263.0, 452.0, 843.0, 1383.0, 2848.0, 6448.0, 19902.0, 114055.0, 3885934.0, 117633.0, 26486.0, 9265.0, 3880.0, 1750.0, 992.0, 534.0, 349.0, 231.0, 125.0, 119.0, 85.0, 82.0, 56.0, 40.0, 27.0, 29.0, 16.0, 26.0, 22.0, 20.0, 11.0, 7.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.87841796875, -2.7138671875, -2.54931640625, -2.384765625, -2.22021484375, -2.0556640625, -1.89111328125, -1.7265625, -1.56201171875, -1.3974609375, -1.23291015625, -1.068359375, -0.90380859375, -0.7392578125, -0.57470703125, -0.41015625, -0.24560546875, -0.0810546875, 0.08349609375, 0.248046875, 0.41259765625, 0.5771484375, 0.74169921875, 0.90625, 1.07080078125, 1.2353515625, 1.39990234375, 1.564453125, 1.72900390625, 1.8935546875, 2.05810546875, 2.22265625, 2.38720703125, 2.5517578125, 2.71630859375, 2.880859375, 3.04541015625, 3.2099609375, 3.37451171875, 3.5390625, 3.70361328125, 3.8681640625, 4.03271484375, 4.197265625, 4.36181640625, 4.5263671875, 4.69091796875, 4.85546875, 5.02001953125, 5.1845703125, 5.34912109375, 5.513671875, 5.67822265625, 5.8427734375, 6.00732421875, 6.171875, 6.33642578125, 6.5009765625, 6.66552734375, 6.830078125, 6.99462890625, 7.1591796875, 7.32373046875, 7.48828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 17.0, 13.0, 15.0, 96.0, 530.0, 222.0, 30.0, 20.0, 13.0, 9.0, 14.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361572265625, -0.3413047790527344, -0.32103729248046875, -0.3007698059082031, -0.2805023193359375, -0.2602348327636719, -0.23996734619140625, -0.21969985961914062, -0.199432373046875, -0.17916488647460938, -0.15889739990234375, -0.13862991333007812, -0.1183624267578125, -0.09809494018554688, -0.07782745361328125, -0.057559967041015625, -0.03729248046875, -0.017024993896484375, 0.00324249267578125, 0.023509979248046875, 0.0437774658203125, 0.06404495239257812, 0.08431243896484375, 0.10457992553710938, 0.124847412109375, 0.14511489868164062, 0.16538238525390625, 0.18564987182617188, 0.2059173583984375, 0.22618484497070312, 0.24645233154296875, 0.2667198181152344, 0.2869873046875, 0.3072547912597656, 0.32752227783203125, 0.3477897644042969, 0.3680572509765625, 0.3883247375488281, 0.40859222412109375, 0.4288597106933594, 0.449127197265625, 0.4693946838378906, 0.48966217041015625, 0.5099296569824219, 0.5301971435546875, 0.5504646301269531, 0.5707321166992188, 0.5909996032714844, 0.61126708984375, 0.6315345764160156, 0.6518020629882812, 0.6720695495605469, 0.6923370361328125, 0.7126045227050781, 0.7328720092773438, 0.7531394958496094, 0.773406982421875, 0.7936744689941406, 0.8139419555664062, 0.8342094421386719, 0.8544769287109375, 0.8747444152832031, 0.8950119018554688, 0.9152793884277344, 0.935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 10.0, 16.0, 22.0, 30.0, 29.0, 67.0, 77.0, 151.0, 220.0, 399.0, 659.0, 1323.0, 2902.0, 6965.0, 20457.0, 79052.0, 623635.0, 3160936.0, 233068.0, 43142.0, 12296.0, 4540.0, 1942.0, 936.0, 554.0, 322.0, 179.0, 121.0, 77.0, 51.0, 28.0, 21.0, 13.0, 10.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.8912353515625, -3.770751953125, -3.6502685546875, -3.52978515625, -3.4093017578125, -3.288818359375, -3.1683349609375, -3.0478515625, -2.9273681640625, -2.806884765625, -2.6864013671875, -2.56591796875, -2.4454345703125, -2.324951171875, -2.2044677734375, -2.083984375, -1.9635009765625, -1.843017578125, -1.7225341796875, -1.60205078125, -1.4815673828125, -1.361083984375, -1.2406005859375, -1.1201171875, -0.9996337890625, -0.879150390625, -0.7586669921875, -0.63818359375, -0.5177001953125, -0.397216796875, -0.2767333984375, -0.15625, -0.0357666015625, 0.084716796875, 0.2052001953125, 0.32568359375, 0.4461669921875, 0.566650390625, 0.6871337890625, 0.8076171875, 0.9281005859375, 1.048583984375, 1.1690673828125, 1.28955078125, 1.4100341796875, 1.530517578125, 1.6510009765625, 1.771484375, 1.8919677734375, 2.012451171875, 2.1329345703125, 2.25341796875, 2.3739013671875, 2.494384765625, 2.6148681640625, 2.7353515625, 2.8558349609375, 2.976318359375, 3.0968017578125, 3.21728515625, 3.3377685546875, 3.458251953125, 3.5787353515625, 3.69921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 9.0, 9.0, 7.0, 17.0, 24.0, 28.0, 32.0, 42.0, 44.0, 56.0, 92.0, 102.0, 174.0, 216.0, 351.0, 723.0, 741.0, 421.0, 254.0, 195.0, 121.0, 106.0, 76.0, 57.0, 40.0, 39.0, 21.0, 17.0, 14.0, 7.0, 6.0, 3.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8671875, -0.8409194946289062, -0.8146514892578125, -0.7883834838867188, -0.762115478515625, -0.7358474731445312, -0.7095794677734375, -0.6833114624023438, -0.65704345703125, -0.6307754516601562, -0.6045074462890625, -0.5782394409179688, -0.551971435546875, -0.5257034301757812, -0.4994354248046875, -0.47316741943359375, -0.4468994140625, -0.42063140869140625, -0.3943634033203125, -0.36809539794921875, -0.341827392578125, -0.31555938720703125, -0.2892913818359375, -0.26302337646484375, -0.23675537109375, -0.21048736572265625, -0.1842193603515625, -0.15795135498046875, -0.131683349609375, -0.10541534423828125, -0.0791473388671875, -0.05287933349609375, -0.026611328125, -0.00034332275390625, 0.0259246826171875, 0.05219268798828125, 0.078460693359375, 0.10472869873046875, 0.1309967041015625, 0.15726470947265625, 0.18353271484375, 0.20980072021484375, 0.2360687255859375, 0.26233673095703125, 0.288604736328125, 0.31487274169921875, 0.3411407470703125, 0.36740875244140625, 0.3936767578125, 0.41994476318359375, 0.4462127685546875, 0.47248077392578125, 0.498748779296875, 0.5250167846679688, 0.5512847900390625, 0.5775527954101562, 0.60382080078125, 0.6300888061523438, 0.6563568115234375, 0.6826248168945312, 0.708892822265625, 0.7351608276367188, 0.7614288330078125, 0.7876968383789062, 0.81396484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 28.0, 110.0, 370.0, 394.0, 70.0, 26.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71318817138672, -33.79825210571289, -32.88331604003906, -31.968379974365234, -31.053443908691406, -30.138507843017578, -29.22357177734375, -28.308635711669922, -27.393699645996094, -26.478763580322266, -25.563827514648438, -24.64889144897461, -23.73395538330078, -22.819019317626953, -21.904083251953125, -20.989147186279297, -20.07421112060547, -19.15927505493164, -18.244338989257812, -17.329402923583984, -16.414466857910156, -15.499530792236328, -14.5845947265625, -13.669658660888672, -12.754720687866211, -11.839784622192383, -10.924848556518555, -10.009912490844727, -9.094976425170898, -8.18004035949707, -7.265103816986084, -6.350167751312256, -5.435232162475586, -4.520296096801758, -3.6053600311279297, -2.6904237270355225, -1.7754876613616943, -0.8605513572692871, 0.054384708404541016, 0.9693207740783691, 1.8842568397521973, 2.7991929054260254, 3.7141289710998535, 4.62906551361084, 5.544001579284668, 6.458937644958496, 7.373873710632324, 8.288809776306152, 9.20374584197998, 10.118681907653809, 11.033617973327637, 11.948554039001465, 12.863490104675293, 13.778427124023438, 14.693363189697266, 15.608299255371094, 16.523235321044922, 17.43817138671875, 18.353107452392578, 19.268043518066406, 20.182979583740234, 21.097915649414062, 22.01285171508789, 22.92778778076172, 23.842723846435547]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 8.0, 14.0, 21.0, 25.0, 45.0, 42.0, 60.0, 58.0, 78.0, 71.0, 103.0, 79.0, 85.0, 75.0, 54.0, 47.0, 39.0, 30.0, 26.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.087030410766602, -11.82918930053711, -11.571348190307617, -11.313507080078125, -11.055665969848633, -10.79782485961914, -10.539983749389648, -10.282142639160156, -10.024301528930664, -9.766460418701172, -9.50861930847168, -9.250778198242188, -8.992937088012695, -8.735095977783203, -8.477254867553711, -8.219413757324219, -7.961572647094727, -7.703731536865234, -7.445890426635742, -7.18804931640625, -6.930208206176758, -6.672367095947266, -6.414525985717773, -6.156684875488281, -5.898843765258789, -5.641002655029297, -5.383161544799805, -5.1253204345703125, -4.86747932434082, -4.609638214111328, -4.351797103881836, -4.093955993652344, -3.8361148834228516, -3.5782737731933594, -3.320432662963867, -3.062591552734375, -2.804750442504883, -2.5469093322753906, -2.2890682220458984, -2.0312271118164062, -1.773386001586914, -1.5155448913574219, -1.2577037811279297, -0.9998626708984375, -0.7420215606689453, -0.4841804504394531, -0.22633934020996094, 0.03150177001953125, 0.28934288024902344, 0.5471839904785156, 0.8050251007080078, 1.0628662109375, 1.3207073211669922, 1.5785484313964844, 1.8363895416259766, 2.0942306518554688, 2.352071762084961, 2.609912872314453, 2.8677539825439453, 3.1255950927734375, 3.3834362030029297, 3.641277313232422, 3.899118423461914, 4.156959533691406, 4.414800643920898]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 5.0, 10.0, 12.0, 11.0, 13.0, 16.0, 22.0, 29.0, 58.0, 85.0, 103.0, 123.0, 242.0, 332.0, 553.0, 812.0, 1440.0, 2819.0, 6290.0, 17858.0, 106927.0, 804252.0, 79225.0, 15564.0, 5651.0, 2525.0, 1311.0, 784.0, 498.0, 325.0, 202.0, 128.0, 85.0, 71.0, 45.0, 29.0, 19.0, 23.0, 14.0, 8.0, 9.0, 5.0, 6.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-3.603515625, -3.5018310546875, -3.400146484375, -3.2984619140625, -3.19677734375, -3.0950927734375, -2.993408203125, -2.8917236328125, -2.7900390625, -2.6883544921875, -2.586669921875, -2.4849853515625, -2.38330078125, -2.2816162109375, -2.179931640625, -2.0782470703125, -1.9765625, -1.8748779296875, -1.773193359375, -1.6715087890625, -1.56982421875, -1.4681396484375, -1.366455078125, -1.2647705078125, -1.1630859375, -1.0614013671875, -0.959716796875, -0.8580322265625, -0.75634765625, -0.6546630859375, -0.552978515625, -0.4512939453125, -0.349609375, -0.2479248046875, -0.146240234375, -0.0445556640625, 0.05712890625, 0.1588134765625, 0.260498046875, 0.3621826171875, 0.4638671875, 0.5655517578125, 0.667236328125, 0.7689208984375, 0.87060546875, 0.9722900390625, 1.073974609375, 1.1756591796875, 1.27734375, 1.3790283203125, 1.480712890625, 1.5823974609375, 1.68408203125, 1.7857666015625, 1.887451171875, 1.9891357421875, 2.0908203125, 2.1925048828125, 2.294189453125, 2.3958740234375, 2.49755859375, 2.5992431640625, 2.700927734375, 2.8026123046875, 2.904296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 11.0, 8.0, 8.0, 5.0, 24.0, 45.0, 85.0, 158.0, 213.0, 172.0, 118.0, 55.0, 25.0, 20.0, 14.0, 10.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3589286804199219, -0.34505462646484375, -0.3311805725097656, -0.3173065185546875, -0.3034324645996094, -0.28955841064453125, -0.2756843566894531, -0.261810302734375, -0.24793624877929688, -0.23406219482421875, -0.22018814086914062, -0.2063140869140625, -0.19244003295898438, -0.17856597900390625, -0.16469192504882812, -0.15081787109375, -0.13694381713867188, -0.12306976318359375, -0.10919570922851562, -0.0953216552734375, -0.08144760131835938, -0.06757354736328125, -0.053699493408203125, -0.039825439453125, -0.025951385498046875, -0.01207733154296875, 0.001796722412109375, 0.0156707763671875, 0.029544830322265625, 0.04341888427734375, 0.057292938232421875, 0.0711669921875, 0.08504104614257812, 0.09891510009765625, 0.11278915405273438, 0.1266632080078125, 0.14053726196289062, 0.15441131591796875, 0.16828536987304688, 0.182159423828125, 0.19603347778320312, 0.20990753173828125, 0.22378158569335938, 0.2376556396484375, 0.2515296936035156, 0.26540374755859375, 0.2792778015136719, 0.29315185546875, 0.3070259094238281, 0.32089996337890625, 0.3347740173339844, 0.3486480712890625, 0.3625221252441406, 0.37639617919921875, 0.3902702331542969, 0.404144287109375, 0.4180183410644531, 0.43189239501953125, 0.4457664489746094, 0.4596405029296875, 0.4735145568847656, 0.48738861083984375, 0.5012626647949219, 0.51513671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 12.0, 11.0, 10.0, 28.0, 49.0, 58.0, 81.0, 124.0, 183.0, 336.0, 568.0, 1003.0, 2326.0, 5937.0, 22967.0, 180363.0, 747077.0, 67383.0, 12451.0, 4001.0, 1539.0, 819.0, 468.0, 268.0, 155.0, 100.0, 74.0, 40.0, 37.0, 19.0, 10.0, 12.0, 8.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.31640625, -5.165771484375, -5.01513671875, -4.864501953125, -4.7138671875, -4.563232421875, -4.41259765625, -4.261962890625, -4.111328125, -3.960693359375, -3.81005859375, -3.659423828125, -3.5087890625, -3.358154296875, -3.20751953125, -3.056884765625, -2.90625, -2.755615234375, -2.60498046875, -2.454345703125, -2.3037109375, -2.153076171875, -2.00244140625, -1.851806640625, -1.701171875, -1.550537109375, -1.39990234375, -1.249267578125, -1.0986328125, -0.947998046875, -0.79736328125, -0.646728515625, -0.49609375, -0.345458984375, -0.19482421875, -0.044189453125, 0.1064453125, 0.257080078125, 0.40771484375, 0.558349609375, 0.708984375, 0.859619140625, 1.01025390625, 1.160888671875, 1.3115234375, 1.462158203125, 1.61279296875, 1.763427734375, 1.9140625, 2.064697265625, 2.21533203125, 2.365966796875, 2.5166015625, 2.667236328125, 2.81787109375, 2.968505859375, 3.119140625, 3.269775390625, 3.42041015625, 3.571044921875, 3.7216796875, 3.872314453125, 4.02294921875, 4.173583984375, 4.32421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 1.0, 3.0, 11.0, 1.0, 5.0, 7.0, 14.0, 13.0, 15.0, 20.0, 19.0, 16.0, 20.0, 24.0, 28.0, 16.0, 32.0, 24.0, 26.0, 38.0, 34.0, 36.0, 44.0, 36.0, 33.0, 43.0, 36.0, 40.0, 35.0, 33.0, 30.0, 27.0, 28.0, 24.0, 26.0, 29.0, 22.0, 20.0, 15.0, 12.0, 15.0, 9.0, 4.0, 3.0, 7.0, 3.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.3203125, -1.2780609130859375, -1.235809326171875, -1.1935577392578125, -1.15130615234375, -1.1090545654296875, -1.066802978515625, -1.0245513916015625, -0.9822998046875, -0.9400482177734375, -0.897796630859375, -0.8555450439453125, -0.81329345703125, -0.7710418701171875, -0.728790283203125, -0.6865386962890625, -0.644287109375, -0.6020355224609375, -0.559783935546875, -0.5175323486328125, -0.47528076171875, -0.4330291748046875, -0.390777587890625, -0.3485260009765625, -0.3062744140625, -0.2640228271484375, -0.221771240234375, -0.1795196533203125, -0.13726806640625, -0.0950164794921875, -0.052764892578125, -0.0105133056640625, 0.03173828125, 0.0739898681640625, 0.116241455078125, 0.1584930419921875, 0.20074462890625, 0.2429962158203125, 0.285247802734375, 0.3274993896484375, 0.3697509765625, 0.4120025634765625, 0.454254150390625, 0.4965057373046875, 0.53875732421875, 0.5810089111328125, 0.623260498046875, 0.6655120849609375, 0.707763671875, 0.7500152587890625, 0.792266845703125, 0.8345184326171875, 0.87677001953125, 0.9190216064453125, 0.961273193359375, 1.0035247802734375, 1.0457763671875, 1.0880279541015625, 1.130279541015625, 1.1725311279296875, 1.21478271484375, 1.2570343017578125, 1.299285888671875, 1.3415374755859375, 1.3837890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 9.0, 5.0, 5.0, 9.0, 9.0, 13.0, 24.0, 28.0, 43.0, 52.0, 80.0, 128.0, 137.0, 262.0, 372.0, 614.0, 1113.0, 2482.0, 6704.0, 33085.0, 890968.0, 94817.0, 10618.0, 3310.0, 1536.0, 779.0, 445.0, 249.0, 172.0, 144.0, 88.0, 80.0, 53.0, 31.0, 22.0, 19.0, 17.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.28515625, -5.1129150390625, -4.940673828125, -4.7684326171875, -4.59619140625, -4.4239501953125, -4.251708984375, -4.0794677734375, -3.9072265625, -3.7349853515625, -3.562744140625, -3.3905029296875, -3.21826171875, -3.0460205078125, -2.873779296875, -2.7015380859375, -2.529296875, -2.3570556640625, -2.184814453125, -2.0125732421875, -1.84033203125, -1.6680908203125, -1.495849609375, -1.3236083984375, -1.1513671875, -0.9791259765625, -0.806884765625, -0.6346435546875, -0.46240234375, -0.2901611328125, -0.117919921875, 0.0543212890625, 0.2265625, 0.3988037109375, 0.571044921875, 0.7432861328125, 0.91552734375, 1.0877685546875, 1.260009765625, 1.4322509765625, 1.6044921875, 1.7767333984375, 1.948974609375, 2.1212158203125, 2.29345703125, 2.4656982421875, 2.637939453125, 2.8101806640625, 2.982421875, 3.1546630859375, 3.326904296875, 3.4991455078125, 3.67138671875, 3.8436279296875, 4.015869140625, 4.1881103515625, 4.3603515625, 4.5325927734375, 4.704833984375, 4.8770751953125, 5.04931640625, 5.2215576171875, 5.393798828125, 5.5660400390625, 5.73828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 11.0, 13.0, 18.0, 29.0, 34.0, 53.0, 60.0, 102.0, 154.0, 153.0, 99.0, 56.0, 46.0, 31.0, 29.0, 18.0, 17.0, 7.0, 11.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009164810180664062, -0.0008859634399414062, -0.0008554458618164062, -0.0008249282836914062, -0.0007944107055664062, -0.0007638931274414062, -0.0007333755493164062, -0.0007028579711914062, -0.0006723403930664062, -0.0006418228149414062, -0.0006113052368164062, -0.0005807876586914062, -0.0005502700805664062, -0.0005197525024414062, -0.0004892349243164062, -0.00045871734619140625, -0.00042819976806640625, -0.00039768218994140625, -0.00036716461181640625, -0.00033664703369140625, -0.00030612945556640625, -0.00027561187744140625, -0.00024509429931640625, -0.00021457672119140625, -0.00018405914306640625, -0.00015354156494140625, -0.00012302398681640625, -9.250640869140625e-05, -6.198883056640625e-05, -3.147125244140625e-05, -9.5367431640625e-07, 2.956390380859375e-05, 6.008148193359375e-05, 9.059906005859375e-05, 0.00012111663818359375, 0.00015163421630859375, 0.00018215179443359375, 0.00021266937255859375, 0.00024318695068359375, 0.00027370452880859375, 0.00030422210693359375, 0.00033473968505859375, 0.00036525726318359375, 0.00039577484130859375, 0.00042629241943359375, 0.00045680999755859375, 0.00048732757568359375, 0.0005178451538085938, 0.0005483627319335938, 0.0005788803100585938, 0.0006093978881835938, 0.0006399154663085938, 0.0006704330444335938, 0.0007009506225585938, 0.0007314682006835938, 0.0007619857788085938, 0.0007925033569335938, 0.0008230209350585938, 0.0008535385131835938, 0.0008840560913085938, 0.0009145736694335938, 0.0009450912475585938, 0.0009756088256835938, 0.0010061264038085938, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 28.0, 34.0, 40.0, 60.0, 81.0, 130.0, 198.0, 329.0, 508.0, 869.0, 1840.0, 3929.0, 10319.0, 41872.0, 760766.0, 190279.0, 23644.0, 7242.0, 2957.0, 1444.0, 713.0, 438.0, 256.0, 183.0, 117.0, 76.0, 47.0, 30.0, 21.0, 21.0, 10.0, 10.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.9140625, -5.73919677734375, -5.5643310546875, -5.38946533203125, -5.214599609375, -5.03973388671875, -4.8648681640625, -4.69000244140625, -4.51513671875, -4.34027099609375, -4.1654052734375, -3.99053955078125, -3.815673828125, -3.64080810546875, -3.4659423828125, -3.29107666015625, -3.1162109375, -2.94134521484375, -2.7664794921875, -2.59161376953125, -2.416748046875, -2.24188232421875, -2.0670166015625, -1.89215087890625, -1.71728515625, -1.54241943359375, -1.3675537109375, -1.19268798828125, -1.017822265625, -0.84295654296875, -0.6680908203125, -0.49322509765625, -0.318359375, -0.14349365234375, 0.0313720703125, 0.20623779296875, 0.381103515625, 0.55596923828125, 0.7308349609375, 0.90570068359375, 1.08056640625, 1.25543212890625, 1.4302978515625, 1.60516357421875, 1.780029296875, 1.95489501953125, 2.1297607421875, 2.30462646484375, 2.4794921875, 2.65435791015625, 2.8292236328125, 3.00408935546875, 3.178955078125, 3.35382080078125, 3.5286865234375, 3.70355224609375, 3.87841796875, 4.05328369140625, 4.2281494140625, 4.40301513671875, 4.577880859375, 4.75274658203125, 4.9276123046875, 5.10247802734375, 5.27734375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 6.0, 7.0, 6.0, 7.0, 8.0, 20.0, 19.0, 10.0, 20.0, 25.0, 42.0, 51.0, 81.0, 110.0, 122.0, 113.0, 89.0, 65.0, 52.0, 25.0, 12.0, 20.0, 20.0, 8.0, 5.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.842376708984375, -1.78436279296875, -1.726348876953125, -1.6683349609375, -1.610321044921875, -1.55230712890625, -1.494293212890625, -1.436279296875, -1.378265380859375, -1.32025146484375, -1.262237548828125, -1.2042236328125, -1.146209716796875, -1.08819580078125, -1.030181884765625, -0.97216796875, -0.914154052734375, -0.85614013671875, -0.798126220703125, -0.7401123046875, -0.682098388671875, -0.62408447265625, -0.566070556640625, -0.508056640625, -0.450042724609375, -0.39202880859375, -0.334014892578125, -0.2760009765625, -0.217987060546875, -0.15997314453125, -0.101959228515625, -0.0439453125, 0.014068603515625, 0.07208251953125, 0.130096435546875, 0.1881103515625, 0.246124267578125, 0.30413818359375, 0.362152099609375, 0.420166015625, 0.478179931640625, 0.53619384765625, 0.594207763671875, 0.6522216796875, 0.710235595703125, 0.76824951171875, 0.826263427734375, 0.88427734375, 0.942291259765625, 1.00030517578125, 1.058319091796875, 1.1163330078125, 1.174346923828125, 1.23236083984375, 1.290374755859375, 1.348388671875, 1.406402587890625, 1.46441650390625, 1.522430419921875, 1.5804443359375, 1.638458251953125, 1.69647216796875, 1.754486083984375, 1.8125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 18.0, 19.0, 36.0, 44.0, 64.0, 100.0, 172.0, 167.0, 128.0, 74.0, 56.0, 28.0, 12.0, 12.0, 8.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.69040870666504, -18.105138778686523, -17.51987075805664, -16.934600830078125, -16.34933090209961, -15.764062881469727, -15.178792953491211, -14.593523979187012, -14.008255004882812, -13.422986030578613, -12.837717056274414, -12.252447128295898, -11.6671781539917, -11.0819091796875, -10.496639251708984, -9.911370277404785, -9.326101303100586, -8.740832328796387, -8.155563354492188, -7.570293426513672, -6.985024452209473, -6.399755477905273, -5.814486026763916, -5.229216575622559, -4.643947601318359, -4.05867862701416, -3.4734091758728027, -2.8881399631500244, -2.302870750427246, -1.7176015377044678, -1.1323323249816895, -0.547062873840332, 0.0382080078125, 0.6234772205352783, 1.2087464332580566, 1.794015645980835, 2.3792848587036133, 2.9645540714263916, 3.54982328414917, 4.135092735290527, 4.720361709594727, 5.305630683898926, 5.890900135040283, 6.476169586181641, 7.06143856048584, 7.646707534790039, 8.231977462768555, 8.817246437072754, 9.402515411376953, 9.987784385681152, 10.573053359985352, 11.158323287963867, 11.743592262268066, 12.328861236572266, 12.914131164550781, 13.49940013885498, 14.08466911315918, 14.669938087463379, 15.255207061767578, 15.840476989746094, 16.42574691772461, 17.011014938354492, 17.596284866333008, 18.18155288696289, 18.766822814941406]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 10.0, 5.0, 6.0, 11.0, 15.0, 18.0, 40.0, 62.0, 79.0, 136.0, 148.0, 139.0, 105.0, 75.0, 50.0, 29.0, 13.0, 16.0, 8.0, 11.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.372894287109375, -22.3516788482666, -21.330463409423828, -20.309247970581055, -19.28803253173828, -18.26681900024414, -17.245603561401367, -16.224388122558594, -15.20317268371582, -14.181957244873047, -13.160741806030273, -12.139527320861816, -11.118311882019043, -10.09709644317627, -9.075881958007812, -8.054666519165039, -7.033451080322266, -6.012235641479492, -4.991020679473877, -3.9698054790496826, -2.9485902786254883, -1.9273748397827148, -0.9061598777770996, 0.11505508422851562, 1.136270523071289, 2.1574857234954834, 3.1787009239196777, 4.199915885925293, 5.221131324768066, 6.24234676361084, 7.263561725616455, 8.28477668762207, 9.30599594116211, 10.327211380004883, 11.348426818847656, 12.369641304016113, 13.390856742858887, 14.41207218170166, 15.433286666870117, 16.45450210571289, 17.475717544555664, 18.496932983398438, 19.51814842224121, 20.539363861083984, 21.560577392578125, 22.58179473876953, 23.603008270263672, 24.624223709106445, 25.64543914794922, 26.666654586791992, 27.687870025634766, 28.70908546447754, 29.730300903320312, 30.751514434814453, 31.772729873657227, 32.7939453125, 33.815162658691406, 34.83637619018555, 35.85759353637695, 36.878807067871094, 37.9000244140625, 38.92123794555664, 39.94245529174805, 40.96366882324219, 41.98488235473633]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 14.0, 11.0, 28.0, 67.0, 693.0, 4167444.0, 25249.0, 556.0, 117.0, 40.0, 17.0, 22.0, 8.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.46875, -42.75830078125, -40.0478515625, -37.33740234375, -34.626953125, -31.91650390625, -29.2060546875, -26.49560546875, -23.78515625, -21.07470703125, -18.3642578125, -15.65380859375, -12.943359375, -10.23291015625, -7.5224609375, -4.81201171875, -2.1015625, 0.60888671875, 3.3193359375, 6.02978515625, 8.740234375, 11.45068359375, 14.1611328125, 16.87158203125, 19.58203125, 22.29248046875, 25.0029296875, 27.71337890625, 30.423828125, 33.13427734375, 35.8447265625, 38.55517578125, 41.265625, 43.97607421875, 46.6865234375, 49.39697265625, 52.107421875, 54.81787109375, 57.5283203125, 60.23876953125, 62.94921875, 65.65966796875, 68.3701171875, 71.08056640625, 73.791015625, 76.50146484375, 79.2119140625, 81.92236328125, 84.6328125, 87.34326171875, 90.0537109375, 92.76416015625, 95.474609375, 98.18505859375, 100.8955078125, 103.60595703125, 106.31640625, 109.02685546875, 111.7373046875, 114.44775390625, 117.158203125, 119.86865234375, 122.5791015625, 125.28955078125, 128.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 13.0, 13.0, 20.0, 28.0, 49.0, 66.0, 91.0, 133.0, 128.0, 102.0, 107.0, 64.0, 44.0, 27.0, 15.0, 20.0, 9.0, 9.0, 11.0, 9.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2731895446777344, -0.26293182373046875, -0.2526741027832031, -0.2424163818359375, -0.23215866088867188, -0.22190093994140625, -0.21164321899414062, -0.201385498046875, -0.19112777709960938, -0.18087005615234375, -0.17061233520507812, -0.1603546142578125, -0.15009689331054688, -0.13983917236328125, -0.12958145141601562, -0.11932373046875, -0.10906600952148438, -0.09880828857421875, -0.08855056762695312, -0.0782928466796875, -0.06803512573242188, -0.05777740478515625, -0.047519683837890625, -0.037261962890625, -0.027004241943359375, -0.01674652099609375, -0.006488800048828125, 0.0037689208984375, 0.014026641845703125, 0.02428436279296875, 0.034542083740234375, 0.0447998046875, 0.055057525634765625, 0.06531524658203125, 0.07557296752929688, 0.0858306884765625, 0.09608840942382812, 0.10634613037109375, 0.11660385131835938, 0.126861572265625, 0.13711929321289062, 0.14737701416015625, 0.15763473510742188, 0.1678924560546875, 0.17815017700195312, 0.18840789794921875, 0.19866561889648438, 0.20892333984375, 0.21918106079101562, 0.22943878173828125, 0.23969650268554688, 0.2499542236328125, 0.2602119445800781, 0.27046966552734375, 0.2807273864746094, 0.290985107421875, 0.3012428283691406, 0.31150054931640625, 0.3217582702636719, 0.3320159912109375, 0.3422737121582031, 0.35253143310546875, 0.3627891540527344, 0.373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 9.0, 19.0, 15.0, 36.0, 61.0, 111.0, 258.0, 547.0, 2397.0, 79251.0, 4098544.0, 11699.0, 957.0, 227.0, 89.0, 39.0, 18.0, 5.0, 6.0, 4.0, 1.0], "bins": [-44.28125, -43.4501953125, -42.619140625, -41.7880859375, -40.95703125, -40.1259765625, -39.294921875, -38.4638671875, -37.6328125, -36.8017578125, -35.970703125, -35.1396484375, -34.30859375, -33.4775390625, -32.646484375, -31.8154296875, -30.984375, -30.1533203125, -29.322265625, -28.4912109375, -27.66015625, -26.8291015625, -25.998046875, -25.1669921875, -24.3359375, -23.5048828125, -22.673828125, -21.8427734375, -21.01171875, -20.1806640625, -19.349609375, -18.5185546875, -17.6875, -16.8564453125, -16.025390625, -15.1943359375, -14.36328125, -13.5322265625, -12.701171875, -11.8701171875, -11.0390625, -10.2080078125, -9.376953125, -8.5458984375, -7.71484375, -6.8837890625, -6.052734375, -5.2216796875, -4.390625, -3.5595703125, -2.728515625, -1.8974609375, -1.06640625, -0.2353515625, 0.595703125, 1.4267578125, 2.2578125, 3.0888671875, 3.919921875, 4.7509765625, 5.58203125, 6.4130859375, 7.244140625, 8.0751953125, 8.90625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 5.0, 11.0, 2.0, 11.0, 18.0, 12.0, 19.0, 24.0, 28.0, 38.0, 55.0, 117.0, 244.0, 691.0, 1775.0, 497.0, 177.0, 105.0, 53.0, 42.0, 28.0, 24.0, 17.0, 12.0, 14.0, 11.0, 6.0, 10.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5030899047851562, -0.4817657470703125, -0.46044158935546875, -0.439117431640625, -0.41779327392578125, -0.3964691162109375, -0.37514495849609375, -0.35382080078125, -0.33249664306640625, -0.3111724853515625, -0.28984832763671875, -0.268524169921875, -0.24720001220703125, -0.2258758544921875, -0.20455169677734375, -0.1832275390625, -0.16190338134765625, -0.1405792236328125, -0.11925506591796875, -0.097930908203125, -0.07660675048828125, -0.0552825927734375, -0.03395843505859375, -0.01263427734375, 0.00868988037109375, 0.0300140380859375, 0.05133819580078125, 0.072662353515625, 0.09398651123046875, 0.1153106689453125, 0.13663482666015625, 0.157958984375, 0.17928314208984375, 0.2006072998046875, 0.22193145751953125, 0.243255615234375, 0.26457977294921875, 0.2859039306640625, 0.30722808837890625, 0.32855224609375, 0.34987640380859375, 0.3712005615234375, 0.39252471923828125, 0.413848876953125, 0.43517303466796875, 0.4564971923828125, 0.47782135009765625, 0.4991455078125, 0.5204696655273438, 0.5417938232421875, 0.5631179809570312, 0.584442138671875, 0.6057662963867188, 0.6270904541015625, 0.6484146118164062, 0.66973876953125, 0.6910629272460938, 0.7123870849609375, 0.7337112426757812, 0.755035400390625, 0.7763595581054688, 0.7976837158203125, 0.8190078735351562, 0.84033203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 30.0, 821.0, 163.0, 4.0], "bins": [-187.39723205566406, -184.3671875, -181.33714294433594, -178.30709838867188, -175.2770538330078, -172.24700927734375, -169.21697998046875, -166.18692016601562, -163.15689086914062, -160.12684631347656, -157.0968017578125, -154.06675720214844, -151.03671264648438, -148.0066680908203, -144.97662353515625, -141.94659423828125, -138.91653442382812, -135.88648986816406, -132.8564453125, -129.82640075683594, -126.7963638305664, -123.76631927490234, -120.73627471923828, -117.70623016357422, -114.67619323730469, -111.64614868164062, -108.61610412597656, -105.5860595703125, -102.55602264404297, -99.5259780883789, -96.49593353271484, -93.46588897705078, -90.43584442138672, -87.40579986572266, -84.3757553100586, -81.34571838378906, -78.315673828125, -75.28562927246094, -72.25558471679688, -69.22554016113281, -66.19549560546875, -63.16545104980469, -60.13541030883789, -57.10536575317383, -54.075321197509766, -51.04528045654297, -48.015235900878906, -44.985191345214844, -41.95515060424805, -38.925106048583984, -35.89506530761719, -32.865020751953125, -29.834976196289062, -26.804933547973633, -23.774890899658203, -20.74484634399414, -17.71480369567871, -14.684760093688965, -11.654716491699219, -8.624673843383789, -5.594630241394043, -2.564586639404297, 0.4654560089111328, 3.4955005645751953, 6.525543212890625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 7.0, 8.0, 14.0, 33.0, 38.0, 54.0, 85.0, 115.0, 144.0, 136.0, 123.0, 97.0, 63.0, 38.0, 21.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0], "bins": [-12.344409942626953, -12.103334426879883, -11.862258911132812, -11.621184349060059, -11.380108833312988, -11.139033317565918, -10.897957801818848, -10.656882286071777, -10.415807723999023, -10.174732208251953, -9.933656692504883, -9.692582130432129, -9.451506614685059, -9.210431098937988, -8.969355583190918, -8.728280067443848, -8.487204551696777, -8.246129035949707, -8.005053520202637, -7.763978481292725, -7.5229034423828125, -7.281827926635742, -7.040752410888672, -6.799676895141602, -6.5586018562316895, -6.317526340484619, -6.076451301574707, -5.835375785827637, -5.594300270080566, -5.353225231170654, -5.112149715423584, -4.871074676513672, -4.629999160766602, -4.388923645019531, -4.147848606109619, -3.906773090362549, -3.6656978130340576, -3.4246225357055664, -3.183547019958496, -2.942471742630005, -2.7013962268829346, -2.4603209495544434, -2.219245433807373, -1.9781701564788818, -1.7370948791503906, -1.4960196018218994, -1.2549442052841187, -1.013868808746338, -0.7727935314178467, -0.5317181944847107, -0.2906428575515747, -0.04956752061843872, 0.19150781631469727, 0.4325830936431885, 0.6736584901809692, 0.91473388671875, 1.1558091640472412, 1.3968844413757324, 1.6379598379135132, 1.879035234451294, 2.120110511779785, 2.3611857891082764, 2.6022610664367676, 2.843336582183838, 3.084411859512329]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 13.0, 14.0, 15.0, 28.0, 27.0, 58.0, 89.0, 151.0, 291.0, 495.0, 895.0, 1748.0, 3550.0, 8104.0, 23178.0, 117428.0, 748147.0, 107417.0, 22212.0, 7574.0, 3490.0, 1600.0, 869.0, 455.0, 304.0, 154.0, 93.0, 49.0, 31.0, 17.0, 19.0, 11.0, 11.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.12109375, -6.91455078125, -6.7080078125, -6.50146484375, -6.294921875, -6.08837890625, -5.8818359375, -5.67529296875, -5.46875, -5.26220703125, -5.0556640625, -4.84912109375, -4.642578125, -4.43603515625, -4.2294921875, -4.02294921875, -3.81640625, -3.60986328125, -3.4033203125, -3.19677734375, -2.990234375, -2.78369140625, -2.5771484375, -2.37060546875, -2.1640625, -1.95751953125, -1.7509765625, -1.54443359375, -1.337890625, -1.13134765625, -0.9248046875, -0.71826171875, -0.51171875, -0.30517578125, -0.0986328125, 0.10791015625, 0.314453125, 0.52099609375, 0.7275390625, 0.93408203125, 1.140625, 1.34716796875, 1.5537109375, 1.76025390625, 1.966796875, 2.17333984375, 2.3798828125, 2.58642578125, 2.79296875, 2.99951171875, 3.2060546875, 3.41259765625, 3.619140625, 3.82568359375, 4.0322265625, 4.23876953125, 4.4453125, 4.65185546875, 4.8583984375, 5.06494140625, 5.271484375, 5.47802734375, 5.6845703125, 5.89111328125, 6.09765625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 6.0, 3.0, 10.0, 17.0, 26.0, 18.0, 25.0, 43.0, 77.0, 79.0, 92.0, 96.0, 94.0, 75.0, 72.0, 64.0, 49.0, 29.0, 21.0, 21.0, 14.0, 19.0, 4.0, 17.0, 10.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2210693359375, -0.21160316467285156, -0.20213699340820312, -0.1926708221435547, -0.18320465087890625, -0.1737384796142578, -0.16427230834960938, -0.15480613708496094, -0.1453399658203125, -0.13587379455566406, -0.12640762329101562, -0.11694145202636719, -0.10747528076171875, -0.09800910949707031, -0.08854293823242188, -0.07907676696777344, -0.069610595703125, -0.06014442443847656, -0.050678253173828125, -0.04121208190917969, -0.03174591064453125, -0.022279739379882812, -0.012813568115234375, -0.0033473968505859375, 0.0061187744140625, 0.015584945678710938, 0.025051116943359375, 0.03451728820800781, 0.04398345947265625, 0.05344963073730469, 0.06291580200195312, 0.07238197326660156, 0.08184814453125, 0.09131431579589844, 0.10078048706054688, 0.11024665832519531, 0.11971282958984375, 0.1291790008544922, 0.13864517211914062, 0.14811134338378906, 0.1575775146484375, 0.16704368591308594, 0.17650985717773438, 0.1859760284423828, 0.19544219970703125, 0.2049083709716797, 0.21437454223632812, 0.22384071350097656, 0.233306884765625, 0.24277305603027344, 0.2522392272949219, 0.2617053985595703, 0.27117156982421875, 0.2806377410888672, 0.2901039123535156, 0.29957008361816406, 0.3090362548828125, 0.31850242614746094, 0.3279685974121094, 0.3374347686767578, 0.34690093994140625, 0.3563671112060547, 0.3658332824707031, 0.37529945373535156, 0.384765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 3.0, 9.0, 7.0, 8.0, 7.0, 12.0, 15.0, 13.0, 14.0, 27.0, 26.0, 43.0, 137.0, 1007.0, 23216.0, 1013671.0, 9329.0, 669.0, 127.0, 39.0, 26.0, 23.0, 15.0, 15.0, 12.0, 11.0, 12.0, 8.0, 4.0, 8.0, 9.0, 7.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.0, -15.4736328125, -14.947265625, -14.4208984375, -13.89453125, -13.3681640625, -12.841796875, -12.3154296875, -11.7890625, -11.2626953125, -10.736328125, -10.2099609375, -9.68359375, -9.1572265625, -8.630859375, -8.1044921875, -7.578125, -7.0517578125, -6.525390625, -5.9990234375, -5.47265625, -4.9462890625, -4.419921875, -3.8935546875, -3.3671875, -2.8408203125, -2.314453125, -1.7880859375, -1.26171875, -0.7353515625, -0.208984375, 0.3173828125, 0.84375, 1.3701171875, 1.896484375, 2.4228515625, 2.94921875, 3.4755859375, 4.001953125, 4.5283203125, 5.0546875, 5.5810546875, 6.107421875, 6.6337890625, 7.16015625, 7.6865234375, 8.212890625, 8.7392578125, 9.265625, 9.7919921875, 10.318359375, 10.8447265625, 11.37109375, 11.8974609375, 12.423828125, 12.9501953125, 13.4765625, 14.0029296875, 14.529296875, 15.0556640625, 15.58203125, 16.1083984375, 16.634765625, 17.1611328125, 17.6875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 6.0, 6.0, 10.0, 11.0, 6.0, 14.0, 21.0, 18.0, 14.0, 23.0, 24.0, 36.0, 29.0, 29.0, 28.0, 37.0, 37.0, 48.0, 42.0, 48.0, 43.0, 49.0, 32.0, 41.0, 34.0, 24.0, 26.0, 41.0, 27.0, 33.0, 20.0, 24.0, 17.0, 10.0, 16.0, 11.0, 14.0, 11.0, 8.0, 6.0, 2.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9638671875, -0.933074951171875, -0.90228271484375, -0.871490478515625, -0.8406982421875, -0.809906005859375, -0.77911376953125, -0.748321533203125, -0.717529296875, -0.686737060546875, -0.65594482421875, -0.625152587890625, -0.5943603515625, -0.563568115234375, -0.53277587890625, -0.501983642578125, -0.47119140625, -0.440399169921875, -0.40960693359375, -0.378814697265625, -0.3480224609375, -0.317230224609375, -0.28643798828125, -0.255645751953125, -0.224853515625, -0.194061279296875, -0.16326904296875, -0.132476806640625, -0.1016845703125, -0.070892333984375, -0.04010009765625, -0.009307861328125, 0.021484375, 0.052276611328125, 0.08306884765625, 0.113861083984375, 0.1446533203125, 0.175445556640625, 0.20623779296875, 0.237030029296875, 0.267822265625, 0.298614501953125, 0.32940673828125, 0.360198974609375, 0.3909912109375, 0.421783447265625, 0.45257568359375, 0.483367919921875, 0.51416015625, 0.544952392578125, 0.57574462890625, 0.606536865234375, 0.6373291015625, 0.668121337890625, 0.69891357421875, 0.729705810546875, 0.760498046875, 0.791290283203125, 0.82208251953125, 0.852874755859375, 0.8836669921875, 0.914459228515625, 0.94525146484375, 0.976043701171875, 1.0068359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 9.0, 6.0, 10.0, 12.0, 22.0, 39.0, 91.0, 316.0, 2570.0, 1032859.0, 11791.0, 572.0, 136.0, 39.0, 18.0, 13.0, 16.0, 2.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.84375, -58.0673828125, -56.291015625, -54.5146484375, -52.73828125, -50.9619140625, -49.185546875, -47.4091796875, -45.6328125, -43.8564453125, -42.080078125, -40.3037109375, -38.52734375, -36.7509765625, -34.974609375, -33.1982421875, -31.421875, -29.6455078125, -27.869140625, -26.0927734375, -24.31640625, -22.5400390625, -20.763671875, -18.9873046875, -17.2109375, -15.4345703125, -13.658203125, -11.8818359375, -10.10546875, -8.3291015625, -6.552734375, -4.7763671875, -3.0, -1.2236328125, 0.552734375, 2.3291015625, 4.10546875, 5.8818359375, 7.658203125, 9.4345703125, 11.2109375, 12.9873046875, 14.763671875, 16.5400390625, 18.31640625, 20.0927734375, 21.869140625, 23.6455078125, 25.421875, 27.1982421875, 28.974609375, 30.7509765625, 32.52734375, 34.3037109375, 36.080078125, 37.8564453125, 39.6328125, 41.4091796875, 43.185546875, 44.9619140625, 46.73828125, 48.5146484375, 50.291015625, 52.0673828125, 53.84375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 10.0, 9.0, 8.0, 13.0, 17.0, 22.0, 20.0, 42.0, 42.0, 66.0, 115.0, 176.0, 132.0, 75.0, 53.0, 33.0, 23.0, 15.0, 18.0, 11.0, 15.0, 11.0, 11.0, 6.0, 4.0, 7.0, 9.0, 0.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018968582153320312, -0.0018364638090133667, -0.0017760694026947021, -0.0017156749963760376, -0.001655280590057373, -0.0015948861837387085, -0.001534491777420044, -0.0014740973711013794, -0.0014137029647827148, -0.0013533085584640503, -0.0012929141521453857, -0.0012325197458267212, -0.0011721253395080566, -0.001111730933189392, -0.0010513365268707275, -0.000990942120552063, -0.0009305477142333984, -0.0008701533079147339, -0.0008097589015960693, -0.0007493644952774048, -0.0006889700889587402, -0.0006285756826400757, -0.0005681812763214111, -0.0005077868700027466, -0.00044739246368408203, -0.0003869980573654175, -0.00032660365104675293, -0.0002662092447280884, -0.00020581483840942383, -0.00014542043209075928, -8.502602577209473e-05, -2.4631619453430176e-05, 3.5762786865234375e-05, 9.615719318389893e-05, 0.00015655159950256348, 0.00021694600582122803, 0.0002773404121398926, 0.00033773481845855713, 0.0003981292247772217, 0.00045852363109588623, 0.0005189180374145508, 0.0005793124437332153, 0.0006397068500518799, 0.0007001012563705444, 0.000760495662689209, 0.0008208900690078735, 0.0008812844753265381, 0.0009416788816452026, 0.0010020732879638672, 0.0010624676942825317, 0.0011228621006011963, 0.0011832565069198608, 0.0012436509132385254, 0.00130404531955719, 0.0013644397258758545, 0.001424834132194519, 0.0014852285385131836, 0.0015456229448318481, 0.0016060173511505127, 0.0016664117574691772, 0.0017268061637878418, 0.0017872005701065063, 0.001847594976425171, 0.0019079893827438354, 0.0019683837890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 5.0, 6.0, 10.0, 29.0, 38.0, 50.0, 69.0, 122.0, 145.0, 200.0, 418.0, 793.0, 1512.0, 3066.0, 7218.0, 24338.0, 737191.0, 242260.0, 19126.0, 5811.0, 2617.0, 1299.0, 761.0, 459.0, 287.0, 209.0, 139.0, 95.0, 87.0, 56.0, 32.0, 26.0, 22.0, 17.0, 8.0, 10.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.827880859375, -16.26513671875, -15.702392578125, -15.1396484375, -14.576904296875, -14.01416015625, -13.451416015625, -12.888671875, -12.325927734375, -11.76318359375, -11.200439453125, -10.6376953125, -10.074951171875, -9.51220703125, -8.949462890625, -8.38671875, -7.823974609375, -7.26123046875, -6.698486328125, -6.1357421875, -5.572998046875, -5.01025390625, -4.447509765625, -3.884765625, -3.322021484375, -2.75927734375, -2.196533203125, -1.6337890625, -1.071044921875, -0.50830078125, 0.054443359375, 0.6171875, 1.179931640625, 1.74267578125, 2.305419921875, 2.8681640625, 3.430908203125, 3.99365234375, 4.556396484375, 5.119140625, 5.681884765625, 6.24462890625, 6.807373046875, 7.3701171875, 7.932861328125, 8.49560546875, 9.058349609375, 9.62109375, 10.183837890625, 10.74658203125, 11.309326171875, 11.8720703125, 12.434814453125, 12.99755859375, 13.560302734375, 14.123046875, 14.685791015625, 15.24853515625, 15.811279296875, 16.3740234375, 16.936767578125, 17.49951171875, 18.062255859375, 18.625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 0.0, 4.0, 6.0, 2.0, 5.0, 10.0, 15.0, 22.0, 47.0, 196.0, 417.0, 124.0, 56.0, 25.0, 20.0, 14.0, 9.0, 9.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.1109619140625, -7.714111328125, -7.3172607421875, -6.92041015625, -6.5235595703125, -6.126708984375, -5.7298583984375, -5.3330078125, -4.9361572265625, -4.539306640625, -4.1424560546875, -3.74560546875, -3.3487548828125, -2.951904296875, -2.5550537109375, -2.158203125, -1.7613525390625, -1.364501953125, -0.9676513671875, -0.57080078125, -0.1739501953125, 0.222900390625, 0.6197509765625, 1.0166015625, 1.4134521484375, 1.810302734375, 2.2071533203125, 2.60400390625, 3.0008544921875, 3.397705078125, 3.7945556640625, 4.19140625, 4.5882568359375, 4.985107421875, 5.3819580078125, 5.77880859375, 6.1756591796875, 6.572509765625, 6.9693603515625, 7.3662109375, 7.7630615234375, 8.159912109375, 8.5567626953125, 8.95361328125, 9.3504638671875, 9.747314453125, 10.1441650390625, 10.541015625, 10.9378662109375, 11.334716796875, 11.7315673828125, 12.12841796875, 12.5252685546875, 12.922119140625, 13.3189697265625, 13.7158203125, 14.1126708984375, 14.509521484375, 14.9063720703125, 15.30322265625, 15.7000732421875, 16.096923828125, 16.4937744140625, 16.890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 15.0, 27.0, 58.0, 105.0, 216.0, 277.0, 170.0, 64.0, 26.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.28681182861328, -56.87620544433594, -55.465599060058594, -54.05499267578125, -52.64439010620117, -51.23378372192383, -49.823177337646484, -48.41257095336914, -47.00196838378906, -45.59136199951172, -44.180755615234375, -42.77014923095703, -41.35954666137695, -39.94894027709961, -38.538333892822266, -37.12772750854492, -35.71712112426758, -34.306514739990234, -32.89590835571289, -31.48530387878418, -30.07469940185547, -28.664093017578125, -27.25348663330078, -25.842880249023438, -24.432275772094727, -23.021669387817383, -21.611064910888672, -20.200458526611328, -18.789852142333984, -17.379247665405273, -15.96864128112793, -14.558035850524902, -13.147428512573242, -11.736823081970215, -10.326217651367188, -8.915611267089844, -7.505005836486816, -6.094400405883789, -4.683794021606445, -3.273188591003418, -1.8625831604003906, -0.4519774913787842, 0.9586281776428223, 2.369234085083008, 3.779839515686035, 5.1904449462890625, 6.601051330566406, 8.011656761169434, 9.422262191772461, 10.832867622375488, 12.243473052978516, 13.65407943725586, 15.064684867858887, 16.475290298461914, 17.885896682739258, 19.29650115966797, 20.707107543945312, 22.117713928222656, 23.528318405151367, 24.93892478942871, 26.349529266357422, 27.760135650634766, 29.17074203491211, 30.581348419189453, 31.991952896118164]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 13.0, 21.0, 37.0, 52.0, 53.0, 80.0, 80.0, 102.0, 101.0, 113.0, 78.0, 69.0, 55.0, 43.0, 35.0, 17.0, 18.0, 8.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-40.01461410522461, -39.12533950805664, -38.23606491088867, -37.3467903137207, -36.457515716552734, -35.568241119384766, -34.6789665222168, -33.78969192504883, -32.90041732788086, -32.01114273071289, -31.121868133544922, -30.232593536376953, -29.343318939208984, -28.454044342041016, -27.564769744873047, -26.675495147705078, -25.786218643188477, -24.896944046020508, -24.00766944885254, -23.11839485168457, -22.2291202545166, -21.339845657348633, -20.45056915283203, -19.561294555664062, -18.672019958496094, -17.782745361328125, -16.893470764160156, -16.004196166992188, -15.114921569824219, -14.22564697265625, -13.336371421813965, -12.447096824645996, -11.557823181152344, -10.668548583984375, -9.779273986816406, -8.889999389648438, -8.000724792480469, -7.111449718475342, -6.222174644470215, -5.332900047302246, -4.443625450134277, -3.5543508529663086, -2.6650760173797607, -1.775801181793213, -0.8865265846252441, 0.0027480125427246094, 0.8920230865478516, 1.7812976837158203, 2.670572280883789, 3.559846878051758, 4.449121475219727, 5.3383965492248535, 6.227671146392822, 7.116945743560791, 8.006220817565918, 8.895495414733887, 9.784770011901855, 10.674044609069824, 11.563319206237793, 12.452594757080078, 13.341869354248047, 14.231143951416016, 15.120418548583984, 16.009693145751953, 16.898967742919922]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 8.0, 11.0, 11.0, 16.0, 14.0, 15.0, 20.0, 25.0, 31.0, 37.0, 66.0, 88.0, 146.0, 339.0, 1711.0, 37762.0, 4140124.0, 12641.0, 859.0, 130.0, 41.0, 34.0, 28.0, 10.0, 20.0, 12.0, 6.0, 8.0, 6.0, 10.0, 8.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-35.9375, -34.921142578125, -33.90478515625, -32.888427734375, -31.8720703125, -30.855712890625, -29.83935546875, -28.822998046875, -27.806640625, -26.790283203125, -25.77392578125, -24.757568359375, -23.7412109375, -22.724853515625, -21.70849609375, -20.692138671875, -19.67578125, -18.659423828125, -17.64306640625, -16.626708984375, -15.6103515625, -14.593994140625, -13.57763671875, -12.561279296875, -11.544921875, -10.528564453125, -9.51220703125, -8.495849609375, -7.4794921875, -6.463134765625, -5.44677734375, -4.430419921875, -3.4140625, -2.397705078125, -1.38134765625, -0.364990234375, 0.6513671875, 1.667724609375, 2.68408203125, 3.700439453125, 4.716796875, 5.733154296875, 6.74951171875, 7.765869140625, 8.7822265625, 9.798583984375, 10.81494140625, 11.831298828125, 12.84765625, 13.864013671875, 14.88037109375, 15.896728515625, 16.9130859375, 17.929443359375, 18.94580078125, 19.962158203125, 20.978515625, 21.994873046875, 23.01123046875, 24.027587890625, 25.0439453125, 26.060302734375, 27.07666015625, 28.093017578125, 29.109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 7.0, 31.0, 53.0, 113.0, 199.0, 211.0, 185.0, 110.0, 59.0, 23.0, 13.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.5229034423828125, -1.492095947265625, -1.4612884521484375, -1.43048095703125, -1.3996734619140625, -1.368865966796875, -1.3380584716796875, -1.3072509765625, -1.2764434814453125, -1.245635986328125, -1.2148284912109375, -1.18402099609375, -1.1532135009765625, -1.122406005859375, -1.0915985107421875, -1.060791015625, -1.0299835205078125, -0.999176025390625, -0.9683685302734375, -0.93756103515625, -0.9067535400390625, -0.875946044921875, -0.8451385498046875, -0.8143310546875, -0.7835235595703125, -0.752716064453125, -0.7219085693359375, -0.69110107421875, -0.6602935791015625, -0.629486083984375, -0.5986785888671875, -0.56787109375, -0.5370635986328125, -0.506256103515625, -0.4754486083984375, -0.44464111328125, -0.4138336181640625, -0.383026123046875, -0.3522186279296875, -0.3214111328125, -0.2906036376953125, -0.259796142578125, -0.2289886474609375, -0.19818115234375, -0.1673736572265625, -0.136566162109375, -0.1057586669921875, -0.074951171875, -0.0441436767578125, -0.013336181640625, 0.0174713134765625, 0.04827880859375, 0.0790863037109375, 0.109893798828125, 0.1407012939453125, 0.1715087890625, 0.2023162841796875, 0.233123779296875, 0.2639312744140625, 0.29473876953125, 0.3255462646484375, 0.356353759765625, 0.3871612548828125, 0.41796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 12.0, 21.0, 105.0, 1468.0, 4181650.0, 10620.0, 329.0, 65.0, 10.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.71875, -18.58056640625, -16.4423828125, -14.30419921875, -12.166015625, -10.02783203125, -7.8896484375, -5.75146484375, -3.61328125, -1.47509765625, 0.6630859375, 2.80126953125, 4.939453125, 7.07763671875, 9.2158203125, 11.35400390625, 13.4921875, 15.63037109375, 17.7685546875, 19.90673828125, 22.044921875, 24.18310546875, 26.3212890625, 28.45947265625, 30.59765625, 32.73583984375, 34.8740234375, 37.01220703125, 39.150390625, 41.28857421875, 43.4267578125, 45.56494140625, 47.703125, 49.84130859375, 51.9794921875, 54.11767578125, 56.255859375, 58.39404296875, 60.5322265625, 62.67041015625, 64.80859375, 66.94677734375, 69.0849609375, 71.22314453125, 73.361328125, 75.49951171875, 77.6376953125, 79.77587890625, 81.9140625, 84.05224609375, 86.1904296875, 88.32861328125, 90.466796875, 92.60498046875, 94.7431640625, 96.88134765625, 99.01953125, 101.15771484375, 103.2958984375, 105.43408203125, 107.572265625, 109.71044921875, 111.8486328125, 113.98681640625, 116.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 8.0, 13.0, 30.0, 61.0, 92.0, 216.0, 725.0, 2268.0, 359.0, 139.0, 67.0, 31.0, 18.0, 16.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6244964599609375, -1.574188232421875, -1.5238800048828125, -1.47357177734375, -1.4232635498046875, -1.372955322265625, -1.3226470947265625, -1.2723388671875, -1.2220306396484375, -1.171722412109375, -1.1214141845703125, -1.07110595703125, -1.0207977294921875, -0.970489501953125, -0.9201812744140625, -0.869873046875, -0.8195648193359375, -0.769256591796875, -0.7189483642578125, -0.66864013671875, -0.6183319091796875, -0.568023681640625, -0.5177154541015625, -0.4674072265625, -0.4170989990234375, -0.366790771484375, -0.3164825439453125, -0.26617431640625, -0.2158660888671875, -0.165557861328125, -0.1152496337890625, -0.06494140625, -0.0146331787109375, 0.035675048828125, 0.0859832763671875, 0.13629150390625, 0.1865997314453125, 0.236907958984375, 0.2872161865234375, 0.3375244140625, 0.3878326416015625, 0.438140869140625, 0.4884490966796875, 0.53875732421875, 0.5890655517578125, 0.639373779296875, 0.6896820068359375, 0.739990234375, 0.7902984619140625, 0.840606689453125, 0.8909149169921875, 0.94122314453125, 0.9915313720703125, 1.041839599609375, 1.0921478271484375, 1.1424560546875, 1.1927642822265625, 1.243072509765625, 1.2933807373046875, 1.34368896484375, 1.3939971923828125, 1.444305419921875, 1.4946136474609375, 1.544921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 31.0, 978.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.820545196533203, -16.07992172241211, -11.339298248291016, -6.598674774169922, -1.8580513000488281, 2.8825721740722656, 7.623195648193359, 12.363819122314453, 17.104442596435547, 21.84506607055664, 26.585689544677734, 31.326313018798828, 36.06693649291992, 40.807559967041016, 45.54818344116211, 50.2888069152832, 55.0294303894043, 59.77005386352539, 64.51068115234375, 69.25129699707031, 73.99192810058594, 78.7325439453125, 83.47317504882812, 88.21379089355469, 92.95442199707031, 97.6950454711914, 102.4356689453125, 107.1762924194336, 111.91691589355469, 116.65753936767578, 121.39816284179688, 126.13878631591797, 130.87939453125, 135.62002563476562, 140.3606414794922, 145.10125732421875, 149.84188842773438, 154.58251953125, 159.32313537597656, 164.06375122070312, 168.80438232421875, 173.54501342773438, 178.28562927246094, 183.0262451171875, 187.76687622070312, 192.50750732421875, 197.2481231689453, 201.98873901367188, 206.7293701171875, 211.47000122070312, 216.2106170654297, 220.95123291015625, 225.69186401367188, 230.4324951171875, 235.17311096191406, 239.91372680664062, 244.65435791015625, 249.39498901367188, 254.13560485839844, 258.876220703125, 263.6168518066406, 268.35748291015625, 273.09808349609375, 277.8387145996094, 282.579345703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 15.0, 40.0, 65.0, 116.0, 184.0, 203.0, 172.0, 122.0, 54.0, 24.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.676932334899902, -7.064642906188965, -6.452353000640869, -5.840063571929932, -5.227773666381836, -4.615484237670898, -4.003194808959961, -3.3909049034118652, -2.7786154747009277, -2.166325807571411, -1.554036259651184, -0.941746711730957, -0.32945704460144043, 0.28283262252807617, 0.8951220512390137, 1.5074119567871094, 2.119701385498047, 2.7319910526275635, 3.34428071975708, 3.9565701484680176, 4.568860054016113, 5.181149482727051, 5.793438911437988, 6.405728816986084, 7.0180182456970215, 7.630307674407959, 8.242597579956055, 8.854887008666992, 9.46717643737793, 10.079465866088867, 10.691755294799805, 11.304045677185059, 11.91633415222168, 12.528623580932617, 13.140913009643555, 13.753202438354492, 14.365492820739746, 14.977782249450684, 15.590071678161621, 16.202362060546875, 16.814651489257812, 17.42694091796875, 18.039230346679688, 18.651519775390625, 19.263809204101562, 19.8760986328125, 20.488388061523438, 21.100679397583008, 21.712966918945312, 22.32525634765625, 22.937545776367188, 23.549835205078125, 24.162124633789062, 24.7744140625, 25.386703491210938, 25.998994827270508, 26.611284255981445, 27.223573684692383, 27.83586311340332, 28.448152542114258, 29.060441970825195, 29.672733306884766, 30.285022735595703, 30.89731216430664, 31.509601593017578]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 15.0, 11.0, 11.0, 13.0, 23.0, 14.0, 27.0, 32.0, 38.0, 36.0, 49.0, 43.0, 61.0, 127.0, 9187.0, 1035545.0, 2825.0, 108.0, 51.0, 45.0, 37.0, 40.0, 35.0, 28.0, 26.0, 27.0, 17.0, 10.0, 13.0, 9.0, 10.0, 3.0, 5.0, 6.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.671875, -28.663330078125, -27.65478515625, -26.646240234375, -25.6376953125, -24.629150390625, -23.62060546875, -22.612060546875, -21.603515625, -20.594970703125, -19.58642578125, -18.577880859375, -17.5693359375, -16.560791015625, -15.55224609375, -14.543701171875, -13.53515625, -12.526611328125, -11.51806640625, -10.509521484375, -9.5009765625, -8.492431640625, -7.48388671875, -6.475341796875, -5.466796875, -4.458251953125, -3.44970703125, -2.441162109375, -1.4326171875, -0.424072265625, 0.58447265625, 1.593017578125, 2.6015625, 3.610107421875, 4.61865234375, 5.627197265625, 6.6357421875, 7.644287109375, 8.65283203125, 9.661376953125, 10.669921875, 11.678466796875, 12.68701171875, 13.695556640625, 14.7041015625, 15.712646484375, 16.72119140625, 17.729736328125, 18.73828125, 19.746826171875, 20.75537109375, 21.763916015625, 22.7724609375, 23.781005859375, 24.78955078125, 25.798095703125, 26.806640625, 27.815185546875, 28.82373046875, 29.832275390625, 30.8408203125, 31.849365234375, 32.85791015625, 33.866455078125, 34.875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [6.0, 56.0, 289.0, 480.0, 174.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34765625, -0.244140625, -0.140625, -0.037109375, 0.06640625, 0.169921875, 0.2734375, 0.376953125, 0.48046875, 0.583984375, 0.6875, 0.791015625, 0.89453125, 0.998046875, 1.1015625, 1.205078125, 1.30859375, 1.412109375, 1.515625, 1.619140625, 1.72265625, 1.826171875, 1.9296875, 2.033203125, 2.13671875, 2.240234375, 2.34375, 2.447265625, 2.55078125, 2.654296875, 2.7578125, 2.861328125, 2.96484375, 3.068359375, 3.171875, 3.275390625, 3.37890625, 3.482421875, 3.5859375, 3.689453125, 3.79296875, 3.896484375, 4.0, 4.103515625, 4.20703125, 4.310546875, 4.4140625, 4.517578125, 4.62109375, 4.724609375, 4.828125, 4.931640625, 5.03515625, 5.138671875, 5.2421875, 5.345703125, 5.44921875, 5.552734375, 5.65625, 5.759765625, 5.86328125, 5.966796875, 6.0703125, 6.173828125, 6.27734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 7.0, 13.0, 19.0, 24.0, 48.0, 41.0, 58.0, 117.0, 176.0, 408.0, 1028.0, 3581.0, 18721.0, 200893.0, 727699.0, 81639.0, 10383.0, 2201.0, 735.0, 306.0, 151.0, 95.0, 48.0, 33.0, 22.0, 19.0, 14.0, 11.0, 8.0, 10.0, 3.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.2578125, -12.882568359375, -12.50732421875, -12.132080078125, -11.7568359375, -11.381591796875, -11.00634765625, -10.631103515625, -10.255859375, -9.880615234375, -9.50537109375, -9.130126953125, -8.7548828125, -8.379638671875, -8.00439453125, -7.629150390625, -7.25390625, -6.878662109375, -6.50341796875, -6.128173828125, -5.7529296875, -5.377685546875, -5.00244140625, -4.627197265625, -4.251953125, -3.876708984375, -3.50146484375, -3.126220703125, -2.7509765625, -2.375732421875, -2.00048828125, -1.625244140625, -1.25, -0.874755859375, -0.49951171875, -0.124267578125, 0.2509765625, 0.626220703125, 1.00146484375, 1.376708984375, 1.751953125, 2.127197265625, 2.50244140625, 2.877685546875, 3.2529296875, 3.628173828125, 4.00341796875, 4.378662109375, 4.75390625, 5.129150390625, 5.50439453125, 5.879638671875, 6.2548828125, 6.630126953125, 7.00537109375, 7.380615234375, 7.755859375, 8.131103515625, 8.50634765625, 8.881591796875, 9.2568359375, 9.632080078125, 10.00732421875, 10.382568359375, 10.7578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 4.0, 7.0, 9.0, 16.0, 17.0, 18.0, 41.0, 28.0, 33.0, 43.0, 37.0, 71.0, 52.0, 63.0, 65.0, 61.0, 60.0, 57.0, 44.0, 51.0, 50.0, 33.0, 19.0, 17.0, 18.0, 12.0, 12.0, 10.0, 5.0, 11.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.95703125, -5.794189453125, -5.63134765625, -5.468505859375, -5.3056640625, -5.142822265625, -4.97998046875, -4.817138671875, -4.654296875, -4.491455078125, -4.32861328125, -4.165771484375, -4.0029296875, -3.840087890625, -3.67724609375, -3.514404296875, -3.3515625, -3.188720703125, -3.02587890625, -2.863037109375, -2.7001953125, -2.537353515625, -2.37451171875, -2.211669921875, -2.048828125, -1.885986328125, -1.72314453125, -1.560302734375, -1.3974609375, -1.234619140625, -1.07177734375, -0.908935546875, -0.74609375, -0.583251953125, -0.42041015625, -0.257568359375, -0.0947265625, 0.068115234375, 0.23095703125, 0.393798828125, 0.556640625, 0.719482421875, 0.88232421875, 1.045166015625, 1.2080078125, 1.370849609375, 1.53369140625, 1.696533203125, 1.859375, 2.022216796875, 2.18505859375, 2.347900390625, 2.5107421875, 2.673583984375, 2.83642578125, 2.999267578125, 3.162109375, 3.324951171875, 3.48779296875, 3.650634765625, 3.8134765625, 3.976318359375, 4.13916015625, 4.302001953125, 4.46484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 11.0, 19.0, 27.0, 48.0, 54.0, 129.0, 245.0, 619.0, 1500.0, 5269.0, 28477.0, 309865.0, 619278.0, 69417.0, 9595.0, 2393.0, 835.0, 357.0, 174.0, 103.0, 38.0, 43.0, 21.0, 12.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9344482421875, -6.704833984375, -6.4752197265625, -6.24560546875, -6.0159912109375, -5.786376953125, -5.5567626953125, -5.3271484375, -5.0975341796875, -4.867919921875, -4.6383056640625, -4.40869140625, -4.1790771484375, -3.949462890625, -3.7198486328125, -3.490234375, -3.2606201171875, -3.031005859375, -2.8013916015625, -2.57177734375, -2.3421630859375, -2.112548828125, -1.8829345703125, -1.6533203125, -1.4237060546875, -1.194091796875, -0.9644775390625, -0.73486328125, -0.5052490234375, -0.275634765625, -0.0460205078125, 0.18359375, 0.4132080078125, 0.642822265625, 0.8724365234375, 1.10205078125, 1.3316650390625, 1.561279296875, 1.7908935546875, 2.0205078125, 2.2501220703125, 2.479736328125, 2.7093505859375, 2.93896484375, 3.1685791015625, 3.398193359375, 3.6278076171875, 3.857421875, 4.0870361328125, 4.316650390625, 4.5462646484375, 4.77587890625, 5.0054931640625, 5.235107421875, 5.4647216796875, 5.6943359375, 5.9239501953125, 6.153564453125, 6.3831787109375, 6.61279296875, 6.8424072265625, 7.072021484375, 7.3016357421875, 7.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 14.0, 20.0, 26.0, 18.0, 35.0, 36.0, 46.0, 65.0, 57.0, 85.0, 100.0, 71.0, 75.0, 66.0, 62.0, 44.0, 30.0, 16.0, 28.0, 21.0, 12.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043582916259765625, -0.0004205852746963501, -0.00040534138679504395, -0.0003900974988937378, -0.00037485361099243164, -0.0003596097230911255, -0.00034436583518981934, -0.0003291219472885132, -0.00031387805938720703, -0.0002986341714859009, -0.0002833902835845947, -0.0002681463956832886, -0.0002529025077819824, -0.00023765861988067627, -0.00022241473197937012, -0.00020717084407806396, -0.0001919269561767578, -0.00017668306827545166, -0.0001614391803741455, -0.00014619529247283936, -0.0001309514045715332, -0.00011570751667022705, -0.0001004636287689209, -8.521974086761475e-05, -6.99758529663086e-05, -5.473196506500244e-05, -3.948807716369629e-05, -2.4244189262390137e-05, -9.000301361083984e-06, 6.243586540222168e-06, 2.148747444152832e-05, 3.673136234283447e-05, 5.1975250244140625e-05, 6.721913814544678e-05, 8.246302604675293e-05, 9.770691394805908e-05, 0.00011295080184936523, 0.0001281946897506714, 0.00014343857765197754, 0.0001586824655532837, 0.00017392635345458984, 0.000189170241355896, 0.00020441412925720215, 0.0002196580171585083, 0.00023490190505981445, 0.0002501457929611206, 0.00026538968086242676, 0.0002806335687637329, 0.00029587745666503906, 0.0003111213445663452, 0.00032636523246765137, 0.0003416091203689575, 0.00035685300827026367, 0.0003720968961715698, 0.000387340784072876, 0.00040258467197418213, 0.0004178285598754883, 0.00043307244777679443, 0.0004483163356781006, 0.00046356022357940674, 0.0004788041114807129, 0.000494047999382019, 0.0005092918872833252, 0.0005245357751846313, 0.0005397796630859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 8.0, 19.0, 43.0, 88.0, 200.0, 543.0, 1860.0, 12610.0, 269043.0, 722468.0, 36541.0, 3734.0, 886.0, 256.0, 113.0, 64.0, 33.0, 16.0, 10.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3824462890625, -8.085205078125, -7.7879638671875, -7.49072265625, -7.1934814453125, -6.896240234375, -6.5989990234375, -6.3017578125, -6.0045166015625, -5.707275390625, -5.4100341796875, -5.11279296875, -4.8155517578125, -4.518310546875, -4.2210693359375, -3.923828125, -3.6265869140625, -3.329345703125, -3.0321044921875, -2.73486328125, -2.4376220703125, -2.140380859375, -1.8431396484375, -1.5458984375, -1.2486572265625, -0.951416015625, -0.6541748046875, -0.35693359375, -0.0596923828125, 0.237548828125, 0.5347900390625, 0.83203125, 1.1292724609375, 1.426513671875, 1.7237548828125, 2.02099609375, 2.3182373046875, 2.615478515625, 2.9127197265625, 3.2099609375, 3.5072021484375, 3.804443359375, 4.1016845703125, 4.39892578125, 4.6961669921875, 4.993408203125, 5.2906494140625, 5.587890625, 5.8851318359375, 6.182373046875, 6.4796142578125, 6.77685546875, 7.0740966796875, 7.371337890625, 7.6685791015625, 7.9658203125, 8.2630615234375, 8.560302734375, 8.8575439453125, 9.15478515625, 9.4520263671875, 9.749267578125, 10.0465087890625, 10.34375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 19.0, 23.0, 22.0, 34.0, 56.0, 57.0, 83.0, 88.0, 96.0, 91.0, 106.0, 71.0, 60.0, 55.0, 38.0, 26.0, 19.0, 9.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.45501708984375, -2.3670654296875, -2.27911376953125, -2.191162109375, -2.10321044921875, -2.0152587890625, -1.92730712890625, -1.83935546875, -1.75140380859375, -1.6634521484375, -1.57550048828125, -1.487548828125, -1.39959716796875, -1.3116455078125, -1.22369384765625, -1.1357421875, -1.04779052734375, -0.9598388671875, -0.87188720703125, -0.783935546875, -0.69598388671875, -0.6080322265625, -0.52008056640625, -0.43212890625, -0.34417724609375, -0.2562255859375, -0.16827392578125, -0.080322265625, 0.00762939453125, 0.0955810546875, 0.18353271484375, 0.271484375, 0.35943603515625, 0.4473876953125, 0.53533935546875, 0.623291015625, 0.71124267578125, 0.7991943359375, 0.88714599609375, 0.97509765625, 1.06304931640625, 1.1510009765625, 1.23895263671875, 1.326904296875, 1.41485595703125, 1.5028076171875, 1.59075927734375, 1.6787109375, 1.76666259765625, 1.8546142578125, 1.94256591796875, 2.030517578125, 2.11846923828125, 2.2064208984375, 2.29437255859375, 2.38232421875, 2.47027587890625, 2.5582275390625, 2.64617919921875, 2.734130859375, 2.82208251953125, 2.9100341796875, 2.99798583984375, 3.0859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 12.0, 45.0, 379.0, 531.0, 42.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-345.8863830566406, -339.8394470214844, -333.7925109863281, -327.7455749511719, -321.6986083984375, -315.65167236328125, -309.604736328125, -303.55780029296875, -297.5108642578125, -291.46392822265625, -285.4169921875, -279.37005615234375, -273.3230895996094, -267.2761535644531, -261.2292175292969, -255.18228149414062, -249.13534545898438, -243.08840942382812, -237.0414581298828, -230.99452209472656, -224.9475860595703, -218.90065002441406, -212.85369873046875, -206.8067626953125, -200.7598114013672, -194.71287536621094, -188.66592407226562, -182.61898803710938, -176.57205200195312, -170.52511596679688, -164.47816467285156, -158.4312286376953, -152.38430786132812, -146.33737182617188, -140.29042053222656, -134.2434844970703, -128.19654846191406, -122.14960479736328, -116.1026611328125, -110.05572509765625, -104.00877380371094, -97.96183013916016, -91.9148941040039, -85.86795043945312, -79.82101440429688, -73.7740707397461, -67.72712707519531, -61.68019104003906, -55.63325500488281, -49.5863151550293, -43.53937530517578, -37.492431640625, -31.445493698120117, -25.3985538482666, -19.351612091064453, -13.304672241210938, -7.257732391357422, -1.210792064666748, 4.836148262023926, 10.883089065551758, 16.930028915405273, 22.97696876525879, 29.023910522460938, 35.07085037231445, 41.11779022216797]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 10.0, 9.0, 7.0, 10.0, 11.0, 19.0, 16.0, 29.0, 30.0, 36.0, 43.0, 39.0, 49.0, 42.0, 44.0, 51.0, 51.0, 50.0, 37.0, 60.0, 71.0, 35.0, 45.0, 37.0, 36.0, 36.0, 22.0, 16.0, 12.0, 15.0, 11.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.034114837646484, -29.104551315307617, -28.17498779296875, -27.245426177978516, -26.31586265563965, -25.38629913330078, -24.456735610961914, -23.527172088623047, -22.597610473632812, -21.668046951293945, -20.738483428955078, -19.808921813964844, -18.879358291625977, -17.94979476928711, -17.020231246948242, -16.090667724609375, -15.161105155944824, -14.231541633605957, -13.301979064941406, -12.372415542602539, -11.442852973937988, -10.513289451599121, -9.58372688293457, -8.654163360595703, -7.724600315093994, -6.795037269592285, -5.865474224090576, -4.935911178588867, -4.00634765625, -3.076784610748291, -2.147221565246582, -1.217658519744873, -0.28809547424316406, 0.6414676308631897, 1.5710307359695435, 2.500593900680542, 3.430156946182251, 4.359720230102539, 5.289283275604248, 6.218846321105957, 7.148409366607666, 8.077972412109375, 9.007535934448242, 9.937098503112793, 10.86666202545166, 11.796224594116211, 12.725788116455078, 13.655351638793945, 14.584914207458496, 15.514477729797363, 16.444040298461914, 17.37360382080078, 18.30316734313965, 19.232730865478516, 20.16229248046875, 21.091856002807617, 22.021419525146484, 22.95098304748535, 23.88054656982422, 24.810108184814453, 25.73967170715332, 26.669235229492188, 27.598798751831055, 28.528362274169922, 29.457923889160156]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 10.0, 28.0, 156.0, 2608.0, 4189175.0, 1719.0, 295.0, 126.0, 60.0, 42.0, 29.0, 19.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -19.35302734375, -15.7998046875, -12.24658203125, -8.693359375, -5.14013671875, -1.5869140625, 1.96630859375, 5.51953125, 9.07275390625, 12.6259765625, 16.17919921875, 19.732421875, 23.28564453125, 26.8388671875, 30.39208984375, 33.9453125, 37.49853515625, 41.0517578125, 44.60498046875, 48.158203125, 51.71142578125, 55.2646484375, 58.81787109375, 62.37109375, 65.92431640625, 69.4775390625, 73.03076171875, 76.583984375, 80.13720703125, 83.6904296875, 87.24365234375, 90.796875, 94.35009765625, 97.9033203125, 101.45654296875, 105.009765625, 108.56298828125, 112.1162109375, 115.66943359375, 119.22265625, 122.77587890625, 126.3291015625, 129.88232421875, 133.435546875, 136.98876953125, 140.5419921875, 144.09521484375, 147.6484375, 151.20166015625, 154.7548828125, 158.30810546875, 161.861328125, 165.41455078125, 168.9677734375, 172.52099609375, 176.07421875, 179.62744140625, 183.1806640625, 186.73388671875, 190.287109375, 193.84033203125, 197.3935546875, 200.94677734375, 204.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 23.0, 103.0, 253.0, 328.0, 197.0, 83.0, 19.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.720703125, -0.608734130859375, -0.49676513671875, -0.384796142578125, -0.2728271484375, -0.160858154296875, -0.04888916015625, 0.063079833984375, 0.175048828125, 0.287017822265625, 0.39898681640625, 0.510955810546875, 0.6229248046875, 0.734893798828125, 0.84686279296875, 0.958831787109375, 1.07080078125, 1.182769775390625, 1.29473876953125, 1.406707763671875, 1.5186767578125, 1.630645751953125, 1.74261474609375, 1.854583740234375, 1.966552734375, 2.078521728515625, 2.19049072265625, 2.302459716796875, 2.4144287109375, 2.526397705078125, 2.63836669921875, 2.750335693359375, 2.8623046875, 2.974273681640625, 3.08624267578125, 3.198211669921875, 3.3101806640625, 3.422149658203125, 3.53411865234375, 3.646087646484375, 3.758056640625, 3.870025634765625, 3.98199462890625, 4.093963623046875, 4.2059326171875, 4.317901611328125, 4.42987060546875, 4.541839599609375, 4.65380859375, 4.765777587890625, 4.87774658203125, 4.989715576171875, 5.1016845703125, 5.213653564453125, 5.32562255859375, 5.437591552734375, 5.549560546875, 5.661529541015625, 5.77349853515625, 5.885467529296875, 5.9974365234375, 6.109405517578125, 6.22137451171875, 6.333343505859375, 6.4453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 14.0, 38.0, 78.0, 124.0, 210.0, 799.0, 4190188.0, 1961.0, 341.0, 218.0, 156.0, 84.0, 41.0, 21.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.0625, -77.4072265625, -72.751953125, -68.0966796875, -63.44140625, -58.7861328125, -54.130859375, -49.4755859375, -44.8203125, -40.1650390625, -35.509765625, -30.8544921875, -26.19921875, -21.5439453125, -16.888671875, -12.2333984375, -7.578125, -2.9228515625, 1.732421875, 6.3876953125, 11.04296875, 15.6982421875, 20.353515625, 25.0087890625, 29.6640625, 34.3193359375, 38.974609375, 43.6298828125, 48.28515625, 52.9404296875, 57.595703125, 62.2509765625, 66.90625, 71.5615234375, 76.216796875, 80.8720703125, 85.52734375, 90.1826171875, 94.837890625, 99.4931640625, 104.1484375, 108.8037109375, 113.458984375, 118.1142578125, 122.76953125, 127.4248046875, 132.080078125, 136.7353515625, 141.390625, 146.0458984375, 150.701171875, 155.3564453125, 160.01171875, 164.6669921875, 169.322265625, 173.9775390625, 178.6328125, 183.2880859375, 187.943359375, 192.5986328125, 197.25390625, 201.9091796875, 206.564453125, 211.2197265625, 215.875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 16.0, 97.0, 2918.0, 979.0, 50.0, 14.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25390625, -4.81341552734375, -4.3729248046875, -3.93243408203125, -3.491943359375, -3.05145263671875, -2.6109619140625, -2.17047119140625, -1.72998046875, -1.28948974609375, -0.8489990234375, -0.40850830078125, 0.031982421875, 0.47247314453125, 0.9129638671875, 1.35345458984375, 1.7939453125, 2.23443603515625, 2.6749267578125, 3.11541748046875, 3.555908203125, 3.99639892578125, 4.4368896484375, 4.87738037109375, 5.31787109375, 5.75836181640625, 6.1988525390625, 6.63934326171875, 7.079833984375, 7.52032470703125, 7.9608154296875, 8.40130615234375, 8.841796875, 9.28228759765625, 9.7227783203125, 10.16326904296875, 10.603759765625, 11.04425048828125, 11.4847412109375, 11.92523193359375, 12.36572265625, 12.80621337890625, 13.2467041015625, 13.68719482421875, 14.127685546875, 14.56817626953125, 15.0086669921875, 15.44915771484375, 15.8896484375, 16.33013916015625, 16.7706298828125, 17.21112060546875, 17.651611328125, 18.09210205078125, 18.5325927734375, 18.97308349609375, 19.41357421875, 19.85406494140625, 20.2945556640625, 20.73504638671875, 21.175537109375, 21.61602783203125, 22.0565185546875, 22.49700927734375, 22.9375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 9.0, 78.0, 798.0, 116.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.74381446838379, -14.134571075439453, -8.5253267288208, -2.9160823822021484, 2.6931610107421875, 8.302404403686523, 13.911649703979492, 19.520891189575195, 25.130136489868164, 30.7393798828125, 36.34862518310547, 41.95787048339844, 47.56711196899414, 53.176353454589844, 58.78559875488281, 64.39484405517578, 70.00408935546875, 75.61333465576172, 81.22257995605469, 86.83181762695312, 92.4410629272461, 98.05030822753906, 103.65955352783203, 109.268798828125, 114.87803649902344, 120.4872817993164, 126.09652709960938, 131.7057647705078, 137.3150177001953, 142.92425537109375, 148.53350830078125, 154.1427459716797, 159.7519989013672, 165.36123657226562, 170.97048950195312, 176.57972717285156, 182.18898010253906, 187.7982177734375, 193.407470703125, 199.01670837402344, 204.62594604492188, 210.2351837158203, 215.8444366455078, 221.45367431640625, 227.06292724609375, 232.6721649169922, 238.28140258789062, 243.89065551757812, 249.49990844726562, 255.10914611816406, 260.7183837890625, 266.32763671875, 271.9368896484375, 277.546142578125, 283.1553649902344, 288.7646179199219, 294.37384033203125, 299.98309326171875, 305.5923156738281, 311.2015686035156, 316.8108215332031, 322.4200439453125, 328.029296875, 333.6385498046875, 339.247802734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 20.0, 32.0, 62.0, 84.0, 121.0, 151.0, 150.0, 142.0, 107.0, 69.0, 31.0, 12.0, 14.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.32392120361328, -75.97357940673828, -73.62324523925781, -71.27290344238281, -68.92256164550781, -66.57222747802734, -64.22188568115234, -61.87154769897461, -59.521209716796875, -57.17087173461914, -54.82052993774414, -52.470191955566406, -50.11985397338867, -47.76951599121094, -45.41917419433594, -43.0688362121582, -40.7184944152832, -38.36815643310547, -36.01781463623047, -33.667476654052734, -31.317138671875, -28.966798782348633, -26.616458892822266, -24.26612091064453, -21.915781021118164, -19.565441131591797, -17.215103149414062, -14.864763259887695, -12.514424324035645, -10.164085388183594, -7.813745498657227, -5.463407516479492, -3.113067626953125, -0.7627284526824951, 1.5876107215881348, 3.9379501342773438, 6.2882890701293945, 8.638628005981445, 10.988967895507812, 13.339305877685547, 15.689645767211914, 18.03998565673828, 20.390323638916016, 22.740663528442383, 25.09100341796875, 27.441341400146484, 29.79168128967285, 32.14202117919922, 34.49235916137695, 36.84269714355469, 39.19303894042969, 41.54337692260742, 43.893714904785156, 46.244056701660156, 48.59439468383789, 50.944732666015625, 53.295074462890625, 55.64541244506836, 57.99575424194336, 60.346092224121094, 62.69643020629883, 65.04676818847656, 67.39710998535156, 69.74745178222656, 72.09778594970703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 8.0, 15.0, 16.0, 17.0, 29.0, 20.0, 32.0, 51.0, 57.0, 93.0, 170.0, 492.0, 1655.0, 9983.0, 368522.0, 649243.0, 14948.0, 2065.0, 576.0, 209.0, 92.0, 54.0, 31.0, 34.0, 30.0, 23.0, 17.0, 18.0, 14.0, 9.0, 9.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5625, -34.518798828125, -33.47509765625, -32.431396484375, -31.3876953125, -30.343994140625, -29.30029296875, -28.256591796875, -27.212890625, -26.169189453125, -25.12548828125, -24.081787109375, -23.0380859375, -21.994384765625, -20.95068359375, -19.906982421875, -18.86328125, -17.819580078125, -16.77587890625, -15.732177734375, -14.6884765625, -13.644775390625, -12.60107421875, -11.557373046875, -10.513671875, -9.469970703125, -8.42626953125, -7.382568359375, -6.3388671875, -5.295166015625, -4.25146484375, -3.207763671875, -2.1640625, -1.120361328125, -0.07666015625, 0.967041015625, 2.0107421875, 3.054443359375, 4.09814453125, 5.141845703125, 6.185546875, 7.229248046875, 8.27294921875, 9.316650390625, 10.3603515625, 11.404052734375, 12.44775390625, 13.491455078125, 14.53515625, 15.578857421875, 16.62255859375, 17.666259765625, 18.7099609375, 19.753662109375, 20.79736328125, 21.841064453125, 22.884765625, 23.928466796875, 24.97216796875, 26.015869140625, 27.0595703125, 28.103271484375, 29.14697265625, 30.190673828125, 31.234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 16.0, 56.0, 78.0, 169.0, 208.0, 218.0, 125.0, 78.0, 36.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -1.99383544921875, -1.8392333984375, -1.68463134765625, -1.530029296875, -1.37542724609375, -1.2208251953125, -1.06622314453125, -0.91162109375, -0.75701904296875, -0.6024169921875, -0.44781494140625, -0.293212890625, -0.13861083984375, 0.0159912109375, 0.17059326171875, 0.3251953125, 0.47979736328125, 0.6343994140625, 0.78900146484375, 0.943603515625, 1.09820556640625, 1.2528076171875, 1.40740966796875, 1.56201171875, 1.71661376953125, 1.8712158203125, 2.02581787109375, 2.180419921875, 2.33502197265625, 2.4896240234375, 2.64422607421875, 2.798828125, 2.95343017578125, 3.1080322265625, 3.26263427734375, 3.417236328125, 3.57183837890625, 3.7264404296875, 3.88104248046875, 4.03564453125, 4.19024658203125, 4.3448486328125, 4.49945068359375, 4.654052734375, 4.80865478515625, 4.9632568359375, 5.11785888671875, 5.2724609375, 5.42706298828125, 5.5816650390625, 5.73626708984375, 5.890869140625, 6.04547119140625, 6.2000732421875, 6.35467529296875, 6.50927734375, 6.66387939453125, 6.8184814453125, 6.97308349609375, 7.127685546875, 7.28228759765625, 7.4368896484375, 7.59149169921875, 7.74609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 12.0, 10.0, 7.0, 18.0, 21.0, 33.0, 51.0, 102.0, 169.0, 398.0, 1312.0, 7270.0, 144745.0, 842423.0, 46525.0, 3845.0, 915.0, 300.0, 139.0, 78.0, 53.0, 40.0, 20.0, 20.0, 11.0, 7.0, 10.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25, -17.60595703125, -16.9619140625, -16.31787109375, -15.673828125, -15.02978515625, -14.3857421875, -13.74169921875, -13.09765625, -12.45361328125, -11.8095703125, -11.16552734375, -10.521484375, -9.87744140625, -9.2333984375, -8.58935546875, -7.9453125, -7.30126953125, -6.6572265625, -6.01318359375, -5.369140625, -4.72509765625, -4.0810546875, -3.43701171875, -2.79296875, -2.14892578125, -1.5048828125, -0.86083984375, -0.216796875, 0.42724609375, 1.0712890625, 1.71533203125, 2.359375, 3.00341796875, 3.6474609375, 4.29150390625, 4.935546875, 5.57958984375, 6.2236328125, 6.86767578125, 7.51171875, 8.15576171875, 8.7998046875, 9.44384765625, 10.087890625, 10.73193359375, 11.3759765625, 12.02001953125, 12.6640625, 13.30810546875, 13.9521484375, 14.59619140625, 15.240234375, 15.88427734375, 16.5283203125, 17.17236328125, 17.81640625, 18.46044921875, 19.1044921875, 19.74853515625, 20.392578125, 21.03662109375, 21.6806640625, 22.32470703125, 22.96875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 9.0, 7.0, 12.0, 15.0, 22.0, 17.0, 28.0, 30.0, 51.0, 50.0, 68.0, 62.0, 57.0, 73.0, 78.0, 70.0, 66.0, 53.0, 43.0, 33.0, 38.0, 27.0, 22.0, 18.0, 8.0, 20.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.93658447265625, -6.6661376953125, -6.39569091796875, -6.125244140625, -5.85479736328125, -5.5843505859375, -5.31390380859375, -5.04345703125, -4.77301025390625, -4.5025634765625, -4.23211669921875, -3.961669921875, -3.69122314453125, -3.4207763671875, -3.15032958984375, -2.8798828125, -2.60943603515625, -2.3389892578125, -2.06854248046875, -1.798095703125, -1.52764892578125, -1.2572021484375, -0.98675537109375, -0.71630859375, -0.44586181640625, -0.1754150390625, 0.09503173828125, 0.365478515625, 0.63592529296875, 0.9063720703125, 1.17681884765625, 1.447265625, 1.71771240234375, 1.9881591796875, 2.25860595703125, 2.529052734375, 2.79949951171875, 3.0699462890625, 3.34039306640625, 3.61083984375, 3.88128662109375, 4.1517333984375, 4.42218017578125, 4.692626953125, 4.96307373046875, 5.2335205078125, 5.50396728515625, 5.7744140625, 6.04486083984375, 6.3153076171875, 6.58575439453125, 6.856201171875, 7.12664794921875, 7.3970947265625, 7.66754150390625, 7.93798828125, 8.20843505859375, 8.4788818359375, 8.74932861328125, 9.019775390625, 9.29022216796875, 9.5606689453125, 9.83111572265625, 10.1015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 6.0, 17.0, 22.0, 32.0, 54.0, 107.0, 175.0, 355.0, 846.0, 2704.0, 13743.0, 219032.0, 766156.0, 37612.0, 5265.0, 1339.0, 516.0, 281.0, 116.0, 61.0, 30.0, 26.0, 19.0, 11.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.238525390625, -11.89111328125, -11.543701171875, -11.1962890625, -10.848876953125, -10.50146484375, -10.154052734375, -9.806640625, -9.459228515625, -9.11181640625, -8.764404296875, -8.4169921875, -8.069580078125, -7.72216796875, -7.374755859375, -7.02734375, -6.679931640625, -6.33251953125, -5.985107421875, -5.6376953125, -5.290283203125, -4.94287109375, -4.595458984375, -4.248046875, -3.900634765625, -3.55322265625, -3.205810546875, -2.8583984375, -2.510986328125, -2.16357421875, -1.816162109375, -1.46875, -1.121337890625, -0.77392578125, -0.426513671875, -0.0791015625, 0.268310546875, 0.61572265625, 0.963134765625, 1.310546875, 1.657958984375, 2.00537109375, 2.352783203125, 2.7001953125, 3.047607421875, 3.39501953125, 3.742431640625, 4.08984375, 4.437255859375, 4.78466796875, 5.132080078125, 5.4794921875, 5.826904296875, 6.17431640625, 6.521728515625, 6.869140625, 7.216552734375, 7.56396484375, 7.911376953125, 8.2587890625, 8.606201171875, 8.95361328125, 9.301025390625, 9.6484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 12.0, 6.0, 10.0, 8.0, 12.0, 23.0, 21.0, 25.0, 33.0, 34.0, 44.0, 53.0, 62.0, 74.0, 58.0, 61.0, 59.0, 61.0, 66.0, 48.0, 37.0, 33.0, 29.0, 36.0, 15.0, 14.0, 8.0, 11.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003757476806640625, -0.0003602132201194763, -0.00034467875957489014, -0.00032914429903030396, -0.0003136098384857178, -0.0002980753779411316, -0.0002825409173965454, -0.00026700645685195923, -0.00025147199630737305, -0.00023593753576278687, -0.00022040307521820068, -0.0002048686146736145, -0.00018933415412902832, -0.00017379969358444214, -0.00015826523303985596, -0.00014273077249526978, -0.0001271963119506836, -0.00011166185140609741, -9.612739086151123e-05, -8.059293031692505e-05, -6.505846977233887e-05, -4.9524009227752686e-05, -3.3989548683166504e-05, -1.8455088138580322e-05, -2.9206275939941406e-06, 1.2613832950592041e-05, 2.8148293495178223e-05, 4.3682754039764404e-05, 5.9217214584350586e-05, 7.475167512893677e-05, 9.028613567352295e-05, 0.00010582059621810913, 0.00012135505676269531, 0.0001368895173072815, 0.00015242397785186768, 0.00016795843839645386, 0.00018349289894104004, 0.00019902735948562622, 0.0002145618200302124, 0.00023009628057479858, 0.00024563074111938477, 0.00026116520166397095, 0.00027669966220855713, 0.0002922341227531433, 0.0003077685832977295, 0.0003233030438423157, 0.00033883750438690186, 0.00035437196493148804, 0.0003699064254760742, 0.0003854408860206604, 0.0004009753465652466, 0.00041650980710983276, 0.00043204426765441895, 0.0004475787281990051, 0.0004631131887435913, 0.0004786476492881775, 0.0004941821098327637, 0.0005097165703773499, 0.000525251030921936, 0.0005407854914665222, 0.0005563199520111084, 0.0005718544125556946, 0.0005873888731002808, 0.0006029233336448669, 0.0006184577941894531]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 8.0, 14.0, 20.0, 32.0, 28.0, 65.0, 110.0, 168.0, 337.0, 867.0, 2955.0, 17379.0, 414645.0, 583669.0, 22899.0, 3440.0, 1016.0, 377.0, 198.0, 124.0, 74.0, 41.0, 22.0, 20.0, 10.0, 11.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8046875, -9.46728515625, -9.1298828125, -8.79248046875, -8.455078125, -8.11767578125, -7.7802734375, -7.44287109375, -7.10546875, -6.76806640625, -6.4306640625, -6.09326171875, -5.755859375, -5.41845703125, -5.0810546875, -4.74365234375, -4.40625, -4.06884765625, -3.7314453125, -3.39404296875, -3.056640625, -2.71923828125, -2.3818359375, -2.04443359375, -1.70703125, -1.36962890625, -1.0322265625, -0.69482421875, -0.357421875, -0.02001953125, 0.3173828125, 0.65478515625, 0.9921875, 1.32958984375, 1.6669921875, 2.00439453125, 2.341796875, 2.67919921875, 3.0166015625, 3.35400390625, 3.69140625, 4.02880859375, 4.3662109375, 4.70361328125, 5.041015625, 5.37841796875, 5.7158203125, 6.05322265625, 6.390625, 6.72802734375, 7.0654296875, 7.40283203125, 7.740234375, 8.07763671875, 8.4150390625, 8.75244140625, 9.08984375, 9.42724609375, 9.7646484375, 10.10205078125, 10.439453125, 10.77685546875, 11.1142578125, 11.45166015625, 11.7890625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 8.0, 16.0, 18.0, 26.0, 36.0, 65.0, 84.0, 93.0, 94.0, 121.0, 103.0, 76.0, 55.0, 55.0, 31.0, 31.0, 18.0, 13.0, 6.0, 4.0, 7.0, 3.0, 2.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7265625, -3.613922119140625, -3.50128173828125, -3.388641357421875, -3.2760009765625, -3.163360595703125, -3.05072021484375, -2.938079833984375, -2.825439453125, -2.712799072265625, -2.60015869140625, -2.487518310546875, -2.3748779296875, -2.262237548828125, -2.14959716796875, -2.036956787109375, -1.92431640625, -1.811676025390625, -1.69903564453125, -1.586395263671875, -1.4737548828125, -1.361114501953125, -1.24847412109375, -1.135833740234375, -1.023193359375, -0.910552978515625, -0.79791259765625, -0.685272216796875, -0.5726318359375, -0.459991455078125, -0.34735107421875, -0.234710693359375, -0.1220703125, -0.009429931640625, 0.10321044921875, 0.215850830078125, 0.3284912109375, 0.441131591796875, 0.55377197265625, 0.666412353515625, 0.779052734375, 0.891693115234375, 1.00433349609375, 1.116973876953125, 1.2296142578125, 1.342254638671875, 1.45489501953125, 1.567535400390625, 1.68017578125, 1.792816162109375, 1.90545654296875, 2.018096923828125, 2.1307373046875, 2.243377685546875, 2.35601806640625, 2.468658447265625, 2.581298828125, 2.693939208984375, 2.80657958984375, 2.919219970703125, 3.0318603515625, 3.144500732421875, 3.25714111328125, 3.369781494140625, 3.482421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 27.0, 509.0, 443.0, 28.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.9824523925781, -496.6236572265625, -487.26483154296875, -477.9060363769531, -468.5472106933594, -459.18841552734375, -449.82958984375, -440.4707946777344, -431.11199951171875, -421.7532043457031, -412.3943786621094, -403.03558349609375, -393.6767578125, -384.3179626464844, -374.9591369628906, -365.600341796875, -356.24151611328125, -346.8827209472656, -337.5238952636719, -328.16510009765625, -318.8062744140625, -309.4474792480469, -300.0886535644531, -290.7298583984375, -281.37103271484375, -272.0122375488281, -262.6534118652344, -253.2946014404297, -243.935791015625, -234.57699584960938, -225.2181854248047, -215.859375, -206.50054931640625, -197.14173889160156, -187.78292846679688, -178.4241180419922, -169.0653076171875, -159.70651245117188, -150.3477020263672, -140.9888916015625, -131.6300811767578, -122.27127075195312, -112.91246032714844, -103.55365753173828, -94.1948471069336, -84.8360366821289, -75.47723388671875, -66.11842346191406, -56.759613037109375, -47.40080261230469, -38.041996002197266, -28.68318748474121, -19.324378967285156, -9.965568542480469, -0.6067619323730469, 8.752044677734375, 18.110855102539062, 27.469663619995117, 36.82847213745117, 46.187278747558594, 55.54608917236328, 64.90489959716797, 74.26370239257812, 83.62251281738281, 92.9813232421875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 7.0, 7.0, 19.0, 16.0, 27.0, 29.0, 49.0, 53.0, 62.0, 65.0, 72.0, 85.0, 65.0, 62.0, 66.0, 67.0, 48.0, 41.0, 41.0, 28.0, 24.0, 19.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.678749084472656, -50.877872467041016, -49.076995849609375, -47.276119232177734, -45.475242614746094, -43.67436599731445, -41.87348937988281, -40.07261276245117, -38.27173614501953, -36.47085952758789, -34.66998291015625, -32.86910629272461, -31.06822967529297, -29.267353057861328, -27.466476440429688, -25.665599822998047, -23.864721298217773, -22.063844680786133, -20.262968063354492, -18.46209144592285, -16.66121482849121, -14.860337257385254, -13.059460639953613, -11.258584022521973, -9.457707405090332, -7.656830787658691, -5.855954170227051, -4.055077075958252, -2.2542004585266113, -0.4533233642578125, 1.3475532531738281, 3.1484298706054688, 4.949306488037109, 6.75018310546875, 8.55105972290039, 10.351936340332031, 12.152812957763672, 13.953690528869629, 15.75456714630127, 17.555442810058594, 19.356319427490234, 21.157196044921875, 22.958072662353516, 24.758949279785156, 26.559825897216797, 28.360702514648438, 30.161579132080078, 31.96245574951172, 33.763336181640625, 35.564212799072266, 37.365089416503906, 39.16596603393555, 40.96684265136719, 42.76771926879883, 44.56859588623047, 46.36947250366211, 48.17034912109375, 49.97122573852539, 51.77210235595703, 53.57297897338867, 55.37385559082031, 57.17473220825195, 58.975608825683594, 60.776485443115234, 62.577362060546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 7.0, 16.0, 42.0, 105.0, 274.0, 1040.0, 8858.0, 490960.0, 3674213.0, 15148.0, 2047.0, 719.0, 321.0, 178.0, 96.0, 65.0, 49.0, 23.0, 39.0, 19.0, 18.0, 14.0, 10.0, 7.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.2508544921875, -12.056396484375, -10.8619384765625, -9.66748046875, -8.4730224609375, -7.278564453125, -6.0841064453125, -4.8896484375, -3.6951904296875, -2.500732421875, -1.3062744140625, -0.11181640625, 1.0826416015625, 2.277099609375, 3.4715576171875, 4.666015625, 5.8604736328125, 7.054931640625, 8.2493896484375, 9.44384765625, 10.6383056640625, 11.832763671875, 13.0272216796875, 14.2216796875, 15.4161376953125, 16.610595703125, 17.8050537109375, 18.99951171875, 20.1939697265625, 21.388427734375, 22.5828857421875, 23.77734375, 24.9718017578125, 26.166259765625, 27.3607177734375, 28.55517578125, 29.7496337890625, 30.944091796875, 32.1385498046875, 33.3330078125, 34.5274658203125, 35.721923828125, 36.9163818359375, 38.11083984375, 39.3052978515625, 40.499755859375, 41.6942138671875, 42.888671875, 44.0831298828125, 45.277587890625, 46.4720458984375, 47.66650390625, 48.8609619140625, 50.055419921875, 51.2498779296875, 52.4443359375, 53.6387939453125, 54.833251953125, 56.0277099609375, 57.22216796875, 58.4166259765625, 59.611083984375, 60.8055419921875, 62.0]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 8.0, 22.0, 45.0, 72.0, 135.0, 188.0, 196.0, 159.0, 84.0, 47.0, 29.0, 16.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.3079833984375, -1.166748046875, -1.0255126953125, -0.88427734375, -0.7430419921875, -0.601806640625, -0.4605712890625, -0.3193359375, -0.1781005859375, -0.036865234375, 0.1043701171875, 0.24560546875, 0.3868408203125, 0.528076171875, 0.6693115234375, 0.810546875, 0.9517822265625, 1.093017578125, 1.2342529296875, 1.37548828125, 1.5167236328125, 1.657958984375, 1.7991943359375, 1.9404296875, 2.0816650390625, 2.222900390625, 2.3641357421875, 2.50537109375, 2.6466064453125, 2.787841796875, 2.9290771484375, 3.0703125, 3.2115478515625, 3.352783203125, 3.4940185546875, 3.63525390625, 3.7764892578125, 3.917724609375, 4.0589599609375, 4.2001953125, 4.3414306640625, 4.482666015625, 4.6239013671875, 4.76513671875, 4.9063720703125, 5.047607421875, 5.1888427734375, 5.330078125, 5.4713134765625, 5.612548828125, 5.7537841796875, 5.89501953125, 6.0362548828125, 6.177490234375, 6.3187255859375, 6.4599609375, 6.6011962890625, 6.742431640625, 6.8836669921875, 7.02490234375, 7.1661376953125, 7.307373046875, 7.4486083984375, 7.58984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 26.0, 46.0, 94.0, 392.0, 4383.0, 4184032.0, 4383.0, 566.0, 200.0, 83.0, 40.0, 21.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -39.81005859375, -36.3388671875, -32.86767578125, -29.396484375, -25.92529296875, -22.4541015625, -18.98291015625, -15.51171875, -12.04052734375, -8.5693359375, -5.09814453125, -1.626953125, 1.84423828125, 5.3154296875, 8.78662109375, 12.2578125, 15.72900390625, 19.2001953125, 22.67138671875, 26.142578125, 29.61376953125, 33.0849609375, 36.55615234375, 40.02734375, 43.49853515625, 46.9697265625, 50.44091796875, 53.912109375, 57.38330078125, 60.8544921875, 64.32568359375, 67.796875, 71.26806640625, 74.7392578125, 78.21044921875, 81.681640625, 85.15283203125, 88.6240234375, 92.09521484375, 95.56640625, 99.03759765625, 102.5087890625, 105.97998046875, 109.451171875, 112.92236328125, 116.3935546875, 119.86474609375, 123.3359375, 126.80712890625, 130.2783203125, 133.74951171875, 137.220703125, 140.69189453125, 144.1630859375, 147.63427734375, 151.10546875, 154.57666015625, 158.0478515625, 161.51904296875, 164.990234375, 168.46142578125, 171.9326171875, 175.40380859375, 178.875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 12.0, 27.0, 87.0, 572.0, 3043.0, 251.0, 53.0, 17.0, 8.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.760498046875, -3.39599609375, -3.031494140625, -2.6669921875, -2.302490234375, -1.93798828125, -1.573486328125, -1.208984375, -0.844482421875, -0.47998046875, -0.115478515625, 0.2490234375, 0.613525390625, 0.97802734375, 1.342529296875, 1.70703125, 2.071533203125, 2.43603515625, 2.800537109375, 3.1650390625, 3.529541015625, 3.89404296875, 4.258544921875, 4.623046875, 4.987548828125, 5.35205078125, 5.716552734375, 6.0810546875, 6.445556640625, 6.81005859375, 7.174560546875, 7.5390625, 7.903564453125, 8.26806640625, 8.632568359375, 8.9970703125, 9.361572265625, 9.72607421875, 10.090576171875, 10.455078125, 10.819580078125, 11.18408203125, 11.548583984375, 11.9130859375, 12.277587890625, 12.64208984375, 13.006591796875, 13.37109375, 13.735595703125, 14.10009765625, 14.464599609375, 14.8291015625, 15.193603515625, 15.55810546875, 15.922607421875, 16.287109375, 16.651611328125, 17.01611328125, 17.380615234375, 17.7451171875, 18.109619140625, 18.47412109375, 18.838623046875, 19.203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 10.0, 11.0, 33.0, 144.0, 351.0, 276.0, 97.0, 40.0, 15.0, 4.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.248306274414062, -15.653608322143555, -14.05890941619873, -12.464210510253906, -10.869512557983398, -9.27481460571289, -7.680115699768066, -6.085416793823242, -4.490718841552734, -2.8960204124450684, -1.3013219833374023, 0.29337644577026367, 1.8880748748779297, 3.4827733039855957, 5.077471733093262, 6.672170639038086, 8.266868591308594, 9.861566543579102, 11.456265449523926, 13.05096435546875, 14.645662307739258, 16.240360260009766, 17.835060119628906, 19.429758071899414, 21.024456024169922, 22.61915397644043, 24.213851928710938, 25.808551788330078, 27.403249740600586, 28.997947692871094, 30.592647552490234, 32.187347412109375, 33.78204345703125, 35.37674331665039, 36.971439361572266, 38.566139221191406, 40.16083526611328, 41.75553512573242, 43.35023498535156, 44.94493103027344, 46.53963088989258, 48.13433074951172, 49.729026794433594, 51.323726654052734, 52.918426513671875, 54.51312255859375, 56.10782241821289, 57.70252227783203, 59.297218322753906, 60.89191818237305, 62.48661422729492, 64.08131408691406, 65.67601013183594, 67.27071380615234, 68.86540985107422, 70.4601058959961, 72.0548095703125, 73.64950561523438, 75.24420928955078, 76.83890533447266, 78.43360137939453, 80.02830505371094, 81.62300109863281, 83.21769714355469, 84.81239318847656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 10.0, 10.0, 27.0, 25.0, 50.0, 79.0, 98.0, 97.0, 108.0, 127.0, 117.0, 101.0, 59.0, 43.0, 23.0, 11.0, 8.0, 9.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.559661865234375, -43.02756118774414, -41.495460510253906, -39.96336364746094, -38.4312629699707, -36.89916229248047, -35.3670654296875, -33.834964752197266, -32.30286407470703, -30.770763397216797, -29.238664627075195, -27.706565856933594, -26.17446517944336, -24.642364501953125, -23.110265731811523, -21.578166961669922, -20.046066284179688, -18.513965606689453, -16.98186683654785, -15.449767112731934, -13.917667388916016, -12.385567665100098, -10.85346794128418, -9.321368217468262, -7.789268493652344, -6.257168769836426, -4.725069046020508, -3.19296932220459, -1.6608695983886719, -0.1287698745727539, 1.403329849243164, 2.935429573059082, 4.467529296875, 5.999629020690918, 7.531728744506836, 9.063828468322754, 10.595928192138672, 12.12802791595459, 13.660127639770508, 15.192227363586426, 16.724327087402344, 18.256427764892578, 19.78852653503418, 21.32062530517578, 22.852725982666016, 24.38482666015625, 25.91692543029785, 27.449024200439453, 28.981124877929688, 30.513225555419922, 32.045326232910156, 33.577423095703125, 35.10952377319336, 36.641624450683594, 38.17372131347656, 39.7058219909668, 41.23792266845703, 42.770023345947266, 44.3021240234375, 45.83422088623047, 47.3663215637207, 48.89842224121094, 50.430519104003906, 51.96261978149414, 53.494720458984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 13.0, 6.0, 8.0, 17.0, 26.0, 25.0, 39.0, 53.0, 84.0, 118.0, 186.0, 315.0, 602.0, 1623.0, 6656.0, 46702.0, 609101.0, 348427.0, 27529.0, 4487.0, 1267.0, 528.0, 254.0, 136.0, 101.0, 61.0, 45.0, 39.0, 26.0, 17.0, 15.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.558349609375, -18.94482421875, -18.331298828125, -17.7177734375, -17.104248046875, -16.49072265625, -15.877197265625, -15.263671875, -14.650146484375, -14.03662109375, -13.423095703125, -12.8095703125, -12.196044921875, -11.58251953125, -10.968994140625, -10.35546875, -9.741943359375, -9.12841796875, -8.514892578125, -7.9013671875, -7.287841796875, -6.67431640625, -6.060791015625, -5.447265625, -4.833740234375, -4.22021484375, -3.606689453125, -2.9931640625, -2.379638671875, -1.76611328125, -1.152587890625, -0.5390625, 0.074462890625, 0.68798828125, 1.301513671875, 1.9150390625, 2.528564453125, 3.14208984375, 3.755615234375, 4.369140625, 4.982666015625, 5.59619140625, 6.209716796875, 6.8232421875, 7.436767578125, 8.05029296875, 8.663818359375, 9.27734375, 9.890869140625, 10.50439453125, 11.117919921875, 11.7314453125, 12.344970703125, 12.95849609375, 13.572021484375, 14.185546875, 14.799072265625, 15.41259765625, 16.026123046875, 16.6396484375, 17.253173828125, 17.86669921875, 18.480224609375, 19.09375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 15.0, 19.0, 42.0, 73.0, 101.0, 138.0, 147.0, 142.0, 122.0, 83.0, 47.0, 38.0, 17.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.398345947265625, -2.23614501953125, -2.073944091796875, -1.9117431640625, -1.749542236328125, -1.58734130859375, -1.425140380859375, -1.262939453125, -1.100738525390625, -0.93853759765625, -0.776336669921875, -0.6141357421875, -0.451934814453125, -0.28973388671875, -0.127532958984375, 0.03466796875, 0.196868896484375, 0.35906982421875, 0.521270751953125, 0.6834716796875, 0.845672607421875, 1.00787353515625, 1.170074462890625, 1.332275390625, 1.494476318359375, 1.65667724609375, 1.818878173828125, 1.9810791015625, 2.143280029296875, 2.30548095703125, 2.467681884765625, 2.6298828125, 2.792083740234375, 2.95428466796875, 3.116485595703125, 3.2786865234375, 3.440887451171875, 3.60308837890625, 3.765289306640625, 3.927490234375, 4.089691162109375, 4.25189208984375, 4.414093017578125, 4.5762939453125, 4.738494873046875, 4.90069580078125, 5.062896728515625, 5.22509765625, 5.387298583984375, 5.54949951171875, 5.711700439453125, 5.8739013671875, 6.036102294921875, 6.19830322265625, 6.360504150390625, 6.522705078125, 6.684906005859375, 6.84710693359375, 7.009307861328125, 7.1715087890625, 7.333709716796875, 7.49591064453125, 7.658111572265625, 7.8203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 8.0, 15.0, 21.0, 30.0, 46.0, 52.0, 102.0, 117.0, 186.0, 312.0, 605.0, 1253.0, 2972.0, 9582.0, 46318.0, 354526.0, 535059.0, 76240.0, 13957.0, 3988.0, 1481.0, 675.0, 354.0, 202.0, 135.0, 91.0, 61.0, 50.0, 33.0, 21.0, 10.0, 14.0, 2.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.03125, -11.644775390625, -11.25830078125, -10.871826171875, -10.4853515625, -10.098876953125, -9.71240234375, -9.325927734375, -8.939453125, -8.552978515625, -8.16650390625, -7.780029296875, -7.3935546875, -7.007080078125, -6.62060546875, -6.234130859375, -5.84765625, -5.461181640625, -5.07470703125, -4.688232421875, -4.3017578125, -3.915283203125, -3.52880859375, -3.142333984375, -2.755859375, -2.369384765625, -1.98291015625, -1.596435546875, -1.2099609375, -0.823486328125, -0.43701171875, -0.050537109375, 0.3359375, 0.722412109375, 1.10888671875, 1.495361328125, 1.8818359375, 2.268310546875, 2.65478515625, 3.041259765625, 3.427734375, 3.814208984375, 4.20068359375, 4.587158203125, 4.9736328125, 5.360107421875, 5.74658203125, 6.133056640625, 6.51953125, 6.906005859375, 7.29248046875, 7.678955078125, 8.0654296875, 8.451904296875, 8.83837890625, 9.224853515625, 9.611328125, 9.997802734375, 10.38427734375, 10.770751953125, 11.1572265625, 11.543701171875, 11.93017578125, 12.316650390625, 12.703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 11.0, 8.0, 11.0, 12.0, 21.0, 30.0, 18.0, 40.0, 40.0, 31.0, 58.0, 62.0, 47.0, 53.0, 47.0, 61.0, 65.0, 53.0, 51.0, 42.0, 31.0, 38.0, 26.0, 24.0, 18.0, 23.0, 17.0, 7.0, 11.0, 7.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.9296875, -8.630615234375, -8.33154296875, -8.032470703125, -7.7333984375, -7.434326171875, -7.13525390625, -6.836181640625, -6.537109375, -6.238037109375, -5.93896484375, -5.639892578125, -5.3408203125, -5.041748046875, -4.74267578125, -4.443603515625, -4.14453125, -3.845458984375, -3.54638671875, -3.247314453125, -2.9482421875, -2.649169921875, -2.35009765625, -2.051025390625, -1.751953125, -1.452880859375, -1.15380859375, -0.854736328125, -0.5556640625, -0.256591796875, 0.04248046875, 0.341552734375, 0.640625, 0.939697265625, 1.23876953125, 1.537841796875, 1.8369140625, 2.135986328125, 2.43505859375, 2.734130859375, 3.033203125, 3.332275390625, 3.63134765625, 3.930419921875, 4.2294921875, 4.528564453125, 4.82763671875, 5.126708984375, 5.42578125, 5.724853515625, 6.02392578125, 6.322998046875, 6.6220703125, 6.921142578125, 7.22021484375, 7.519287109375, 7.818359375, 8.117431640625, 8.41650390625, 8.715576171875, 9.0146484375, 9.313720703125, 9.61279296875, 9.911865234375, 10.2109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 9.0, 26.0, 55.0, 76.0, 223.0, 467.0, 1427.0, 5189.0, 36296.0, 622965.0, 355461.0, 20849.0, 3687.0, 1067.0, 387.0, 185.0, 77.0, 35.0, 25.0, 14.0, 11.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.710693359375, -7.45263671875, -7.194580078125, -6.9365234375, -6.678466796875, -6.42041015625, -6.162353515625, -5.904296875, -5.646240234375, -5.38818359375, -5.130126953125, -4.8720703125, -4.614013671875, -4.35595703125, -4.097900390625, -3.83984375, -3.581787109375, -3.32373046875, -3.065673828125, -2.8076171875, -2.549560546875, -2.29150390625, -2.033447265625, -1.775390625, -1.517333984375, -1.25927734375, -1.001220703125, -0.7431640625, -0.485107421875, -0.22705078125, 0.031005859375, 0.2890625, 0.547119140625, 0.80517578125, 1.063232421875, 1.3212890625, 1.579345703125, 1.83740234375, 2.095458984375, 2.353515625, 2.611572265625, 2.86962890625, 3.127685546875, 3.3857421875, 3.643798828125, 3.90185546875, 4.159912109375, 4.41796875, 4.676025390625, 4.93408203125, 5.192138671875, 5.4501953125, 5.708251953125, 5.96630859375, 6.224365234375, 6.482421875, 6.740478515625, 6.99853515625, 7.256591796875, 7.5146484375, 7.772705078125, 8.03076171875, 8.288818359375, 8.546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 17.0, 30.0, 36.0, 57.0, 92.0, 108.0, 118.0, 116.0, 101.0, 67.0, 64.0, 44.0, 36.0, 26.0, 20.0, 14.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005602836608886719, -0.0005357339978218079, -0.0005111843347549438, -0.00048663467168807983, -0.0004620850086212158, -0.0004375353455543518, -0.0004129856824874878, -0.0003884360194206238, -0.00036388635635375977, -0.00033933669328689575, -0.00031478703022003174, -0.0002902373671531677, -0.0002656877040863037, -0.0002411380410194397, -0.00021658837795257568, -0.00019203871488571167, -0.00016748905181884766, -0.00014293938875198364, -0.00011838972568511963, -9.384006261825562e-05, -6.92903995513916e-05, -4.474073648452759e-05, -2.0191073417663574e-05, 4.3585896492004395e-06, 2.8908252716064453e-05, 5.345791578292847e-05, 7.800757884979248e-05, 0.0001025572419166565, 0.0001271069049835205, 0.00015165656805038452, 0.00017620623111724854, 0.00020075589418411255, 0.00022530555725097656, 0.0002498552203178406, 0.0002744048833847046, 0.0002989545464515686, 0.0003235042095184326, 0.00034805387258529663, 0.00037260353565216064, 0.00039715319871902466, 0.00042170286178588867, 0.0004462525248527527, 0.0004708021879196167, 0.0004953518509864807, 0.0005199015140533447, 0.0005444511771202087, 0.0005690008401870728, 0.0005935505032539368, 0.0006181001663208008, 0.0006426498293876648, 0.0006671994924545288, 0.0006917491555213928, 0.0007162988185882568, 0.0007408484816551208, 0.0007653981447219849, 0.0007899478077888489, 0.0008144974708557129, 0.0008390471339225769, 0.0008635967969894409, 0.0008881464600563049, 0.0009126961231231689, 0.000937245786190033, 0.000961795449256897, 0.000986345112323761, 0.001010894775390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 14.0, 20.0, 18.0, 45.0, 75.0, 108.0, 159.0, 311.0, 632.0, 1402.0, 4005.0, 15341.0, 124911.0, 746046.0, 132491.0, 15893.0, 4151.0, 1452.0, 622.0, 332.0, 194.0, 107.0, 69.0, 38.0, 29.0, 11.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.23046875, -6.01934814453125, -5.8082275390625, -5.59710693359375, -5.385986328125, -5.17486572265625, -4.9637451171875, -4.75262451171875, -4.54150390625, -4.33038330078125, -4.1192626953125, -3.90814208984375, -3.697021484375, -3.48590087890625, -3.2747802734375, -3.06365966796875, -2.8525390625, -2.64141845703125, -2.4302978515625, -2.21917724609375, -2.008056640625, -1.79693603515625, -1.5858154296875, -1.37469482421875, -1.16357421875, -0.95245361328125, -0.7413330078125, -0.53021240234375, -0.319091796875, -0.10797119140625, 0.1031494140625, 0.31427001953125, 0.525390625, 0.73651123046875, 0.9476318359375, 1.15875244140625, 1.369873046875, 1.58099365234375, 1.7921142578125, 2.00323486328125, 2.21435546875, 2.42547607421875, 2.6365966796875, 2.84771728515625, 3.058837890625, 3.26995849609375, 3.4810791015625, 3.69219970703125, 3.9033203125, 4.11444091796875, 4.3255615234375, 4.53668212890625, 4.747802734375, 4.95892333984375, 5.1700439453125, 5.38116455078125, 5.59228515625, 5.80340576171875, 6.0145263671875, 6.22564697265625, 6.436767578125, 6.64788818359375, 6.8590087890625, 7.07012939453125, 7.28125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 11.0, 5.0, 10.0, 8.0, 15.0, 22.0, 37.0, 55.0, 101.0, 120.0, 138.0, 141.0, 116.0, 82.0, 45.0, 34.0, 12.0, 10.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.26171875, -4.1090087890625, -3.956298828125, -3.8035888671875, -3.65087890625, -3.4981689453125, -3.345458984375, -3.1927490234375, -3.0400390625, -2.8873291015625, -2.734619140625, -2.5819091796875, -2.42919921875, -2.2764892578125, -2.123779296875, -1.9710693359375, -1.818359375, -1.6656494140625, -1.512939453125, -1.3602294921875, -1.20751953125, -1.0548095703125, -0.902099609375, -0.7493896484375, -0.5966796875, -0.4439697265625, -0.291259765625, -0.1385498046875, 0.01416015625, 0.1668701171875, 0.319580078125, 0.4722900390625, 0.625, 0.7777099609375, 0.930419921875, 1.0831298828125, 1.23583984375, 1.3885498046875, 1.541259765625, 1.6939697265625, 1.8466796875, 1.9993896484375, 2.152099609375, 2.3048095703125, 2.45751953125, 2.6102294921875, 2.762939453125, 2.9156494140625, 3.068359375, 3.2210693359375, 3.373779296875, 3.5264892578125, 3.67919921875, 3.8319091796875, 3.984619140625, 4.1373291015625, 4.2900390625, 4.4427490234375, 4.595458984375, 4.7481689453125, 4.90087890625, 5.0535888671875, 5.206298828125, 5.3590087890625, 5.51171875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 29.0, 139.0, 523.0, 258.0, 38.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.63331604003906, -230.5352783203125, -224.43722534179688, -218.3391876220703, -212.24114990234375, -206.14309692382812, -200.04505920410156, -193.947021484375, -187.84896850585938, -181.7509307861328, -175.6528778076172, -169.55484008789062, -163.45680236816406, -157.3587646484375, -151.26071166992188, -145.1626739501953, -139.06463623046875, -132.9665985107422, -126.8685531616211, -120.7705078125, -114.67247009277344, -108.57442474365234, -102.47637939453125, -96.37834167480469, -90.2802963256836, -84.1822509765625, -78.08421325683594, -71.98616790771484, -65.88812255859375, -59.79008483886719, -53.692039489746094, -47.593997955322266, -41.495941162109375, -35.39789962768555, -29.299856185913086, -23.201812744140625, -17.103771209716797, -11.005729675292969, -4.907684326171875, 1.1903572082519531, 7.288398742675781, 13.386441230773926, 19.48448371887207, 25.58252716064453, 31.68056869506836, 37.77861022949219, 43.87665557861328, 49.97469711303711, 56.07273864746094, 62.170780181884766, 68.2688217163086, 74.36686706542969, 80.46490478515625, 86.56295013427734, 92.66099548339844, 98.759033203125, 104.8570785522461, 110.95512390136719, 117.05316162109375, 123.15120697021484, 129.24925231933594, 135.3472900390625, 141.44534301757812, 147.5433807373047, 153.64141845703125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 15.0, 10.0, 11.0, 13.0, 18.0, 32.0, 33.0, 28.0, 46.0, 54.0, 47.0, 54.0, 54.0, 59.0, 69.0, 50.0, 65.0, 57.0, 57.0, 35.0, 41.0, 37.0, 21.0, 22.0, 21.0, 10.0, 8.0, 8.0, 4.0, 4.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.09480285644531, -59.17831802368164, -57.26183319091797, -55.3453483581543, -53.428863525390625, -51.51238250732422, -49.59589385986328, -47.679412841796875, -45.7629280090332, -43.84644317626953, -41.92995834350586, -40.01347351074219, -38.096988677978516, -36.180503845214844, -34.26402282714844, -32.347537994384766, -30.43105125427246, -28.51456642150879, -26.598081588745117, -24.681598663330078, -22.765113830566406, -20.848628997802734, -18.932144165039062, -17.01565933227539, -15.099175453186035, -13.182690620422363, -11.266206741333008, -9.349721908569336, -7.433237552642822, -5.516753196716309, -3.6002683639526367, -1.6837844848632812, 0.23270034790039062, 2.1491847038269043, 4.065669059753418, 5.98215389251709, 7.8986382484436035, 9.815122604370117, 11.731607437133789, 13.648091316223145, 15.564576148986816, 17.481060028076172, 19.397544860839844, 21.314029693603516, 23.230514526367188, 25.14699935913086, 27.06348419189453, 28.97996711730957, 30.896451950073242, 32.81293487548828, 34.72941970825195, 36.645904541015625, 38.5623893737793, 40.47887420654297, 42.39535903930664, 44.31184387207031, 46.228328704833984, 48.144813537597656, 50.06129837036133, 51.977783203125, 53.89426803588867, 55.810752868652344, 57.72723388671875, 59.64371871948242, 61.560203552246094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 14.0, 14.0, 25.0, 61.0, 124.0, 273.0, 725.0, 2414.0, 14429.0, 996384.0, 3157931.0, 17037.0, 2905.0, 902.0, 403.0, 238.0, 136.0, 90.0, 53.0, 43.0, 30.0, 18.0, 8.0, 7.0, 7.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -19.942626953125, -18.99462890625, -18.046630859375, -17.0986328125, -16.150634765625, -15.20263671875, -14.254638671875, -13.306640625, -12.358642578125, -11.41064453125, -10.462646484375, -9.5146484375, -8.566650390625, -7.61865234375, -6.670654296875, -5.72265625, -4.774658203125, -3.82666015625, -2.878662109375, -1.9306640625, -0.982666015625, -0.03466796875, 0.913330078125, 1.861328125, 2.809326171875, 3.75732421875, 4.705322265625, 5.6533203125, 6.601318359375, 7.54931640625, 8.497314453125, 9.4453125, 10.393310546875, 11.34130859375, 12.289306640625, 13.2373046875, 14.185302734375, 15.13330078125, 16.081298828125, 17.029296875, 17.977294921875, 18.92529296875, 19.873291015625, 20.8212890625, 21.769287109375, 22.71728515625, 23.665283203125, 24.61328125, 25.561279296875, 26.50927734375, 27.457275390625, 28.4052734375, 29.353271484375, 30.30126953125, 31.249267578125, 32.197265625, 33.145263671875, 34.09326171875, 35.041259765625, 35.9892578125, 36.937255859375, 37.88525390625, 38.833251953125, 39.78125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 12.0, 5.0, 9.0, 33.0, 35.0, 58.0, 97.0, 114.0, 140.0, 130.0, 122.0, 90.0, 74.0, 38.0, 27.0, 10.0, 5.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.007080078125, -1.85400390625, -1.700927734375, -1.5478515625, -1.394775390625, -1.24169921875, -1.088623046875, -0.935546875, -0.782470703125, -0.62939453125, -0.476318359375, -0.3232421875, -0.170166015625, -0.01708984375, 0.135986328125, 0.2890625, 0.442138671875, 0.59521484375, 0.748291015625, 0.9013671875, 1.054443359375, 1.20751953125, 1.360595703125, 1.513671875, 1.666748046875, 1.81982421875, 1.972900390625, 2.1259765625, 2.279052734375, 2.43212890625, 2.585205078125, 2.73828125, 2.891357421875, 3.04443359375, 3.197509765625, 3.3505859375, 3.503662109375, 3.65673828125, 3.809814453125, 3.962890625, 4.115966796875, 4.26904296875, 4.422119140625, 4.5751953125, 4.728271484375, 4.88134765625, 5.034423828125, 5.1875, 5.340576171875, 5.49365234375, 5.646728515625, 5.7998046875, 5.952880859375, 6.10595703125, 6.259033203125, 6.412109375, 6.565185546875, 6.71826171875, 6.871337890625, 7.0244140625, 7.177490234375, 7.33056640625, 7.483642578125, 7.63671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 13.0, 19.0, 33.0, 45.0, 66.0, 65.0, 117.0, 167.0, 577.0, 22519.0, 4167684.0, 2261.0, 324.0, 168.0, 80.0, 63.0, 36.0, 13.0, 15.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.125, -106.6611328125, -104.197265625, -101.7333984375, -99.26953125, -96.8056640625, -94.341796875, -91.8779296875, -89.4140625, -86.9501953125, -84.486328125, -82.0224609375, -79.55859375, -77.0947265625, -74.630859375, -72.1669921875, -69.703125, -67.2392578125, -64.775390625, -62.3115234375, -59.84765625, -57.3837890625, -54.919921875, -52.4560546875, -49.9921875, -47.5283203125, -45.064453125, -42.6005859375, -40.13671875, -37.6728515625, -35.208984375, -32.7451171875, -30.28125, -27.8173828125, -25.353515625, -22.8896484375, -20.42578125, -17.9619140625, -15.498046875, -13.0341796875, -10.5703125, -8.1064453125, -5.642578125, -3.1787109375, -0.71484375, 1.7490234375, 4.212890625, 6.6767578125, 9.140625, 11.6044921875, 14.068359375, 16.5322265625, 18.99609375, 21.4599609375, 23.923828125, 26.3876953125, 28.8515625, 31.3154296875, 33.779296875, 36.2431640625, 38.70703125, 41.1708984375, 43.634765625, 46.0986328125, 48.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 36.0, 325.0, 3456.0, 217.0, 34.0, 9.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.8577880859375, -25.262451171875, -24.6671142578125, -24.07177734375, -23.4764404296875, -22.881103515625, -22.2857666015625, -21.6904296875, -21.0950927734375, -20.499755859375, -19.9044189453125, -19.30908203125, -18.7137451171875, -18.118408203125, -17.5230712890625, -16.927734375, -16.3323974609375, -15.737060546875, -15.1417236328125, -14.54638671875, -13.9510498046875, -13.355712890625, -12.7603759765625, -12.1650390625, -11.5697021484375, -10.974365234375, -10.3790283203125, -9.78369140625, -9.1883544921875, -8.593017578125, -7.9976806640625, -7.40234375, -6.8070068359375, -6.211669921875, -5.6163330078125, -5.02099609375, -4.4256591796875, -3.830322265625, -3.2349853515625, -2.6396484375, -2.0443115234375, -1.448974609375, -0.8536376953125, -0.25830078125, 0.3370361328125, 0.932373046875, 1.5277099609375, 2.123046875, 2.7183837890625, 3.313720703125, 3.9090576171875, 4.50439453125, 5.0997314453125, 5.695068359375, 6.2904052734375, 6.8857421875, 7.4810791015625, 8.076416015625, 8.6717529296875, 9.26708984375, 9.8624267578125, 10.457763671875, 11.0531005859375, 11.6484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 16.0, 100.0, 426.0, 361.0, 75.0, 13.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-119.66759490966797, -117.49042510986328, -115.31324768066406, -113.13607788085938, -110.95890808105469, -108.78173828125, -106.60456085205078, -104.4273910522461, -102.25021362304688, -100.07304382324219, -97.89586639404297, -95.71869659423828, -93.5415267944336, -91.36434936523438, -89.18717956542969, -87.010009765625, -84.83283996582031, -82.65567016601562, -80.4784927368164, -78.30132293701172, -76.12415313720703, -73.94697570800781, -71.76980590820312, -69.59263610839844, -67.41546630859375, -65.23829650878906, -63.06112289428711, -60.883949279785156, -58.70677947998047, -56.529605865478516, -54.35243225097656, -52.175262451171875, -49.99808883666992, -47.82091522216797, -45.64374542236328, -43.46657180786133, -41.289398193359375, -39.11222839355469, -36.935054779052734, -34.75788116455078, -32.580711364746094, -30.403539657592773, -28.226367950439453, -26.0491943359375, -23.87202262878418, -21.69485092163086, -19.517677307128906, -17.340505599975586, -15.163333892822266, -12.986162185668945, -10.808989524841309, -8.631816864013672, -6.454645156860352, -4.277473449707031, -2.1003007888793945, 0.07687187194824219, 2.2540435791015625, 4.431215763092041, 6.6083879470825195, 8.785560607910156, 10.962732315063477, 13.139904022216797, 15.317076683044434, 17.49424934387207, 19.67142105102539]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 18.0, 28.0, 57.0, 75.0, 105.0, 110.0, 137.0, 129.0, 125.0, 81.0, 65.0, 35.0, 20.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.928974151611328, -27.684797286987305, -26.44062042236328, -25.196443557739258, -23.952266693115234, -22.708087921142578, -21.463911056518555, -20.21973419189453, -18.975557327270508, -17.731380462646484, -16.48720359802246, -15.243025779724121, -13.998848915100098, -12.754672050476074, -11.510494232177734, -10.266317367553711, -9.022140502929688, -7.777963638305664, -6.533786296844482, -5.289608955383301, -4.045432090759277, -2.801255226135254, -1.5570778846740723, -0.3129005432128906, 0.9312763214111328, 2.1754534244537354, 3.419630527496338, 4.6638078689575195, 5.907984733581543, 7.152161598205566, 8.396339416503906, 9.64051628112793, 10.884689331054688, 12.128866195678711, 13.373043060302734, 14.617220878601074, 15.861397743225098, 17.105575561523438, 18.34975242614746, 19.593929290771484, 20.838106155395508, 22.08228302001953, 23.326459884643555, 24.570636749267578, 25.814815521240234, 27.058990478515625, 28.30316925048828, 29.547346115112305, 30.791522979736328, 32.035701751708984, 33.279876708984375, 34.52405548095703, 35.76823043823242, 37.01240921020508, 38.25658416748047, 39.500762939453125, 40.74494171142578, 41.98912048339844, 43.23329544067383, 44.477474212646484, 45.721649169921875, 46.96582794189453, 48.21000289916992, 49.45418167114258, 50.69835662841797]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 16.0, 14.0, 21.0, 43.0, 52.0, 75.0, 129.0, 198.0, 348.0, 749.0, 2116.0, 7283.0, 37763.0, 295792.0, 594471.0, 89129.0, 14394.0, 3468.0, 1243.0, 514.0, 239.0, 149.0, 92.0, 62.0, 54.0, 34.0, 25.0, 7.0, 11.0, 9.0, 12.0, 11.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.17626953125, -11.7119140625, -11.24755859375, -10.783203125, -10.31884765625, -9.8544921875, -9.39013671875, -8.92578125, -8.46142578125, -7.9970703125, -7.53271484375, -7.068359375, -6.60400390625, -6.1396484375, -5.67529296875, -5.2109375, -4.74658203125, -4.2822265625, -3.81787109375, -3.353515625, -2.88916015625, -2.4248046875, -1.96044921875, -1.49609375, -1.03173828125, -0.5673828125, -0.10302734375, 0.361328125, 0.82568359375, 1.2900390625, 1.75439453125, 2.21875, 2.68310546875, 3.1474609375, 3.61181640625, 4.076171875, 4.54052734375, 5.0048828125, 5.46923828125, 5.93359375, 6.39794921875, 6.8623046875, 7.32666015625, 7.791015625, 8.25537109375, 8.7197265625, 9.18408203125, 9.6484375, 10.11279296875, 10.5771484375, 11.04150390625, 11.505859375, 11.97021484375, 12.4345703125, 12.89892578125, 13.36328125, 13.82763671875, 14.2919921875, 14.75634765625, 15.220703125, 15.68505859375, 16.1494140625, 16.61376953125, 17.078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 19.0, 33.0, 35.0, 58.0, 66.0, 119.0, 110.0, 119.0, 119.0, 79.0, 82.0, 61.0, 33.0, 30.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.891204833984375, -1.76092529296875, -1.630645751953125, -1.5003662109375, -1.370086669921875, -1.23980712890625, -1.109527587890625, -0.979248046875, -0.848968505859375, -0.71868896484375, -0.588409423828125, -0.4581298828125, -0.327850341796875, -0.19757080078125, -0.067291259765625, 0.06298828125, 0.193267822265625, 0.32354736328125, 0.453826904296875, 0.5841064453125, 0.714385986328125, 0.84466552734375, 0.974945068359375, 1.105224609375, 1.235504150390625, 1.36578369140625, 1.496063232421875, 1.6263427734375, 1.756622314453125, 1.88690185546875, 2.017181396484375, 2.1474609375, 2.277740478515625, 2.40802001953125, 2.538299560546875, 2.6685791015625, 2.798858642578125, 2.92913818359375, 3.059417724609375, 3.189697265625, 3.319976806640625, 3.45025634765625, 3.580535888671875, 3.7108154296875, 3.841094970703125, 3.97137451171875, 4.101654052734375, 4.23193359375, 4.362213134765625, 4.49249267578125, 4.622772216796875, 4.7530517578125, 4.883331298828125, 5.01361083984375, 5.143890380859375, 5.274169921875, 5.404449462890625, 5.53472900390625, 5.665008544921875, 5.7952880859375, 5.925567626953125, 6.05584716796875, 6.186126708984375, 6.31640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 12.0, 6.0, 14.0, 11.0, 25.0, 42.0, 62.0, 66.0, 108.0, 162.0, 285.0, 413.0, 723.0, 1514.0, 4008.0, 12240.0, 49789.0, 301559.0, 543773.0, 101753.0, 21034.0, 6134.0, 2366.0, 975.0, 500.0, 318.0, 216.0, 135.0, 79.0, 56.0, 51.0, 25.0, 29.0, 17.0, 10.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.210693359375, -9.83544921875, -9.460205078125, -9.0849609375, -8.709716796875, -8.33447265625, -7.959228515625, -7.583984375, -7.208740234375, -6.83349609375, -6.458251953125, -6.0830078125, -5.707763671875, -5.33251953125, -4.957275390625, -4.58203125, -4.206787109375, -3.83154296875, -3.456298828125, -3.0810546875, -2.705810546875, -2.33056640625, -1.955322265625, -1.580078125, -1.204833984375, -0.82958984375, -0.454345703125, -0.0791015625, 0.296142578125, 0.67138671875, 1.046630859375, 1.421875, 1.797119140625, 2.17236328125, 2.547607421875, 2.9228515625, 3.298095703125, 3.67333984375, 4.048583984375, 4.423828125, 4.799072265625, 5.17431640625, 5.549560546875, 5.9248046875, 6.300048828125, 6.67529296875, 7.050537109375, 7.42578125, 7.801025390625, 8.17626953125, 8.551513671875, 8.9267578125, 9.302001953125, 9.67724609375, 10.052490234375, 10.427734375, 10.802978515625, 11.17822265625, 11.553466796875, 11.9287109375, 12.303955078125, 12.67919921875, 13.054443359375, 13.4296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 4.0, 10.0, 1.0, 7.0, 18.0, 18.0, 18.0, 26.0, 22.0, 37.0, 37.0, 45.0, 44.0, 58.0, 57.0, 59.0, 59.0, 52.0, 69.0, 56.0, 43.0, 52.0, 37.0, 33.0, 32.0, 23.0, 19.0, 12.0, 8.0, 8.0, 5.0, 12.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.128662109375, -8.77294921875, -8.417236328125, -8.0615234375, -7.705810546875, -7.35009765625, -6.994384765625, -6.638671875, -6.282958984375, -5.92724609375, -5.571533203125, -5.2158203125, -4.860107421875, -4.50439453125, -4.148681640625, -3.79296875, -3.437255859375, -3.08154296875, -2.725830078125, -2.3701171875, -2.014404296875, -1.65869140625, -1.302978515625, -0.947265625, -0.591552734375, -0.23583984375, 0.119873046875, 0.4755859375, 0.831298828125, 1.18701171875, 1.542724609375, 1.8984375, 2.254150390625, 2.60986328125, 2.965576171875, 3.3212890625, 3.677001953125, 4.03271484375, 4.388427734375, 4.744140625, 5.099853515625, 5.45556640625, 5.811279296875, 6.1669921875, 6.522705078125, 6.87841796875, 7.234130859375, 7.58984375, 7.945556640625, 8.30126953125, 8.656982421875, 9.0126953125, 9.368408203125, 9.72412109375, 10.079833984375, 10.435546875, 10.791259765625, 11.14697265625, 11.502685546875, 11.8583984375, 12.214111328125, 12.56982421875, 12.925537109375, 13.28125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 15.0, 26.0, 35.0, 42.0, 103.0, 206.0, 367.0, 830.0, 2363.0, 7976.0, 43871.0, 489353.0, 451525.0, 40497.0, 7498.0, 2203.0, 812.0, 385.0, 204.0, 100.0, 50.0, 31.0, 22.0, 11.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.20062255859375, -6.9754638671875, -6.75030517578125, -6.525146484375, -6.29998779296875, -6.0748291015625, -5.84967041015625, -5.62451171875, -5.39935302734375, -5.1741943359375, -4.94903564453125, -4.723876953125, -4.49871826171875, -4.2735595703125, -4.04840087890625, -3.8232421875, -3.59808349609375, -3.3729248046875, -3.14776611328125, -2.922607421875, -2.69744873046875, -2.4722900390625, -2.24713134765625, -2.02197265625, -1.79681396484375, -1.5716552734375, -1.34649658203125, -1.121337890625, -0.89617919921875, -0.6710205078125, -0.44586181640625, -0.220703125, 0.00445556640625, 0.2296142578125, 0.45477294921875, 0.679931640625, 0.90509033203125, 1.1302490234375, 1.35540771484375, 1.58056640625, 1.80572509765625, 2.0308837890625, 2.25604248046875, 2.481201171875, 2.70635986328125, 2.9315185546875, 3.15667724609375, 3.3818359375, 3.60699462890625, 3.8321533203125, 4.05731201171875, 4.282470703125, 4.50762939453125, 4.7327880859375, 4.95794677734375, 5.18310546875, 5.40826416015625, 5.6334228515625, 5.85858154296875, 6.083740234375, 6.30889892578125, 6.5340576171875, 6.75921630859375, 6.984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 3.0, 8.0, 9.0, 14.0, 14.0, 15.0, 30.0, 37.0, 42.0, 61.0, 90.0, 117.0, 127.0, 132.0, 70.0, 59.0, 45.0, 36.0, 13.0, 16.0, 17.0, 5.0, 9.0, 5.0, 3.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010423660278320312, -0.0010165199637413025, -0.0009906738996505737, -0.000964827835559845, -0.0009389817714691162, -0.0009131357073783875, -0.0008872896432876587, -0.0008614435791969299, -0.0008355975151062012, -0.0008097514510154724, -0.0007839053869247437, -0.0007580593228340149, -0.0007322132587432861, -0.0007063671946525574, -0.0006805211305618286, -0.0006546750664710999, -0.0006288290023803711, -0.0006029829382896423, -0.0005771368741989136, -0.0005512908101081848, -0.0005254447460174561, -0.0004995986819267273, -0.00047375261783599854, -0.0004479065537452698, -0.000422060489654541, -0.00039621442556381226, -0.0003703683614730835, -0.00034452229738235474, -0.000318676233291626, -0.0002928301692008972, -0.00026698410511016846, -0.0002411380410194397, -0.00021529197692871094, -0.00018944591283798218, -0.00016359984874725342, -0.00013775378465652466, -0.0001119077205657959, -8.606165647506714e-05, -6.021559238433838e-05, -3.436952829360962e-05, -8.52346420288086e-06, 1.73225998878479e-05, 4.316866397857666e-05, 6.901472806930542e-05, 9.486079216003418e-05, 0.00012070685625076294, 0.0001465529203414917, 0.00017239898443222046, 0.00019824504852294922, 0.00022409111261367798, 0.00024993717670440674, 0.0002757832407951355, 0.00030162930488586426, 0.000327475368976593, 0.0003533214330673218, 0.00037916749715805054, 0.0004050135612487793, 0.00043085962533950806, 0.0004567056894302368, 0.0004825517535209656, 0.0005083978176116943, 0.0005342438817024231, 0.0005600899457931519, 0.0005859360098838806, 0.0006117820739746094]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 15.0, 17.0, 25.0, 31.0, 51.0, 88.0, 106.0, 147.0, 265.0, 531.0, 1009.0, 1989.0, 4535.0, 12583.0, 48796.0, 281245.0, 544960.0, 115064.0, 23847.0, 7364.0, 2803.0, 1313.0, 693.0, 392.0, 203.0, 140.0, 80.0, 63.0, 53.0, 35.0, 15.0, 18.0, 14.0, 13.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.7109375, -4.56927490234375, -4.4276123046875, -4.28594970703125, -4.144287109375, -4.00262451171875, -3.8609619140625, -3.71929931640625, -3.57763671875, -3.43597412109375, -3.2943115234375, -3.15264892578125, -3.010986328125, -2.86932373046875, -2.7276611328125, -2.58599853515625, -2.4443359375, -2.30267333984375, -2.1610107421875, -2.01934814453125, -1.877685546875, -1.73602294921875, -1.5943603515625, -1.45269775390625, -1.31103515625, -1.16937255859375, -1.0277099609375, -0.88604736328125, -0.744384765625, -0.60272216796875, -0.4610595703125, -0.31939697265625, -0.177734375, -0.03607177734375, 0.1055908203125, 0.24725341796875, 0.388916015625, 0.53057861328125, 0.6722412109375, 0.81390380859375, 0.95556640625, 1.09722900390625, 1.2388916015625, 1.38055419921875, 1.522216796875, 1.66387939453125, 1.8055419921875, 1.94720458984375, 2.0888671875, 2.23052978515625, 2.3721923828125, 2.51385498046875, 2.655517578125, 2.79718017578125, 2.9388427734375, 3.08050537109375, 3.22216796875, 3.36383056640625, 3.5054931640625, 3.64715576171875, 3.788818359375, 3.93048095703125, 4.0721435546875, 4.21380615234375, 4.35546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 6.0, 5.0, 6.0, 1.0, 4.0, 7.0, 15.0, 10.0, 13.0, 23.0, 22.0, 30.0, 47.0, 33.0, 54.0, 70.0, 55.0, 78.0, 75.0, 76.0, 69.0, 66.0, 39.0, 39.0, 27.0, 28.0, 20.0, 17.0, 19.0, 12.0, 6.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.017578125, -2.925506591796875, -2.83343505859375, -2.741363525390625, -2.6492919921875, -2.557220458984375, -2.46514892578125, -2.373077392578125, -2.281005859375, -2.188934326171875, -2.09686279296875, -2.004791259765625, -1.9127197265625, -1.820648193359375, -1.72857666015625, -1.636505126953125, -1.54443359375, -1.452362060546875, -1.36029052734375, -1.268218994140625, -1.1761474609375, -1.084075927734375, -0.99200439453125, -0.899932861328125, -0.807861328125, -0.715789794921875, -0.62371826171875, -0.531646728515625, -0.4395751953125, -0.347503662109375, -0.25543212890625, -0.163360595703125, -0.0712890625, 0.020782470703125, 0.11285400390625, 0.204925537109375, 0.2969970703125, 0.389068603515625, 0.48114013671875, 0.573211669921875, 0.665283203125, 0.757354736328125, 0.84942626953125, 0.941497802734375, 1.0335693359375, 1.125640869140625, 1.21771240234375, 1.309783935546875, 1.40185546875, 1.493927001953125, 1.58599853515625, 1.678070068359375, 1.7701416015625, 1.862213134765625, 1.95428466796875, 2.046356201171875, 2.138427734375, 2.230499267578125, 2.32257080078125, 2.414642333984375, 2.5067138671875, 2.598785400390625, 2.69085693359375, 2.782928466796875, 2.875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 11.0, 17.0, 17.0, 41.0, 49.0, 75.0, 106.0, 123.0, 153.0, 116.0, 102.0, 77.0, 33.0, 26.0, 10.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.70413208007812, -63.85623550415039, -62.008338928222656, -60.16044235229492, -58.31254577636719, -56.46464538574219, -54.61675262451172, -52.76885223388672, -50.920955657958984, -49.07305908203125, -47.225162506103516, -45.37726593017578, -43.52936935424805, -41.68147277832031, -39.83357238769531, -37.98567581176758, -36.137779235839844, -34.28988265991211, -32.441986083984375, -30.59408950805664, -28.746191024780273, -26.89829444885254, -25.050397872924805, -23.202499389648438, -21.35460662841797, -19.506710052490234, -17.6588134765625, -15.81091594696045, -13.963018417358398, -12.115121841430664, -10.26722526550293, -8.419327735900879, -6.571430206298828, -4.7235331535339355, -2.875636339187622, -1.0277395248413086, 0.820157527923584, 2.6680545806884766, 4.515951156616211, 6.363848686218262, 8.211745262145996, 10.05964183807373, 11.907539367675781, 13.755435943603516, 15.60333251953125, 17.451229095458984, 19.29912567138672, 21.147024154663086, 22.99492073059082, 24.842817306518555, 26.69071388244629, 28.538612365722656, 30.38650894165039, 32.234405517578125, 34.08230209350586, 35.930198669433594, 37.77809524536133, 39.62599182128906, 41.4738883972168, 43.32178497314453, 45.169681549072266, 47.017578125, 48.865478515625, 50.713375091552734, 52.56127166748047]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 0.0, 6.0, 10.0, 9.0, 13.0, 17.0, 21.0, 21.0, 21.0, 20.0, 20.0, 37.0, 30.0, 32.0, 43.0, 46.0, 36.0, 55.0, 60.0, 50.0, 42.0, 56.0, 51.0, 47.0, 43.0, 40.0, 30.0, 30.0, 16.0, 19.0, 18.0, 16.0, 12.0, 7.0, 10.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.65648651123047, -62.80373001098633, -60.95096969604492, -59.09821319580078, -57.245452880859375, -55.392696380615234, -53.539939880371094, -51.68717956542969, -49.83442306518555, -47.981666564941406, -46.12890625, -44.27614974975586, -42.42339324951172, -40.57063293457031, -38.71787643432617, -36.86511993408203, -35.012359619140625, -33.159603118896484, -31.306842803955078, -29.454086303710938, -27.601327896118164, -25.74856948852539, -23.89581298828125, -22.043054580688477, -20.190296173095703, -18.33753776550293, -16.484779357910156, -14.632022857666016, -12.779264450073242, -10.926506042480469, -9.073748588562012, -7.220991134643555, -5.368236541748047, -3.5154786109924316, -1.6627206802368164, 0.19003725051879883, 2.042795181274414, 3.8955535888671875, 5.7483110427856445, 7.601068496704102, 9.453826904296875, 11.306585311889648, 13.159342765808105, 15.012100219726562, 16.864858627319336, 18.71761703491211, 20.57037353515625, 22.423131942749023, 24.275890350341797, 26.12864875793457, 27.981407165527344, 29.834163665771484, 31.686922073364258, 33.53968048095703, 35.39243698120117, 37.24519348144531, 39.09795379638672, 40.95071029663086, 42.803470611572266, 44.656227111816406, 46.50898742675781, 48.36174392700195, 50.214500427246094, 52.0672607421875, 53.92001724243164]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 18.0, 46.0, 78.0, 167.0, 339.0, 680.0, 1736.0, 5891.0, 31573.0, 642298.0, 3441121.0, 56244.0, 9029.0, 2601.0, 1069.0, 522.0, 256.0, 191.0, 115.0, 90.0, 51.0, 41.0, 40.0, 18.0, 25.0, 6.0, 7.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.546875, -7.896240234375, -7.24560546875, -6.594970703125, -5.9443359375, -5.293701171875, -4.64306640625, -3.992431640625, -3.341796875, -2.691162109375, -2.04052734375, -1.389892578125, -0.7392578125, -0.088623046875, 0.56201171875, 1.212646484375, 1.86328125, 2.513916015625, 3.16455078125, 3.815185546875, 4.4658203125, 5.116455078125, 5.76708984375, 6.417724609375, 7.068359375, 7.718994140625, 8.36962890625, 9.020263671875, 9.6708984375, 10.321533203125, 10.97216796875, 11.622802734375, 12.2734375, 12.924072265625, 13.57470703125, 14.225341796875, 14.8759765625, 15.526611328125, 16.17724609375, 16.827880859375, 17.478515625, 18.129150390625, 18.77978515625, 19.430419921875, 20.0810546875, 20.731689453125, 21.38232421875, 22.032958984375, 22.68359375, 23.334228515625, 23.98486328125, 24.635498046875, 25.2861328125, 25.936767578125, 26.58740234375, 27.238037109375, 27.888671875, 28.539306640625, 29.18994140625, 29.840576171875, 30.4912109375, 31.141845703125, 31.79248046875, 32.443115234375, 33.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 5.0, 8.0, 24.0, 26.0, 48.0, 55.0, 75.0, 85.0, 108.0, 122.0, 102.0, 92.0, 67.0, 63.0, 50.0, 32.0, 15.0, 5.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.448394775390625, -1.32452392578125, -1.200653076171875, -1.0767822265625, -0.952911376953125, -0.82904052734375, -0.705169677734375, -0.581298828125, -0.457427978515625, -0.33355712890625, -0.209686279296875, -0.0858154296875, 0.038055419921875, 0.16192626953125, 0.285797119140625, 0.40966796875, 0.533538818359375, 0.65740966796875, 0.781280517578125, 0.9051513671875, 1.029022216796875, 1.15289306640625, 1.276763916015625, 1.400634765625, 1.524505615234375, 1.64837646484375, 1.772247314453125, 1.8961181640625, 2.019989013671875, 2.14385986328125, 2.267730712890625, 2.3916015625, 2.515472412109375, 2.63934326171875, 2.763214111328125, 2.8870849609375, 3.010955810546875, 3.13482666015625, 3.258697509765625, 3.382568359375, 3.506439208984375, 3.63031005859375, 3.754180908203125, 3.8780517578125, 4.001922607421875, 4.12579345703125, 4.249664306640625, 4.37353515625, 4.497406005859375, 4.62127685546875, 4.745147705078125, 4.8690185546875, 4.992889404296875, 5.11676025390625, 5.240631103515625, 5.364501953125, 5.488372802734375, 5.61224365234375, 5.736114501953125, 5.8599853515625, 5.983856201171875, 6.10772705078125, 6.231597900390625, 6.35546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 15.0, 10.0, 15.0, 23.0, 39.0, 46.0, 58.0, 79.0, 135.0, 213.0, 525.0, 1850.0, 12170.0, 4011356.0, 160187.0, 5237.0, 1294.0, 465.0, 174.0, 123.0, 79.0, 54.0, 39.0, 29.0, 19.0, 11.0, 12.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.33349609375, -35.8857421875, -34.43798828125, -32.990234375, -31.54248046875, -30.0947265625, -28.64697265625, -27.19921875, -25.75146484375, -24.3037109375, -22.85595703125, -21.408203125, -19.96044921875, -18.5126953125, -17.06494140625, -15.6171875, -14.16943359375, -12.7216796875, -11.27392578125, -9.826171875, -8.37841796875, -6.9306640625, -5.48291015625, -4.03515625, -2.58740234375, -1.1396484375, 0.30810546875, 1.755859375, 3.20361328125, 4.6513671875, 6.09912109375, 7.546875, 8.99462890625, 10.4423828125, 11.89013671875, 13.337890625, 14.78564453125, 16.2333984375, 17.68115234375, 19.12890625, 20.57666015625, 22.0244140625, 23.47216796875, 24.919921875, 26.36767578125, 27.8154296875, 29.26318359375, 30.7109375, 32.15869140625, 33.6064453125, 35.05419921875, 36.501953125, 37.94970703125, 39.3974609375, 40.84521484375, 42.29296875, 43.74072265625, 45.1884765625, 46.63623046875, 48.083984375, 49.53173828125, 50.9794921875, 52.42724609375, 53.875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 7.0, 17.0, 39.0, 114.0, 927.0, 2595.0, 262.0, 60.0, 25.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.288818359375, -15.74951171875, -15.210205078125, -14.6708984375, -14.131591796875, -13.59228515625, -13.052978515625, -12.513671875, -11.974365234375, -11.43505859375, -10.895751953125, -10.3564453125, -9.817138671875, -9.27783203125, -8.738525390625, -8.19921875, -7.659912109375, -7.12060546875, -6.581298828125, -6.0419921875, -5.502685546875, -4.96337890625, -4.424072265625, -3.884765625, -3.345458984375, -2.80615234375, -2.266845703125, -1.7275390625, -1.188232421875, -0.64892578125, -0.109619140625, 0.4296875, 0.968994140625, 1.50830078125, 2.047607421875, 2.5869140625, 3.126220703125, 3.66552734375, 4.204833984375, 4.744140625, 5.283447265625, 5.82275390625, 6.362060546875, 6.9013671875, 7.440673828125, 7.97998046875, 8.519287109375, 9.05859375, 9.597900390625, 10.13720703125, 10.676513671875, 11.2158203125, 11.755126953125, 12.29443359375, 12.833740234375, 13.373046875, 13.912353515625, 14.45166015625, 14.990966796875, 15.5302734375, 16.069580078125, 16.60888671875, 17.148193359375, 17.6875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 9.0, 14.0, 53.0, 160.0, 302.0, 233.0, 133.0, 46.0, 26.0, 11.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0123291015625, -95.72346496582031, -93.43460083007812, -91.14573669433594, -88.85687255859375, -86.56800079345703, -84.27913665771484, -81.99027252197266, -79.70140838623047, -77.41254425048828, -75.1236801147461, -72.8348159790039, -70.54594421386719, -68.257080078125, -65.96821594238281, -63.679351806640625, -61.39048767089844, -59.10162353515625, -56.81275939941406, -54.52389144897461, -52.23502731323242, -49.946163177490234, -47.65729522705078, -45.368431091308594, -43.079566955566406, -40.79070281982422, -38.50183868408203, -36.21297073364258, -33.92410659790039, -31.635242462158203, -29.346376419067383, -27.057510375976562, -24.76865005493164, -22.479785919189453, -20.190919876098633, -17.902053833007812, -15.613189697265625, -13.324324607849121, -11.035459518432617, -8.746593475341797, -6.457729339599609, -4.1688642501831055, -1.8799991607666016, 0.40886592864990234, 2.6977310180664062, 4.98659610748291, 7.275461196899414, 9.564327239990234, 11.853191375732422, 14.142056465148926, 16.43092155456543, 18.71978759765625, 21.008651733398438, 23.297515869140625, 25.586381912231445, 27.875247955322266, 30.164112091064453, 32.45297622680664, 34.741844177246094, 37.03070831298828, 39.31957244873047, 41.608436584472656, 43.897300720214844, 46.1861686706543, 48.475032806396484]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 12.0, 21.0, 51.0, 66.0, 101.0, 128.0, 123.0, 142.0, 120.0, 100.0, 50.0, 46.0, 25.0, 12.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.96382522583008, -62.1107063293457, -60.257591247558594, -58.40447235107422, -56.551353454589844, -54.69823455810547, -52.84511947631836, -50.992000579833984, -49.138885498046875, -47.2857666015625, -45.43265151977539, -43.579532623291016, -41.72641372680664, -39.87329864501953, -38.020179748535156, -36.16706085205078, -34.313941955566406, -32.46082305908203, -30.60770606994629, -28.754589080810547, -26.901470184326172, -25.04835319519043, -23.195236206054688, -21.342117309570312, -19.48900032043457, -17.635883331298828, -15.782764434814453, -13.929647445678711, -12.076529502868652, -10.223411560058594, -8.370294570922852, -6.517176628112793, -4.6640625, -2.8109447956085205, -0.957827091217041, 0.8952903747558594, 2.748408317565918, 4.601526260375977, 6.454643249511719, 8.307761192321777, 10.160879135131836, 12.013997077941895, 13.867115020751953, 15.720232009887695, 17.573348999023438, 19.426467895507812, 21.279584884643555, 23.132701873779297, 24.985820770263672, 26.838937759399414, 28.69205665588379, 30.54517364501953, 32.398292541503906, 34.25141143798828, 36.10452651977539, 37.957645416259766, 39.810760498046875, 41.66387939453125, 43.51699447631836, 45.370113372802734, 47.22323226928711, 49.07634735107422, 50.929466247558594, 52.78258514404297, 54.635704040527344]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 10.0, 7.0, 4.0, 16.0, 13.0, 28.0, 19.0, 36.0, 56.0, 68.0, 104.0, 149.0, 224.0, 393.0, 679.0, 1358.0, 3280.0, 8829.0, 30299.0, 134305.0, 492459.0, 288494.0, 62158.0, 15837.0, 5283.0, 2019.0, 959.0, 534.0, 287.0, 172.0, 124.0, 100.0, 77.0, 42.0, 43.0, 27.0, 15.0, 11.0, 9.0, 9.0, 4.0, 3.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-13.03125, -12.65625, -12.28125, -11.90625, -11.53125, -11.15625, -10.78125, -10.40625, -10.03125, -9.65625, -9.28125, -8.90625, -8.53125, -8.15625, -7.78125, -7.40625, -7.03125, -6.65625, -6.28125, -5.90625, -5.53125, -5.15625, -4.78125, -4.40625, -4.03125, -3.65625, -3.28125, -2.90625, -2.53125, -2.15625, -1.78125, -1.40625, -1.03125, -0.65625, -0.28125, 0.09375, 0.46875, 0.84375, 1.21875, 1.59375, 1.96875, 2.34375, 2.71875, 3.09375, 3.46875, 3.84375, 4.21875, 4.59375, 4.96875, 5.34375, 5.71875, 6.09375, 6.46875, 6.84375, 7.21875, 7.59375, 7.96875, 8.34375, 8.71875, 9.09375, 9.46875, 9.84375, 10.21875, 10.59375, 10.96875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 14.0, 25.0, 29.0, 50.0, 73.0, 62.0, 91.0, 87.0, 107.0, 90.0, 96.0, 70.0, 52.0, 52.0, 26.0, 23.0, 10.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.001953125, -1.887847900390625, -1.77374267578125, -1.659637451171875, -1.5455322265625, -1.431427001953125, -1.31732177734375, -1.203216552734375, -1.089111328125, -0.975006103515625, -0.86090087890625, -0.746795654296875, -0.6326904296875, -0.518585205078125, -0.40447998046875, -0.290374755859375, -0.17626953125, -0.062164306640625, 0.05194091796875, 0.166046142578125, 0.2801513671875, 0.394256591796875, 0.50836181640625, 0.622467041015625, 0.736572265625, 0.850677490234375, 0.96478271484375, 1.078887939453125, 1.1929931640625, 1.307098388671875, 1.42120361328125, 1.535308837890625, 1.6494140625, 1.763519287109375, 1.87762451171875, 1.991729736328125, 2.1058349609375, 2.219940185546875, 2.33404541015625, 2.448150634765625, 2.562255859375, 2.676361083984375, 2.79046630859375, 2.904571533203125, 3.0186767578125, 3.132781982421875, 3.24688720703125, 3.360992431640625, 3.47509765625, 3.589202880859375, 3.70330810546875, 3.817413330078125, 3.9315185546875, 4.045623779296875, 4.15972900390625, 4.273834228515625, 4.387939453125, 4.502044677734375, 4.61614990234375, 4.730255126953125, 4.8443603515625, 4.958465576171875, 5.07257080078125, 5.186676025390625, 5.30078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 16.0, 21.0, 28.0, 40.0, 44.0, 57.0, 72.0, 143.0, 172.0, 299.0, 386.0, 646.0, 1105.0, 2054.0, 4250.0, 9521.0, 23298.0, 62036.0, 179541.0, 383294.0, 241753.0, 85488.0, 30929.0, 12166.0, 5238.0, 2450.0, 1288.0, 720.0, 444.0, 297.0, 213.0, 144.0, 86.0, 89.0, 54.0, 41.0, 29.0, 18.0, 23.0, 9.0, 12.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.875, -6.65777587890625, -6.4405517578125, -6.22332763671875, -6.006103515625, -5.78887939453125, -5.5716552734375, -5.35443115234375, -5.13720703125, -4.91998291015625, -4.7027587890625, -4.48553466796875, -4.268310546875, -4.05108642578125, -3.8338623046875, -3.61663818359375, -3.3994140625, -3.18218994140625, -2.9649658203125, -2.74774169921875, -2.530517578125, -2.31329345703125, -2.0960693359375, -1.87884521484375, -1.66162109375, -1.44439697265625, -1.2271728515625, -1.00994873046875, -0.792724609375, -0.57550048828125, -0.3582763671875, -0.14105224609375, 0.076171875, 0.29339599609375, 0.5106201171875, 0.72784423828125, 0.945068359375, 1.16229248046875, 1.3795166015625, 1.59674072265625, 1.81396484375, 2.03118896484375, 2.2484130859375, 2.46563720703125, 2.682861328125, 2.90008544921875, 3.1173095703125, 3.33453369140625, 3.5517578125, 3.76898193359375, 3.9862060546875, 4.20343017578125, 4.420654296875, 4.63787841796875, 4.8551025390625, 5.07232666015625, 5.28955078125, 5.50677490234375, 5.7239990234375, 5.94122314453125, 6.158447265625, 6.37567138671875, 6.5928955078125, 6.81011962890625, 7.02734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 5.0, 5.0, 14.0, 26.0, 20.0, 21.0, 26.0, 25.0, 29.0, 33.0, 40.0, 58.0, 46.0, 54.0, 46.0, 50.0, 49.0, 57.0, 44.0, 52.0, 32.0, 47.0, 25.0, 25.0, 38.0, 19.0, 14.0, 19.0, 11.0, 13.0, 7.0, 6.0, 10.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.40869140625, -8.1298828125, -7.85107421875, -7.572265625, -7.29345703125, -7.0146484375, -6.73583984375, -6.45703125, -6.17822265625, -5.8994140625, -5.62060546875, -5.341796875, -5.06298828125, -4.7841796875, -4.50537109375, -4.2265625, -3.94775390625, -3.6689453125, -3.39013671875, -3.111328125, -2.83251953125, -2.5537109375, -2.27490234375, -1.99609375, -1.71728515625, -1.4384765625, -1.15966796875, -0.880859375, -0.60205078125, -0.3232421875, -0.04443359375, 0.234375, 0.51318359375, 0.7919921875, 1.07080078125, 1.349609375, 1.62841796875, 1.9072265625, 2.18603515625, 2.46484375, 2.74365234375, 3.0224609375, 3.30126953125, 3.580078125, 3.85888671875, 4.1376953125, 4.41650390625, 4.6953125, 4.97412109375, 5.2529296875, 5.53173828125, 5.810546875, 6.08935546875, 6.3681640625, 6.64697265625, 6.92578125, 7.20458984375, 7.4833984375, 7.76220703125, 8.041015625, 8.31982421875, 8.5986328125, 8.87744140625, 9.15625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 13.0, 16.0, 18.0, 34.0, 60.0, 117.0, 210.0, 487.0, 1445.0, 5758.0, 41423.0, 733745.0, 243347.0, 16910.0, 3247.0, 944.0, 369.0, 174.0, 78.0, 53.0, 24.0, 27.0, 14.0, 7.0, 8.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3671875, -11.978271484375, -11.58935546875, -11.200439453125, -10.8115234375, -10.422607421875, -10.03369140625, -9.644775390625, -9.255859375, -8.866943359375, -8.47802734375, -8.089111328125, -7.7001953125, -7.311279296875, -6.92236328125, -6.533447265625, -6.14453125, -5.755615234375, -5.36669921875, -4.977783203125, -4.5888671875, -4.199951171875, -3.81103515625, -3.422119140625, -3.033203125, -2.644287109375, -2.25537109375, -1.866455078125, -1.4775390625, -1.088623046875, -0.69970703125, -0.310791015625, 0.078125, 0.467041015625, 0.85595703125, 1.244873046875, 1.6337890625, 2.022705078125, 2.41162109375, 2.800537109375, 3.189453125, 3.578369140625, 3.96728515625, 4.356201171875, 4.7451171875, 5.134033203125, 5.52294921875, 5.911865234375, 6.30078125, 6.689697265625, 7.07861328125, 7.467529296875, 7.8564453125, 8.245361328125, 8.63427734375, 9.023193359375, 9.412109375, 9.801025390625, 10.18994140625, 10.578857421875, 10.9677734375, 11.356689453125, 11.74560546875, 12.134521484375, 12.5234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 10.0, 18.0, 19.0, 28.0, 50.0, 65.0, 123.0, 208.0, 197.0, 114.0, 49.0, 33.0, 29.0, 16.0, 15.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014829635620117188, -0.0014427155256271362, -0.0014024674892425537, -0.0013622194528579712, -0.0013219714164733887, -0.0012817233800888062, -0.0012414753437042236, -0.0012012273073196411, -0.0011609792709350586, -0.001120731234550476, -0.0010804831981658936, -0.001040235161781311, -0.0009999871253967285, -0.000959739089012146, -0.0009194910526275635, -0.000879243016242981, -0.0008389949798583984, -0.0007987469434738159, -0.0007584989070892334, -0.0007182508707046509, -0.0006780028343200684, -0.0006377547979354858, -0.0005975067615509033, -0.0005572587251663208, -0.0005170106887817383, -0.00047676265239715576, -0.00043651461601257324, -0.0003962665796279907, -0.0003560185432434082, -0.0003157705068588257, -0.00027552247047424316, -0.00023527443408966064, -0.00019502639770507812, -0.0001547783613204956, -0.00011453032493591309, -7.428228855133057e-05, -3.403425216674805e-05, 6.213784217834473e-06, 4.646182060241699e-05, 8.670985698699951e-05, 0.00012695789337158203, 0.00016720592975616455, 0.00020745396614074707, 0.0002477020025253296, 0.0002879500389099121, 0.00032819807529449463, 0.00036844611167907715, 0.00040869414806365967, 0.0004489421844482422, 0.0004891902208328247, 0.0005294382572174072, 0.0005696862936019897, 0.0006099343299865723, 0.0006501823663711548, 0.0006904304027557373, 0.0007306784391403198, 0.0007709264755249023, 0.0008111745119094849, 0.0008514225482940674, 0.0008916705846786499, 0.0009319186210632324, 0.0009721666574478149, 0.0010124146938323975, 0.00105266273021698, 0.0010929107666015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 7.0, 9.0, 14.0, 20.0, 45.0, 63.0, 118.0, 231.0, 381.0, 819.0, 2109.0, 6690.0, 36224.0, 626440.0, 343529.0, 23404.0, 5139.0, 1732.0, 782.0, 352.0, 196.0, 99.0, 60.0, 27.0, 19.0, 11.0, 8.0, 12.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.375, -13.012451171875, -12.64990234375, -12.287353515625, -11.9248046875, -11.562255859375, -11.19970703125, -10.837158203125, -10.474609375, -10.112060546875, -9.74951171875, -9.386962890625, -9.0244140625, -8.661865234375, -8.29931640625, -7.936767578125, -7.57421875, -7.211669921875, -6.84912109375, -6.486572265625, -6.1240234375, -5.761474609375, -5.39892578125, -5.036376953125, -4.673828125, -4.311279296875, -3.94873046875, -3.586181640625, -3.2236328125, -2.861083984375, -2.49853515625, -2.135986328125, -1.7734375, -1.410888671875, -1.04833984375, -0.685791015625, -0.3232421875, 0.039306640625, 0.40185546875, 0.764404296875, 1.126953125, 1.489501953125, 1.85205078125, 2.214599609375, 2.5771484375, 2.939697265625, 3.30224609375, 3.664794921875, 4.02734375, 4.389892578125, 4.75244140625, 5.114990234375, 5.4775390625, 5.840087890625, 6.20263671875, 6.565185546875, 6.927734375, 7.290283203125, 7.65283203125, 8.015380859375, 8.3779296875, 8.740478515625, 9.10302734375, 9.465576171875, 9.828125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 6.0, 1.0, 5.0, 8.0, 12.0, 17.0, 26.0, 35.0, 46.0, 72.0, 125.0, 147.0, 134.0, 113.0, 75.0, 64.0, 37.0, 24.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.49945068359375, -6.2684326171875, -6.03741455078125, -5.806396484375, -5.57537841796875, -5.3443603515625, -5.11334228515625, -4.88232421875, -4.65130615234375, -4.4202880859375, -4.18927001953125, -3.958251953125, -3.72723388671875, -3.4962158203125, -3.26519775390625, -3.0341796875, -2.80316162109375, -2.5721435546875, -2.34112548828125, -2.110107421875, -1.87908935546875, -1.6480712890625, -1.41705322265625, -1.18603515625, -0.95501708984375, -0.7239990234375, -0.49298095703125, -0.261962890625, -0.03094482421875, 0.2000732421875, 0.43109130859375, 0.662109375, 0.89312744140625, 1.1241455078125, 1.35516357421875, 1.586181640625, 1.81719970703125, 2.0482177734375, 2.27923583984375, 2.51025390625, 2.74127197265625, 2.9722900390625, 3.20330810546875, 3.434326171875, 3.66534423828125, 3.8963623046875, 4.12738037109375, 4.3583984375, 4.58941650390625, 4.8204345703125, 5.05145263671875, 5.282470703125, 5.51348876953125, 5.7445068359375, 5.97552490234375, 6.20654296875, 6.43756103515625, 6.6685791015625, 6.89959716796875, 7.130615234375, 7.36163330078125, 7.5926513671875, 7.82366943359375, 8.0546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 14.0, 22.0, 42.0, 85.0, 162.0, 231.0, 193.0, 123.0, 69.0, 32.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.61470031738281, -62.295997619628906, -58.977298736572266, -55.65859603881836, -52.33989715576172, -49.02119445800781, -45.702491760253906, -42.3837890625, -39.06509017944336, -35.74638748168945, -32.42768859863281, -29.108985900878906, -25.790285110473633, -22.47158432006836, -19.152881622314453, -15.83418083190918, -12.515480041503906, -9.196779251098633, -5.878077507019043, -2.559375762939453, 0.7593250274658203, 4.078025817871094, 7.396728515625, 10.715429306030273, 14.034130096435547, 17.35283088684082, 20.671531677246094, 23.990234375, 27.308935165405273, 30.627635955810547, 33.94633865356445, 37.265037536621094, 40.583740234375, 43.902442932128906, 47.22114181518555, 50.53984451293945, 53.858543395996094, 57.17724609375, 60.495948791503906, 63.81465148925781, 67.13334655761719, 70.4520492553711, 73.770751953125, 77.08944702148438, 80.40814971923828, 83.72685241699219, 87.0455551147461, 90.3642578125, 93.6829605102539, 97.00166320800781, 100.32036590576172, 103.63906860351562, 106.957763671875, 110.2764663696289, 113.59516906738281, 116.91387176513672, 120.23257446289062, 123.55127716064453, 126.86997985839844, 130.1886749267578, 133.50738525390625, 136.82608032226562, 140.144775390625, 143.46348571777344, 146.7821807861328]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 13.0, 11.0, 14.0, 19.0, 26.0, 35.0, 35.0, 41.0, 42.0, 54.0, 59.0, 55.0, 49.0, 59.0, 66.0, 59.0, 51.0, 47.0, 39.0, 39.0, 34.0, 30.0, 22.0, 17.0, 23.0, 10.0, 5.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.30348205566406, -64.3127670288086, -62.322044372558594, -60.33132553100586, -58.340606689453125, -56.349891662597656, -54.359169006347656, -52.36845397949219, -50.37773513793945, -48.38701629638672, -46.396297454833984, -44.40557861328125, -42.414859771728516, -40.42414093017578, -38.43342590332031, -36.44270706176758, -34.451988220214844, -32.46126937866211, -30.470550537109375, -28.47983169555664, -26.48911476135254, -24.498395919799805, -22.50767707824707, -20.51696014404297, -18.52623748779297, -16.535518646240234, -14.544800758361816, -12.554081916809082, -10.563364028930664, -8.57264518737793, -6.581926345825195, -4.591208457946777, -2.6004905700683594, -0.6097720861434937, 1.380946397781372, 3.3716650009155273, 5.3623833656311035, 7.35310173034668, 9.343820571899414, 11.334538459777832, 13.325257301330566, 15.3159761428833, 17.30669403076172, 19.297412872314453, 21.288131713867188, 23.278850555419922, 25.269569396972656, 27.260286331176758, 29.251005172729492, 31.241724014282227, 33.23244094848633, 35.22315979003906, 37.2138786315918, 39.20459747314453, 41.195316314697266, 43.18603515625, 45.176753997802734, 47.16747283935547, 49.1581916809082, 51.14891052246094, 53.13962936401367, 55.130348205566406, 57.121063232421875, 59.11178207397461, 61.102500915527344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 15.0, 10.0, 32.0, 36.0, 59.0, 104.0, 143.0, 242.0, 384.0, 702.0, 1411.0, 3525.0, 11401.0, 53871.0, 3308029.0, 759722.0, 39069.0, 9349.0, 3141.0, 1263.0, 625.0, 367.0, 227.0, 141.0, 114.0, 67.0, 55.0, 30.0, 39.0, 31.0, 12.0, 13.0, 9.0, 14.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.7265625, -10.2584228515625, -9.790283203125, -9.3221435546875, -8.85400390625, -8.3858642578125, -7.917724609375, -7.4495849609375, -6.9814453125, -6.5133056640625, -6.045166015625, -5.5770263671875, -5.10888671875, -4.6407470703125, -4.172607421875, -3.7044677734375, -3.236328125, -2.7681884765625, -2.300048828125, -1.8319091796875, -1.36376953125, -0.8956298828125, -0.427490234375, 0.0406494140625, 0.5087890625, 0.9769287109375, 1.445068359375, 1.9132080078125, 2.38134765625, 2.8494873046875, 3.317626953125, 3.7857666015625, 4.25390625, 4.7220458984375, 5.190185546875, 5.6583251953125, 6.12646484375, 6.5946044921875, 7.062744140625, 7.5308837890625, 7.9990234375, 8.4671630859375, 8.935302734375, 9.4034423828125, 9.87158203125, 10.3397216796875, 10.807861328125, 11.2760009765625, 11.744140625, 12.2122802734375, 12.680419921875, 13.1485595703125, 13.61669921875, 14.0848388671875, 14.552978515625, 15.0211181640625, 15.4892578125, 15.9573974609375, 16.425537109375, 16.8936767578125, 17.36181640625, 17.8299560546875, 18.298095703125, 18.7662353515625, 19.234375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 18.0, 38.0, 35.0, 33.0, 58.0, 71.0, 86.0, 85.0, 92.0, 95.0, 86.0, 70.0, 52.0, 52.0, 40.0, 32.0, 17.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.7975921630859375, -1.684051513671875, -1.5705108642578125, -1.45697021484375, -1.3434295654296875, -1.229888916015625, -1.1163482666015625, -1.0028076171875, -0.8892669677734375, -0.775726318359375, -0.6621856689453125, -0.54864501953125, -0.4351043701171875, -0.321563720703125, -0.2080230712890625, -0.094482421875, 0.0190582275390625, 0.132598876953125, 0.2461395263671875, 0.35968017578125, 0.4732208251953125, 0.586761474609375, 0.7003021240234375, 0.8138427734375, 0.9273834228515625, 1.040924072265625, 1.1544647216796875, 1.26800537109375, 1.3815460205078125, 1.495086669921875, 1.6086273193359375, 1.72216796875, 1.8357086181640625, 1.949249267578125, 2.0627899169921875, 2.17633056640625, 2.2898712158203125, 2.403411865234375, 2.5169525146484375, 2.6304931640625, 2.7440338134765625, 2.857574462890625, 2.9711151123046875, 3.08465576171875, 3.1981964111328125, 3.311737060546875, 3.4252777099609375, 3.538818359375, 3.6523590087890625, 3.765899658203125, 3.8794403076171875, 3.99298095703125, 4.1065216064453125, 4.220062255859375, 4.3336029052734375, 4.4471435546875, 4.5606842041015625, 4.674224853515625, 4.7877655029296875, 4.90130615234375, 5.0148468017578125, 5.128387451171875, 5.2419281005859375, 5.35546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 5.0, 10.0, 5.0, 18.0, 26.0, 35.0, 49.0, 76.0, 134.0, 198.0, 283.0, 500.0, 873.0, 1692.0, 3940.0, 11264.0, 41759.0, 281575.0, 3568621.0, 228904.0, 36608.0, 10418.0, 3772.0, 1552.0, 824.0, 456.0, 260.0, 148.0, 92.0, 56.0, 28.0, 30.0, 21.0, 9.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4266357421875, -9.095458984375, -8.7642822265625, -8.43310546875, -8.1019287109375, -7.770751953125, -7.4395751953125, -7.1083984375, -6.7772216796875, -6.446044921875, -6.1148681640625, -5.78369140625, -5.4525146484375, -5.121337890625, -4.7901611328125, -4.458984375, -4.1278076171875, -3.796630859375, -3.4654541015625, -3.13427734375, -2.8031005859375, -2.471923828125, -2.1407470703125, -1.8095703125, -1.4783935546875, -1.147216796875, -0.8160400390625, -0.48486328125, -0.1536865234375, 0.177490234375, 0.5086669921875, 0.83984375, 1.1710205078125, 1.502197265625, 1.8333740234375, 2.16455078125, 2.4957275390625, 2.826904296875, 3.1580810546875, 3.4892578125, 3.8204345703125, 4.151611328125, 4.4827880859375, 4.81396484375, 5.1451416015625, 5.476318359375, 5.8074951171875, 6.138671875, 6.4698486328125, 6.801025390625, 7.1322021484375, 7.46337890625, 7.7945556640625, 8.125732421875, 8.4569091796875, 8.7880859375, 9.1192626953125, 9.450439453125, 9.7816162109375, 10.11279296875, 10.4439697265625, 10.775146484375, 11.1063232421875, 11.4375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 12.0, 12.0, 28.0, 36.0, 62.0, 75.0, 115.0, 252.0, 531.0, 1784.0, 602.0, 220.0, 101.0, 71.0, 50.0, 29.0, 20.0, 16.0, 10.0, 12.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.540740966796875, -4.40960693359375, -4.278472900390625, -4.1473388671875, -4.016204833984375, -3.88507080078125, -3.753936767578125, -3.622802734375, -3.491668701171875, -3.36053466796875, -3.229400634765625, -3.0982666015625, -2.967132568359375, -2.83599853515625, -2.704864501953125, -2.57373046875, -2.442596435546875, -2.31146240234375, -2.180328369140625, -2.0491943359375, -1.918060302734375, -1.78692626953125, -1.655792236328125, -1.524658203125, -1.393524169921875, -1.26239013671875, -1.131256103515625, -1.0001220703125, -0.868988037109375, -0.73785400390625, -0.606719970703125, -0.4755859375, -0.344451904296875, -0.21331787109375, -0.082183837890625, 0.0489501953125, 0.180084228515625, 0.31121826171875, 0.442352294921875, 0.573486328125, 0.704620361328125, 0.83575439453125, 0.966888427734375, 1.0980224609375, 1.229156494140625, 1.36029052734375, 1.491424560546875, 1.62255859375, 1.753692626953125, 1.88482666015625, 2.015960693359375, 2.1470947265625, 2.278228759765625, 2.40936279296875, 2.540496826171875, 2.671630859375, 2.802764892578125, 2.93389892578125, 3.065032958984375, 3.1961669921875, 3.327301025390625, 3.45843505859375, 3.589569091796875, 3.720703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 16.0, 10.0, 20.0, 52.0, 133.0, 231.0, 251.0, 153.0, 74.0, 38.0, 12.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.88685989379883, -43.554935455322266, -42.2230110168457, -40.89108657836914, -39.559165954589844, -38.22724151611328, -36.89531707763672, -35.563392639160156, -34.231468200683594, -32.89954376220703, -31.56761932373047, -30.23569679260254, -28.903772354125977, -27.571847915649414, -26.239925384521484, -24.908000946044922, -23.57607650756836, -22.244152069091797, -20.912227630615234, -19.580305099487305, -18.248380661010742, -16.91645622253418, -15.584532737731934, -14.252609252929688, -12.920684814453125, -11.588760375976562, -10.256836891174316, -8.92491340637207, -7.592988967895508, -6.2610650062561035, -4.929141044616699, -3.597217559814453, -2.2652931213378906, -0.9333691596984863, 0.39855480194091797, 1.7304787635803223, 3.0624027252197266, 4.394326686859131, 5.726250648498535, 7.058174133300781, 8.390098571777344, 9.722023010253906, 11.053946495056152, 12.385869979858398, 13.717794418334961, 15.049718856811523, 16.381641387939453, 17.713565826416016, 19.045490264892578, 20.37741470336914, 21.709339141845703, 23.041261672973633, 24.373186111450195, 25.705110549926758, 27.037033081054688, 28.36895751953125, 29.700881958007812, 31.032806396484375, 32.36473083496094, 33.6966552734375, 35.02857971191406, 36.36050033569336, 37.69242477416992, 39.024349212646484, 40.35627365112305]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 8.0, 14.0, 9.0, 10.0, 17.0, 20.0, 27.0, 28.0, 32.0, 26.0, 48.0, 45.0, 47.0, 54.0, 58.0, 55.0, 49.0, 47.0, 52.0, 51.0, 45.0, 45.0, 39.0, 32.0, 37.0, 26.0, 22.0, 13.0, 18.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.221168518066406, -19.61266326904297, -19.00415802001953, -18.395652770996094, -17.787145614624023, -17.178640365600586, -16.57013511657715, -15.961629867553711, -15.353124618530273, -14.744619369506836, -14.136113166809082, -13.527607917785645, -12.919102668762207, -12.310596466064453, -11.702091217041016, -11.093585968017578, -10.485079765319824, -9.876574516296387, -9.268068313598633, -8.659563064575195, -8.051057815551758, -7.442552089691162, -6.834046363830566, -6.225541114807129, -5.617035388946533, -5.0085296630859375, -4.4000244140625, -3.7915186882019043, -3.1830132007598877, -2.574507713317871, -1.9660019874572754, -1.357496738433838, -0.7489910125732422, -0.1404854655265808, 0.46802008152008057, 1.0765256881713867, 1.6850311756134033, 2.29353666305542, 2.9020423889160156, 3.510547637939453, 4.119053363800049, 4.7275590896606445, 5.336064338684082, 5.944570064544678, 6.553075790405273, 7.161581039428711, 7.770086765289307, 8.378591537475586, 8.98709774017334, 9.595602989196777, 10.204109191894531, 10.812614440917969, 11.421119689941406, 12.029624938964844, 12.638131141662598, 13.246636390686035, 13.855142593383789, 14.463647842407227, 15.07215404510498, 15.680659294128418, 16.289165496826172, 16.89767074584961, 17.506175994873047, 18.114681243896484, 18.723186492919922]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 9.0, 6.0, 6.0, 9.0, 9.0, 15.0, 20.0, 36.0, 44.0, 62.0, 71.0, 125.0, 203.0, 335.0, 595.0, 1250.0, 2979.0, 8419.0, 28598.0, 124163.0, 480683.0, 307950.0, 66425.0, 16825.0, 5347.0, 2106.0, 930.0, 511.0, 297.0, 149.0, 103.0, 75.0, 57.0, 33.0, 24.0, 27.0, 16.0, 11.0, 7.0, 8.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6640625, -13.259765625, -12.85546875, -12.451171875, -12.046875, -11.642578125, -11.23828125, -10.833984375, -10.4296875, -10.025390625, -9.62109375, -9.216796875, -8.8125, -8.408203125, -8.00390625, -7.599609375, -7.1953125, -6.791015625, -6.38671875, -5.982421875, -5.578125, -5.173828125, -4.76953125, -4.365234375, -3.9609375, -3.556640625, -3.15234375, -2.748046875, -2.34375, -1.939453125, -1.53515625, -1.130859375, -0.7265625, -0.322265625, 0.08203125, 0.486328125, 0.890625, 1.294921875, 1.69921875, 2.103515625, 2.5078125, 2.912109375, 3.31640625, 3.720703125, 4.125, 4.529296875, 4.93359375, 5.337890625, 5.7421875, 6.146484375, 6.55078125, 6.955078125, 7.359375, 7.763671875, 8.16796875, 8.572265625, 8.9765625, 9.380859375, 9.78515625, 10.189453125, 10.59375, 10.998046875, 11.40234375, 11.806640625, 12.2109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 12.0, 23.0, 28.0, 39.0, 33.0, 52.0, 69.0, 88.0, 86.0, 99.0, 89.0, 78.0, 64.0, 68.0, 54.0, 40.0, 20.0, 20.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -1.9676513671875, -1.857177734375, -1.7467041015625, -1.63623046875, -1.5257568359375, -1.415283203125, -1.3048095703125, -1.1943359375, -1.0838623046875, -0.973388671875, -0.8629150390625, -0.75244140625, -0.6419677734375, -0.531494140625, -0.4210205078125, -0.310546875, -0.2000732421875, -0.089599609375, 0.0208740234375, 0.13134765625, 0.2418212890625, 0.352294921875, 0.4627685546875, 0.5732421875, 0.6837158203125, 0.794189453125, 0.9046630859375, 1.01513671875, 1.1256103515625, 1.236083984375, 1.3465576171875, 1.45703125, 1.5675048828125, 1.677978515625, 1.7884521484375, 1.89892578125, 2.0093994140625, 2.119873046875, 2.2303466796875, 2.3408203125, 2.4512939453125, 2.561767578125, 2.6722412109375, 2.78271484375, 2.8931884765625, 3.003662109375, 3.1141357421875, 3.224609375, 3.3350830078125, 3.445556640625, 3.5560302734375, 3.66650390625, 3.7769775390625, 3.887451171875, 3.9979248046875, 4.1083984375, 4.2188720703125, 4.329345703125, 4.4398193359375, 4.55029296875, 4.6607666015625, 4.771240234375, 4.8817138671875, 4.9921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 7.0, 13.0, 16.0, 22.0, 27.0, 39.0, 46.0, 63.0, 100.0, 147.0, 176.0, 296.0, 496.0, 855.0, 1840.0, 5217.0, 20159.0, 100135.0, 455062.0, 367097.0, 73131.0, 15479.0, 4366.0, 1591.0, 738.0, 458.0, 277.0, 210.0, 142.0, 82.0, 79.0, 46.0, 41.0, 20.0, 23.0, 17.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0], "bins": [-12.8671875, -12.5185546875, -12.169921875, -11.8212890625, -11.47265625, -11.1240234375, -10.775390625, -10.4267578125, -10.078125, -9.7294921875, -9.380859375, -9.0322265625, -8.68359375, -8.3349609375, -7.986328125, -7.6376953125, -7.2890625, -6.9404296875, -6.591796875, -6.2431640625, -5.89453125, -5.5458984375, -5.197265625, -4.8486328125, -4.5, -4.1513671875, -3.802734375, -3.4541015625, -3.10546875, -2.7568359375, -2.408203125, -2.0595703125, -1.7109375, -1.3623046875, -1.013671875, -0.6650390625, -0.31640625, 0.0322265625, 0.380859375, 0.7294921875, 1.078125, 1.4267578125, 1.775390625, 2.1240234375, 2.47265625, 2.8212890625, 3.169921875, 3.5185546875, 3.8671875, 4.2158203125, 4.564453125, 4.9130859375, 5.26171875, 5.6103515625, 5.958984375, 6.3076171875, 6.65625, 7.0048828125, 7.353515625, 7.7021484375, 8.05078125, 8.3994140625, 8.748046875, 9.0966796875, 9.4453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 6.0, 21.0, 6.0, 10.0, 21.0, 16.0, 20.0, 28.0, 25.0, 27.0, 24.0, 39.0, 39.0, 40.0, 37.0, 35.0, 32.0, 41.0, 38.0, 44.0, 43.0, 28.0, 51.0, 39.0, 26.0, 35.0, 34.0, 24.0, 17.0, 20.0, 25.0, 12.0, 18.0, 9.0, 9.0, 11.0, 10.0, 5.0, 6.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.51171875, -7.2733154296875, -7.034912109375, -6.7965087890625, -6.55810546875, -6.3197021484375, -6.081298828125, -5.8428955078125, -5.6044921875, -5.3660888671875, -5.127685546875, -4.8892822265625, -4.65087890625, -4.4124755859375, -4.174072265625, -3.9356689453125, -3.697265625, -3.4588623046875, -3.220458984375, -2.9820556640625, -2.74365234375, -2.5052490234375, -2.266845703125, -2.0284423828125, -1.7900390625, -1.5516357421875, -1.313232421875, -1.0748291015625, -0.83642578125, -0.5980224609375, -0.359619140625, -0.1212158203125, 0.1171875, 0.3555908203125, 0.593994140625, 0.8323974609375, 1.07080078125, 1.3092041015625, 1.547607421875, 1.7860107421875, 2.0244140625, 2.2628173828125, 2.501220703125, 2.7396240234375, 2.97802734375, 3.2164306640625, 3.454833984375, 3.6932373046875, 3.931640625, 4.1700439453125, 4.408447265625, 4.6468505859375, 4.88525390625, 5.1236572265625, 5.362060546875, 5.6004638671875, 5.8388671875, 6.0772705078125, 6.315673828125, 6.5540771484375, 6.79248046875, 7.0308837890625, 7.269287109375, 7.5076904296875, 7.74609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 12.0, 13.0, 26.0, 33.0, 58.0, 111.0, 196.0, 357.0, 767.0, 1688.0, 3804.0, 10559.0, 39042.0, 215307.0, 595751.0, 138624.0, 28149.0, 8223.0, 3081.0, 1325.0, 675.0, 310.0, 171.0, 101.0, 57.0, 38.0, 17.0, 17.0, 18.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.26953125, -7.08013916015625, -6.8907470703125, -6.70135498046875, -6.511962890625, -6.32257080078125, -6.1331787109375, -5.94378662109375, -5.75439453125, -5.56500244140625, -5.3756103515625, -5.18621826171875, -4.996826171875, -4.80743408203125, -4.6180419921875, -4.42864990234375, -4.2392578125, -4.04986572265625, -3.8604736328125, -3.67108154296875, -3.481689453125, -3.29229736328125, -3.1029052734375, -2.91351318359375, -2.72412109375, -2.53472900390625, -2.3453369140625, -2.15594482421875, -1.966552734375, -1.77716064453125, -1.5877685546875, -1.39837646484375, -1.208984375, -1.01959228515625, -0.8302001953125, -0.64080810546875, -0.451416015625, -0.26202392578125, -0.0726318359375, 0.11676025390625, 0.30615234375, 0.49554443359375, 0.6849365234375, 0.87432861328125, 1.063720703125, 1.25311279296875, 1.4425048828125, 1.63189697265625, 1.8212890625, 2.01068115234375, 2.2000732421875, 2.38946533203125, 2.578857421875, 2.76824951171875, 2.9576416015625, 3.14703369140625, 3.33642578125, 3.52581787109375, 3.7152099609375, 3.90460205078125, 4.093994140625, 4.28338623046875, 4.4727783203125, 4.66217041015625, 4.8515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 11.0, 8.0, 14.0, 11.0, 15.0, 22.0, 32.0, 29.0, 45.0, 51.0, 71.0, 91.0, 134.0, 97.0, 82.0, 63.0, 47.0, 42.0, 27.0, 31.0, 21.0, 6.0, 13.0, 9.0, 3.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006628036499023438, -0.0006380677223205566, -0.0006133317947387695, -0.0005885958671569824, -0.0005638599395751953, -0.0005391240119934082, -0.0005143880844116211, -0.000489652156829834, -0.0004649162292480469, -0.00044018030166625977, -0.00041544437408447266, -0.00039070844650268555, -0.00036597251892089844, -0.00034123659133911133, -0.0003165006637573242, -0.0002917647361755371, -0.00026702880859375, -0.0002422928810119629, -0.00021755695343017578, -0.00019282102584838867, -0.00016808509826660156, -0.00014334917068481445, -0.00011861324310302734, -9.387731552124023e-05, -6.914138793945312e-05, -4.4405460357666016e-05, -1.9669532775878906e-05, 5.066394805908203e-06, 2.9802322387695312e-05, 5.453824996948242e-05, 7.927417755126953e-05, 0.00010401010513305664, 0.00012874603271484375, 0.00015348196029663086, 0.00017821788787841797, 0.00020295381546020508, 0.0002276897430419922, 0.0002524256706237793, 0.0002771615982055664, 0.0003018975257873535, 0.0003266334533691406, 0.00035136938095092773, 0.00037610530853271484, 0.00040084123611450195, 0.00042557716369628906, 0.00045031309127807617, 0.0004750490188598633, 0.0004997849464416504, 0.0005245208740234375, 0.0005492568016052246, 0.0005739927291870117, 0.0005987286567687988, 0.0006234645843505859, 0.000648200511932373, 0.0006729364395141602, 0.0006976723670959473, 0.0007224082946777344, 0.0007471442222595215, 0.0007718801498413086, 0.0007966160774230957, 0.0008213520050048828, 0.0008460879325866699, 0.000870823860168457, 0.0008955597877502441, 0.0009202957153320312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 8.0, 11.0, 21.0, 22.0, 35.0, 71.0, 151.0, 372.0, 895.0, 3342.0, 24035.0, 603791.0, 393952.0, 17713.0, 2792.0, 765.0, 299.0, 106.0, 65.0, 41.0, 28.0, 14.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.6583251953125, -12.261962890625, -11.8656005859375, -11.46923828125, -11.0728759765625, -10.676513671875, -10.2801513671875, -9.8837890625, -9.4874267578125, -9.091064453125, -8.6947021484375, -8.29833984375, -7.9019775390625, -7.505615234375, -7.1092529296875, -6.712890625, -6.3165283203125, -5.920166015625, -5.5238037109375, -5.12744140625, -4.7310791015625, -4.334716796875, -3.9383544921875, -3.5419921875, -3.1456298828125, -2.749267578125, -2.3529052734375, -1.95654296875, -1.5601806640625, -1.163818359375, -0.7674560546875, -0.37109375, 0.0252685546875, 0.421630859375, 0.8179931640625, 1.21435546875, 1.6107177734375, 2.007080078125, 2.4034423828125, 2.7998046875, 3.1961669921875, 3.592529296875, 3.9888916015625, 4.38525390625, 4.7816162109375, 5.177978515625, 5.5743408203125, 5.970703125, 6.3670654296875, 6.763427734375, 7.1597900390625, 7.55615234375, 7.9525146484375, 8.348876953125, 8.7452392578125, 9.1416015625, 9.5379638671875, 9.934326171875, 10.3306884765625, 10.72705078125, 11.1234130859375, 11.519775390625, 11.9161376953125, 12.3125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 13.0, 20.0, 15.0, 25.0, 19.0, 29.0, 45.0, 47.0, 54.0, 78.0, 93.0, 86.0, 83.0, 78.0, 59.0, 44.0, 41.0, 30.0, 25.0, 22.0, 10.0, 10.0, 10.0, 3.0, 4.0, 5.0, 6.0, 1.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.0703125, -3.947845458984375, -3.82537841796875, -3.702911376953125, -3.5804443359375, -3.457977294921875, -3.33551025390625, -3.213043212890625, -3.090576171875, -2.968109130859375, -2.84564208984375, -2.723175048828125, -2.6007080078125, -2.478240966796875, -2.35577392578125, -2.233306884765625, -2.11083984375, -1.988372802734375, -1.86590576171875, -1.743438720703125, -1.6209716796875, -1.498504638671875, -1.37603759765625, -1.253570556640625, -1.131103515625, -1.008636474609375, -0.88616943359375, -0.763702392578125, -0.6412353515625, -0.518768310546875, -0.39630126953125, -0.273834228515625, -0.1513671875, -0.028900146484375, 0.09356689453125, 0.216033935546875, 0.3385009765625, 0.460968017578125, 0.58343505859375, 0.705902099609375, 0.828369140625, 0.950836181640625, 1.07330322265625, 1.195770263671875, 1.3182373046875, 1.440704345703125, 1.56317138671875, 1.685638427734375, 1.80810546875, 1.930572509765625, 2.05303955078125, 2.175506591796875, 2.2979736328125, 2.420440673828125, 2.54290771484375, 2.665374755859375, 2.787841796875, 2.910308837890625, 3.03277587890625, 3.155242919921875, 3.2777099609375, 3.400177001953125, 3.52264404296875, 3.645111083984375, 3.767578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 18.0, 38.0, 80.0, 152.0, 252.0, 205.0, 138.0, 60.0, 26.0, 20.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.47367095947266, -98.92929077148438, -95.3849105834961, -91.84053039550781, -88.296142578125, -84.75177001953125, -81.20738220214844, -77.66300201416016, -74.11862182617188, -70.5742416381836, -67.02986145019531, -63.485477447509766, -59.941097259521484, -56.3967170715332, -52.852333068847656, -49.307952880859375, -45.763572692871094, -42.21919250488281, -38.67481231689453, -35.130428314208984, -31.586048126220703, -28.041667938232422, -24.497285842895508, -20.952903747558594, -17.408523559570312, -13.864142417907715, -10.319761276245117, -6.7753801345825195, -3.230998992919922, 0.3133811950683594, 3.8577632904052734, 7.4021453857421875, 10.946533203125, 14.490914344787598, 18.035295486450195, 21.57967758178711, 25.12405776977539, 28.668437957763672, 32.21282196044922, 35.7572021484375, 39.30158233642578, 42.84596252441406, 46.390342712402344, 49.93472671508789, 53.47910690307617, 57.02348709106445, 60.56787109375, 64.11225128173828, 67.65663146972656, 71.20101165771484, 74.74539184570312, 78.2897720336914, 81.83415222167969, 85.3785400390625, 88.92292022705078, 92.46730041503906, 96.01168060302734, 99.55606079101562, 103.1004409790039, 106.64482116699219, 110.189208984375, 113.73358154296875, 117.27796936035156, 120.82234954833984, 124.36672973632812]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 8.0, 17.0, 14.0, 14.0, 22.0, 29.0, 18.0, 25.0, 40.0, 51.0, 45.0, 35.0, 63.0, 55.0, 56.0, 52.0, 50.0, 47.0, 54.0, 36.0, 39.0, 35.0, 30.0, 28.0, 27.0, 17.0, 22.0, 16.0, 14.0, 15.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.1720199584961, -63.32449722290039, -61.47697448730469, -59.62945556640625, -57.78193283081055, -55.934410095214844, -54.08688735961914, -52.23936462402344, -50.391841888427734, -48.54431915283203, -46.69679641723633, -44.849273681640625, -43.00175476074219, -41.154232025146484, -39.30670928955078, -37.45918655395508, -35.611663818359375, -33.76414108276367, -31.9166202545166, -30.0690975189209, -28.221574783325195, -26.374053955078125, -24.526531219482422, -22.67900848388672, -20.83148956298828, -18.983966827392578, -17.136445999145508, -15.288923263549805, -13.441400527954102, -11.593878746032715, -9.746356964111328, -7.898834228515625, -6.051311492919922, -4.203789234161377, -2.356267213821411, -0.5087451934814453, 1.3387770652770996, 3.1862993240356445, 5.033821105957031, 6.881343841552734, 8.728865623474121, 10.576387405395508, 12.423910140991211, 14.271431922912598, 16.118953704833984, 17.966476440429688, 19.81399917602539, 21.661521911621094, 23.509042739868164, 25.356565475463867, 27.204086303710938, 29.05160903930664, 30.899131774902344, 32.74665451049805, 34.59417724609375, 36.44169616699219, 38.28921890258789, 40.136741638183594, 41.9842643737793, 43.831787109375, 45.67930603027344, 47.52682876586914, 49.374351501464844, 51.22187423706055, 53.06939697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 15.0, 34.0, 41.0, 92.0, 148.0, 280.0, 556.0, 1371.0, 3948.0, 16514.0, 155462.0, 3890528.0, 105956.0, 13469.0, 3480.0, 1174.0, 532.0, 241.0, 131.0, 93.0, 51.0, 48.0, 27.0, 23.0, 18.0, 12.0, 5.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.36376953125, -11.7587890625, -11.15380859375, -10.548828125, -9.94384765625, -9.3388671875, -8.73388671875, -8.12890625, -7.52392578125, -6.9189453125, -6.31396484375, -5.708984375, -5.10400390625, -4.4990234375, -3.89404296875, -3.2890625, -2.68408203125, -2.0791015625, -1.47412109375, -0.869140625, -0.26416015625, 0.3408203125, 0.94580078125, 1.55078125, 2.15576171875, 2.7607421875, 3.36572265625, 3.970703125, 4.57568359375, 5.1806640625, 5.78564453125, 6.390625, 6.99560546875, 7.6005859375, 8.20556640625, 8.810546875, 9.41552734375, 10.0205078125, 10.62548828125, 11.23046875, 11.83544921875, 12.4404296875, 13.04541015625, 13.650390625, 14.25537109375, 14.8603515625, 15.46533203125, 16.0703125, 16.67529296875, 17.2802734375, 17.88525390625, 18.490234375, 19.09521484375, 19.7001953125, 20.30517578125, 20.91015625, 21.51513671875, 22.1201171875, 22.72509765625, 23.330078125, 23.93505859375, 24.5400390625, 25.14501953125, 25.75]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 14.0, 19.0, 25.0, 31.0, 30.0, 58.0, 55.0, 56.0, 80.0, 79.0, 84.0, 93.0, 67.0, 63.0, 60.0, 42.0, 41.0, 30.0, 26.0, 15.0, 9.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.03515625, -1.92578125, -1.81640625, -1.70703125, -1.59765625, -1.48828125, -1.37890625, -1.26953125, -1.16015625, -1.05078125, -0.94140625, -0.83203125, -0.72265625, -0.61328125, -0.50390625, -0.39453125, -0.28515625, -0.17578125, -0.06640625, 0.04296875, 0.15234375, 0.26171875, 0.37109375, 0.48046875, 0.58984375, 0.69921875, 0.80859375, 0.91796875, 1.02734375, 1.13671875, 1.24609375, 1.35546875, 1.46484375, 1.57421875, 1.68359375, 1.79296875, 1.90234375, 2.01171875, 2.12109375, 2.23046875, 2.33984375, 2.44921875, 2.55859375, 2.66796875, 2.77734375, 2.88671875, 2.99609375, 3.10546875, 3.21484375, 3.32421875, 3.43359375, 3.54296875, 3.65234375, 3.76171875, 3.87109375, 3.98046875, 4.08984375, 4.19921875, 4.30859375, 4.41796875, 4.52734375, 4.63671875, 4.74609375, 4.85546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 8.0, 14.0, 10.0, 16.0, 29.0, 35.0, 40.0, 61.0, 115.0, 236.0, 492.0, 1421.0, 5279.0, 32407.0, 590161.0, 3481815.0, 69495.0, 9321.0, 2052.0, 658.0, 238.0, 133.0, 56.0, 46.0, 35.0, 26.0, 23.0, 12.0, 12.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.1827392578125, -10.654541015625, -10.1263427734375, -9.59814453125, -9.0699462890625, -8.541748046875, -8.0135498046875, -7.4853515625, -6.9571533203125, -6.428955078125, -5.9007568359375, -5.37255859375, -4.8443603515625, -4.316162109375, -3.7879638671875, -3.259765625, -2.7315673828125, -2.203369140625, -1.6751708984375, -1.14697265625, -0.6187744140625, -0.090576171875, 0.4376220703125, 0.9658203125, 1.4940185546875, 2.022216796875, 2.5504150390625, 3.07861328125, 3.6068115234375, 4.135009765625, 4.6632080078125, 5.19140625, 5.7196044921875, 6.247802734375, 6.7760009765625, 7.30419921875, 7.8323974609375, 8.360595703125, 8.8887939453125, 9.4169921875, 9.9451904296875, 10.473388671875, 11.0015869140625, 11.52978515625, 12.0579833984375, 12.586181640625, 13.1143798828125, 13.642578125, 14.1707763671875, 14.698974609375, 15.2271728515625, 15.75537109375, 16.2835693359375, 16.811767578125, 17.3399658203125, 17.8681640625, 18.3963623046875, 18.924560546875, 19.4527587890625, 19.98095703125, 20.5091552734375, 21.037353515625, 21.5655517578125, 22.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 13.0, 21.0, 22.0, 54.0, 99.0, 175.0, 482.0, 1939.0, 731.0, 241.0, 128.0, 55.0, 48.0, 22.0, 12.0, 13.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.34075927734375, -9.1268310546875, -8.91290283203125, -8.698974609375, -8.48504638671875, -8.2711181640625, -8.05718994140625, -7.84326171875, -7.62933349609375, -7.4154052734375, -7.20147705078125, -6.987548828125, -6.77362060546875, -6.5596923828125, -6.34576416015625, -6.1318359375, -5.91790771484375, -5.7039794921875, -5.49005126953125, -5.276123046875, -5.06219482421875, -4.8482666015625, -4.63433837890625, -4.42041015625, -4.20648193359375, -3.9925537109375, -3.77862548828125, -3.564697265625, -3.35076904296875, -3.1368408203125, -2.92291259765625, -2.708984375, -2.49505615234375, -2.2811279296875, -2.06719970703125, -1.853271484375, -1.63934326171875, -1.4254150390625, -1.21148681640625, -0.99755859375, -0.78363037109375, -0.5697021484375, -0.35577392578125, -0.141845703125, 0.07208251953125, 0.2860107421875, 0.49993896484375, 0.7138671875, 0.92779541015625, 1.1417236328125, 1.35565185546875, 1.569580078125, 1.78350830078125, 1.9974365234375, 2.21136474609375, 2.42529296875, 2.63922119140625, 2.8531494140625, 3.06707763671875, 3.281005859375, 3.49493408203125, 3.7088623046875, 3.92279052734375, 4.13671875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 8.0, 21.0, 16.0, 77.0, 141.0, 210.0, 213.0, 161.0, 97.0, 35.0, 11.0, 8.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-59.77345275878906, -58.35493087768555, -56.93640899658203, -55.51788330078125, -54.099361419677734, -52.68083953857422, -51.26231384277344, -49.84379196166992, -48.425270080566406, -47.00674819946289, -45.588226318359375, -44.169700622558594, -42.75117874145508, -41.33265686035156, -39.91413116455078, -38.495609283447266, -37.07708740234375, -35.658565521240234, -34.24004364013672, -32.82151794433594, -31.402996063232422, -29.984474182128906, -28.565950393676758, -27.14742660522461, -25.728904724121094, -24.310382843017578, -22.89185905456543, -21.47333526611328, -20.054813385009766, -18.63629150390625, -17.2177677154541, -15.79924488067627, -14.380722045898438, -12.962199211120605, -11.543676376342773, -10.125153541564941, -8.70663070678711, -7.288107872009277, -5.869585037231445, -4.451062202453613, -3.0325393676757812, -1.6140165328979492, -0.1954936981201172, 1.2230291366577148, 2.641551971435547, 4.060074806213379, 5.478597640991211, 6.897120475769043, 8.315643310546875, 9.734166145324707, 11.152688980102539, 12.571211814880371, 13.989734649658203, 15.408257484436035, 16.826780319213867, 18.245304107666016, 19.66382598876953, 21.082347869873047, 22.500871658325195, 23.919395446777344, 25.33791732788086, 26.756439208984375, 28.174962997436523, 29.593486785888672, 31.012008666992188]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 12.0, 11.0, 13.0, 9.0, 12.0, 19.0, 29.0, 29.0, 29.0, 31.0, 33.0, 31.0, 53.0, 30.0, 45.0, 44.0, 40.0, 46.0, 51.0, 41.0, 31.0, 50.0, 46.0, 30.0, 31.0, 31.0, 28.0, 25.0, 16.0, 17.0, 13.0, 13.0, 10.0, 12.0, 4.0, 7.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.110811233520508, -15.644418716430664, -15.178025245666504, -14.71163272857666, -14.2452392578125, -13.778846740722656, -13.312454223632812, -12.846060752868652, -12.379667282104492, -11.913274765014648, -11.446881294250488, -10.980488777160645, -10.514095306396484, -10.04770278930664, -9.581310272216797, -9.114916801452637, -8.648524284362793, -8.18213176727295, -7.715738296508789, -7.249345779418945, -6.782952308654785, -6.316559791564941, -5.8501667976379395, -5.3837738037109375, -4.9173808097839355, -4.450987815856934, -3.9845948219299316, -3.518202066421509, -3.051809072494507, -2.585416078567505, -2.119023323059082, -1.65263032913208, -1.1862373352050781, -0.719844400882721, -0.25345146656036377, 0.21294140815734863, 0.6793344020843506, 1.1457273960113525, 1.6121201515197754, 2.0785131454467773, 2.5449061393737793, 3.0112991333007812, 3.477692127227783, 3.944084882736206, 4.410477638244629, 4.876871109008789, 5.343263626098633, 5.809656620025635, 6.276049613952637, 6.742442607879639, 7.208835601806641, 7.675228118896484, 8.141621589660645, 8.608014106750488, 9.074407577514648, 9.540800094604492, 10.007192611694336, 10.47358512878418, 10.93997859954834, 11.406371116638184, 11.872764587402344, 12.339157104492188, 12.805549621582031, 13.271943092346191, 13.738336563110352]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 4.0, 8.0, 14.0, 12.0, 18.0, 36.0, 37.0, 61.0, 94.0, 173.0, 325.0, 647.0, 1561.0, 4228.0, 14860.0, 68239.0, 450366.0, 422394.0, 64512.0, 14019.0, 4041.0, 1462.0, 614.0, 309.0, 186.0, 116.0, 72.0, 42.0, 18.0, 20.0, 20.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.0625, -17.5740966796875, -17.085693359375, -16.5972900390625, -16.10888671875, -15.6204833984375, -15.132080078125, -14.6436767578125, -14.1552734375, -13.6668701171875, -13.178466796875, -12.6900634765625, -12.20166015625, -11.7132568359375, -11.224853515625, -10.7364501953125, -10.248046875, -9.7596435546875, -9.271240234375, -8.7828369140625, -8.29443359375, -7.8060302734375, -7.317626953125, -6.8292236328125, -6.3408203125, -5.8524169921875, -5.364013671875, -4.8756103515625, -4.38720703125, -3.8988037109375, -3.410400390625, -2.9219970703125, -2.43359375, -1.9451904296875, -1.456787109375, -0.9683837890625, -0.47998046875, 0.0084228515625, 0.496826171875, 0.9852294921875, 1.4736328125, 1.9620361328125, 2.450439453125, 2.9388427734375, 3.42724609375, 3.9156494140625, 4.404052734375, 4.8924560546875, 5.380859375, 5.8692626953125, 6.357666015625, 6.8460693359375, 7.33447265625, 7.8228759765625, 8.311279296875, 8.7996826171875, 9.2880859375, 9.7764892578125, 10.264892578125, 10.7532958984375, 11.24169921875, 11.7301025390625, 12.218505859375, 12.7069091796875, 13.1953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 18.0, 21.0, 23.0, 34.0, 37.0, 54.0, 49.0, 52.0, 82.0, 83.0, 85.0, 82.0, 70.0, 59.0, 50.0, 42.0, 46.0, 34.0, 20.0, 12.0, 11.0, 7.0, 7.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.828857421875, -1.72412109375, -1.619384765625, -1.5146484375, -1.409912109375, -1.30517578125, -1.200439453125, -1.095703125, -0.990966796875, -0.88623046875, -0.781494140625, -0.6767578125, -0.572021484375, -0.46728515625, -0.362548828125, -0.2578125, -0.153076171875, -0.04833984375, 0.056396484375, 0.1611328125, 0.265869140625, 0.37060546875, 0.475341796875, 0.580078125, 0.684814453125, 0.78955078125, 0.894287109375, 0.9990234375, 1.103759765625, 1.20849609375, 1.313232421875, 1.41796875, 1.522705078125, 1.62744140625, 1.732177734375, 1.8369140625, 1.941650390625, 2.04638671875, 2.151123046875, 2.255859375, 2.360595703125, 2.46533203125, 2.570068359375, 2.6748046875, 2.779541015625, 2.88427734375, 2.989013671875, 3.09375, 3.198486328125, 3.30322265625, 3.407958984375, 3.5126953125, 3.617431640625, 3.72216796875, 3.826904296875, 3.931640625, 4.036376953125, 4.14111328125, 4.245849609375, 4.3505859375, 4.455322265625, 4.56005859375, 4.664794921875, 4.76953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 11.0, 8.0, 17.0, 18.0, 23.0, 38.0, 34.0, 62.0, 93.0, 135.0, 197.0, 320.0, 540.0, 1029.0, 2533.0, 8337.0, 41474.0, 289949.0, 592123.0, 89092.0, 15307.0, 3866.0, 1521.0, 698.0, 433.0, 205.0, 163.0, 98.0, 59.0, 42.0, 36.0, 31.0, 9.0, 13.0, 12.0, 8.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.90625, -13.4744873046875, -13.042724609375, -12.6109619140625, -12.17919921875, -11.7474365234375, -11.315673828125, -10.8839111328125, -10.4521484375, -10.0203857421875, -9.588623046875, -9.1568603515625, -8.72509765625, -8.2933349609375, -7.861572265625, -7.4298095703125, -6.998046875, -6.5662841796875, -6.134521484375, -5.7027587890625, -5.27099609375, -4.8392333984375, -4.407470703125, -3.9757080078125, -3.5439453125, -3.1121826171875, -2.680419921875, -2.2486572265625, -1.81689453125, -1.3851318359375, -0.953369140625, -0.5216064453125, -0.08984375, 0.3419189453125, 0.773681640625, 1.2054443359375, 1.63720703125, 2.0689697265625, 2.500732421875, 2.9324951171875, 3.3642578125, 3.7960205078125, 4.227783203125, 4.6595458984375, 5.09130859375, 5.5230712890625, 5.954833984375, 6.3865966796875, 6.818359375, 7.2501220703125, 7.681884765625, 8.1136474609375, 8.54541015625, 8.9771728515625, 9.408935546875, 9.8406982421875, 10.2724609375, 10.7042236328125, 11.135986328125, 11.5677490234375, 11.99951171875, 12.4312744140625, 12.863037109375, 13.2947998046875, 13.7265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 7.0, 5.0, 12.0, 16.0, 23.0, 29.0, 19.0, 35.0, 42.0, 48.0, 63.0, 58.0, 66.0, 62.0, 56.0, 72.0, 53.0, 56.0, 40.0, 45.0, 44.0, 28.0, 21.0, 20.0, 27.0, 15.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5, -12.1453857421875, -11.790771484375, -11.4361572265625, -11.08154296875, -10.7269287109375, -10.372314453125, -10.0177001953125, -9.6630859375, -9.3084716796875, -8.953857421875, -8.5992431640625, -8.24462890625, -7.8900146484375, -7.535400390625, -7.1807861328125, -6.826171875, -6.4715576171875, -6.116943359375, -5.7623291015625, -5.40771484375, -5.0531005859375, -4.698486328125, -4.3438720703125, -3.9892578125, -3.6346435546875, -3.280029296875, -2.9254150390625, -2.57080078125, -2.2161865234375, -1.861572265625, -1.5069580078125, -1.15234375, -0.7977294921875, -0.443115234375, -0.0885009765625, 0.26611328125, 0.6207275390625, 0.975341796875, 1.3299560546875, 1.6845703125, 2.0391845703125, 2.393798828125, 2.7484130859375, 3.10302734375, 3.4576416015625, 3.812255859375, 4.1668701171875, 4.521484375, 4.8760986328125, 5.230712890625, 5.5853271484375, 5.93994140625, 6.2945556640625, 6.649169921875, 7.0037841796875, 7.3583984375, 7.7130126953125, 8.067626953125, 8.4222412109375, 8.77685546875, 9.1314697265625, 9.486083984375, 9.8406982421875, 10.1953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 13.0, 43.0, 43.0, 78.0, 141.0, 319.0, 822.0, 2842.0, 13894.0, 137349.0, 849375.0, 35000.0, 6185.0, 1486.0, 489.0, 217.0, 107.0, 55.0, 32.0, 20.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.375, -13.955322265625, -13.53564453125, -13.115966796875, -12.6962890625, -12.276611328125, -11.85693359375, -11.437255859375, -11.017578125, -10.597900390625, -10.17822265625, -9.758544921875, -9.3388671875, -8.919189453125, -8.49951171875, -8.079833984375, -7.66015625, -7.240478515625, -6.82080078125, -6.401123046875, -5.9814453125, -5.561767578125, -5.14208984375, -4.722412109375, -4.302734375, -3.883056640625, -3.46337890625, -3.043701171875, -2.6240234375, -2.204345703125, -1.78466796875, -1.364990234375, -0.9453125, -0.525634765625, -0.10595703125, 0.313720703125, 0.7333984375, 1.153076171875, 1.57275390625, 1.992431640625, 2.412109375, 2.831787109375, 3.25146484375, 3.671142578125, 4.0908203125, 4.510498046875, 4.93017578125, 5.349853515625, 5.76953125, 6.189208984375, 6.60888671875, 7.028564453125, 7.4482421875, 7.867919921875, 8.28759765625, 8.707275390625, 9.126953125, 9.546630859375, 9.96630859375, 10.385986328125, 10.8056640625, 11.225341796875, 11.64501953125, 12.064697265625, 12.484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 12.0, 18.0, 20.0, 19.0, 33.0, 63.0, 141.0, 244.0, 188.0, 90.0, 40.0, 34.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013523101806640625, -0.0013173818588256836, -0.0012824535369873047, -0.0012475252151489258, -0.0012125968933105469, -0.001177668571472168, -0.001142740249633789, -0.0011078119277954102, -0.0010728836059570312, -0.0010379552841186523, -0.0010030269622802734, -0.0009680986404418945, -0.0009331703186035156, -0.0008982419967651367, -0.0008633136749267578, -0.0008283853530883789, -0.00079345703125, -0.0007585287094116211, -0.0007236003875732422, -0.0006886720657348633, -0.0006537437438964844, -0.0006188154220581055, -0.0005838871002197266, -0.0005489587783813477, -0.0005140304565429688, -0.00047910213470458984, -0.00044417381286621094, -0.00040924549102783203, -0.0003743171691894531, -0.0003393888473510742, -0.0003044605255126953, -0.0002695322036743164, -0.0002346038818359375, -0.0001996755599975586, -0.0001647472381591797, -0.00012981891632080078, -9.489059448242188e-05, -5.996227264404297e-05, -2.5033950805664062e-05, 9.894371032714844e-06, 4.482269287109375e-05, 7.975101470947266e-05, 0.00011467933654785156, 0.00014960765838623047, 0.00018453598022460938, 0.00021946430206298828, 0.0002543926239013672, 0.0002893209457397461, 0.000324249267578125, 0.0003591775894165039, 0.0003941059112548828, 0.0004290342330932617, 0.0004639625549316406, 0.0004988908767700195, 0.0005338191986083984, 0.0005687475204467773, 0.0006036758422851562, 0.0006386041641235352, 0.0006735324859619141, 0.000708460807800293, 0.0007433891296386719, 0.0007783174514770508, 0.0008132457733154297, 0.0008481740951538086, 0.0008831024169921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 13.0, 7.0, 21.0, 29.0, 59.0, 78.0, 130.0, 249.0, 547.0, 1396.0, 4498.0, 19591.0, 298699.0, 689480.0, 25189.0, 5664.0, 1638.0, 618.0, 253.0, 135.0, 91.0, 43.0, 42.0, 21.0, 8.0, 11.0, 12.0, 9.0, 9.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.859375, -15.431640625, -15.00390625, -14.576171875, -14.1484375, -13.720703125, -13.29296875, -12.865234375, -12.4375, -12.009765625, -11.58203125, -11.154296875, -10.7265625, -10.298828125, -9.87109375, -9.443359375, -9.015625, -8.587890625, -8.16015625, -7.732421875, -7.3046875, -6.876953125, -6.44921875, -6.021484375, -5.59375, -5.166015625, -4.73828125, -4.310546875, -3.8828125, -3.455078125, -3.02734375, -2.599609375, -2.171875, -1.744140625, -1.31640625, -0.888671875, -0.4609375, -0.033203125, 0.39453125, 0.822265625, 1.25, 1.677734375, 2.10546875, 2.533203125, 2.9609375, 3.388671875, 3.81640625, 4.244140625, 4.671875, 5.099609375, 5.52734375, 5.955078125, 6.3828125, 6.810546875, 7.23828125, 7.666015625, 8.09375, 8.521484375, 8.94921875, 9.376953125, 9.8046875, 10.232421875, 10.66015625, 11.087890625, 11.515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 14.0, 13.0, 15.0, 25.0, 43.0, 103.0, 243.0, 281.0, 115.0, 49.0, 22.0, 18.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-13.96875, -13.6654052734375, -13.362060546875, -13.0587158203125, -12.75537109375, -12.4520263671875, -12.148681640625, -11.8453369140625, -11.5419921875, -11.2386474609375, -10.935302734375, -10.6319580078125, -10.32861328125, -10.0252685546875, -9.721923828125, -9.4185791015625, -9.115234375, -8.8118896484375, -8.508544921875, -8.2052001953125, -7.90185546875, -7.5985107421875, -7.295166015625, -6.9918212890625, -6.6884765625, -6.3851318359375, -6.081787109375, -5.7784423828125, -5.47509765625, -5.1717529296875, -4.868408203125, -4.5650634765625, -4.26171875, -3.9583740234375, -3.655029296875, -3.3516845703125, -3.04833984375, -2.7449951171875, -2.441650390625, -2.1383056640625, -1.8349609375, -1.5316162109375, -1.228271484375, -0.9249267578125, -0.62158203125, -0.3182373046875, -0.014892578125, 0.2884521484375, 0.591796875, 0.8951416015625, 1.198486328125, 1.5018310546875, 1.80517578125, 2.1085205078125, 2.411865234375, 2.7152099609375, 3.0185546875, 3.3218994140625, 3.625244140625, 3.9285888671875, 4.23193359375, 4.5352783203125, 4.838623046875, 5.1419677734375, 5.4453125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 15.0, 24.0, 50.0, 61.0, 118.0, 154.0, 149.0, 141.0, 116.0, 88.0, 30.0, 19.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.24507141113281, -61.54106140136719, -58.8370475769043, -56.13303756713867, -53.42902374267578, -50.725013732910156, -48.02100372314453, -45.316993713378906, -42.612979888916016, -39.90896987915039, -37.2049560546875, -34.500946044921875, -31.796934127807617, -29.09292221069336, -26.388912200927734, -23.684900283813477, -20.98088836669922, -18.27687644958496, -15.57286548614502, -12.868854522705078, -10.16484260559082, -7.4608306884765625, -4.7568206787109375, -2.0528087615966797, 0.6512031555175781, 3.3552145957946777, 6.059226036071777, 8.763236999511719, 11.467248916625977, 14.171260833740234, 16.87527084350586, 19.579282760620117, 22.283287048339844, 24.9872989654541, 27.69131088256836, 30.395320892333984, 33.099334716796875, 35.8033447265625, 38.507354736328125, 41.21136474609375, 43.91537857055664, 46.619388580322266, 49.323402404785156, 52.02741241455078, 54.731422424316406, 57.4354362487793, 60.13944625854492, 62.84346008300781, 65.54747009277344, 68.25148010253906, 70.95549011230469, 73.65950012207031, 76.36351776123047, 79.0675277709961, 81.77153778076172, 84.47554779052734, 87.1795654296875, 89.88357543945312, 92.58758544921875, 95.29159545898438, 97.99561309814453, 100.69962310791016, 103.40363311767578, 106.1076431274414, 108.81165313720703]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 11.0, 7.0, 11.0, 11.0, 17.0, 9.0, 21.0, 14.0, 24.0, 30.0, 20.0, 26.0, 31.0, 37.0, 26.0, 45.0, 40.0, 46.0, 41.0, 51.0, 38.0, 44.0, 34.0, 47.0, 43.0, 38.0, 35.0, 30.0, 27.0, 24.0, 26.0, 13.0, 15.0, 19.0, 13.0, 14.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-45.95240783691406, -44.49048614501953, -43.028564453125, -41.56664276123047, -40.10472106933594, -38.642799377441406, -37.180877685546875, -35.718955993652344, -34.25703430175781, -32.79511260986328, -31.33319091796875, -29.87126922607422, -28.409347534179688, -26.947425842285156, -25.485502243041992, -24.02358055114746, -22.561656951904297, -21.099735260009766, -19.637813568115234, -18.175891876220703, -16.713970184326172, -15.252047538757324, -13.790124893188477, -12.328203201293945, -10.866281509399414, -9.404359817504883, -7.942437648773193, -6.480515480041504, -5.018593788146973, -3.5566720962524414, -2.0947494506835938, -0.6328277587890625, 0.8290939331054688, 2.291015863418579, 3.7529377937316895, 5.214859962463379, 6.67678165435791, 8.138703346252441, 9.600625991821289, 11.06254768371582, 12.524469375610352, 13.986391067504883, 15.448312759399414, 16.910236358642578, 18.37215805053711, 19.83407974243164, 21.296001434326172, 22.757923126220703, 24.219844818115234, 25.681766510009766, 27.143688201904297, 28.605609893798828, 30.06753158569336, 31.52945327758789, 32.99137878417969, 34.45330047607422, 35.91522216796875, 37.37714385986328, 38.83906555175781, 40.300987243652344, 41.762908935546875, 43.224830627441406, 44.68675231933594, 46.14867401123047, 47.610595703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 16.0, 19.0, 13.0, 21.0, 38.0, 53.0, 97.0, 128.0, 231.0, 448.0, 816.0, 1871.0, 4566.0, 13702.0, 59008.0, 1347766.0, 2677360.0, 64570.0, 14760.0, 4771.0, 2019.0, 890.0, 419.0, 243.0, 132.0, 78.0, 60.0, 34.0, 33.0, 16.0, 18.0, 14.0, 14.0, 11.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.8203125, -11.3480224609375, -10.875732421875, -10.4034423828125, -9.93115234375, -9.4588623046875, -8.986572265625, -8.5142822265625, -8.0419921875, -7.5697021484375, -7.097412109375, -6.6251220703125, -6.15283203125, -5.6805419921875, -5.208251953125, -4.7359619140625, -4.263671875, -3.7913818359375, -3.319091796875, -2.8468017578125, -2.37451171875, -1.9022216796875, -1.429931640625, -0.9576416015625, -0.4853515625, -0.0130615234375, 0.459228515625, 0.9315185546875, 1.40380859375, 1.8760986328125, 2.348388671875, 2.8206787109375, 3.29296875, 3.7652587890625, 4.237548828125, 4.7098388671875, 5.18212890625, 5.6544189453125, 6.126708984375, 6.5989990234375, 7.0712890625, 7.5435791015625, 8.015869140625, 8.4881591796875, 8.96044921875, 9.4327392578125, 9.905029296875, 10.3773193359375, 10.849609375, 11.3218994140625, 11.794189453125, 12.2664794921875, 12.73876953125, 13.2110595703125, 13.683349609375, 14.1556396484375, 14.6279296875, 15.1002197265625, 15.572509765625, 16.0447998046875, 16.51708984375, 16.9893798828125, 17.461669921875, 17.9339599609375, 18.40625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 18.0, 16.0, 21.0, 29.0, 27.0, 43.0, 52.0, 65.0, 60.0, 61.0, 93.0, 88.0, 87.0, 57.0, 54.0, 54.0, 49.0, 36.0, 25.0, 15.0, 18.0, 5.0, 10.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98046875, -1.87030029296875, -1.7601318359375, -1.64996337890625, -1.539794921875, -1.42962646484375, -1.3194580078125, -1.20928955078125, -1.09912109375, -0.98895263671875, -0.8787841796875, -0.76861572265625, -0.658447265625, -0.54827880859375, -0.4381103515625, -0.32794189453125, -0.2177734375, -0.10760498046875, 0.0025634765625, 0.11273193359375, 0.222900390625, 0.33306884765625, 0.4432373046875, 0.55340576171875, 0.66357421875, 0.77374267578125, 0.8839111328125, 0.99407958984375, 1.104248046875, 1.21441650390625, 1.3245849609375, 1.43475341796875, 1.544921875, 1.65509033203125, 1.7652587890625, 1.87542724609375, 1.985595703125, 2.09576416015625, 2.2059326171875, 2.31610107421875, 2.42626953125, 2.53643798828125, 2.6466064453125, 2.75677490234375, 2.866943359375, 2.97711181640625, 3.0872802734375, 3.19744873046875, 3.3076171875, 3.41778564453125, 3.5279541015625, 3.63812255859375, 3.748291015625, 3.85845947265625, 3.9686279296875, 4.07879638671875, 4.18896484375, 4.29913330078125, 4.4093017578125, 4.51947021484375, 4.629638671875, 4.73980712890625, 4.8499755859375, 4.96014404296875, 5.0703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 1.0, 11.0, 14.0, 11.0, 17.0, 12.0, 18.0, 30.0, 29.0, 41.0, 41.0, 49.0, 70.0, 119.0, 243.0, 763.0, 6085.0, 159809.0, 3991105.0, 32452.0, 2382.0, 438.0, 154.0, 87.0, 78.0, 45.0, 37.0, 20.0, 22.0, 13.0, 20.0, 13.0, 12.0, 5.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.46875, -26.498046875, -25.52734375, -24.556640625, -23.5859375, -22.615234375, -21.64453125, -20.673828125, -19.703125, -18.732421875, -17.76171875, -16.791015625, -15.8203125, -14.849609375, -13.87890625, -12.908203125, -11.9375, -10.966796875, -9.99609375, -9.025390625, -8.0546875, -7.083984375, -6.11328125, -5.142578125, -4.171875, -3.201171875, -2.23046875, -1.259765625, -0.2890625, 0.681640625, 1.65234375, 2.623046875, 3.59375, 4.564453125, 5.53515625, 6.505859375, 7.4765625, 8.447265625, 9.41796875, 10.388671875, 11.359375, 12.330078125, 13.30078125, 14.271484375, 15.2421875, 16.212890625, 17.18359375, 18.154296875, 19.125, 20.095703125, 21.06640625, 22.037109375, 23.0078125, 23.978515625, 24.94921875, 25.919921875, 26.890625, 27.861328125, 28.83203125, 29.802734375, 30.7734375, 31.744140625, 32.71484375, 33.685546875, 34.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 16.0, 44.0, 124.0, 600.0, 2758.0, 369.0, 99.0, 37.0, 14.0, 7.0, 4.0, 1.0, 2.0, 1.0], "bins": [-22.046875, -21.641204833984375, -21.23553466796875, -20.829864501953125, -20.4241943359375, -20.018524169921875, -19.61285400390625, -19.207183837890625, -18.801513671875, -18.395843505859375, -17.99017333984375, -17.584503173828125, -17.1788330078125, -16.773162841796875, -16.36749267578125, -15.961822509765625, -15.55615234375, -15.150482177734375, -14.74481201171875, -14.339141845703125, -13.9334716796875, -13.527801513671875, -13.12213134765625, -12.716461181640625, -12.310791015625, -11.905120849609375, -11.49945068359375, -11.093780517578125, -10.6881103515625, -10.282440185546875, -9.87677001953125, -9.471099853515625, -9.0654296875, -8.659759521484375, -8.25408935546875, -7.848419189453125, -7.4427490234375, -7.037078857421875, -6.63140869140625, -6.225738525390625, -5.820068359375, -5.414398193359375, -5.00872802734375, -4.603057861328125, -4.1973876953125, -3.791717529296875, -3.38604736328125, -2.980377197265625, -2.57470703125, -2.169036865234375, -1.76336669921875, -1.357696533203125, -0.9520263671875, -0.546356201171875, -0.14068603515625, 0.264984130859375, 0.670654296875, 1.076324462890625, 1.48199462890625, 1.887664794921875, 2.2933349609375, 2.699005126953125, 3.10467529296875, 3.510345458984375, 3.916015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 7.0, 17.0, 22.0, 45.0, 58.0, 111.0, 137.0, 166.0, 126.0, 114.0, 69.0, 49.0, 20.0, 21.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.04656982421875, -33.05360794067383, -32.06064987182617, -31.067689895629883, -30.074729919433594, -29.081769943237305, -28.088809967041016, -27.095848083496094, -26.102890014648438, -25.10993003845215, -24.11697006225586, -23.12401008605957, -22.13105010986328, -21.138090133666992, -20.145130157470703, -19.15216827392578, -18.159208297729492, -17.166248321533203, -16.173288345336914, -15.180328369140625, -14.187368392944336, -13.194408416748047, -12.201447486877441, -11.208487510681152, -10.215527534484863, -9.222567558288574, -8.229607582092285, -7.236647129058838, -6.243687152862549, -5.25072717666626, -4.2577667236328125, -3.2648067474365234, -2.2718467712402344, -1.2788866758346558, -0.28592658042907715, 0.707033634185791, 1.69999361038208, 2.692953586578369, 3.6859140396118164, 4.6788740158081055, 5.6718339920043945, 6.664793968200684, 7.657753944396973, 8.650714874267578, 9.643674850463867, 10.636634826660156, 11.629594802856445, 12.622554779052734, 13.615514755249023, 14.608474731445312, 15.601434707641602, 16.59439468383789, 17.58735466003418, 18.58031463623047, 19.57327651977539, 20.566234588623047, 21.55919647216797, 22.552156448364258, 23.545116424560547, 24.538076400756836, 25.531036376953125, 26.523996353149414, 27.516956329345703, 28.509918212890625, 29.50287628173828]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 10.0, 10.0, 22.0, 23.0, 46.0, 47.0, 59.0, 59.0, 74.0, 85.0, 80.0, 81.0, 71.0, 72.0, 53.0, 58.0, 38.0, 25.0, 27.0, 18.0, 17.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.086515426635742, -20.235530853271484, -19.38454818725586, -18.5335636138916, -17.682579040527344, -16.831594467163086, -15.980610847473145, -15.129627227783203, -14.278642654418945, -13.427658081054688, -12.576674461364746, -11.725690841674805, -10.874706268310547, -10.023721694946289, -9.172738075256348, -8.321754455566406, -7.470769882202148, -6.619785785675049, -5.768801689147949, -4.91781759262085, -4.06683349609375, -3.2158493995666504, -2.364865303039551, -1.5138812065124512, -0.6628971099853516, 0.18808698654174805, 1.0390710830688477, 1.8900551795959473, 2.741039276123047, 3.5920233726501465, 4.443007469177246, 5.293991565704346, 6.144977569580078, 6.995961666107178, 7.846945762634277, 8.697929382324219, 9.548913955688477, 10.399898529052734, 11.250882148742676, 12.101865768432617, 12.952850341796875, 13.803834915161133, 14.654818534851074, 15.505802154541016, 16.356786727905273, 17.20777130126953, 18.058753967285156, 18.909738540649414, 19.760723114013672, 20.61170768737793, 21.462692260742188, 22.313674926757812, 23.16465950012207, 24.015644073486328, 24.866626739501953, 25.71761131286621, 26.56859588623047, 27.419580459594727, 28.270565032958984, 29.12154769897461, 29.972532272338867, 30.823516845703125, 31.67449951171875, 32.52548599243164, 33.376468658447266]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 11.0, 12.0, 9.0, 13.0, 20.0, 23.0, 26.0, 42.0, 73.0, 115.0, 208.0, 377.0, 705.0, 1495.0, 4150.0, 12972.0, 49136.0, 229694.0, 558365.0, 143388.0, 32947.0, 9144.0, 3045.0, 1181.0, 552.0, 324.0, 153.0, 100.0, 91.0, 54.0, 36.0, 23.0, 18.0, 16.0, 12.0, 1.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.9375, -12.52490234375, -12.1123046875, -11.69970703125, -11.287109375, -10.87451171875, -10.4619140625, -10.04931640625, -9.63671875, -9.22412109375, -8.8115234375, -8.39892578125, -7.986328125, -7.57373046875, -7.1611328125, -6.74853515625, -6.3359375, -5.92333984375, -5.5107421875, -5.09814453125, -4.685546875, -4.27294921875, -3.8603515625, -3.44775390625, -3.03515625, -2.62255859375, -2.2099609375, -1.79736328125, -1.384765625, -0.97216796875, -0.5595703125, -0.14697265625, 0.265625, 0.67822265625, 1.0908203125, 1.50341796875, 1.916015625, 2.32861328125, 2.7412109375, 3.15380859375, 3.56640625, 3.97900390625, 4.3916015625, 4.80419921875, 5.216796875, 5.62939453125, 6.0419921875, 6.45458984375, 6.8671875, 7.27978515625, 7.6923828125, 8.10498046875, 8.517578125, 8.93017578125, 9.3427734375, 9.75537109375, 10.16796875, 10.58056640625, 10.9931640625, 11.40576171875, 11.818359375, 12.23095703125, 12.6435546875, 13.05615234375, 13.46875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 9.0, 6.0, 23.0, 20.0, 32.0, 25.0, 39.0, 46.0, 59.0, 45.0, 63.0, 77.0, 69.0, 74.0, 62.0, 50.0, 54.0, 50.0, 43.0, 29.0, 27.0, 17.0, 17.0, 17.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96875, -1.8675537109375, -1.766357421875, -1.6651611328125, -1.56396484375, -1.4627685546875, -1.361572265625, -1.2603759765625, -1.1591796875, -1.0579833984375, -0.956787109375, -0.8555908203125, -0.75439453125, -0.6531982421875, -0.552001953125, -0.4508056640625, -0.349609375, -0.2484130859375, -0.147216796875, -0.0460205078125, 0.05517578125, 0.1563720703125, 0.257568359375, 0.3587646484375, 0.4599609375, 0.5611572265625, 0.662353515625, 0.7635498046875, 0.86474609375, 0.9659423828125, 1.067138671875, 1.1683349609375, 1.26953125, 1.3707275390625, 1.471923828125, 1.5731201171875, 1.67431640625, 1.7755126953125, 1.876708984375, 1.9779052734375, 2.0791015625, 2.1802978515625, 2.281494140625, 2.3826904296875, 2.48388671875, 2.5850830078125, 2.686279296875, 2.7874755859375, 2.888671875, 2.9898681640625, 3.091064453125, 3.1922607421875, 3.29345703125, 3.3946533203125, 3.495849609375, 3.5970458984375, 3.6982421875, 3.7994384765625, 3.900634765625, 4.0018310546875, 4.10302734375, 4.2042236328125, 4.305419921875, 4.4066162109375, 4.5078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 9.0, 16.0, 23.0, 29.0, 24.0, 44.0, 50.0, 76.0, 105.0, 199.0, 325.0, 548.0, 1049.0, 2437.0, 7120.0, 23413.0, 89766.0, 408219.0, 393734.0, 86800.0, 22787.0, 6856.0, 2443.0, 1117.0, 510.0, 272.0, 184.0, 114.0, 85.0, 62.0, 39.0, 24.0, 17.0, 13.0, 8.0, 5.0, 1.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0380859375, -7.740234375, -7.4423828125, -7.14453125, -6.8466796875, -6.548828125, -6.2509765625, -5.953125, -5.6552734375, -5.357421875, -5.0595703125, -4.76171875, -4.4638671875, -4.166015625, -3.8681640625, -3.5703125, -3.2724609375, -2.974609375, -2.6767578125, -2.37890625, -2.0810546875, -1.783203125, -1.4853515625, -1.1875, -0.8896484375, -0.591796875, -0.2939453125, 0.00390625, 0.3017578125, 0.599609375, 0.8974609375, 1.1953125, 1.4931640625, 1.791015625, 2.0888671875, 2.38671875, 2.6845703125, 2.982421875, 3.2802734375, 3.578125, 3.8759765625, 4.173828125, 4.4716796875, 4.76953125, 5.0673828125, 5.365234375, 5.6630859375, 5.9609375, 6.2587890625, 6.556640625, 6.8544921875, 7.15234375, 7.4501953125, 7.748046875, 8.0458984375, 8.34375, 8.6416015625, 8.939453125, 9.2373046875, 9.53515625, 9.8330078125, 10.130859375, 10.4287109375, 10.7265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 1.0, 7.0, 7.0, 15.0, 10.0, 7.0, 12.0, 20.0, 20.0, 30.0, 44.0, 40.0, 43.0, 39.0, 45.0, 44.0, 53.0, 53.0, 47.0, 55.0, 52.0, 38.0, 44.0, 35.0, 42.0, 44.0, 27.0, 22.0, 25.0, 22.0, 16.0, 9.0, 5.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9140625, -9.60888671875, -9.3037109375, -8.99853515625, -8.693359375, -8.38818359375, -8.0830078125, -7.77783203125, -7.47265625, -7.16748046875, -6.8623046875, -6.55712890625, -6.251953125, -5.94677734375, -5.6416015625, -5.33642578125, -5.03125, -4.72607421875, -4.4208984375, -4.11572265625, -3.810546875, -3.50537109375, -3.2001953125, -2.89501953125, -2.58984375, -2.28466796875, -1.9794921875, -1.67431640625, -1.369140625, -1.06396484375, -0.7587890625, -0.45361328125, -0.1484375, 0.15673828125, 0.4619140625, 0.76708984375, 1.072265625, 1.37744140625, 1.6826171875, 1.98779296875, 2.29296875, 2.59814453125, 2.9033203125, 3.20849609375, 3.513671875, 3.81884765625, 4.1240234375, 4.42919921875, 4.734375, 5.03955078125, 5.3447265625, 5.64990234375, 5.955078125, 6.26025390625, 6.5654296875, 6.87060546875, 7.17578125, 7.48095703125, 7.7861328125, 8.09130859375, 8.396484375, 8.70166015625, 9.0068359375, 9.31201171875, 9.6171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 26.0, 21.0, 41.0, 53.0, 86.0, 144.0, 296.0, 523.0, 1095.0, 2378.0, 5932.0, 18359.0, 99352.0, 764959.0, 123043.0, 20880.0, 6298.0, 2545.0, 1185.0, 547.0, 344.0, 164.0, 103.0, 63.0, 33.0, 26.0, 14.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.62890625, -4.45452880859375, -4.2801513671875, -4.10577392578125, -3.931396484375, -3.75701904296875, -3.5826416015625, -3.40826416015625, -3.23388671875, -3.05950927734375, -2.8851318359375, -2.71075439453125, -2.536376953125, -2.36199951171875, -2.1876220703125, -2.01324462890625, -1.8388671875, -1.66448974609375, -1.4901123046875, -1.31573486328125, -1.141357421875, -0.96697998046875, -0.7926025390625, -0.61822509765625, -0.44384765625, -0.26947021484375, -0.0950927734375, 0.07928466796875, 0.253662109375, 0.42803955078125, 0.6024169921875, 0.77679443359375, 0.951171875, 1.12554931640625, 1.2999267578125, 1.47430419921875, 1.648681640625, 1.82305908203125, 1.9974365234375, 2.17181396484375, 2.34619140625, 2.52056884765625, 2.6949462890625, 2.86932373046875, 3.043701171875, 3.21807861328125, 3.3924560546875, 3.56683349609375, 3.7412109375, 3.91558837890625, 4.0899658203125, 4.26434326171875, 4.438720703125, 4.61309814453125, 4.7874755859375, 4.96185302734375, 5.13623046875, 5.31060791015625, 5.4849853515625, 5.65936279296875, 5.833740234375, 6.00811767578125, 6.1824951171875, 6.35687255859375, 6.53125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 17.0, 22.0, 23.0, 60.0, 187.0, 419.0, 120.0, 46.0, 19.0, 25.0, 13.0, 15.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017833709716796875, -0.001738041639328003, -0.0016927123069763184, -0.0016473829746246338, -0.0016020536422729492, -0.0015567243099212646, -0.00151139497756958, -0.0014660656452178955, -0.001420736312866211, -0.0013754069805145264, -0.0013300776481628418, -0.0012847483158111572, -0.0012394189834594727, -0.001194089651107788, -0.0011487603187561035, -0.001103430986404419, -0.0010581016540527344, -0.0010127723217010498, -0.0009674429893493652, -0.0009221136569976807, -0.0008767843246459961, -0.0008314549922943115, -0.000786125659942627, -0.0007407963275909424, -0.0006954669952392578, -0.0006501376628875732, -0.0006048083305358887, -0.0005594789981842041, -0.0005141496658325195, -0.00046882033348083496, -0.0004234910011291504, -0.0003781616687774658, -0.00033283233642578125, -0.0002875030040740967, -0.0002421736717224121, -0.00019684433937072754, -0.00015151500701904297, -0.0001061856746673584, -6.085634231567383e-05, -1.5527009963989258e-05, 2.9802322387695312e-05, 7.513165473937988e-05, 0.00012046098709106445, 0.00016579031944274902, 0.0002111196517944336, 0.00025644898414611816, 0.00030177831649780273, 0.0003471076488494873, 0.0003924369812011719, 0.00043776631355285645, 0.000483095645904541, 0.0005284249782562256, 0.0005737543106079102, 0.0006190836429595947, 0.0006644129753112793, 0.0007097423076629639, 0.0007550716400146484, 0.000800400972366333, 0.0008457303047180176, 0.0008910596370697021, 0.0009363889694213867, 0.0009817183017730713, 0.0010270476341247559, 0.0010723769664764404, 0.001117706298828125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 14.0, 16.0, 13.0, 21.0, 63.0, 88.0, 144.0, 247.0, 434.0, 892.0, 2063.0, 5182.0, 18525.0, 156393.0, 797410.0, 50790.0, 10037.0, 3300.0, 1417.0, 652.0, 350.0, 192.0, 113.0, 63.0, 48.0, 29.0, 20.0, 5.0, 7.0, 8.0, 8.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.68359375, -7.4658203125, -7.248046875, -7.0302734375, -6.8125, -6.5947265625, -6.376953125, -6.1591796875, -5.94140625, -5.7236328125, -5.505859375, -5.2880859375, -5.0703125, -4.8525390625, -4.634765625, -4.4169921875, -4.19921875, -3.9814453125, -3.763671875, -3.5458984375, -3.328125, -3.1103515625, -2.892578125, -2.6748046875, -2.45703125, -2.2392578125, -2.021484375, -1.8037109375, -1.5859375, -1.3681640625, -1.150390625, -0.9326171875, -0.71484375, -0.4970703125, -0.279296875, -0.0615234375, 0.15625, 0.3740234375, 0.591796875, 0.8095703125, 1.02734375, 1.2451171875, 1.462890625, 1.6806640625, 1.8984375, 2.1162109375, 2.333984375, 2.5517578125, 2.76953125, 2.9873046875, 3.205078125, 3.4228515625, 3.640625, 3.8583984375, 4.076171875, 4.2939453125, 4.51171875, 4.7294921875, 4.947265625, 5.1650390625, 5.3828125, 5.6005859375, 5.818359375, 6.0361328125, 6.25390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 7.0, 18.0, 20.0, 35.0, 55.0, 99.0, 200.0, 224.0, 137.0, 78.0, 39.0, 25.0, 15.0, 11.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.703125, -6.488037109375, -6.27294921875, -6.057861328125, -5.8427734375, -5.627685546875, -5.41259765625, -5.197509765625, -4.982421875, -4.767333984375, -4.55224609375, -4.337158203125, -4.1220703125, -3.906982421875, -3.69189453125, -3.476806640625, -3.26171875, -3.046630859375, -2.83154296875, -2.616455078125, -2.4013671875, -2.186279296875, -1.97119140625, -1.756103515625, -1.541015625, -1.325927734375, -1.11083984375, -0.895751953125, -0.6806640625, -0.465576171875, -0.25048828125, -0.035400390625, 0.1796875, 0.394775390625, 0.60986328125, 0.824951171875, 1.0400390625, 1.255126953125, 1.47021484375, 1.685302734375, 1.900390625, 2.115478515625, 2.33056640625, 2.545654296875, 2.7607421875, 2.975830078125, 3.19091796875, 3.406005859375, 3.62109375, 3.836181640625, 4.05126953125, 4.266357421875, 4.4814453125, 4.696533203125, 4.91162109375, 5.126708984375, 5.341796875, 5.556884765625, 5.77197265625, 5.987060546875, 6.2021484375, 6.417236328125, 6.63232421875, 6.847412109375, 7.0625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 11.0, 31.0, 66.0, 103.0, 186.0, 211.0, 189.0, 102.0, 50.0, 27.0, 16.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.35700607299805, -56.31415939331055, -53.27131271362305, -50.22846603393555, -47.18561935424805, -44.14277267456055, -41.09992218017578, -38.05707550048828, -35.01422882080078, -31.97138214111328, -28.92853546142578, -25.88568878173828, -22.84284210205078, -19.79999542236328, -16.75714683532715, -13.714300155639648, -10.671455383300781, -7.628608703613281, -4.585761547088623, -1.5429143905639648, 1.4999322891235352, 4.542778968811035, 7.585626602172852, 10.628473281860352, 13.671319961547852, 16.71416664123535, 19.75701332092285, 22.799861907958984, 25.842708587646484, 28.885555267333984, 31.928401947021484, 34.971248626708984, 38.01409149169922, 41.05693817138672, 44.09978485107422, 47.14263153076172, 50.18547821044922, 53.22832489013672, 56.27117156982422, 59.31401824951172, 62.35686492919922, 65.39971160888672, 68.44255828857422, 71.48540496826172, 74.52825164794922, 77.57109832763672, 80.61394500732422, 83.65679168701172, 86.69964599609375, 89.74249267578125, 92.78533935546875, 95.82818603515625, 98.87103271484375, 101.91387939453125, 104.95672607421875, 107.99957275390625, 111.04241943359375, 114.08526611328125, 117.12811279296875, 120.17095947265625, 123.21380615234375, 126.25665283203125, 129.29949951171875, 132.34234619140625, 135.38519287109375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 5.0, 5.0, 11.0, 15.0, 13.0, 13.0, 17.0, 16.0, 22.0, 21.0, 27.0, 29.0, 29.0, 25.0, 33.0, 35.0, 35.0, 50.0, 38.0, 37.0, 48.0, 34.0, 46.0, 39.0, 36.0, 39.0, 27.0, 28.0, 22.0, 18.0, 23.0, 19.0, 19.0, 14.0, 17.0, 17.0, 14.0, 9.0, 14.0, 8.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.96068572998047, -34.733070373535156, -33.505455017089844, -32.27783966064453, -31.05022430419922, -29.822608947753906, -28.594995498657227, -27.367380142211914, -26.1397647857666, -24.91214942932129, -23.684534072875977, -22.456918716430664, -21.229305267333984, -20.001689910888672, -18.77407455444336, -17.546459197998047, -16.318843841552734, -15.091228485107422, -13.86361312866211, -12.635998725891113, -11.4083833694458, -10.180768013000488, -8.953153610229492, -7.72553825378418, -6.497922897338867, -5.270307540893555, -4.0426926612854, -2.815077543258667, -1.5874624252319336, -0.3598470687866211, 0.8677678108215332, 2.0953826904296875, 3.3229942321777344, 4.550609588623047, 5.778224468231201, 7.0058393478393555, 8.233454704284668, 9.46107006072998, 10.688684463500977, 11.916299819946289, 13.143915176391602, 14.371530532836914, 15.599145889282227, 16.82676124572754, 18.05437469482422, 19.28199005126953, 20.509605407714844, 21.737220764160156, 22.96483612060547, 24.19245147705078, 25.420066833496094, 26.647682189941406, 27.87529754638672, 29.10291290283203, 30.33052635192871, 31.558141708374023, 32.78575897216797, 34.01337432861328, 35.240989685058594, 36.468605041503906, 37.69622039794922, 38.92383575439453, 40.151451110839844, 41.379066467285156, 42.6066780090332]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 20.0, 24.0, 29.0, 57.0, 104.0, 157.0, 250.0, 496.0, 1110.0, 2851.0, 8522.0, 38186.0, 2360029.0, 1731258.0, 37887.0, 8419.0, 2705.0, 1029.0, 475.0, 241.0, 134.0, 92.0, 49.0, 47.0, 28.0, 21.0, 11.0, 18.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.244140625, -18.50390625, -17.763671875, -17.0234375, -16.283203125, -15.54296875, -14.802734375, -14.0625, -13.322265625, -12.58203125, -11.841796875, -11.1015625, -10.361328125, -9.62109375, -8.880859375, -8.140625, -7.400390625, -6.66015625, -5.919921875, -5.1796875, -4.439453125, -3.69921875, -2.958984375, -2.21875, -1.478515625, -0.73828125, 0.001953125, 0.7421875, 1.482421875, 2.22265625, 2.962890625, 3.703125, 4.443359375, 5.18359375, 5.923828125, 6.6640625, 7.404296875, 8.14453125, 8.884765625, 9.625, 10.365234375, 11.10546875, 11.845703125, 12.5859375, 13.326171875, 14.06640625, 14.806640625, 15.546875, 16.287109375, 17.02734375, 17.767578125, 18.5078125, 19.248046875, 19.98828125, 20.728515625, 21.46875, 22.208984375, 22.94921875, 23.689453125, 24.4296875, 25.169921875, 25.91015625, 26.650390625, 27.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 6.0, 3.0, 4.0, 7.0, 10.0, 11.0, 11.0, 19.0, 21.0, 28.0, 21.0, 31.0, 43.0, 54.0, 59.0, 69.0, 72.0, 54.0, 50.0, 63.0, 55.0, 61.0, 58.0, 45.0, 29.0, 26.0, 31.0, 13.0, 12.0, 15.0, 13.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0703125, -1.9703369140625, -1.870361328125, -1.7703857421875, -1.67041015625, -1.5704345703125, -1.470458984375, -1.3704833984375, -1.2705078125, -1.1705322265625, -1.070556640625, -0.9705810546875, -0.87060546875, -0.7706298828125, -0.670654296875, -0.5706787109375, -0.470703125, -0.3707275390625, -0.270751953125, -0.1707763671875, -0.07080078125, 0.0291748046875, 0.129150390625, 0.2291259765625, 0.3291015625, 0.4290771484375, 0.529052734375, 0.6290283203125, 0.72900390625, 0.8289794921875, 0.928955078125, 1.0289306640625, 1.12890625, 1.2288818359375, 1.328857421875, 1.4288330078125, 1.52880859375, 1.6287841796875, 1.728759765625, 1.8287353515625, 1.9287109375, 2.0286865234375, 2.128662109375, 2.2286376953125, 2.32861328125, 2.4285888671875, 2.528564453125, 2.6285400390625, 2.728515625, 2.8284912109375, 2.928466796875, 3.0284423828125, 3.12841796875, 3.2283935546875, 3.328369140625, 3.4283447265625, 3.5283203125, 3.6282958984375, 3.728271484375, 3.8282470703125, 3.92822265625, 4.0281982421875, 4.128173828125, 4.2281494140625, 4.328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 4.0, 7.0, 11.0, 24.0, 22.0, 28.0, 50.0, 74.0, 92.0, 142.0, 229.0, 376.0, 578.0, 1150.0, 2455.0, 5499.0, 14449.0, 44892.0, 226370.0, 3574632.0, 249919.0, 47442.0, 14829.0, 5799.0, 2453.0, 1111.0, 580.0, 393.0, 219.0, 124.0, 95.0, 52.0, 49.0, 33.0, 24.0, 24.0, 14.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.4183349609375, -10.039794921875, -9.6612548828125, -9.28271484375, -8.9041748046875, -8.525634765625, -8.1470947265625, -7.7685546875, -7.3900146484375, -7.011474609375, -6.6329345703125, -6.25439453125, -5.8758544921875, -5.497314453125, -5.1187744140625, -4.740234375, -4.3616943359375, -3.983154296875, -3.6046142578125, -3.22607421875, -2.8475341796875, -2.468994140625, -2.0904541015625, -1.7119140625, -1.3333740234375, -0.954833984375, -0.5762939453125, -0.19775390625, 0.1807861328125, 0.559326171875, 0.9378662109375, 1.31640625, 1.6949462890625, 2.073486328125, 2.4520263671875, 2.83056640625, 3.2091064453125, 3.587646484375, 3.9661865234375, 4.3447265625, 4.7232666015625, 5.101806640625, 5.4803466796875, 5.85888671875, 6.2374267578125, 6.615966796875, 6.9945068359375, 7.373046875, 7.7515869140625, 8.130126953125, 8.5086669921875, 8.88720703125, 9.2657470703125, 9.644287109375, 10.0228271484375, 10.4013671875, 10.7799072265625, 11.158447265625, 11.5369873046875, 11.91552734375, 12.2940673828125, 12.672607421875, 13.0511474609375, 13.4296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 13.0, 19.0, 25.0, 29.0, 36.0, 64.0, 120.0, 206.0, 581.0, 2133.0, 402.0, 141.0, 83.0, 56.0, 37.0, 25.0, 29.0, 11.0, 4.0, 3.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.37298583984375, -4.2069091796875, -4.04083251953125, -3.874755859375, -3.70867919921875, -3.5426025390625, -3.37652587890625, -3.21044921875, -3.04437255859375, -2.8782958984375, -2.71221923828125, -2.546142578125, -2.38006591796875, -2.2139892578125, -2.04791259765625, -1.8818359375, -1.71575927734375, -1.5496826171875, -1.38360595703125, -1.217529296875, -1.05145263671875, -0.8853759765625, -0.71929931640625, -0.55322265625, -0.38714599609375, -0.2210693359375, -0.05499267578125, 0.111083984375, 0.27716064453125, 0.4432373046875, 0.60931396484375, 0.775390625, 0.94146728515625, 1.1075439453125, 1.27362060546875, 1.439697265625, 1.60577392578125, 1.7718505859375, 1.93792724609375, 2.10400390625, 2.27008056640625, 2.4361572265625, 2.60223388671875, 2.768310546875, 2.93438720703125, 3.1004638671875, 3.26654052734375, 3.4326171875, 3.59869384765625, 3.7647705078125, 3.93084716796875, 4.096923828125, 4.26300048828125, 4.4290771484375, 4.59515380859375, 4.76123046875, 4.92730712890625, 5.0933837890625, 5.25946044921875, 5.425537109375, 5.59161376953125, 5.7576904296875, 5.92376708984375, 6.08984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 9.0, 4.0, 19.0, 26.0, 82.0, 164.0, 226.0, 182.0, 153.0, 69.0, 29.0, 17.0, 8.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.158531188964844, -52.764747619628906, -51.37096405029297, -49.977176666259766, -48.58339309692383, -47.18960952758789, -45.79582595825195, -44.40203857421875, -43.00825500488281, -41.614471435546875, -40.22068786621094, -38.826900482177734, -37.4331169128418, -36.03933334350586, -34.64554977416992, -33.25176239013672, -31.857980728149414, -30.464197158813477, -29.070411682128906, -27.67662811279297, -26.2828426361084, -24.88905906677246, -23.49527359008789, -22.101490020751953, -20.707706451416016, -19.313922882080078, -17.920137405395508, -16.52635383605957, -15.132568359375, -13.738784790039062, -12.345000267028809, -10.951215744018555, -9.557430267333984, -8.16364574432373, -6.769861221313477, -5.376077175140381, -3.982292652130127, -2.588508129119873, -1.1947240829467773, 0.19906044006347656, 1.5928449630737305, 2.9866294860839844, 4.380414009094238, 5.774198055267334, 7.167982578277588, 8.561767578125, 9.955551147460938, 11.349335670471191, 12.743120193481445, 14.1369047164917, 15.530689239501953, 16.92447280883789, 18.31825828552246, 19.7120418548584, 21.10582733154297, 22.499610900878906, 23.893394470214844, 25.28717803955078, 26.68096351623535, 28.07474708557129, 29.46853256225586, 30.862316131591797, 32.256099700927734, 33.64988708496094, 35.043670654296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 18.0, 20.0, 25.0, 38.0, 40.0, 49.0, 62.0, 60.0, 69.0, 84.0, 78.0, 79.0, 73.0, 67.0, 49.0, 33.0, 42.0, 29.0, 25.0, 21.0, 11.0, 8.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.885009765625, -23.145307540893555, -22.40560531616211, -21.665904998779297, -20.92620277404785, -20.186500549316406, -19.44679832458496, -18.707096099853516, -17.967395782470703, -17.227693557739258, -16.487991333007812, -15.748290061950684, -15.008588790893555, -14.26888656616211, -13.529184341430664, -12.789482116699219, -12.049779891967773, -11.310077667236328, -10.5703763961792, -9.830674171447754, -9.090972900390625, -8.35127067565918, -7.611568450927734, -6.871866703033447, -6.13216495513916, -5.392463207244873, -4.652761459350586, -3.9130592346191406, -3.1733574867248535, -2.4336557388305664, -1.693953514099121, -0.954251766204834, -0.2145519256591797, 0.525149941444397, 1.2648518085479736, 2.00455379486084, 2.744255542755127, 3.483957290649414, 4.223659515380859, 4.9633612632751465, 5.703063011169434, 6.442764759063721, 7.182466506958008, 7.922168731689453, 8.661870956420898, 9.401572227478027, 10.141274452209473, 10.880975723266602, 11.620677947998047, 12.360380172729492, 13.100081443786621, 13.839783668518066, 14.579484939575195, 15.31918716430664, 16.058889389038086, 16.79859161376953, 17.538291931152344, 18.27799415588379, 19.017696380615234, 19.757396697998047, 20.497098922729492, 21.236801147460938, 21.976503372192383, 22.716205596923828, 23.455907821655273]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 12.0, 18.0, 20.0, 36.0, 52.0, 80.0, 228.0, 350.0, 746.0, 1685.0, 4679.0, 14670.0, 56988.0, 235418.0, 499125.0, 174690.0, 41671.0, 11463.0, 3769.0, 1440.0, 616.0, 336.0, 192.0, 104.0, 38.0, 38.0, 21.0, 16.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.3125, -16.861572265625, -16.41064453125, -15.959716796875, -15.5087890625, -15.057861328125, -14.60693359375, -14.156005859375, -13.705078125, -13.254150390625, -12.80322265625, -12.352294921875, -11.9013671875, -11.450439453125, -10.99951171875, -10.548583984375, -10.09765625, -9.646728515625, -9.19580078125, -8.744873046875, -8.2939453125, -7.843017578125, -7.39208984375, -6.941162109375, -6.490234375, -6.039306640625, -5.58837890625, -5.137451171875, -4.6865234375, -4.235595703125, -3.78466796875, -3.333740234375, -2.8828125, -2.431884765625, -1.98095703125, -1.530029296875, -1.0791015625, -0.628173828125, -0.17724609375, 0.273681640625, 0.724609375, 1.175537109375, 1.62646484375, 2.077392578125, 2.5283203125, 2.979248046875, 3.43017578125, 3.881103515625, 4.33203125, 4.782958984375, 5.23388671875, 5.684814453125, 6.1357421875, 6.586669921875, 7.03759765625, 7.488525390625, 7.939453125, 8.390380859375, 8.84130859375, 9.292236328125, 9.7431640625, 10.194091796875, 10.64501953125, 11.095947265625, 11.546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 8.0, 13.0, 9.0, 8.0, 23.0, 23.0, 25.0, 33.0, 36.0, 34.0, 56.0, 64.0, 59.0, 57.0, 71.0, 51.0, 60.0, 60.0, 41.0, 55.0, 35.0, 32.0, 39.0, 22.0, 25.0, 11.0, 11.0, 6.0, 12.0, 3.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.9215087890625, -1.823486328125, -1.7254638671875, -1.62744140625, -1.5294189453125, -1.431396484375, -1.3333740234375, -1.2353515625, -1.1373291015625, -1.039306640625, -0.9412841796875, -0.84326171875, -0.7452392578125, -0.647216796875, -0.5491943359375, -0.451171875, -0.3531494140625, -0.255126953125, -0.1571044921875, -0.05908203125, 0.0389404296875, 0.136962890625, 0.2349853515625, 0.3330078125, 0.4310302734375, 0.529052734375, 0.6270751953125, 0.72509765625, 0.8231201171875, 0.921142578125, 1.0191650390625, 1.1171875, 1.2152099609375, 1.313232421875, 1.4112548828125, 1.50927734375, 1.6072998046875, 1.705322265625, 1.8033447265625, 1.9013671875, 1.9993896484375, 2.097412109375, 2.1954345703125, 2.29345703125, 2.3914794921875, 2.489501953125, 2.5875244140625, 2.685546875, 2.7835693359375, 2.881591796875, 2.9796142578125, 3.07763671875, 3.1756591796875, 3.273681640625, 3.3717041015625, 3.4697265625, 3.5677490234375, 3.665771484375, 3.7637939453125, 3.86181640625, 3.9598388671875, 4.057861328125, 4.1558837890625, 4.25390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 1.0, 5.0, 6.0, 11.0, 15.0, 11.0, 22.0, 34.0, 38.0, 44.0, 70.0, 99.0, 149.0, 197.0, 302.0, 525.0, 870.0, 2011.0, 6559.0, 31023.0, 202904.0, 620667.0, 150272.0, 23587.0, 5200.0, 1744.0, 810.0, 445.0, 285.0, 194.0, 108.0, 94.0, 75.0, 43.0, 36.0, 31.0, 19.0, 11.0, 10.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.9609375, -14.5133056640625, -14.065673828125, -13.6180419921875, -13.17041015625, -12.7227783203125, -12.275146484375, -11.8275146484375, -11.3798828125, -10.9322509765625, -10.484619140625, -10.0369873046875, -9.58935546875, -9.1417236328125, -8.694091796875, -8.2464599609375, -7.798828125, -7.3511962890625, -6.903564453125, -6.4559326171875, -6.00830078125, -5.5606689453125, -5.113037109375, -4.6654052734375, -4.2177734375, -3.7701416015625, -3.322509765625, -2.8748779296875, -2.42724609375, -1.9796142578125, -1.531982421875, -1.0843505859375, -0.63671875, -0.1890869140625, 0.258544921875, 0.7061767578125, 1.15380859375, 1.6014404296875, 2.049072265625, 2.4967041015625, 2.9443359375, 3.3919677734375, 3.839599609375, 4.2872314453125, 4.73486328125, 5.1824951171875, 5.630126953125, 6.0777587890625, 6.525390625, 6.9730224609375, 7.420654296875, 7.8682861328125, 8.31591796875, 8.7635498046875, 9.211181640625, 9.6588134765625, 10.1064453125, 10.5540771484375, 11.001708984375, 11.4493408203125, 11.89697265625, 12.3446044921875, 12.792236328125, 13.2398681640625, 13.6875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 4.0, 3.0, 8.0, 7.0, 6.0, 14.0, 13.0, 19.0, 23.0, 37.0, 32.0, 35.0, 24.0, 42.0, 44.0, 36.0, 45.0, 54.0, 46.0, 52.0, 52.0, 42.0, 42.0, 38.0, 45.0, 40.0, 30.0, 27.0, 23.0, 17.0, 14.0, 15.0, 15.0, 9.0, 5.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.5390625, -11.2000732421875, -10.861083984375, -10.5220947265625, -10.18310546875, -9.8441162109375, -9.505126953125, -9.1661376953125, -8.8271484375, -8.4881591796875, -8.149169921875, -7.8101806640625, -7.47119140625, -7.1322021484375, -6.793212890625, -6.4542236328125, -6.115234375, -5.7762451171875, -5.437255859375, -5.0982666015625, -4.75927734375, -4.4202880859375, -4.081298828125, -3.7423095703125, -3.4033203125, -3.0643310546875, -2.725341796875, -2.3863525390625, -2.04736328125, -1.7083740234375, -1.369384765625, -1.0303955078125, -0.69140625, -0.3524169921875, -0.013427734375, 0.3255615234375, 0.66455078125, 1.0035400390625, 1.342529296875, 1.6815185546875, 2.0205078125, 2.3594970703125, 2.698486328125, 3.0374755859375, 3.37646484375, 3.7154541015625, 4.054443359375, 4.3934326171875, 4.732421875, 5.0714111328125, 5.410400390625, 5.7493896484375, 6.08837890625, 6.4273681640625, 6.766357421875, 7.1053466796875, 7.4443359375, 7.7833251953125, 8.122314453125, 8.4613037109375, 8.80029296875, 9.1392822265625, 9.478271484375, 9.8172607421875, 10.15625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 11.0, 13.0, 12.0, 18.0, 25.0, 37.0, 79.0, 105.0, 229.0, 325.0, 641.0, 1327.0, 2778.0, 6948.0, 20828.0, 78485.0, 514494.0, 332399.0, 61835.0, 17144.0, 5970.0, 2388.0, 1105.0, 564.0, 297.0, 199.0, 100.0, 66.0, 42.0, 27.0, 25.0, 7.0, 8.0, 11.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0], "bins": [-8.4453125, -8.2388916015625, -8.032470703125, -7.8260498046875, -7.61962890625, -7.4132080078125, -7.206787109375, -7.0003662109375, -6.7939453125, -6.5875244140625, -6.381103515625, -6.1746826171875, -5.96826171875, -5.7618408203125, -5.555419921875, -5.3489990234375, -5.142578125, -4.9361572265625, -4.729736328125, -4.5233154296875, -4.31689453125, -4.1104736328125, -3.904052734375, -3.6976318359375, -3.4912109375, -3.2847900390625, -3.078369140625, -2.8719482421875, -2.66552734375, -2.4591064453125, -2.252685546875, -2.0462646484375, -1.83984375, -1.6334228515625, -1.427001953125, -1.2205810546875, -1.01416015625, -0.8077392578125, -0.601318359375, -0.3948974609375, -0.1884765625, 0.0179443359375, 0.224365234375, 0.4307861328125, 0.63720703125, 0.8436279296875, 1.050048828125, 1.2564697265625, 1.462890625, 1.6693115234375, 1.875732421875, 2.0821533203125, 2.28857421875, 2.4949951171875, 2.701416015625, 2.9078369140625, 3.1142578125, 3.3206787109375, 3.527099609375, 3.7335205078125, 3.93994140625, 4.1463623046875, 4.352783203125, 4.5592041015625, 4.765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 8.0, 10.0, 17.0, 19.0, 31.0, 40.0, 50.0, 78.0, 132.0, 268.0, 109.0, 65.0, 48.0, 42.0, 28.0, 18.0, 11.0, 9.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014829635620117188, -0.0014371275901794434, -0.001391291618347168, -0.0013454556465148926, -0.0012996196746826172, -0.0012537837028503418, -0.0012079477310180664, -0.001162111759185791, -0.0011162757873535156, -0.0010704398155212402, -0.0010246038436889648, -0.0009787678718566895, -0.0009329319000244141, -0.0008870959281921387, -0.0008412599563598633, -0.0007954239845275879, -0.0007495880126953125, -0.0007037520408630371, -0.0006579160690307617, -0.0006120800971984863, -0.0005662441253662109, -0.0005204081535339355, -0.00047457218170166016, -0.00042873620986938477, -0.0003829002380371094, -0.000337064266204834, -0.0002912282943725586, -0.0002453923225402832, -0.0001995563507080078, -0.00015372037887573242, -0.00010788440704345703, -6.204843521118164e-05, -1.621246337890625e-05, 2.962350845336914e-05, 7.545948028564453e-05, 0.00012129545211791992, 0.0001671314239501953, 0.0002129673957824707, 0.0002588033676147461, 0.0003046393394470215, 0.0003504753112792969, 0.00039631128311157227, 0.00044214725494384766, 0.00048798322677612305, 0.0005338191986083984, 0.0005796551704406738, 0.0006254911422729492, 0.0006713271141052246, 0.0007171630859375, 0.0007629990577697754, 0.0008088350296020508, 0.0008546710014343262, 0.0009005069732666016, 0.000946342945098877, 0.0009921789169311523, 0.0010380148887634277, 0.0010838508605957031, 0.0011296868324279785, 0.001175522804260254, 0.0012213587760925293, 0.0012671947479248047, 0.00131303071975708, 0.0013588666915893555, 0.0014047026634216309, 0.0014505386352539062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 11.0, 21.0, 31.0, 50.0, 124.0, 279.0, 675.0, 2999.0, 35194.0, 930220.0, 72858.0, 4503.0, 947.0, 340.0, 134.0, 82.0, 34.0, 20.0, 11.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.23095703125, -18.6025390625, -17.97412109375, -17.345703125, -16.71728515625, -16.0888671875, -15.46044921875, -14.83203125, -14.20361328125, -13.5751953125, -12.94677734375, -12.318359375, -11.68994140625, -11.0615234375, -10.43310546875, -9.8046875, -9.17626953125, -8.5478515625, -7.91943359375, -7.291015625, -6.66259765625, -6.0341796875, -5.40576171875, -4.77734375, -4.14892578125, -3.5205078125, -2.89208984375, -2.263671875, -1.63525390625, -1.0068359375, -0.37841796875, 0.25, 0.87841796875, 1.5068359375, 2.13525390625, 2.763671875, 3.39208984375, 4.0205078125, 4.64892578125, 5.27734375, 5.90576171875, 6.5341796875, 7.16259765625, 7.791015625, 8.41943359375, 9.0478515625, 9.67626953125, 10.3046875, 10.93310546875, 11.5615234375, 12.18994140625, 12.818359375, 13.44677734375, 14.0751953125, 14.70361328125, 15.33203125, 15.96044921875, 16.5888671875, 17.21728515625, 17.845703125, 18.47412109375, 19.1025390625, 19.73095703125, 20.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 6.0, 9.0, 9.0, 8.0, 14.0, 31.0, 25.0, 42.0, 58.0, 105.0, 115.0, 189.0, 125.0, 74.0, 40.0, 42.0, 23.0, 20.0, 14.0, 10.0, 16.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.8602294921875, -4.595458984375, -4.3306884765625, -4.06591796875, -3.8011474609375, -3.536376953125, -3.2716064453125, -3.0068359375, -2.7420654296875, -2.477294921875, -2.2125244140625, -1.94775390625, -1.6829833984375, -1.418212890625, -1.1534423828125, -0.888671875, -0.6239013671875, -0.359130859375, -0.0943603515625, 0.17041015625, 0.4351806640625, 0.699951171875, 0.9647216796875, 1.2294921875, 1.4942626953125, 1.759033203125, 2.0238037109375, 2.28857421875, 2.5533447265625, 2.818115234375, 3.0828857421875, 3.34765625, 3.6124267578125, 3.877197265625, 4.1419677734375, 4.40673828125, 4.6715087890625, 4.936279296875, 5.2010498046875, 5.4658203125, 5.7305908203125, 5.995361328125, 6.2601318359375, 6.52490234375, 6.7896728515625, 7.054443359375, 7.3192138671875, 7.583984375, 7.8487548828125, 8.113525390625, 8.3782958984375, 8.64306640625, 8.9078369140625, 9.172607421875, 9.4373779296875, 9.7021484375, 9.9669189453125, 10.231689453125, 10.4964599609375, 10.76123046875, 11.0260009765625, 11.290771484375, 11.5555419921875, 11.8203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 23.0, 37.0, 74.0, 133.0, 173.0, 197.0, 144.0, 96.0, 59.0, 32.0, 14.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-92.31546020507812, -88.49166107177734, -84.66786193847656, -80.84406280517578, -77.020263671875, -73.19647216796875, -69.37266540527344, -65.54887390136719, -61.725074768066406, -57.901275634765625, -54.077476501464844, -50.25367736816406, -46.42988204956055, -42.606082916259766, -38.782283782958984, -34.95848846435547, -31.134685516357422, -27.31088638305664, -23.487089157104492, -19.66329002380371, -15.839491844177246, -12.015693664550781, -8.19189453125, -4.368097305297852, -0.5442981719970703, 3.2795002460479736, 7.103298664093018, 10.92709732055664, 14.750895500183105, 18.57469367980957, 22.39849281311035, 26.2222900390625, 30.04608917236328, 33.86988830566406, 37.693687438964844, 41.517486572265625, 45.34128189086914, 49.16508102416992, 52.9888801574707, 56.81267547607422, 60.636474609375, 64.46027374267578, 68.28407287597656, 72.10787200927734, 75.93167114257812, 79.75546264648438, 83.57926940917969, 87.40306091308594, 91.22686767578125, 95.05066680908203, 98.87446594238281, 102.6982650756836, 106.52206420898438, 110.34585571289062, 114.16966247558594, 117.99345397949219, 121.81725311279297, 125.64105224609375, 129.46484375, 133.2886505126953, 137.11244201660156, 140.93624877929688, 144.76004028320312, 148.58384704589844, 152.4076385498047]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 7.0, 7.0, 16.0, 14.0, 19.0, 28.0, 22.0, 37.0, 29.0, 34.0, 40.0, 48.0, 37.0, 39.0, 35.0, 47.0, 47.0, 56.0, 46.0, 44.0, 40.0, 24.0, 36.0, 26.0, 31.0, 25.0, 16.0, 27.0, 19.0, 19.0, 10.0, 9.0, 10.0, 7.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.81776428222656, -43.98305892944336, -42.148353576660156, -40.31365203857422, -38.478946685791016, -36.64424133300781, -34.80953598022461, -32.974830627441406, -31.140125274658203, -29.305419921875, -27.47071647644043, -25.636011123657227, -23.801305770874023, -21.966602325439453, -20.13189697265625, -18.297191619873047, -16.462488174438477, -14.62778377532959, -12.793078422546387, -10.9583740234375, -9.123668670654297, -7.28896427154541, -5.454259872436523, -3.6195545196533203, -1.7848501205444336, 0.04985463619232178, 1.8845593929290771, 3.719264030456543, 5.553968906402588, 7.388673782348633, 9.22337818145752, 11.058083534240723, 12.89278793334961, 14.727492332458496, 16.562196731567383, 18.396902084350586, 20.23160743713379, 22.06631088256836, 23.901016235351562, 25.735721588134766, 27.57042694091797, 29.405132293701172, 31.239835739135742, 33.07453918457031, 34.909244537353516, 36.74394989013672, 38.57865524291992, 40.413360595703125, 42.24806213378906, 44.082767486572266, 45.91747283935547, 47.752174377441406, 49.58687973022461, 51.42158508300781, 53.256290435791016, 55.09099578857422, 56.92570114135742, 58.760406494140625, 60.59511184692383, 62.42981719970703, 64.26451873779297, 66.09922790527344, 67.93392944335938, 69.76863098144531, 71.60334014892578]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 17.0, 13.0, 15.0, 11.0, 25.0, 29.0, 38.0, 48.0, 69.0, 94.0, 125.0, 223.0, 329.0, 493.0, 834.0, 1625.0, 3732.0, 9203.0, 28820.0, 158980.0, 3685427.0, 247322.0, 37037.0, 10887.0, 4337.0, 1918.0, 959.0, 521.0, 337.0, 218.0, 151.0, 108.0, 82.0, 60.0, 42.0, 31.0, 20.0, 21.0, 17.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-14.703125, -14.2376708984375, -13.772216796875, -13.3067626953125, -12.84130859375, -12.3758544921875, -11.910400390625, -11.4449462890625, -10.9794921875, -10.5140380859375, -10.048583984375, -9.5831298828125, -9.11767578125, -8.6522216796875, -8.186767578125, -7.7213134765625, -7.255859375, -6.7904052734375, -6.324951171875, -5.8594970703125, -5.39404296875, -4.9285888671875, -4.463134765625, -3.9976806640625, -3.5322265625, -3.0667724609375, -2.601318359375, -2.1358642578125, -1.67041015625, -1.2049560546875, -0.739501953125, -0.2740478515625, 0.19140625, 0.6568603515625, 1.122314453125, 1.5877685546875, 2.05322265625, 2.5186767578125, 2.984130859375, 3.4495849609375, 3.9150390625, 4.3804931640625, 4.845947265625, 5.3114013671875, 5.77685546875, 6.2423095703125, 6.707763671875, 7.1732177734375, 7.638671875, 8.1041259765625, 8.569580078125, 9.0350341796875, 9.50048828125, 9.9659423828125, 10.431396484375, 10.8968505859375, 11.3623046875, 11.8277587890625, 12.293212890625, 12.7586669921875, 13.22412109375, 13.6895751953125, 14.155029296875, 14.6204833984375, 15.0859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 5.0, 9.0, 9.0, 10.0, 17.0, 27.0, 27.0, 40.0, 50.0, 57.0, 42.0, 64.0, 57.0, 45.0, 57.0, 51.0, 63.0, 53.0, 59.0, 53.0, 50.0, 30.0, 15.0, 26.0, 13.0, 14.0, 7.0, 16.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.4007568359375, -2.293701171875, -2.1866455078125, -2.07958984375, -1.9725341796875, -1.865478515625, -1.7584228515625, -1.6513671875, -1.5443115234375, -1.437255859375, -1.3302001953125, -1.22314453125, -1.1160888671875, -1.009033203125, -0.9019775390625, -0.794921875, -0.6878662109375, -0.580810546875, -0.4737548828125, -0.36669921875, -0.2596435546875, -0.152587890625, -0.0455322265625, 0.0615234375, 0.1685791015625, 0.275634765625, 0.3826904296875, 0.48974609375, 0.5968017578125, 0.703857421875, 0.8109130859375, 0.91796875, 1.0250244140625, 1.132080078125, 1.2391357421875, 1.34619140625, 1.4532470703125, 1.560302734375, 1.6673583984375, 1.7744140625, 1.8814697265625, 1.988525390625, 2.0955810546875, 2.20263671875, 2.3096923828125, 2.416748046875, 2.5238037109375, 2.630859375, 2.7379150390625, 2.844970703125, 2.9520263671875, 3.05908203125, 3.1661376953125, 3.273193359375, 3.3802490234375, 3.4873046875, 3.5943603515625, 3.701416015625, 3.8084716796875, 3.91552734375, 4.0225830078125, 4.129638671875, 4.2366943359375, 4.34375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 10.0, 13.0, 31.0, 26.0, 62.0, 104.0, 140.0, 256.0, 455.0, 738.0, 1367.0, 2757.0, 5982.0, 15041.0, 43407.0, 180008.0, 3110396.0, 692319.0, 94627.0, 27337.0, 10133.0, 4473.0, 2092.0, 1084.0, 594.0, 308.0, 205.0, 114.0, 58.0, 49.0, 35.0, 18.0, 15.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.1343994140625, -9.815673828125, -9.4969482421875, -9.17822265625, -8.8594970703125, -8.540771484375, -8.2220458984375, -7.9033203125, -7.5845947265625, -7.265869140625, -6.9471435546875, -6.62841796875, -6.3096923828125, -5.990966796875, -5.6722412109375, -5.353515625, -5.0347900390625, -4.716064453125, -4.3973388671875, -4.07861328125, -3.7598876953125, -3.441162109375, -3.1224365234375, -2.8037109375, -2.4849853515625, -2.166259765625, -1.8475341796875, -1.52880859375, -1.2100830078125, -0.891357421875, -0.5726318359375, -0.25390625, 0.0648193359375, 0.383544921875, 0.7022705078125, 1.02099609375, 1.3397216796875, 1.658447265625, 1.9771728515625, 2.2958984375, 2.6146240234375, 2.933349609375, 3.2520751953125, 3.57080078125, 3.8895263671875, 4.208251953125, 4.5269775390625, 4.845703125, 5.1644287109375, 5.483154296875, 5.8018798828125, 6.12060546875, 6.4393310546875, 6.758056640625, 7.0767822265625, 7.3955078125, 7.7142333984375, 8.032958984375, 8.3516845703125, 8.67041015625, 8.9891357421875, 9.307861328125, 9.6265869140625, 9.9453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 6.0, 2.0, 8.0, 10.0, 13.0, 20.0, 24.0, 27.0, 54.0, 84.0, 168.0, 277.0, 1177.0, 1505.0, 307.0, 143.0, 71.0, 53.0, 39.0, 28.0, 11.0, 12.0, 11.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8046875, -7.58209228515625, -7.3594970703125, -7.13690185546875, -6.914306640625, -6.69171142578125, -6.4691162109375, -6.24652099609375, -6.02392578125, -5.80133056640625, -5.5787353515625, -5.35614013671875, -5.133544921875, -4.91094970703125, -4.6883544921875, -4.46575927734375, -4.2431640625, -4.02056884765625, -3.7979736328125, -3.57537841796875, -3.352783203125, -3.13018798828125, -2.9075927734375, -2.68499755859375, -2.46240234375, -2.23980712890625, -2.0172119140625, -1.79461669921875, -1.572021484375, -1.34942626953125, -1.1268310546875, -0.90423583984375, -0.681640625, -0.45904541015625, -0.2364501953125, -0.01385498046875, 0.208740234375, 0.43133544921875, 0.6539306640625, 0.87652587890625, 1.09912109375, 1.32171630859375, 1.5443115234375, 1.76690673828125, 1.989501953125, 2.21209716796875, 2.4346923828125, 2.65728759765625, 2.8798828125, 3.10247802734375, 3.3250732421875, 3.54766845703125, 3.770263671875, 3.99285888671875, 4.2154541015625, 4.43804931640625, 4.66064453125, 4.88323974609375, 5.1058349609375, 5.32843017578125, 5.551025390625, 5.77362060546875, 5.9962158203125, 6.21881103515625, 6.44140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 11.0, 30.0, 81.0, 166.0, 234.0, 246.0, 137.0, 48.0, 21.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-87.59194946289062, -85.3626480102539, -83.13334655761719, -80.904052734375, -78.67475128173828, -76.44544982910156, -74.21615600585938, -71.98685455322266, -69.75755310058594, -67.52825164794922, -65.2989501953125, -63.06965637207031, -60.840354919433594, -58.611053466796875, -56.38175582885742, -54.15245819091797, -51.92315673828125, -49.69385528564453, -47.46455764770508, -45.235260009765625, -43.005958557128906, -40.77665710449219, -38.547359466552734, -36.31806182861328, -34.08876037597656, -31.859460830688477, -29.63016128540039, -27.400861740112305, -25.17156219482422, -22.942262649536133, -20.712963104248047, -18.48366355895996, -16.254371643066406, -14.02507209777832, -11.795772552490234, -9.566473007202148, -7.3371734619140625, -5.107873916625977, -2.8785743713378906, -0.6492748260498047, 1.5800247192382812, 3.809324264526367, 6.038623809814453, 8.267923355102539, 10.497222900390625, 12.726522445678711, 14.955821990966797, 17.185121536254883, 19.41442108154297, 21.643720626831055, 23.87302017211914, 26.102319717407227, 28.331619262695312, 30.5609188079834, 32.790218353271484, 35.01951599121094, 37.248817443847656, 39.478118896484375, 41.70741653442383, 43.93671417236328, 46.166015625, 48.39531707763672, 50.62461471557617, 52.853912353515625, 55.083213806152344]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 10.0, 16.0, 22.0, 23.0, 22.0, 19.0, 37.0, 34.0, 43.0, 43.0, 39.0, 46.0, 52.0, 51.0, 52.0, 49.0, 49.0, 46.0, 50.0, 41.0, 44.0, 27.0, 27.0, 30.0, 22.0, 21.0, 12.0, 17.0, 12.0, 4.0, 4.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.367141723632812, -17.653270721435547, -16.93939781188965, -16.225526809692383, -15.5116548538208, -14.797782897949219, -14.083910942077637, -13.370038986206055, -12.656167984008789, -11.942296028137207, -11.228424072265625, -10.51455307006836, -9.800681114196777, -9.086809158325195, -8.372937202453613, -7.6590657234191895, -6.945193290710449, -6.231321334838867, -5.517449855804443, -4.803577899932861, -4.0897064208984375, -3.3758344650268555, -2.6619625091552734, -1.9480910301208496, -1.2342190742492676, -0.5203472971916199, 0.19352447986602783, 0.9073963165283203, 1.6212680339813232, 2.335139751434326, 3.049011707305908, 3.762883186340332, 4.476755142211914, 5.190627098083496, 5.90449857711792, 6.618370532989502, 7.332242012023926, 8.046113967895508, 8.75998592376709, 9.473857879638672, 10.187728881835938, 10.90160083770752, 11.615472793579102, 12.329343795776367, 13.04321575164795, 13.757087707519531, 14.470959663391113, 15.184831619262695, 15.898703575134277, 16.61257553100586, 17.326446533203125, 18.040319442749023, 18.75419044494629, 19.468063354492188, 20.181934356689453, 20.89580535888672, 21.609678268432617, 22.323549270629883, 23.03742218017578, 23.751293182373047, 24.465166091918945, 25.17903709411621, 25.89291000366211, 26.606781005859375, 27.32065200805664]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 17.0, 23.0, 28.0, 67.0, 98.0, 183.0, 285.0, 670.0, 1728.0, 4277.0, 11914.0, 39637.0, 145219.0, 389481.0, 315630.0, 97978.0, 27095.0, 8520.0, 3151.0, 1349.0, 553.0, 262.0, 133.0, 84.0, 45.0, 37.0, 24.0, 13.0, 10.0, 1.0, 2.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.2421875, -13.8214111328125, -13.400634765625, -12.9798583984375, -12.55908203125, -12.1383056640625, -11.717529296875, -11.2967529296875, -10.8759765625, -10.4552001953125, -10.034423828125, -9.6136474609375, -9.19287109375, -8.7720947265625, -8.351318359375, -7.9305419921875, -7.509765625, -7.0889892578125, -6.668212890625, -6.2474365234375, -5.82666015625, -5.4058837890625, -4.985107421875, -4.5643310546875, -4.1435546875, -3.7227783203125, -3.302001953125, -2.8812255859375, -2.46044921875, -2.0396728515625, -1.618896484375, -1.1981201171875, -0.77734375, -0.3565673828125, 0.064208984375, 0.4849853515625, 0.90576171875, 1.3265380859375, 1.747314453125, 2.1680908203125, 2.5888671875, 3.0096435546875, 3.430419921875, 3.8511962890625, 4.27197265625, 4.6927490234375, 5.113525390625, 5.5343017578125, 5.955078125, 6.3758544921875, 6.796630859375, 7.2174072265625, 7.63818359375, 8.0589599609375, 8.479736328125, 8.9005126953125, 9.3212890625, 9.7420654296875, 10.162841796875, 10.5836181640625, 11.00439453125, 11.4251708984375, 11.845947265625, 12.2667236328125, 12.6875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 5.0, 7.0, 5.0, 8.0, 18.0, 21.0, 34.0, 29.0, 23.0, 44.0, 33.0, 49.0, 54.0, 54.0, 56.0, 57.0, 59.0, 44.0, 59.0, 58.0, 53.0, 37.0, 29.0, 30.0, 24.0, 20.0, 12.0, 21.0, 10.0, 13.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.29296875, -2.19219970703125, -2.0914306640625, -1.99066162109375, -1.889892578125, -1.78912353515625, -1.6883544921875, -1.58758544921875, -1.48681640625, -1.38604736328125, -1.2852783203125, -1.18450927734375, -1.083740234375, -0.98297119140625, -0.8822021484375, -0.78143310546875, -0.6806640625, -0.57989501953125, -0.4791259765625, -0.37835693359375, -0.277587890625, -0.17681884765625, -0.0760498046875, 0.02471923828125, 0.12548828125, 0.22625732421875, 0.3270263671875, 0.42779541015625, 0.528564453125, 0.62933349609375, 0.7301025390625, 0.83087158203125, 0.931640625, 1.03240966796875, 1.1331787109375, 1.23394775390625, 1.334716796875, 1.43548583984375, 1.5362548828125, 1.63702392578125, 1.73779296875, 1.83856201171875, 1.9393310546875, 2.04010009765625, 2.140869140625, 2.24163818359375, 2.3424072265625, 2.44317626953125, 2.5439453125, 2.64471435546875, 2.7454833984375, 2.84625244140625, 2.947021484375, 3.04779052734375, 3.1485595703125, 3.24932861328125, 3.35009765625, 3.45086669921875, 3.5516357421875, 3.65240478515625, 3.753173828125, 3.85394287109375, 3.9547119140625, 4.05548095703125, 4.15625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 5.0, 7.0, 11.0, 22.0, 38.0, 48.0, 59.0, 89.0, 129.0, 204.0, 309.0, 533.0, 1051.0, 2974.0, 18484.0, 256275.0, 686177.0, 71685.0, 6651.0, 1752.0, 791.0, 446.0, 238.0, 184.0, 118.0, 72.0, 45.0, 37.0, 33.0, 20.0, 10.0, 15.0, 4.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.09375, -23.390625, -22.6875, -21.984375, -21.28125, -20.578125, -19.875, -19.171875, -18.46875, -17.765625, -17.0625, -16.359375, -15.65625, -14.953125, -14.25, -13.546875, -12.84375, -12.140625, -11.4375, -10.734375, -10.03125, -9.328125, -8.625, -7.921875, -7.21875, -6.515625, -5.8125, -5.109375, -4.40625, -3.703125, -3.0, -2.296875, -1.59375, -0.890625, -0.1875, 0.515625, 1.21875, 1.921875, 2.625, 3.328125, 4.03125, 4.734375, 5.4375, 6.140625, 6.84375, 7.546875, 8.25, 8.953125, 9.65625, 10.359375, 11.0625, 11.765625, 12.46875, 13.171875, 13.875, 14.578125, 15.28125, 15.984375, 16.6875, 17.390625, 18.09375, 18.796875, 19.5, 20.203125, 20.90625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 9.0, 15.0, 10.0, 12.0, 30.0, 20.0, 26.0, 32.0, 27.0, 43.0, 31.0, 39.0, 42.0, 57.0, 38.0, 48.0, 54.0, 37.0, 47.0, 41.0, 36.0, 38.0, 34.0, 30.0, 41.0, 25.0, 22.0, 19.0, 13.0, 24.0, 13.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.3065185546875, -11.894287109375, -11.4820556640625, -11.06982421875, -10.6575927734375, -10.245361328125, -9.8331298828125, -9.4208984375, -9.0086669921875, -8.596435546875, -8.1842041015625, -7.77197265625, -7.3597412109375, -6.947509765625, -6.5352783203125, -6.123046875, -5.7108154296875, -5.298583984375, -4.8863525390625, -4.47412109375, -4.0618896484375, -3.649658203125, -3.2374267578125, -2.8251953125, -2.4129638671875, -2.000732421875, -1.5885009765625, -1.17626953125, -0.7640380859375, -0.351806640625, 0.0604248046875, 0.47265625, 0.8848876953125, 1.297119140625, 1.7093505859375, 2.12158203125, 2.5338134765625, 2.946044921875, 3.3582763671875, 3.7705078125, 4.1827392578125, 4.594970703125, 5.0072021484375, 5.41943359375, 5.8316650390625, 6.243896484375, 6.6561279296875, 7.068359375, 7.4805908203125, 7.892822265625, 8.3050537109375, 8.71728515625, 9.1295166015625, 9.541748046875, 9.9539794921875, 10.3662109375, 10.7784423828125, 11.190673828125, 11.6029052734375, 12.01513671875, 12.4273681640625, 12.839599609375, 13.2518310546875, 13.6640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 16.0, 8.0, 12.0, 20.0, 54.0, 74.0, 135.0, 217.0, 470.0, 1094.0, 2316.0, 6199.0, 19571.0, 90472.0, 498600.0, 348243.0, 58664.0, 14149.0, 4669.0, 1831.0, 852.0, 386.0, 214.0, 116.0, 72.0, 33.0, 25.0, 18.0, 12.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.356689453125, -9.08837890625, -8.820068359375, -8.5517578125, -8.283447265625, -8.01513671875, -7.746826171875, -7.478515625, -7.210205078125, -6.94189453125, -6.673583984375, -6.4052734375, -6.136962890625, -5.86865234375, -5.600341796875, -5.33203125, -5.063720703125, -4.79541015625, -4.527099609375, -4.2587890625, -3.990478515625, -3.72216796875, -3.453857421875, -3.185546875, -2.917236328125, -2.64892578125, -2.380615234375, -2.1123046875, -1.843994140625, -1.57568359375, -1.307373046875, -1.0390625, -0.770751953125, -0.50244140625, -0.234130859375, 0.0341796875, 0.302490234375, 0.57080078125, 0.839111328125, 1.107421875, 1.375732421875, 1.64404296875, 1.912353515625, 2.1806640625, 2.448974609375, 2.71728515625, 2.985595703125, 3.25390625, 3.522216796875, 3.79052734375, 4.058837890625, 4.3271484375, 4.595458984375, 4.86376953125, 5.132080078125, 5.400390625, 5.668701171875, 5.93701171875, 6.205322265625, 6.4736328125, 6.741943359375, 7.01025390625, 7.278564453125, 7.546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 16.0, 15.0, 34.0, 33.0, 70.0, 103.0, 110.0, 138.0, 141.0, 112.0, 77.0, 56.0, 32.0, 14.0, 7.0, 14.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008945465087890625, -0.0008466839790344238, -0.0007988214492797852, -0.0007509589195251465, -0.0007030963897705078, -0.0006552338600158691, -0.0006073713302612305, -0.0005595088005065918, -0.0005116462707519531, -0.00046378374099731445, -0.0004159212112426758, -0.0003680586814880371, -0.00032019615173339844, -0.00027233362197875977, -0.0002244710922241211, -0.00017660856246948242, -0.00012874603271484375, -8.088350296020508e-05, -3.3020973205566406e-05, 1.4841556549072266e-05, 6.270408630371094e-05, 0.00011056661605834961, 0.00015842914581298828, 0.00020629167556762695, 0.0002541542053222656, 0.0003020167350769043, 0.00034987926483154297, 0.00039774179458618164, 0.0004456043243408203, 0.000493466854095459, 0.0005413293838500977, 0.0005891919136047363, 0.000637054443359375, 0.0006849169731140137, 0.0007327795028686523, 0.000780642032623291, 0.0008285045623779297, 0.0008763670921325684, 0.000924229621887207, 0.0009720921516418457, 0.0010199546813964844, 0.001067817211151123, 0.0011156797409057617, 0.0011635422706604004, 0.001211404800415039, 0.0012592673301696777, 0.0013071298599243164, 0.001354992389678955, 0.0014028549194335938, 0.0014507174491882324, 0.001498579978942871, 0.0015464425086975098, 0.0015943050384521484, 0.0016421675682067871, 0.0016900300979614258, 0.0017378926277160645, 0.0017857551574707031, 0.0018336176872253418, 0.0018814802169799805, 0.0019293427467346191, 0.001977205276489258, 0.0020250678062438965, 0.002072930335998535, 0.002120792865753174, 0.0021686553955078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 11.0, 14.0, 21.0, 30.0, 44.0, 65.0, 85.0, 145.0, 252.0, 498.0, 1228.0, 4272.0, 30741.0, 595820.0, 390018.0, 19828.0, 3319.0, 1083.0, 443.0, 244.0, 137.0, 85.0, 51.0, 34.0, 22.0, 10.0, 15.0, 6.0, 6.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.2890625, -14.8382568359375, -14.387451171875, -13.9366455078125, -13.48583984375, -13.0350341796875, -12.584228515625, -12.1334228515625, -11.6826171875, -11.2318115234375, -10.781005859375, -10.3302001953125, -9.87939453125, -9.4285888671875, -8.977783203125, -8.5269775390625, -8.076171875, -7.6253662109375, -7.174560546875, -6.7237548828125, -6.27294921875, -5.8221435546875, -5.371337890625, -4.9205322265625, -4.4697265625, -4.0189208984375, -3.568115234375, -3.1173095703125, -2.66650390625, -2.2156982421875, -1.764892578125, -1.3140869140625, -0.86328125, -0.4124755859375, 0.038330078125, 0.4891357421875, 0.93994140625, 1.3907470703125, 1.841552734375, 2.2923583984375, 2.7431640625, 3.1939697265625, 3.644775390625, 4.0955810546875, 4.54638671875, 4.9971923828125, 5.447998046875, 5.8988037109375, 6.349609375, 6.8004150390625, 7.251220703125, 7.7020263671875, 8.15283203125, 8.6036376953125, 9.054443359375, 9.5052490234375, 9.9560546875, 10.4068603515625, 10.857666015625, 11.3084716796875, 11.75927734375, 12.2100830078125, 12.660888671875, 13.1116943359375, 13.5625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 15.0, 16.0, 19.0, 33.0, 38.0, 56.0, 58.0, 62.0, 87.0, 94.0, 113.0, 91.0, 77.0, 69.0, 37.0, 31.0, 29.0, 18.0, 16.0, 8.0, 11.0, 2.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.0, -7.7421875, -7.484375, -7.2265625, -6.96875, -6.7109375, -6.453125, -6.1953125, -5.9375, -5.6796875, -5.421875, -5.1640625, -4.90625, -4.6484375, -4.390625, -4.1328125, -3.875, -3.6171875, -3.359375, -3.1015625, -2.84375, -2.5859375, -2.328125, -2.0703125, -1.8125, -1.5546875, -1.296875, -1.0390625, -0.78125, -0.5234375, -0.265625, -0.0078125, 0.25, 0.5078125, 0.765625, 1.0234375, 1.28125, 1.5390625, 1.796875, 2.0546875, 2.3125, 2.5703125, 2.828125, 3.0859375, 3.34375, 3.6015625, 3.859375, 4.1171875, 4.375, 4.6328125, 4.890625, 5.1484375, 5.40625, 5.6640625, 5.921875, 6.1796875, 6.4375, 6.6953125, 6.953125, 7.2109375, 7.46875, 7.7265625, 7.984375, 8.2421875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 21.0, 66.0, 138.0, 272.0, 247.0, 149.0, 62.0, 16.0, 12.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.19776916503906, -128.11488342285156, -122.03199005126953, -115.94910430908203, -109.86621856689453, -103.7833251953125, -97.700439453125, -91.6175537109375, -85.53466796875, -79.4517822265625, -73.36888885498047, -67.28600311279297, -61.20311737060547, -55.1202278137207, -49.03733825683594, -42.95445251464844, -36.871559143066406, -30.788671493530273, -24.70578384399414, -18.622894287109375, -12.540006637573242, -6.457118988037109, -0.37422943115234375, 5.708656311035156, 11.791545867919922, 17.874433517456055, 23.957321166992188, 30.040210723876953, 36.12310028076172, 42.20598602294922, 48.288875579833984, 54.371761322021484, 60.45465087890625, 66.53753662109375, 72.62042999267578, 78.70331573486328, 84.78620147705078, 90.86909484863281, 96.95198059082031, 103.03486633300781, 109.11775207519531, 115.20063781738281, 121.28353118896484, 127.36641693115234, 133.44931030273438, 139.53219604492188, 145.61508178710938, 151.69796752929688, 157.78085327148438, 163.86373901367188, 169.94662475585938, 176.02951049804688, 182.11241149902344, 188.19529724121094, 194.27818298339844, 200.36106872558594, 206.4439697265625, 212.52685546875, 218.6097412109375, 224.692626953125, 230.77552795410156, 236.85841369628906, 242.94129943847656, 249.02418518066406, 255.10707092285156]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 11.0, 4.0, 9.0, 6.0, 11.0, 13.0, 25.0, 24.0, 23.0, 27.0, 32.0, 41.0, 28.0, 52.0, 34.0, 42.0, 40.0, 49.0, 46.0, 56.0, 43.0, 51.0, 39.0, 33.0, 32.0, 27.0, 29.0, 31.0, 18.0, 27.0, 17.0, 15.0, 20.0, 15.0, 4.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.36685180664062, -69.21539306640625, -67.06392669677734, -64.91246795654297, -62.761009216308594, -60.60954666137695, -58.45808410644531, -56.30662536621094, -54.15516662597656, -52.00370407104492, -49.85224533081055, -47.700782775878906, -45.54932403564453, -43.39786148071289, -41.24639892578125, -39.094940185546875, -36.943477630615234, -34.792015075683594, -32.64055633544922, -30.489093780517578, -28.337635040283203, -26.186172485351562, -24.034711837768555, -21.883251190185547, -19.73179054260254, -17.58032989501953, -15.428869247436523, -13.2774076461792, -11.125946998596191, -8.974486351013184, -6.823024749755859, -4.671564102172852, -2.5201034545898438, -0.36864256858825684, 1.78281831741333, 3.934279441833496, 6.085740089416504, 8.237200736999512, 10.388662338256836, 12.540122985839844, 14.691583633422852, 16.84304428100586, 18.994504928588867, 21.145965576171875, 23.297428131103516, 25.44888687133789, 27.60034942626953, 29.75181007385254, 31.903270721435547, 34.05473327636719, 36.20619201660156, 38.3576545715332, 40.50911331176758, 42.66057586669922, 44.812034606933594, 46.963497161865234, 49.114959716796875, 51.266422271728516, 53.41788101196289, 55.56934356689453, 57.720802307128906, 59.87226486206055, 62.02372741699219, 64.17518615722656, 66.32664489746094]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 9.0, 12.0, 22.0, 29.0, 23.0, 44.0, 51.0, 84.0, 100.0, 164.0, 325.0, 567.0, 1160.0, 2693.0, 9175.0, 70480.0, 4046148.0, 50471.0, 7889.0, 2431.0, 1066.0, 531.0, 267.0, 170.0, 89.0, 67.0, 52.0, 38.0, 25.0, 21.0, 22.0, 11.0, 6.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.75, -20.1103515625, -19.470703125, -18.8310546875, -18.19140625, -17.5517578125, -16.912109375, -16.2724609375, -15.6328125, -14.9931640625, -14.353515625, -13.7138671875, -13.07421875, -12.4345703125, -11.794921875, -11.1552734375, -10.515625, -9.8759765625, -9.236328125, -8.5966796875, -7.95703125, -7.3173828125, -6.677734375, -6.0380859375, -5.3984375, -4.7587890625, -4.119140625, -3.4794921875, -2.83984375, -2.2001953125, -1.560546875, -0.9208984375, -0.28125, 0.3583984375, 0.998046875, 1.6376953125, 2.27734375, 2.9169921875, 3.556640625, 4.1962890625, 4.8359375, 5.4755859375, 6.115234375, 6.7548828125, 7.39453125, 8.0341796875, 8.673828125, 9.3134765625, 9.953125, 10.5927734375, 11.232421875, 11.8720703125, 12.51171875, 13.1513671875, 13.791015625, 14.4306640625, 15.0703125, 15.7099609375, 16.349609375, 16.9892578125, 17.62890625, 18.2685546875, 18.908203125, 19.5478515625, 20.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 13.0, 3.0, 15.0, 16.0, 12.0, 16.0, 30.0, 23.0, 29.0, 33.0, 29.0, 46.0, 42.0, 46.0, 49.0, 57.0, 66.0, 60.0, 52.0, 45.0, 44.0, 47.0, 40.0, 34.0, 20.0, 31.0, 15.0, 17.0, 13.0, 12.0, 5.0, 9.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.69366455078125, -2.5826416015625, -2.47161865234375, -2.360595703125, -2.24957275390625, -2.1385498046875, -2.02752685546875, -1.91650390625, -1.80548095703125, -1.6944580078125, -1.58343505859375, -1.472412109375, -1.36138916015625, -1.2503662109375, -1.13934326171875, -1.0283203125, -0.91729736328125, -0.8062744140625, -0.69525146484375, -0.584228515625, -0.47320556640625, -0.3621826171875, -0.25115966796875, -0.14013671875, -0.02911376953125, 0.0819091796875, 0.19293212890625, 0.303955078125, 0.41497802734375, 0.5260009765625, 0.63702392578125, 0.748046875, 0.85906982421875, 0.9700927734375, 1.08111572265625, 1.192138671875, 1.30316162109375, 1.4141845703125, 1.52520751953125, 1.63623046875, 1.74725341796875, 1.8582763671875, 1.96929931640625, 2.080322265625, 2.19134521484375, 2.3023681640625, 2.41339111328125, 2.5244140625, 2.63543701171875, 2.7464599609375, 2.85748291015625, 2.968505859375, 3.07952880859375, 3.1905517578125, 3.30157470703125, 3.41259765625, 3.52362060546875, 3.6346435546875, 3.74566650390625, 3.856689453125, 3.96771240234375, 4.0787353515625, 4.18975830078125, 4.30078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 2.0, 11.0, 10.0, 11.0, 20.0, 17.0, 28.0, 37.0, 61.0, 78.0, 120.0, 146.0, 225.0, 364.0, 545.0, 827.0, 1431.0, 2630.0, 5311.0, 12445.0, 37601.0, 343632.0, 3701229.0, 57105.0, 16174.0, 6573.0, 3082.0, 1725.0, 967.0, 566.0, 355.0, 287.0, 177.0, 129.0, 91.0, 70.0, 50.0, 44.0, 23.0, 19.0, 19.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.5546875, -10.2156982421875, -9.876708984375, -9.5377197265625, -9.19873046875, -8.8597412109375, -8.520751953125, -8.1817626953125, -7.8427734375, -7.5037841796875, -7.164794921875, -6.8258056640625, -6.48681640625, -6.1478271484375, -5.808837890625, -5.4698486328125, -5.130859375, -4.7918701171875, -4.452880859375, -4.1138916015625, -3.77490234375, -3.4359130859375, -3.096923828125, -2.7579345703125, -2.4189453125, -2.0799560546875, -1.740966796875, -1.4019775390625, -1.06298828125, -0.7239990234375, -0.385009765625, -0.0460205078125, 0.29296875, 0.6319580078125, 0.970947265625, 1.3099365234375, 1.64892578125, 1.9879150390625, 2.326904296875, 2.6658935546875, 3.0048828125, 3.3438720703125, 3.682861328125, 4.0218505859375, 4.36083984375, 4.6998291015625, 5.038818359375, 5.3778076171875, 5.716796875, 6.0557861328125, 6.394775390625, 6.7337646484375, 7.07275390625, 7.4117431640625, 7.750732421875, 8.0897216796875, 8.4287109375, 8.7677001953125, 9.106689453125, 9.4456787109375, 9.78466796875, 10.1236572265625, 10.462646484375, 10.8016357421875, 11.140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 9.0, 10.0, 14.0, 22.0, 33.0, 65.0, 189.0, 3251.0, 269.0, 85.0, 32.0, 26.0, 18.0, 13.0, 4.0, 8.0, 5.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.28082275390625, -3.1768798828125, -3.07293701171875, -2.968994140625, -2.86505126953125, -2.7611083984375, -2.65716552734375, -2.55322265625, -2.44927978515625, -2.3453369140625, -2.24139404296875, -2.137451171875, -2.03350830078125, -1.9295654296875, -1.82562255859375, -1.7216796875, -1.61773681640625, -1.5137939453125, -1.40985107421875, -1.305908203125, -1.20196533203125, -1.0980224609375, -0.99407958984375, -0.89013671875, -0.78619384765625, -0.6822509765625, -0.57830810546875, -0.474365234375, -0.37042236328125, -0.2664794921875, -0.16253662109375, -0.05859375, 0.04534912109375, 0.1492919921875, 0.25323486328125, 0.357177734375, 0.46112060546875, 0.5650634765625, 0.66900634765625, 0.77294921875, 0.87689208984375, 0.9808349609375, 1.08477783203125, 1.188720703125, 1.29266357421875, 1.3966064453125, 1.50054931640625, 1.6044921875, 1.70843505859375, 1.8123779296875, 1.91632080078125, 2.020263671875, 2.12420654296875, 2.2281494140625, 2.33209228515625, 2.43603515625, 2.53997802734375, 2.6439208984375, 2.74786376953125, 2.851806640625, 2.95574951171875, 3.0596923828125, 3.16363525390625, 3.267578125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 23.0, 64.0, 134.0, 234.0, 227.0, 176.0, 82.0, 31.0, 15.0, 10.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.442170143127441, -9.732256889343262, -9.022343635559082, -8.312431335449219, -7.602517604827881, -6.892604351043701, -6.18269157409668, -5.4727783203125, -4.76286506652832, -4.052951812744141, -3.34303879737854, -2.6331257820129395, -1.9232125282287598, -1.21329927444458, -0.5033864974975586, 0.2065267562866211, 0.9164400100708008, 1.626353144645691, 2.336266279220581, 3.0461792945861816, 3.7560925483703613, 4.466005802154541, 5.1759185791015625, 5.885831832885742, 6.595745086669922, 7.305658340454102, 8.015571594238281, 8.725484848022461, 9.43539810180664, 10.14531135559082, 10.855223655700684, 11.565136909484863, 12.27505111694336, 12.984964370727539, 13.694877624511719, 14.404790878295898, 15.114704132080078, 15.824617385864258, 16.534530639648438, 17.244441986083984, 17.954357147216797, 18.664270401000977, 19.374183654785156, 20.084096908569336, 20.794010162353516, 21.503923416137695, 22.213836669921875, 22.923748016357422, 23.6336612701416, 24.34357452392578, 25.05348777770996, 25.76340103149414, 26.47331428527832, 27.1832275390625, 27.893138885498047, 28.60305404663086, 29.312965393066406, 30.022878646850586, 30.732791900634766, 31.442705154418945, 32.152618408203125, 32.86252975463867, 33.572444915771484, 34.28235626220703, 34.992271423339844]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 10.0, 10.0, 15.0, 15.0, 18.0, 29.0, 13.0, 44.0, 35.0, 41.0, 43.0, 42.0, 52.0, 51.0, 52.0, 45.0, 43.0, 49.0, 47.0, 40.0, 41.0, 32.0, 34.0, 37.0, 25.0, 28.0, 23.0, 14.0, 14.0, 11.0, 8.0, 6.0, 7.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.110553741455078, -6.887495040893555, -6.664436340332031, -6.441377639770508, -6.218318939208984, -5.995260238647461, -5.7722015380859375, -5.549143314361572, -5.326084613800049, -5.103025913238525, -4.879967212677002, -4.6569085121154785, -4.433849811553955, -4.21079158782959, -3.9877326488494873, -3.764674186706543, -3.5416152477264404, -3.318556547164917, -3.0954978466033936, -2.872439384460449, -2.649380683898926, -2.4263219833374023, -2.203263282775879, -1.980204701423645, -1.7571460008621216, -1.5340873003005981, -1.3110287189483643, -1.0879700183868408, -0.8649113774299622, -0.6418527364730835, -0.41879403591156006, -0.19573545455932617, 0.027323246002197266, 0.2503818869590759, 0.473440557718277, 0.696499228477478, 0.9195578694343567, 1.1426165103912354, 1.3656752109527588, 1.5887337923049927, 1.8117924928665161, 2.03485107421875, 2.2579097747802734, 2.480968475341797, 2.7040271759033203, 2.9270858764648438, 3.150144577026367, 3.3732030391693115, 3.596261739730835, 3.8193204402923584, 4.042378902435303, 4.265437602996826, 4.48849630355835, 4.711555004119873, 4.9346137046813965, 5.15767240524292, 5.380731105804443, 5.603789806365967, 5.82684850692749, 6.049907207489014, 6.272965908050537, 6.496024131774902, 6.719082832336426, 6.942141532897949, 7.165200233459473]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 20.0, 14.0, 34.0, 44.0, 64.0, 79.0, 135.0, 198.0, 371.0, 729.0, 1486.0, 3286.0, 7648.0, 19240.0, 51064.0, 135236.0, 289760.0, 301820.0, 146174.0, 55427.0, 20767.0, 8254.0, 3455.0, 1465.0, 731.0, 377.0, 237.0, 138.0, 93.0, 50.0, 39.0, 28.0, 23.0, 17.0, 12.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.2421875, -8.9537353515625, -8.665283203125, -8.3768310546875, -8.08837890625, -7.7999267578125, -7.511474609375, -7.2230224609375, -6.9345703125, -6.6461181640625, -6.357666015625, -6.0692138671875, -5.78076171875, -5.4923095703125, -5.203857421875, -4.9154052734375, -4.626953125, -4.3385009765625, -4.050048828125, -3.7615966796875, -3.47314453125, -3.1846923828125, -2.896240234375, -2.6077880859375, -2.3193359375, -2.0308837890625, -1.742431640625, -1.4539794921875, -1.16552734375, -0.8770751953125, -0.588623046875, -0.3001708984375, -0.01171875, 0.2767333984375, 0.565185546875, 0.8536376953125, 1.14208984375, 1.4305419921875, 1.718994140625, 2.0074462890625, 2.2958984375, 2.5843505859375, 2.872802734375, 3.1612548828125, 3.44970703125, 3.7381591796875, 4.026611328125, 4.3150634765625, 4.603515625, 4.8919677734375, 5.180419921875, 5.4688720703125, 5.75732421875, 6.0457763671875, 6.334228515625, 6.6226806640625, 6.9111328125, 7.1995849609375, 7.488037109375, 7.7764892578125, 8.06494140625, 8.3533935546875, 8.641845703125, 8.9302978515625, 9.21875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 9.0, 10.0, 9.0, 10.0, 18.0, 19.0, 27.0, 30.0, 30.0, 25.0, 37.0, 36.0, 52.0, 51.0, 55.0, 53.0, 54.0, 58.0, 49.0, 46.0, 44.0, 36.0, 42.0, 43.0, 31.0, 26.0, 14.0, 20.0, 7.0, 11.0, 12.0, 7.0, 6.0, 5.0, 9.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -2.989471435546875, -2.87542724609375, -2.761383056640625, -2.6473388671875, -2.533294677734375, -2.41925048828125, -2.305206298828125, -2.191162109375, -2.077117919921875, -1.96307373046875, -1.849029541015625, -1.7349853515625, -1.620941162109375, -1.50689697265625, -1.392852783203125, -1.27880859375, -1.164764404296875, -1.05072021484375, -0.936676025390625, -0.8226318359375, -0.708587646484375, -0.59454345703125, -0.480499267578125, -0.366455078125, -0.252410888671875, -0.13836669921875, -0.024322509765625, 0.0897216796875, 0.203765869140625, 0.31781005859375, 0.431854248046875, 0.5458984375, 0.659942626953125, 0.77398681640625, 0.888031005859375, 1.0020751953125, 1.116119384765625, 1.23016357421875, 1.344207763671875, 1.458251953125, 1.572296142578125, 1.68634033203125, 1.800384521484375, 1.9144287109375, 2.028472900390625, 2.14251708984375, 2.256561279296875, 2.37060546875, 2.484649658203125, 2.59869384765625, 2.712738037109375, 2.8267822265625, 2.940826416015625, 3.05487060546875, 3.168914794921875, 3.282958984375, 3.397003173828125, 3.51104736328125, 3.625091552734375, 3.7391357421875, 3.853179931640625, 3.96722412109375, 4.081268310546875, 4.1953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 3.0, 2.0, 10.0, 4.0, 7.0, 18.0, 19.0, 24.0, 38.0, 39.0, 76.0, 88.0, 117.0, 182.0, 252.0, 328.0, 608.0, 1109.0, 2791.0, 21093.0, 482720.0, 510574.0, 22644.0, 2830.0, 1097.0, 580.0, 432.0, 235.0, 162.0, 112.0, 91.0, 76.0, 30.0, 39.0, 27.0, 23.0, 16.0, 12.0, 12.0, 8.0, 2.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0], "bins": [-30.3125, -29.470703125, -28.62890625, -27.787109375, -26.9453125, -26.103515625, -25.26171875, -24.419921875, -23.578125, -22.736328125, -21.89453125, -21.052734375, -20.2109375, -19.369140625, -18.52734375, -17.685546875, -16.84375, -16.001953125, -15.16015625, -14.318359375, -13.4765625, -12.634765625, -11.79296875, -10.951171875, -10.109375, -9.267578125, -8.42578125, -7.583984375, -6.7421875, -5.900390625, -5.05859375, -4.216796875, -3.375, -2.533203125, -1.69140625, -0.849609375, -0.0078125, 0.833984375, 1.67578125, 2.517578125, 3.359375, 4.201171875, 5.04296875, 5.884765625, 6.7265625, 7.568359375, 8.41015625, 9.251953125, 10.09375, 10.935546875, 11.77734375, 12.619140625, 13.4609375, 14.302734375, 15.14453125, 15.986328125, 16.828125, 17.669921875, 18.51171875, 19.353515625, 20.1953125, 21.037109375, 21.87890625, 22.720703125, 23.5625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 8.0, 16.0, 13.0, 14.0, 15.0, 18.0, 24.0, 31.0, 30.0, 38.0, 32.0, 54.0, 39.0, 54.0, 54.0, 66.0, 55.0, 54.0, 49.0, 41.0, 42.0, 38.0, 34.0, 29.0, 28.0, 14.0, 26.0, 23.0, 11.0, 9.0, 5.0, 10.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.21875, -19.680419921875, -19.14208984375, -18.603759765625, -18.0654296875, -17.527099609375, -16.98876953125, -16.450439453125, -15.912109375, -15.373779296875, -14.83544921875, -14.297119140625, -13.7587890625, -13.220458984375, -12.68212890625, -12.143798828125, -11.60546875, -11.067138671875, -10.52880859375, -9.990478515625, -9.4521484375, -8.913818359375, -8.37548828125, -7.837158203125, -7.298828125, -6.760498046875, -6.22216796875, -5.683837890625, -5.1455078125, -4.607177734375, -4.06884765625, -3.530517578125, -2.9921875, -2.453857421875, -1.91552734375, -1.377197265625, -0.8388671875, -0.300537109375, 0.23779296875, 0.776123046875, 1.314453125, 1.852783203125, 2.39111328125, 2.929443359375, 3.4677734375, 4.006103515625, 4.54443359375, 5.082763671875, 5.62109375, 6.159423828125, 6.69775390625, 7.236083984375, 7.7744140625, 8.312744140625, 8.85107421875, 9.389404296875, 9.927734375, 10.466064453125, 11.00439453125, 11.542724609375, 12.0810546875, 12.619384765625, 13.15771484375, 13.696044921875, 14.234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 13.0, 11.0, 15.0, 25.0, 29.0, 54.0, 69.0, 96.0, 188.0, 269.0, 570.0, 1054.0, 2378.0, 6253.0, 18906.0, 71003.0, 294916.0, 471942.0, 131065.0, 33246.0, 9650.0, 3588.0, 1476.0, 701.0, 420.0, 198.0, 119.0, 102.0, 53.0, 33.0, 25.0, 22.0, 10.0, 11.0, 8.0, 10.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.71356201171875, -4.5716552734375, -4.42974853515625, -4.287841796875, -4.14593505859375, -4.0040283203125, -3.86212158203125, -3.72021484375, -3.57830810546875, -3.4364013671875, -3.29449462890625, -3.152587890625, -3.01068115234375, -2.8687744140625, -2.72686767578125, -2.5849609375, -2.44305419921875, -2.3011474609375, -2.15924072265625, -2.017333984375, -1.87542724609375, -1.7335205078125, -1.59161376953125, -1.44970703125, -1.30780029296875, -1.1658935546875, -1.02398681640625, -0.882080078125, -0.74017333984375, -0.5982666015625, -0.45635986328125, -0.314453125, -0.17254638671875, -0.0306396484375, 0.11126708984375, 0.253173828125, 0.39508056640625, 0.5369873046875, 0.67889404296875, 0.82080078125, 0.96270751953125, 1.1046142578125, 1.24652099609375, 1.388427734375, 1.53033447265625, 1.6722412109375, 1.81414794921875, 1.9560546875, 2.09796142578125, 2.2398681640625, 2.38177490234375, 2.523681640625, 2.66558837890625, 2.8074951171875, 2.94940185546875, 3.09130859375, 3.23321533203125, 3.3751220703125, 3.51702880859375, 3.658935546875, 3.80084228515625, 3.9427490234375, 4.08465576171875, 4.2265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 10.0, 9.0, 8.0, 17.0, 20.0, 31.0, 28.0, 47.0, 42.0, 59.0, 67.0, 73.0, 69.0, 76.0, 78.0, 67.0, 53.0, 38.0, 35.0, 35.0, 26.0, 28.0, 13.0, 14.0, 9.0, 8.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006303787231445312, -0.0006095021963119507, -0.0005886256694793701, -0.0005677491426467896, -0.000546872615814209, -0.0005259960889816284, -0.0005051195621490479, -0.0004842430353164673, -0.0004633665084838867, -0.00044248998165130615, -0.0004216134548187256, -0.000400736927986145, -0.00037986040115356445, -0.0003589838743209839, -0.0003381073474884033, -0.00031723082065582275, -0.0002963542938232422, -0.0002754777669906616, -0.00025460124015808105, -0.0002337247133255005, -0.00021284818649291992, -0.00019197165966033936, -0.0001710951328277588, -0.00015021860599517822, -0.00012934207916259766, -0.00010846555233001709, -8.758902549743652e-05, -6.671249866485596e-05, -4.583597183227539e-05, -2.4959444999694824e-05, -4.082918167114258e-06, 1.679360866546631e-05, 3.7670135498046875e-05, 5.854666233062744e-05, 7.942318916320801e-05, 0.00010029971599578857, 0.00012117624282836914, 0.0001420527696609497, 0.00016292929649353027, 0.00018380582332611084, 0.0002046823501586914, 0.00022555887699127197, 0.00024643540382385254, 0.0002673119306564331, 0.00028818845748901367, 0.00030906498432159424, 0.0003299415111541748, 0.00035081803798675537, 0.00037169456481933594, 0.0003925710916519165, 0.00041344761848449707, 0.00043432414531707764, 0.0004552006721496582, 0.00047607719898223877, 0.0004969537258148193, 0.0005178302526473999, 0.0005387067794799805, 0.000559583306312561, 0.0005804598331451416, 0.0006013363599777222, 0.0006222128868103027, 0.0006430894136428833, 0.0006639659404754639, 0.0006848424673080444, 0.000705718994140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 10.0, 13.0, 12.0, 26.0, 28.0, 50.0, 89.0, 142.0, 331.0, 726.0, 1820.0, 7355.0, 102189.0, 845431.0, 80888.0, 6459.0, 1691.0, 629.0, 293.0, 147.0, 86.0, 35.0, 31.0, 23.0, 13.0, 8.0, 7.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.9923095703125, -9.664306640625, -9.3363037109375, -9.00830078125, -8.6802978515625, -8.352294921875, -8.0242919921875, -7.6962890625, -7.3682861328125, -7.040283203125, -6.7122802734375, -6.38427734375, -6.0562744140625, -5.728271484375, -5.4002685546875, -5.072265625, -4.7442626953125, -4.416259765625, -4.0882568359375, -3.76025390625, -3.4322509765625, -3.104248046875, -2.7762451171875, -2.4482421875, -2.1202392578125, -1.792236328125, -1.4642333984375, -1.13623046875, -0.8082275390625, -0.480224609375, -0.1522216796875, 0.17578125, 0.5037841796875, 0.831787109375, 1.1597900390625, 1.48779296875, 1.8157958984375, 2.143798828125, 2.4718017578125, 2.7998046875, 3.1278076171875, 3.455810546875, 3.7838134765625, 4.11181640625, 4.4398193359375, 4.767822265625, 5.0958251953125, 5.423828125, 5.7518310546875, 6.079833984375, 6.4078369140625, 6.73583984375, 7.0638427734375, 7.391845703125, 7.7198486328125, 8.0478515625, 8.3758544921875, 8.703857421875, 9.0318603515625, 9.35986328125, 9.6878662109375, 10.015869140625, 10.3438720703125, 10.671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 10.0, 10.0, 15.0, 10.0, 23.0, 26.0, 32.0, 48.0, 66.0, 83.0, 95.0, 85.0, 99.0, 97.0, 61.0, 69.0, 34.0, 32.0, 34.0, 19.0, 17.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.37738037109375, -6.1766357421875, -5.97589111328125, -5.775146484375, -5.57440185546875, -5.3736572265625, -5.17291259765625, -4.97216796875, -4.77142333984375, -4.5706787109375, -4.36993408203125, -4.169189453125, -3.96844482421875, -3.7677001953125, -3.56695556640625, -3.3662109375, -3.16546630859375, -2.9647216796875, -2.76397705078125, -2.563232421875, -2.36248779296875, -2.1617431640625, -1.96099853515625, -1.76025390625, -1.55950927734375, -1.3587646484375, -1.15802001953125, -0.957275390625, -0.75653076171875, -0.5557861328125, -0.35504150390625, -0.154296875, 0.04644775390625, 0.2471923828125, 0.44793701171875, 0.648681640625, 0.84942626953125, 1.0501708984375, 1.25091552734375, 1.45166015625, 1.65240478515625, 1.8531494140625, 2.05389404296875, 2.254638671875, 2.45538330078125, 2.6561279296875, 2.85687255859375, 3.0576171875, 3.25836181640625, 3.4591064453125, 3.65985107421875, 3.860595703125, 4.06134033203125, 4.2620849609375, 4.46282958984375, 4.66357421875, 4.86431884765625, 5.0650634765625, 5.26580810546875, 5.466552734375, 5.66729736328125, 5.8680419921875, 6.06878662109375, 6.26953125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 11.0, 22.0, 38.0, 116.0, 173.0, 227.0, 190.0, 128.0, 58.0, 22.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.9042205810547, -130.0378875732422, -125.17153930664062, -120.30520629882812, -115.4388656616211, -110.57252502441406, -105.70619201660156, -100.83985137939453, -95.9735107421875, -91.10717010498047, -86.24082946777344, -81.37449645996094, -76.5081558227539, -71.64181518554688, -66.77548217773438, -61.909141540527344, -57.04280090332031, -52.17646026611328, -47.310123443603516, -42.44378662109375, -37.57744598388672, -32.71110534667969, -27.844768524169922, -22.978431701660156, -18.112091064453125, -13.245752334594727, -8.379413604736328, -3.5130748748779297, 1.3532638549804688, 6.219602584838867, 11.085941314697266, 15.952278137207031, 20.818634033203125, 25.684972763061523, 30.551311492919922, 35.41764831542969, 40.28398895263672, 45.15032958984375, 50.016666412353516, 54.88300323486328, 59.74934387207031, 64.61568450927734, 69.48202514648438, 74.34835815429688, 79.2146987915039, 84.08103942871094, 88.94737243652344, 93.81371307373047, 98.6800537109375, 103.54639434814453, 108.41273498535156, 113.27906799316406, 118.1454086303711, 123.01174926757812, 127.87808227539062, 132.74441528320312, 137.6107635498047, 142.4770965576172, 147.34344482421875, 152.20977783203125, 157.07611083984375, 161.9424591064453, 166.8087921142578, 171.67514038085938, 176.54147338867188]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 2.0, 12.0, 13.0, 18.0, 19.0, 18.0, 22.0, 24.0, 29.0, 34.0, 45.0, 37.0, 48.0, 46.0, 43.0, 49.0, 51.0, 56.0, 50.0, 48.0, 37.0, 51.0, 27.0, 34.0, 28.0, 26.0, 20.0, 22.0, 9.0, 11.0, 10.0, 6.0, 7.0, 10.0, 7.0, 2.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.21461486816406, -63.956398010253906, -61.698184967041016, -59.43996810913086, -57.18175506591797, -54.92353820800781, -52.665321350097656, -50.407108306884766, -48.148895263671875, -45.89067840576172, -43.63246536254883, -41.37424850463867, -39.11603546142578, -36.857818603515625, -34.59960174560547, -32.34138870239258, -30.083171844482422, -27.8249568939209, -25.566741943359375, -23.30852508544922, -21.050312042236328, -18.792095184326172, -16.53388023376465, -14.275665283203125, -12.017450332641602, -9.759235382080078, -7.5010199546813965, -5.242804527282715, -2.9845895767211914, -0.726374626159668, 1.5318412780761719, 3.7900562286376953, 6.048271179199219, 8.306486129760742, 10.564701080322266, 12.822916984558105, 15.081131935119629, 17.33934783935547, 19.597562789916992, 21.855777740478516, 24.11399269104004, 26.372207641601562, 28.630422592163086, 30.88863754272461, 33.146854400634766, 35.405067443847656, 37.66328430175781, 39.92150115966797, 42.17971420288086, 44.437931060791016, 46.696144104003906, 48.95436096191406, 51.21257400512695, 53.47079086303711, 55.72900390625, 57.987220764160156, 60.24543762207031, 62.50365447998047, 64.76187133789062, 67.02008056640625, 69.2782974243164, 71.53651428222656, 73.79473114013672, 76.05294799804688, 78.3111572265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 16.0, 12.0, 30.0, 56.0, 83.0, 170.0, 340.0, 728.0, 1566.0, 3964.0, 16386.0, 548464.0, 3596820.0, 18250.0, 4330.0, 1622.0, 694.0, 310.0, 197.0, 106.0, 57.0, 32.0, 13.0, 13.0, 6.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.875, -12.339111328125, -11.80322265625, -11.267333984375, -10.7314453125, -10.195556640625, -9.65966796875, -9.123779296875, -8.587890625, -8.052001953125, -7.51611328125, -6.980224609375, -6.4443359375, -5.908447265625, -5.37255859375, -4.836669921875, -4.30078125, -3.764892578125, -3.22900390625, -2.693115234375, -2.1572265625, -1.621337890625, -1.08544921875, -0.549560546875, -0.013671875, 0.522216796875, 1.05810546875, 1.593994140625, 2.1298828125, 2.665771484375, 3.20166015625, 3.737548828125, 4.2734375, 4.809326171875, 5.34521484375, 5.881103515625, 6.4169921875, 6.952880859375, 7.48876953125, 8.024658203125, 8.560546875, 9.096435546875, 9.63232421875, 10.168212890625, 10.7041015625, 11.239990234375, 11.77587890625, 12.311767578125, 12.84765625, 13.383544921875, 13.91943359375, 14.455322265625, 14.9912109375, 15.527099609375, 16.06298828125, 16.598876953125, 17.134765625, 17.670654296875, 18.20654296875, 18.742431640625, 19.2783203125, 19.814208984375, 20.35009765625, 20.885986328125, 21.421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 9.0, 8.0, 13.0, 12.0, 15.0, 20.0, 15.0, 29.0, 27.0, 26.0, 27.0, 36.0, 48.0, 41.0, 41.0, 50.0, 60.0, 64.0, 34.0, 52.0, 39.0, 39.0, 44.0, 32.0, 31.0, 24.0, 23.0, 21.0, 15.0, 20.0, 19.0, 16.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.734375, -2.630126953125, -2.52587890625, -2.421630859375, -2.3173828125, -2.213134765625, -2.10888671875, -2.004638671875, -1.900390625, -1.796142578125, -1.69189453125, -1.587646484375, -1.4833984375, -1.379150390625, -1.27490234375, -1.170654296875, -1.06640625, -0.962158203125, -0.85791015625, -0.753662109375, -0.6494140625, -0.545166015625, -0.44091796875, -0.336669921875, -0.232421875, -0.128173828125, -0.02392578125, 0.080322265625, 0.1845703125, 0.288818359375, 0.39306640625, 0.497314453125, 0.6015625, 0.705810546875, 0.81005859375, 0.914306640625, 1.0185546875, 1.122802734375, 1.22705078125, 1.331298828125, 1.435546875, 1.539794921875, 1.64404296875, 1.748291015625, 1.8525390625, 1.956787109375, 2.06103515625, 2.165283203125, 2.26953125, 2.373779296875, 2.47802734375, 2.582275390625, 2.6865234375, 2.790771484375, 2.89501953125, 2.999267578125, 3.103515625, 3.207763671875, 3.31201171875, 3.416259765625, 3.5205078125, 3.624755859375, 3.72900390625, 3.833251953125, 3.9375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 11.0, 14.0, 19.0, 31.0, 36.0, 63.0, 78.0, 110.0, 156.0, 218.0, 284.0, 408.0, 653.0, 963.0, 1655.0, 2723.0, 5212.0, 10269.0, 25563.0, 91621.0, 3667187.0, 307375.0, 46262.0, 16330.0, 7348.0, 3750.0, 2059.0, 1287.0, 816.0, 551.0, 374.0, 257.0, 146.0, 123.0, 89.0, 72.0, 45.0, 34.0, 26.0, 17.0, 15.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.3167724609375, -6.117919921875, -5.9190673828125, -5.72021484375, -5.5213623046875, -5.322509765625, -5.1236572265625, -4.9248046875, -4.7259521484375, -4.527099609375, -4.3282470703125, -4.12939453125, -3.9305419921875, -3.731689453125, -3.5328369140625, -3.333984375, -3.1351318359375, -2.936279296875, -2.7374267578125, -2.53857421875, -2.3397216796875, -2.140869140625, -1.9420166015625, -1.7431640625, -1.5443115234375, -1.345458984375, -1.1466064453125, -0.94775390625, -0.7489013671875, -0.550048828125, -0.3511962890625, -0.15234375, 0.0465087890625, 0.245361328125, 0.4442138671875, 0.64306640625, 0.8419189453125, 1.040771484375, 1.2396240234375, 1.4384765625, 1.6373291015625, 1.836181640625, 2.0350341796875, 2.23388671875, 2.4327392578125, 2.631591796875, 2.8304443359375, 3.029296875, 3.2281494140625, 3.427001953125, 3.6258544921875, 3.82470703125, 4.0235595703125, 4.222412109375, 4.4212646484375, 4.6201171875, 4.8189697265625, 5.017822265625, 5.2166748046875, 5.41552734375, 5.6143798828125, 5.813232421875, 6.0120849609375, 6.2109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 7.0, 10.0, 10.0, 17.0, 21.0, 42.0, 93.0, 204.0, 2930.0, 429.0, 118.0, 64.0, 28.0, 29.0, 19.0, 15.0, 6.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.63671875, -2.56292724609375, -2.4891357421875, -2.41534423828125, -2.341552734375, -2.26776123046875, -2.1939697265625, -2.12017822265625, -2.04638671875, -1.97259521484375, -1.8988037109375, -1.82501220703125, -1.751220703125, -1.67742919921875, -1.6036376953125, -1.52984619140625, -1.4560546875, -1.38226318359375, -1.3084716796875, -1.23468017578125, -1.160888671875, -1.08709716796875, -1.0133056640625, -0.93951416015625, -0.86572265625, -0.79193115234375, -0.7181396484375, -0.64434814453125, -0.570556640625, -0.49676513671875, -0.4229736328125, -0.34918212890625, -0.275390625, -0.20159912109375, -0.1278076171875, -0.05401611328125, 0.019775390625, 0.09356689453125, 0.1673583984375, 0.24114990234375, 0.31494140625, 0.38873291015625, 0.4625244140625, 0.53631591796875, 0.610107421875, 0.68389892578125, 0.7576904296875, 0.83148193359375, 0.9052734375, 0.97906494140625, 1.0528564453125, 1.12664794921875, 1.200439453125, 1.27423095703125, 1.3480224609375, 1.42181396484375, 1.49560546875, 1.56939697265625, 1.6431884765625, 1.71697998046875, 1.790771484375, 1.86456298828125, 1.9383544921875, 2.01214599609375, 2.0859375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 20.0, 56.0, 147.0, 222.0, 228.0, 163.0, 88.0, 42.0, 13.0, 6.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.771703720092773, -15.156792640686035, -14.541881561279297, -13.926971435546875, -13.312060356140137, -12.697149276733398, -12.082239151000977, -11.467328071594238, -10.8524169921875, -10.237505912780762, -9.622594833374023, -9.007684707641602, -8.392773628234863, -7.777862548828125, -7.162951946258545, -6.548041343688965, -5.933130264282227, -5.318219184875488, -4.703308582305908, -4.088397979736328, -3.47348690032959, -2.8585760593414307, -2.2436652183532715, -1.6287546157836914, -1.0138435363769531, -0.39893269538879395, 0.21597814559936523, 0.8308889865875244, 1.4457998275756836, 2.0607106685638428, 2.675621509552002, 3.290532112121582, 3.9054431915283203, 4.520354270935059, 5.135264873504639, 5.750175476074219, 6.365086555480957, 6.979997634887695, 7.594908237457275, 8.209818840026855, 8.824729919433594, 9.439640998840332, 10.05455207824707, 10.669462203979492, 11.28437328338623, 11.899284362792969, 12.51419448852539, 13.129105567932129, 13.744016647338867, 14.358927726745605, 14.973838806152344, 15.588748931884766, 16.203659057617188, 16.818571090698242, 17.433481216430664, 18.04839324951172, 18.66330337524414, 19.278213500976562, 19.893125534057617, 20.50803565979004, 21.122947692871094, 21.737857818603516, 22.352767944335938, 22.96767807006836, 23.582590103149414]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 9.0, 5.0, 5.0, 10.0, 11.0, 11.0, 9.0, 18.0, 21.0, 26.0, 24.0, 22.0, 26.0, 31.0, 30.0, 28.0, 29.0, 29.0, 28.0, 46.0, 38.0, 20.0, 36.0, 45.0, 42.0, 32.0, 30.0, 37.0, 31.0, 29.0, 30.0, 27.0, 24.0, 14.0, 30.0, 16.0, 12.0, 16.0, 13.0, 11.0, 13.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.286715984344482, -5.130557060241699, -4.974398612976074, -4.818239688873291, -4.662080764770508, -4.505921840667725, -4.349762916564941, -4.193604469299316, -4.037445545196533, -3.88128662109375, -3.725127935409546, -3.568969249725342, -3.4128103256225586, -3.2566514015197754, -3.1004927158355713, -2.944334030151367, -2.788175106048584, -2.632016181945801, -2.4758574962615967, -2.3196988105773926, -2.1635398864746094, -2.007380962371826, -1.851222276687622, -1.6950634717941284, -1.5389046669006348, -1.3827458620071411, -1.2265870571136475, -1.0704282522201538, -0.9142694473266602, -0.7581106424331665, -0.6019518375396729, -0.4457930326461792, -0.28963375091552734, -0.1334749460220337, 0.02268385887145996, 0.1788426637649536, 0.33500146865844727, 0.4911602735519409, 0.6473190784454346, 0.8034778833389282, 0.9596366882324219, 1.1157954931259155, 1.2719542980194092, 1.4281131029129028, 1.5842719078063965, 1.7404307126998901, 1.8965895175933838, 2.052748203277588, 2.208907127380371, 2.3650660514831543, 2.5212247371673584, 2.6773834228515625, 2.8335423469543457, 2.989701271057129, 3.145859956741333, 3.302018642425537, 3.4581775665283203, 3.6143364906311035, 3.7704951763153076, 3.9266538619995117, 4.082812786102295, 4.238971710205078, 4.395130157470703, 4.551289081573486, 4.7074480056762695]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 11.0, 15.0, 22.0, 35.0, 46.0, 64.0, 114.0, 179.0, 305.0, 508.0, 949.0, 1699.0, 3422.0, 7060.0, 16197.0, 38124.0, 94369.0, 214263.0, 308842.0, 207022.0, 89741.0, 36180.0, 15232.0, 6846.0, 3344.0, 1715.0, 887.0, 524.0, 285.0, 192.0, 124.0, 70.0, 48.0, 39.0, 27.0, 16.0, 15.0, 7.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6328125, -7.40478515625, -7.1767578125, -6.94873046875, -6.720703125, -6.49267578125, -6.2646484375, -6.03662109375, -5.80859375, -5.58056640625, -5.3525390625, -5.12451171875, -4.896484375, -4.66845703125, -4.4404296875, -4.21240234375, -3.984375, -3.75634765625, -3.5283203125, -3.30029296875, -3.072265625, -2.84423828125, -2.6162109375, -2.38818359375, -2.16015625, -1.93212890625, -1.7041015625, -1.47607421875, -1.248046875, -1.02001953125, -0.7919921875, -0.56396484375, -0.3359375, -0.10791015625, 0.1201171875, 0.34814453125, 0.576171875, 0.80419921875, 1.0322265625, 1.26025390625, 1.48828125, 1.71630859375, 1.9443359375, 2.17236328125, 2.400390625, 2.62841796875, 2.8564453125, 3.08447265625, 3.3125, 3.54052734375, 3.7685546875, 3.99658203125, 4.224609375, 4.45263671875, 4.6806640625, 4.90869140625, 5.13671875, 5.36474609375, 5.5927734375, 5.82080078125, 6.048828125, 6.27685546875, 6.5048828125, 6.73291015625, 6.9609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 11.0, 13.0, 27.0, 17.0, 19.0, 24.0, 38.0, 30.0, 35.0, 41.0, 50.0, 49.0, 50.0, 36.0, 53.0, 58.0, 50.0, 45.0, 53.0, 41.0, 35.0, 32.0, 24.0, 23.0, 25.0, 18.0, 16.0, 14.0, 16.0, 8.0, 7.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.163818359375, -3.05224609375, -2.940673828125, -2.8291015625, -2.717529296875, -2.60595703125, -2.494384765625, -2.3828125, -2.271240234375, -2.15966796875, -2.048095703125, -1.9365234375, -1.824951171875, -1.71337890625, -1.601806640625, -1.490234375, -1.378662109375, -1.26708984375, -1.155517578125, -1.0439453125, -0.932373046875, -0.82080078125, -0.709228515625, -0.59765625, -0.486083984375, -0.37451171875, -0.262939453125, -0.1513671875, -0.039794921875, 0.07177734375, 0.183349609375, 0.294921875, 0.406494140625, 0.51806640625, 0.629638671875, 0.7412109375, 0.852783203125, 0.96435546875, 1.075927734375, 1.1875, 1.299072265625, 1.41064453125, 1.522216796875, 1.6337890625, 1.745361328125, 1.85693359375, 1.968505859375, 2.080078125, 2.191650390625, 2.30322265625, 2.414794921875, 2.5263671875, 2.637939453125, 2.74951171875, 2.861083984375, 2.97265625, 3.084228515625, 3.19580078125, 3.307373046875, 3.4189453125, 3.530517578125, 3.64208984375, 3.753662109375, 3.865234375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 15.0, 24.0, 35.0, 31.0, 43.0, 81.0, 116.0, 155.0, 254.0, 435.0, 673.0, 1405.0, 4415.0, 59669.0, 906110.0, 67083.0, 4620.0, 1439.0, 733.0, 431.0, 264.0, 158.0, 101.0, 70.0, 55.0, 30.0, 21.0, 14.0, 10.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.90625, -26.052490234375, -25.19873046875, -24.344970703125, -23.4912109375, -22.637451171875, -21.78369140625, -20.929931640625, -20.076171875, -19.222412109375, -18.36865234375, -17.514892578125, -16.6611328125, -15.807373046875, -14.95361328125, -14.099853515625, -13.24609375, -12.392333984375, -11.53857421875, -10.684814453125, -9.8310546875, -8.977294921875, -8.12353515625, -7.269775390625, -6.416015625, -5.562255859375, -4.70849609375, -3.854736328125, -3.0009765625, -2.147216796875, -1.29345703125, -0.439697265625, 0.4140625, 1.267822265625, 2.12158203125, 2.975341796875, 3.8291015625, 4.682861328125, 5.53662109375, 6.390380859375, 7.244140625, 8.097900390625, 8.95166015625, 9.805419921875, 10.6591796875, 11.512939453125, 12.36669921875, 13.220458984375, 14.07421875, 14.927978515625, 15.78173828125, 16.635498046875, 17.4892578125, 18.343017578125, 19.19677734375, 20.050537109375, 20.904296875, 21.758056640625, 22.61181640625, 23.465576171875, 24.3193359375, 25.173095703125, 26.02685546875, 26.880615234375, 27.734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 11.0, 4.0, 7.0, 9.0, 17.0, 12.0, 14.0, 27.0, 32.0, 37.0, 36.0, 35.0, 50.0, 43.0, 60.0, 48.0, 53.0, 61.0, 60.0, 64.0, 56.0, 36.0, 36.0, 31.0, 35.0, 25.0, 19.0, 15.0, 16.0, 17.0, 10.0, 5.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.71875, -18.201904296875, -17.68505859375, -17.168212890625, -16.6513671875, -16.134521484375, -15.61767578125, -15.100830078125, -14.583984375, -14.067138671875, -13.55029296875, -13.033447265625, -12.5166015625, -11.999755859375, -11.48291015625, -10.966064453125, -10.44921875, -9.932373046875, -9.41552734375, -8.898681640625, -8.3818359375, -7.864990234375, -7.34814453125, -6.831298828125, -6.314453125, -5.797607421875, -5.28076171875, -4.763916015625, -4.2470703125, -3.730224609375, -3.21337890625, -2.696533203125, -2.1796875, -1.662841796875, -1.14599609375, -0.629150390625, -0.1123046875, 0.404541015625, 0.92138671875, 1.438232421875, 1.955078125, 2.471923828125, 2.98876953125, 3.505615234375, 4.0224609375, 4.539306640625, 5.05615234375, 5.572998046875, 6.08984375, 6.606689453125, 7.12353515625, 7.640380859375, 8.1572265625, 8.674072265625, 9.19091796875, 9.707763671875, 10.224609375, 10.741455078125, 11.25830078125, 11.775146484375, 12.2919921875, 12.808837890625, 13.32568359375, 13.842529296875, 14.359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 8.0, 7.0, 10.0, 14.0, 18.0, 38.0, 51.0, 93.0, 146.0, 292.0, 658.0, 2088.0, 10974.0, 197219.0, 797648.0, 33006.0, 4224.0, 1086.0, 411.0, 193.0, 109.0, 83.0, 40.0, 37.0, 28.0, 15.0, 6.0, 11.0, 7.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.296875, -9.956298828125, -9.61572265625, -9.275146484375, -8.9345703125, -8.593994140625, -8.25341796875, -7.912841796875, -7.572265625, -7.231689453125, -6.89111328125, -6.550537109375, -6.2099609375, -5.869384765625, -5.52880859375, -5.188232421875, -4.84765625, -4.507080078125, -4.16650390625, -3.825927734375, -3.4853515625, -3.144775390625, -2.80419921875, -2.463623046875, -2.123046875, -1.782470703125, -1.44189453125, -1.101318359375, -0.7607421875, -0.420166015625, -0.07958984375, 0.260986328125, 0.6015625, 0.942138671875, 1.28271484375, 1.623291015625, 1.9638671875, 2.304443359375, 2.64501953125, 2.985595703125, 3.326171875, 3.666748046875, 4.00732421875, 4.347900390625, 4.6884765625, 5.029052734375, 5.36962890625, 5.710205078125, 6.05078125, 6.391357421875, 6.73193359375, 7.072509765625, 7.4130859375, 7.753662109375, 8.09423828125, 8.434814453125, 8.775390625, 9.115966796875, 9.45654296875, 9.797119140625, 10.1376953125, 10.478271484375, 10.81884765625, 11.159423828125, 11.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 15.0, 5.0, 12.0, 9.0, 34.0, 33.0, 32.0, 52.0, 46.0, 79.0, 100.0, 116.0, 113.0, 81.0, 64.0, 44.0, 46.0, 27.0, 23.0, 20.0, 11.0, 7.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0009746551513671875, -0.0009464919567108154, -0.0009183287620544434, -0.0008901655673980713, -0.0008620023727416992, -0.0008338391780853271, -0.0008056759834289551, -0.000777512788772583, -0.0007493495941162109, -0.0007211863994598389, -0.0006930232048034668, -0.0006648600101470947, -0.0006366968154907227, -0.0006085336208343506, -0.0005803704261779785, -0.0005522072315216064, -0.0005240440368652344, -0.0004958808422088623, -0.00046771764755249023, -0.00043955445289611816, -0.0004113912582397461, -0.000383228063583374, -0.00035506486892700195, -0.0003269016742706299, -0.0002987384796142578, -0.00027057528495788574, -0.00024241209030151367, -0.0002142488956451416, -0.00018608570098876953, -0.00015792250633239746, -0.0001297593116760254, -0.00010159611701965332, -7.343292236328125e-05, -4.526972770690918e-05, -1.710653305053711e-05, 1.1056661605834961e-05, 3.921985626220703e-05, 6.73830509185791e-05, 9.554624557495117e-05, 0.00012370944023132324, 0.0001518726348876953, 0.00018003582954406738, 0.00020819902420043945, 0.00023636221885681152, 0.0002645254135131836, 0.00029268860816955566, 0.00032085180282592773, 0.0003490149974822998, 0.0003771781921386719, 0.00040534138679504395, 0.000433504581451416, 0.0004616677761077881, 0.0004898309707641602, 0.0005179941654205322, 0.0005461573600769043, 0.0005743205547332764, 0.0006024837493896484, 0.0006306469440460205, 0.0006588101387023926, 0.0006869733333587646, 0.0007151365280151367, 0.0007432997226715088, 0.0007714629173278809, 0.0007996261119842529, 0.000827789306640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 23.0, 32.0, 39.0, 90.0, 171.0, 319.0, 826.0, 3657.0, 58202.0, 950042.0, 31086.0, 2693.0, 724.0, 295.0, 127.0, 72.0, 52.0, 23.0, 19.0, 10.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.96875, -18.487548828125, -18.00634765625, -17.525146484375, -17.0439453125, -16.562744140625, -16.08154296875, -15.600341796875, -15.119140625, -14.637939453125, -14.15673828125, -13.675537109375, -13.1943359375, -12.713134765625, -12.23193359375, -11.750732421875, -11.26953125, -10.788330078125, -10.30712890625, -9.825927734375, -9.3447265625, -8.863525390625, -8.38232421875, -7.901123046875, -7.419921875, -6.938720703125, -6.45751953125, -5.976318359375, -5.4951171875, -5.013916015625, -4.53271484375, -4.051513671875, -3.5703125, -3.089111328125, -2.60791015625, -2.126708984375, -1.6455078125, -1.164306640625, -0.68310546875, -0.201904296875, 0.279296875, 0.760498046875, 1.24169921875, 1.722900390625, 2.2041015625, 2.685302734375, 3.16650390625, 3.647705078125, 4.12890625, 4.610107421875, 5.09130859375, 5.572509765625, 6.0537109375, 6.534912109375, 7.01611328125, 7.497314453125, 7.978515625, 8.459716796875, 8.94091796875, 9.422119140625, 9.9033203125, 10.384521484375, 10.86572265625, 11.346923828125, 11.828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 11.0, 12.0, 26.0, 50.0, 118.0, 186.0, 233.0, 163.0, 90.0, 38.0, 25.0, 13.0, 6.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.1875, -19.75213623046875, -19.3167724609375, -18.88140869140625, -18.446044921875, -18.01068115234375, -17.5753173828125, -17.13995361328125, -16.70458984375, -16.26922607421875, -15.8338623046875, -15.39849853515625, -14.963134765625, -14.52777099609375, -14.0924072265625, -13.65704345703125, -13.2216796875, -12.78631591796875, -12.3509521484375, -11.91558837890625, -11.480224609375, -11.04486083984375, -10.6094970703125, -10.17413330078125, -9.73876953125, -9.30340576171875, -8.8680419921875, -8.43267822265625, -7.997314453125, -7.56195068359375, -7.1265869140625, -6.69122314453125, -6.255859375, -5.82049560546875, -5.3851318359375, -4.94976806640625, -4.514404296875, -4.07904052734375, -3.6436767578125, -3.20831298828125, -2.77294921875, -2.33758544921875, -1.9022216796875, -1.46685791015625, -1.031494140625, -0.59613037109375, -0.1607666015625, 0.27459716796875, 0.7099609375, 1.14532470703125, 1.5806884765625, 2.01605224609375, 2.451416015625, 2.88677978515625, 3.3221435546875, 3.75750732421875, 4.19287109375, 4.62823486328125, 5.0635986328125, 5.49896240234375, 5.934326171875, 6.36968994140625, 6.8050537109375, 7.24041748046875, 7.67578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 8.0, 23.0, 64.0, 200.0, 299.0, 243.0, 112.0, 35.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.58305358886719, -113.18986511230469, -106.79667663574219, -100.40348815917969, -94.01029968261719, -87.61711120605469, -81.22393035888672, -74.83074188232422, -68.43755340576172, -62.04436492919922, -55.65117645263672, -49.257991790771484, -42.864803314208984, -36.471614837646484, -30.07843017578125, -23.68524169921875, -17.29205322265625, -10.898865699768066, -4.505678176879883, 1.8875083923339844, 8.280696868896484, 14.673885345458984, 21.06707000732422, 27.46025848388672, 33.85344696044922, 40.24663543701172, 46.63982391357422, 53.03300857543945, 59.42619705200195, 65.81938171386719, 72.21257019042969, 78.60575866699219, 84.99893188476562, 91.39212036132812, 97.78530883789062, 104.17849731445312, 110.57168579101562, 116.96487426757812, 123.3580551147461, 129.75125122070312, 136.14443969726562, 142.53762817382812, 148.93081665039062, 155.32400512695312, 161.71719360351562, 168.11038208007812, 174.50357055664062, 180.89675903320312, 187.28993225097656, 193.68312072753906, 200.07630920410156, 206.46949768066406, 212.86268615722656, 219.25587463378906, 225.6490478515625, 232.042236328125, 238.4354248046875, 244.82861328125, 251.2218017578125, 257.614990234375, 264.0081787109375, 270.4013671875, 276.7945556640625, 283.187744140625, 289.5809326171875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 8.0, 8.0, 9.0, 17.0, 25.0, 25.0, 17.0, 28.0, 30.0, 34.0, 31.0, 55.0, 48.0, 55.0, 68.0, 47.0, 46.0, 58.0, 51.0, 44.0, 49.0, 32.0, 33.0, 30.0, 21.0, 20.0, 17.0, 11.0, 8.0, 10.0, 11.0, 4.0, 4.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.61265563964844, -71.26774597167969, -68.92284393310547, -66.57794189453125, -64.2330322265625, -61.888126373291016, -59.54322052001953, -57.19831466674805, -54.85340881347656, -52.50850296020508, -50.163597106933594, -47.81869125366211, -45.473785400390625, -43.12887954711914, -40.783973693847656, -38.43906784057617, -36.09416198730469, -33.7492561340332, -31.40435028076172, -29.059444427490234, -26.71453857421875, -24.369632720947266, -22.02472686767578, -19.679821014404297, -17.334915161132812, -14.990009307861328, -12.645103454589844, -10.30019760131836, -7.955291748046875, -5.610385894775391, -3.2654800415039062, -0.9205741882324219, 1.4243316650390625, 3.769237518310547, 6.114143371582031, 8.459049224853516, 10.803955078125, 13.148860931396484, 15.493766784667969, 17.838672637939453, 20.183578491210938, 22.528484344482422, 24.873390197753906, 27.21829605102539, 29.563201904296875, 31.90810775756836, 34.253013610839844, 36.59791946411133, 38.94282531738281, 41.2877311706543, 43.63263702392578, 45.977542877197266, 48.32244873046875, 50.667354583740234, 53.01226043701172, 55.3571662902832, 57.70207214355469, 60.04697799682617, 62.391883850097656, 64.73678588867188, 67.08169555664062, 69.42660522460938, 71.7715072631836, 74.11640930175781, 76.46131896972656]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 14.0, 29.0, 43.0, 71.0, 170.0, 300.0, 559.0, 1296.0, 3561.0, 14275.0, 251870.0, 3895637.0, 19314.0, 4297.0, 1469.0, 665.0, 279.0, 165.0, 90.0, 61.0, 42.0, 16.0, 13.0, 8.0, 2.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-24.671875, -24.0712890625, -23.470703125, -22.8701171875, -22.26953125, -21.6689453125, -21.068359375, -20.4677734375, -19.8671875, -19.2666015625, -18.666015625, -18.0654296875, -17.46484375, -16.8642578125, -16.263671875, -15.6630859375, -15.0625, -14.4619140625, -13.861328125, -13.2607421875, -12.66015625, -12.0595703125, -11.458984375, -10.8583984375, -10.2578125, -9.6572265625, -9.056640625, -8.4560546875, -7.85546875, -7.2548828125, -6.654296875, -6.0537109375, -5.453125, -4.8525390625, -4.251953125, -3.6513671875, -3.05078125, -2.4501953125, -1.849609375, -1.2490234375, -0.6484375, -0.0478515625, 0.552734375, 1.1533203125, 1.75390625, 2.3544921875, 2.955078125, 3.5556640625, 4.15625, 4.7568359375, 5.357421875, 5.9580078125, 6.55859375, 7.1591796875, 7.759765625, 8.3603515625, 8.9609375, 9.5615234375, 10.162109375, 10.7626953125, 11.36328125, 11.9638671875, 12.564453125, 13.1650390625, 13.765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 19.0, 18.0, 16.0, 30.0, 37.0, 35.0, 29.0, 30.0, 40.0, 43.0, 49.0, 54.0, 45.0, 39.0, 64.0, 57.0, 50.0, 50.0, 39.0, 34.0, 30.0, 23.0, 17.0, 19.0, 15.0, 22.0, 8.0, 8.0, 8.0, 16.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.259765625, -3.1474609375, -3.03515625, -2.9228515625, -2.810546875, -2.6982421875, -2.5859375, -2.4736328125, -2.361328125, -2.2490234375, -2.13671875, -2.0244140625, -1.912109375, -1.7998046875, -1.6875, -1.5751953125, -1.462890625, -1.3505859375, -1.23828125, -1.1259765625, -1.013671875, -0.9013671875, -0.7890625, -0.6767578125, -0.564453125, -0.4521484375, -0.33984375, -0.2275390625, -0.115234375, -0.0029296875, 0.109375, 0.2216796875, 0.333984375, 0.4462890625, 0.55859375, 0.6708984375, 0.783203125, 0.8955078125, 1.0078125, 1.1201171875, 1.232421875, 1.3447265625, 1.45703125, 1.5693359375, 1.681640625, 1.7939453125, 1.90625, 2.0185546875, 2.130859375, 2.2431640625, 2.35546875, 2.4677734375, 2.580078125, 2.6923828125, 2.8046875, 2.9169921875, 3.029296875, 3.1416015625, 3.25390625, 3.3662109375, 3.478515625, 3.5908203125, 3.703125, 3.8154296875, 3.927734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 10.0, 20.0, 15.0, 28.0, 25.0, 26.0, 61.0, 69.0, 105.0, 181.0, 324.0, 491.0, 762.0, 1209.0, 2081.0, 4094.0, 9554.0, 35581.0, 3737015.0, 360445.0, 25861.0, 7830.0, 3525.0, 1931.0, 1133.0, 710.0, 408.0, 243.0, 160.0, 105.0, 77.0, 47.0, 31.0, 20.0, 23.0, 12.0, 13.0, 11.0, 2.0, 3.0, 9.0, 7.0, 3.0, 7.0, 0.0, 3.0, 0.0, 1.0], "bins": [-12.6953125, -12.33154296875, -11.9677734375, -11.60400390625, -11.240234375, -10.87646484375, -10.5126953125, -10.14892578125, -9.78515625, -9.42138671875, -9.0576171875, -8.69384765625, -8.330078125, -7.96630859375, -7.6025390625, -7.23876953125, -6.875, -6.51123046875, -6.1474609375, -5.78369140625, -5.419921875, -5.05615234375, -4.6923828125, -4.32861328125, -3.96484375, -3.60107421875, -3.2373046875, -2.87353515625, -2.509765625, -2.14599609375, -1.7822265625, -1.41845703125, -1.0546875, -0.69091796875, -0.3271484375, 0.03662109375, 0.400390625, 0.76416015625, 1.1279296875, 1.49169921875, 1.85546875, 2.21923828125, 2.5830078125, 2.94677734375, 3.310546875, 3.67431640625, 4.0380859375, 4.40185546875, 4.765625, 5.12939453125, 5.4931640625, 5.85693359375, 6.220703125, 6.58447265625, 6.9482421875, 7.31201171875, 7.67578125, 8.03955078125, 8.4033203125, 8.76708984375, 9.130859375, 9.49462890625, 9.8583984375, 10.22216796875, 10.5859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 13.0, 32.0, 44.0, 163.0, 3377.0, 281.0, 67.0, 27.0, 15.0, 14.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.335235595703125, -4.21343994140625, -4.091644287109375, -3.9698486328125, -3.848052978515625, -3.72625732421875, -3.604461669921875, -3.482666015625, -3.360870361328125, -3.23907470703125, -3.117279052734375, -2.9954833984375, -2.873687744140625, -2.75189208984375, -2.630096435546875, -2.50830078125, -2.386505126953125, -2.26470947265625, -2.142913818359375, -2.0211181640625, -1.899322509765625, -1.77752685546875, -1.655731201171875, -1.533935546875, -1.412139892578125, -1.29034423828125, -1.168548583984375, -1.0467529296875, -0.924957275390625, -0.80316162109375, -0.681365966796875, -0.5595703125, -0.437774658203125, -0.31597900390625, -0.194183349609375, -0.0723876953125, 0.049407958984375, 0.17120361328125, 0.292999267578125, 0.414794921875, 0.536590576171875, 0.65838623046875, 0.780181884765625, 0.9019775390625, 1.023773193359375, 1.14556884765625, 1.267364501953125, 1.38916015625, 1.510955810546875, 1.63275146484375, 1.754547119140625, 1.8763427734375, 1.998138427734375, 2.11993408203125, 2.241729736328125, 2.363525390625, 2.485321044921875, 2.60711669921875, 2.728912353515625, 2.8507080078125, 2.972503662109375, 3.09429931640625, 3.216094970703125, 3.337890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 16.0, 36.0, 129.0, 244.0, 284.0, 182.0, 51.0, 27.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.323989868164062, -20.35895347595215, -19.393917083740234, -18.428882598876953, -17.46384620666504, -16.498809814453125, -15.533773422241211, -14.568737030029297, -13.603700637817383, -12.638664245605469, -11.673628807067871, -10.708592414855957, -9.743556022644043, -8.778520584106445, -7.813484191894531, -6.848447799682617, -5.8834123611450195, -4.918376445770264, -3.9533400535583496, -2.9883041381835938, -2.023267984390259, -1.0582318305969238, -0.09319591522216797, 0.8718404769897461, 1.836876392364502, 2.801912546157837, 3.766948699951172, 4.731984615325928, 5.697020530700684, 6.662056922912598, 7.6270928382873535, 8.59212875366211, 9.557165145874023, 10.522201538085938, 11.487236976623535, 12.45227336883545, 13.417309761047363, 14.382345199584961, 15.347381591796875, 16.31241798400879, 17.277454376220703, 18.242490768432617, 19.20752716064453, 20.172561645507812, 21.137598037719727, 22.10263442993164, 23.067670822143555, 24.03270721435547, 24.99774169921875, 25.962778091430664, 26.927814483642578, 27.89284896850586, 28.857885360717773, 29.822921752929688, 30.7879581451416, 31.752994537353516, 32.71803283691406, 33.683067321777344, 34.64810562133789, 35.61314010620117, 36.57817840576172, 37.543212890625, 38.50824737548828, 39.47328567504883, 40.43832015991211]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 13.0, 11.0, 19.0, 11.0, 26.0, 22.0, 38.0, 35.0, 40.0, 53.0, 53.0, 45.0, 60.0, 58.0, 48.0, 48.0, 51.0, 37.0, 53.0, 46.0, 34.0, 37.0, 19.0, 22.0, 23.0, 15.0, 16.0, 12.0, 7.0, 8.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.228087425231934, -7.016045570373535, -6.804003715515137, -6.591961860656738, -6.37992000579834, -6.167878150939941, -5.955835819244385, -5.743793964385986, -5.531752109527588, -5.3197102546691895, -5.107668399810791, -4.895626544952393, -4.683584213256836, -4.4715423583984375, -4.259500503540039, -4.047458648681641, -3.835416793823242, -3.6233749389648438, -3.4113330841064453, -3.1992909908294678, -2.9872491359710693, -2.775207281112671, -2.5631651878356934, -2.351123332977295, -2.1390814781188965, -1.927039623260498, -1.71499764919281, -1.502955675125122, -1.2909138202667236, -1.0788719654083252, -0.8668299913406372, -0.6547880172729492, -0.4427461624145508, -0.23070424795150757, -0.018662333488464355, 0.19337958097457886, 0.40542149543762207, 0.6174633502960205, 0.8295053243637085, 1.0415472984313965, 1.253589153289795, 1.4656310081481934, 1.6776729822158813, 1.8897149562835693, 2.1017568111419678, 2.313798666000366, 2.5258407592773438, 2.737882614135742, 2.9499244689941406, 3.161966323852539, 3.3740081787109375, 3.586050271987915, 3.7980921268463135, 4.010133743286133, 4.2221760749816895, 4.434217929840088, 4.646259784698486, 4.858301639556885, 5.070343494415283, 5.282385349273682, 5.494427680969238, 5.706469535827637, 5.918511390686035, 6.130553245544434, 6.342595100402832]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 5.0, 19.0, 16.0, 29.0, 33.0, 32.0, 39.0, 67.0, 114.0, 204.0, 319.0, 599.0, 1308.0, 2914.0, 7624.0, 23067.0, 75801.0, 242272.0, 413725.0, 192198.0, 58942.0, 18086.0, 6313.0, 2400.0, 1068.0, 530.0, 287.0, 181.0, 102.0, 84.0, 44.0, 32.0, 11.0, 27.0, 17.0, 8.0, 5.0, 8.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.072509765625, -7.77783203125, -7.483154296875, -7.1884765625, -6.893798828125, -6.59912109375, -6.304443359375, -6.009765625, -5.715087890625, -5.42041015625, -5.125732421875, -4.8310546875, -4.536376953125, -4.24169921875, -3.947021484375, -3.65234375, -3.357666015625, -3.06298828125, -2.768310546875, -2.4736328125, -2.178955078125, -1.88427734375, -1.589599609375, -1.294921875, -1.000244140625, -0.70556640625, -0.410888671875, -0.1162109375, 0.178466796875, 0.47314453125, 0.767822265625, 1.0625, 1.357177734375, 1.65185546875, 1.946533203125, 2.2412109375, 2.535888671875, 2.83056640625, 3.125244140625, 3.419921875, 3.714599609375, 4.00927734375, 4.303955078125, 4.5986328125, 4.893310546875, 5.18798828125, 5.482666015625, 5.77734375, 6.072021484375, 6.36669921875, 6.661376953125, 6.9560546875, 7.250732421875, 7.54541015625, 7.840087890625, 8.134765625, 8.429443359375, 8.72412109375, 9.018798828125, 9.3134765625, 9.608154296875, 9.90283203125, 10.197509765625, 10.4921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 3.0, 10.0, 14.0, 12.0, 14.0, 19.0, 26.0, 23.0, 30.0, 41.0, 44.0, 25.0, 36.0, 38.0, 41.0, 40.0, 48.0, 50.0, 50.0, 49.0, 52.0, 56.0, 50.0, 21.0, 32.0, 24.0, 21.0, 15.0, 18.0, 15.0, 11.0, 12.0, 14.0, 7.0, 12.0, 9.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.248046875, -3.13677978515625, -3.0255126953125, -2.91424560546875, -2.802978515625, -2.69171142578125, -2.5804443359375, -2.46917724609375, -2.35791015625, -2.24664306640625, -2.1353759765625, -2.02410888671875, -1.912841796875, -1.80157470703125, -1.6903076171875, -1.57904052734375, -1.4677734375, -1.35650634765625, -1.2452392578125, -1.13397216796875, -1.022705078125, -0.91143798828125, -0.8001708984375, -0.68890380859375, -0.57763671875, -0.46636962890625, -0.3551025390625, -0.24383544921875, -0.132568359375, -0.02130126953125, 0.0899658203125, 0.20123291015625, 0.3125, 0.42376708984375, 0.5350341796875, 0.64630126953125, 0.757568359375, 0.86883544921875, 0.9801025390625, 1.09136962890625, 1.20263671875, 1.31390380859375, 1.4251708984375, 1.53643798828125, 1.647705078125, 1.75897216796875, 1.8702392578125, 1.98150634765625, 2.0927734375, 2.20404052734375, 2.3153076171875, 2.42657470703125, 2.537841796875, 2.64910888671875, 2.7603759765625, 2.87164306640625, 2.98291015625, 3.09417724609375, 3.2054443359375, 3.31671142578125, 3.427978515625, 3.53924560546875, 3.6505126953125, 3.76177978515625, 3.873046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 12.0, 15.0, 12.0, 24.0, 44.0, 67.0, 116.0, 245.0, 468.0, 1198.0, 4648.0, 248473.0, 781856.0, 8550.0, 1593.0, 611.0, 256.0, 147.0, 76.0, 40.0, 26.0, 18.0, 13.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.89697265625, -31.6376953125, -30.37841796875, -29.119140625, -27.85986328125, -26.6005859375, -25.34130859375, -24.08203125, -22.82275390625, -21.5634765625, -20.30419921875, -19.044921875, -17.78564453125, -16.5263671875, -15.26708984375, -14.0078125, -12.74853515625, -11.4892578125, -10.22998046875, -8.970703125, -7.71142578125, -6.4521484375, -5.19287109375, -3.93359375, -2.67431640625, -1.4150390625, -0.15576171875, 1.103515625, 2.36279296875, 3.6220703125, 4.88134765625, 6.140625, 7.39990234375, 8.6591796875, 9.91845703125, 11.177734375, 12.43701171875, 13.6962890625, 14.95556640625, 16.21484375, 17.47412109375, 18.7333984375, 19.99267578125, 21.251953125, 22.51123046875, 23.7705078125, 25.02978515625, 26.2890625, 27.54833984375, 28.8076171875, 30.06689453125, 31.326171875, 32.58544921875, 33.8447265625, 35.10400390625, 36.36328125, 37.62255859375, 38.8818359375, 40.14111328125, 41.400390625, 42.65966796875, 43.9189453125, 45.17822265625, 46.4375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 11.0, 21.0, 28.0, 34.0, 31.0, 53.0, 51.0, 62.0, 77.0, 76.0, 79.0, 78.0, 81.0, 60.0, 58.0, 43.0, 30.0, 34.0, 27.0, 19.0, 12.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.28125, -25.32421875, -24.3671875, -23.41015625, -22.453125, -21.49609375, -20.5390625, -19.58203125, -18.625, -17.66796875, -16.7109375, -15.75390625, -14.796875, -13.83984375, -12.8828125, -11.92578125, -10.96875, -10.01171875, -9.0546875, -8.09765625, -7.140625, -6.18359375, -5.2265625, -4.26953125, -3.3125, -2.35546875, -1.3984375, -0.44140625, 0.515625, 1.47265625, 2.4296875, 3.38671875, 4.34375, 5.30078125, 6.2578125, 7.21484375, 8.171875, 9.12890625, 10.0859375, 11.04296875, 12.0, 12.95703125, 13.9140625, 14.87109375, 15.828125, 16.78515625, 17.7421875, 18.69921875, 19.65625, 20.61328125, 21.5703125, 22.52734375, 23.484375, 24.44140625, 25.3984375, 26.35546875, 27.3125, 28.26953125, 29.2265625, 30.18359375, 31.140625, 32.09765625, 33.0546875, 34.01171875, 34.96875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 9.0, 6.0, 14.0, 23.0, 18.0, 38.0, 54.0, 57.0, 109.0, 142.0, 277.0, 575.0, 1969.0, 31236.0, 986545.0, 24380.0, 1787.0, 572.0, 240.0, 134.0, 94.0, 61.0, 39.0, 35.0, 26.0, 18.0, 10.0, 16.0, 12.0, 6.0, 6.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.328125, -20.69091796875, -20.0537109375, -19.41650390625, -18.779296875, -18.14208984375, -17.5048828125, -16.86767578125, -16.23046875, -15.59326171875, -14.9560546875, -14.31884765625, -13.681640625, -13.04443359375, -12.4072265625, -11.77001953125, -11.1328125, -10.49560546875, -9.8583984375, -9.22119140625, -8.583984375, -7.94677734375, -7.3095703125, -6.67236328125, -6.03515625, -5.39794921875, -4.7607421875, -4.12353515625, -3.486328125, -2.84912109375, -2.2119140625, -1.57470703125, -0.9375, -0.30029296875, 0.3369140625, 0.97412109375, 1.611328125, 2.24853515625, 2.8857421875, 3.52294921875, 4.16015625, 4.79736328125, 5.4345703125, 6.07177734375, 6.708984375, 7.34619140625, 7.9833984375, 8.62060546875, 9.2578125, 9.89501953125, 10.5322265625, 11.16943359375, 11.806640625, 12.44384765625, 13.0810546875, 13.71826171875, 14.35546875, 14.99267578125, 15.6298828125, 16.26708984375, 16.904296875, 17.54150390625, 18.1787109375, 18.81591796875, 19.453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 10.0, 20.0, 27.0, 31.0, 23.0, 42.0, 44.0, 49.0, 68.0, 98.0, 81.0, 96.0, 72.0, 52.0, 42.0, 33.0, 29.0, 19.0, 28.0, 24.0, 14.0, 20.0, 8.0, 6.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006337165832519531, -0.0006136447191238403, -0.0005935728549957275, -0.0005735009908676147, -0.000553429126739502, -0.0005333572626113892, -0.0005132853984832764, -0.0004932135343551636, -0.0004731416702270508, -0.000453069806098938, -0.0004329979419708252, -0.0004129260778427124, -0.0003928542137145996, -0.0003727823495864868, -0.000352710485458374, -0.00033263862133026123, -0.00031256675720214844, -0.00029249489307403564, -0.00027242302894592285, -0.00025235116481781006, -0.00023227930068969727, -0.00021220743656158447, -0.00019213557243347168, -0.0001720637083053589, -0.0001519918441772461, -0.0001319199800491333, -0.00011184811592102051, -9.177625179290771e-05, -7.170438766479492e-05, -5.163252353668213e-05, -3.1560659408569336e-05, -1.1488795280456543e-05, 8.58306884765625e-06, 2.8654932975769043e-05, 4.8726797103881836e-05, 6.879866123199463e-05, 8.887052536010742e-05, 0.00010894238948822021, 0.000129014253616333, 0.0001490861177444458, 0.0001691579818725586, 0.0001892298460006714, 0.00020930171012878418, 0.00022937357425689697, 0.00024944543838500977, 0.00026951730251312256, 0.00028958916664123535, 0.00030966103076934814, 0.00032973289489746094, 0.00034980475902557373, 0.0003698766231536865, 0.0003899484872817993, 0.0004100203514099121, 0.0004300922155380249, 0.0004501640796661377, 0.0004702359437942505, 0.0004903078079223633, 0.0005103796720504761, 0.0005304515361785889, 0.0005505234003067017, 0.0005705952644348145, 0.0005906671285629272, 0.00061073899269104, 0.0006308108568191528, 0.0006508827209472656]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 6.0, 5.0, 6.0, 8.0, 10.0, 16.0, 18.0, 18.0, 35.0, 41.0, 63.0, 123.0, 169.0, 334.0, 771.0, 2232.0, 11623.0, 514221.0, 503431.0, 11530.0, 2223.0, 771.0, 364.0, 187.0, 96.0, 64.0, 41.0, 38.0, 34.0, 16.0, 11.0, 7.0, 13.0, 4.0, 11.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-19.078125, -18.5760498046875, -18.073974609375, -17.5718994140625, -17.06982421875, -16.5677490234375, -16.065673828125, -15.5635986328125, -15.0615234375, -14.5594482421875, -14.057373046875, -13.5552978515625, -13.05322265625, -12.5511474609375, -12.049072265625, -11.5469970703125, -11.044921875, -10.5428466796875, -10.040771484375, -9.5386962890625, -9.03662109375, -8.5345458984375, -8.032470703125, -7.5303955078125, -7.0283203125, -6.5262451171875, -6.024169921875, -5.5220947265625, -5.02001953125, -4.5179443359375, -4.015869140625, -3.5137939453125, -3.01171875, -2.5096435546875, -2.007568359375, -1.5054931640625, -1.00341796875, -0.5013427734375, 0.000732421875, 0.5028076171875, 1.0048828125, 1.5069580078125, 2.009033203125, 2.5111083984375, 3.01318359375, 3.5152587890625, 4.017333984375, 4.5194091796875, 5.021484375, 5.5235595703125, 6.025634765625, 6.5277099609375, 7.02978515625, 7.5318603515625, 8.033935546875, 8.5360107421875, 9.0380859375, 9.5401611328125, 10.042236328125, 10.5443115234375, 11.04638671875, 11.5484619140625, 12.050537109375, 12.5526123046875, 13.0546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 12.0, 19.0, 20.0, 68.0, 170.0, 310.0, 238.0, 90.0, 27.0, 23.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.829833984375, -31.06591796875, -30.302001953125, -29.5380859375, -28.774169921875, -28.01025390625, -27.246337890625, -26.482421875, -25.718505859375, -24.95458984375, -24.190673828125, -23.4267578125, -22.662841796875, -21.89892578125, -21.135009765625, -20.37109375, -19.607177734375, -18.84326171875, -18.079345703125, -17.3154296875, -16.551513671875, -15.78759765625, -15.023681640625, -14.259765625, -13.495849609375, -12.73193359375, -11.968017578125, -11.2041015625, -10.440185546875, -9.67626953125, -8.912353515625, -8.1484375, -7.384521484375, -6.62060546875, -5.856689453125, -5.0927734375, -4.328857421875, -3.56494140625, -2.801025390625, -2.037109375, -1.273193359375, -0.50927734375, 0.254638671875, 1.0185546875, 1.782470703125, 2.54638671875, 3.310302734375, 4.07421875, 4.838134765625, 5.60205078125, 6.365966796875, 7.1298828125, 7.893798828125, 8.65771484375, 9.421630859375, 10.185546875, 10.949462890625, 11.71337890625, 12.477294921875, 13.2412109375, 14.005126953125, 14.76904296875, 15.532958984375, 16.296875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 20.0, 113.0, 356.0, 381.0, 92.0, 25.0, 5.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.3914794921875, -358.4256896972656, -348.45989990234375, -338.4941101074219, -328.5283203125, -318.56256103515625, -308.59674072265625, -298.6309814453125, -288.6651916503906, -278.69940185546875, -268.7336120605469, -258.767822265625, -248.8020477294922, -238.8362579345703, -228.87046813964844, -218.90469360351562, -208.9388885498047, -198.9730987548828, -189.00730895996094, -179.04153442382812, -169.07574462890625, -159.10995483398438, -149.1441650390625, -139.17837524414062, -129.21258544921875, -119.24679565429688, -109.28101348876953, -99.31522369384766, -89.34944152832031, -79.38365173339844, -69.41786193847656, -59.45207977294922, -49.486297607421875, -39.520511627197266, -29.554723739624023, -19.58893585205078, -9.623149871826172, 0.3426361083984375, 10.308425903320312, 20.274208068847656, 30.23999786376953, 40.20578384399414, 50.17156982421875, 60.137359619140625, 70.1031494140625, 80.06893157958984, 90.03472137451172, 100.00050354003906, 109.96629333496094, 119.93208312988281, 129.8978729248047, 139.8636474609375, 149.82943725585938, 159.79522705078125, 169.76101684570312, 179.726806640625, 189.69259643554688, 199.65838623046875, 209.62417602539062, 219.5899658203125, 229.5557403564453, 239.5215301513672, 249.48731994628906, 259.4530944824219, 269.41888427734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 7.0, 3.0, 5.0, 5.0, 8.0, 9.0, 5.0, 11.0, 15.0, 17.0, 21.0, 24.0, 25.0, 21.0, 28.0, 36.0, 40.0, 33.0, 42.0, 41.0, 42.0, 53.0, 34.0, 46.0, 37.0, 42.0, 48.0, 38.0, 34.0, 31.0, 23.0, 28.0, 23.0, 18.0, 17.0, 19.0, 12.0, 15.0, 11.0, 6.0, 3.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.46610260009766, -65.87213897705078, -63.278175354003906, -60.684207916259766, -58.09024429321289, -55.496280670166016, -52.902313232421875, -50.308349609375, -47.714385986328125, -45.12042236328125, -42.526458740234375, -39.932491302490234, -37.33852767944336, -34.744564056396484, -32.150596618652344, -29.55663299560547, -26.962669372558594, -24.36870574951172, -21.77474021911621, -19.180774688720703, -16.586811065673828, -13.992846488952637, -11.398881912231445, -8.804916381835938, -6.2109527587890625, -3.616988182067871, -1.0230236053466797, 1.5709409713745117, 4.164905548095703, 6.7588701248168945, 9.352834701538086, 11.946800231933594, 14.540763854980469, 17.134727478027344, 19.72869300842285, 22.32265853881836, 24.916622161865234, 27.51058578491211, 30.104551315307617, 32.698516845703125, 35.29248046875, 37.886444091796875, 40.48040771484375, 43.07437515258789, 45.668338775634766, 48.26230239868164, 50.85626983642578, 53.450233459472656, 56.04419708251953, 58.638160705566406, 61.23212432861328, 63.82609176635742, 66.42005920410156, 69.01402282714844, 71.60798645019531, 74.20195007324219, 76.79591369628906, 79.38987731933594, 81.98384094238281, 84.57780456542969, 87.17176818847656, 89.76573944091797, 92.35970306396484, 94.95366668701172, 97.5476303100586]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 8.0, 21.0, 19.0, 47.0, 98.0, 189.0, 352.0, 714.0, 1482.0, 3904.0, 13913.0, 129452.0, 3988222.0, 42953.0, 8051.0, 2525.0, 1122.0, 552.0, 262.0, 154.0, 82.0, 44.0, 32.0, 24.0, 15.0, 8.0, 7.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.48388671875, -14.0849609375, -13.68603515625, -13.287109375, -12.88818359375, -12.4892578125, -12.09033203125, -11.69140625, -11.29248046875, -10.8935546875, -10.49462890625, -10.095703125, -9.69677734375, -9.2978515625, -8.89892578125, -8.5, -8.10107421875, -7.7021484375, -7.30322265625, -6.904296875, -6.50537109375, -6.1064453125, -5.70751953125, -5.30859375, -4.90966796875, -4.5107421875, -4.11181640625, -3.712890625, -3.31396484375, -2.9150390625, -2.51611328125, -2.1171875, -1.71826171875, -1.3193359375, -0.92041015625, -0.521484375, -0.12255859375, 0.2763671875, 0.67529296875, 1.07421875, 1.47314453125, 1.8720703125, 2.27099609375, 2.669921875, 3.06884765625, 3.4677734375, 3.86669921875, 4.265625, 4.66455078125, 5.0634765625, 5.46240234375, 5.861328125, 6.26025390625, 6.6591796875, 7.05810546875, 7.45703125, 7.85595703125, 8.2548828125, 8.65380859375, 9.052734375, 9.45166015625, 9.8505859375, 10.24951171875, 10.6484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 5.0, 4.0, 6.0, 8.0, 22.0, 32.0, 25.0, 29.0, 48.0, 54.0, 64.0, 61.0, 82.0, 78.0, 74.0, 66.0, 58.0, 56.0, 44.0, 32.0, 45.0, 19.0, 26.0, 17.0, 12.0, 8.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.71527099609375, -4.5399169921875, -4.36456298828125, -4.189208984375, -4.01385498046875, -3.8385009765625, -3.66314697265625, -3.48779296875, -3.31243896484375, -3.1370849609375, -2.96173095703125, -2.786376953125, -2.61102294921875, -2.4356689453125, -2.26031494140625, -2.0849609375, -1.90960693359375, -1.7342529296875, -1.55889892578125, -1.383544921875, -1.20819091796875, -1.0328369140625, -0.85748291015625, -0.68212890625, -0.50677490234375, -0.3314208984375, -0.15606689453125, 0.019287109375, 0.19464111328125, 0.3699951171875, 0.54534912109375, 0.720703125, 0.89605712890625, 1.0714111328125, 1.24676513671875, 1.422119140625, 1.59747314453125, 1.7728271484375, 1.94818115234375, 2.12353515625, 2.29888916015625, 2.4742431640625, 2.64959716796875, 2.824951171875, 3.00030517578125, 3.1756591796875, 3.35101318359375, 3.5263671875, 3.70172119140625, 3.8770751953125, 4.05242919921875, 4.227783203125, 4.40313720703125, 4.5784912109375, 4.75384521484375, 4.92919921875, 5.10455322265625, 5.2799072265625, 5.45526123046875, 5.630615234375, 5.80596923828125, 5.9813232421875, 6.15667724609375, 6.33203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 18.0, 14.0, 34.0, 46.0, 61.0, 76.0, 103.0, 172.0, 290.0, 637.0, 1255.0, 3640.0, 11730.0, 60540.0, 3907328.0, 178265.0, 20724.0, 5593.0, 1912.0, 795.0, 409.0, 197.0, 125.0, 69.0, 67.0, 36.0, 33.0, 22.0, 13.0, 18.0, 11.0, 8.0, 7.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.23681640625, -8.9033203125, -8.56982421875, -8.236328125, -7.90283203125, -7.5693359375, -7.23583984375, -6.90234375, -6.56884765625, -6.2353515625, -5.90185546875, -5.568359375, -5.23486328125, -4.9013671875, -4.56787109375, -4.234375, -3.90087890625, -3.5673828125, -3.23388671875, -2.900390625, -2.56689453125, -2.2333984375, -1.89990234375, -1.56640625, -1.23291015625, -0.8994140625, -0.56591796875, -0.232421875, 0.10107421875, 0.4345703125, 0.76806640625, 1.1015625, 1.43505859375, 1.7685546875, 2.10205078125, 2.435546875, 2.76904296875, 3.1025390625, 3.43603515625, 3.76953125, 4.10302734375, 4.4365234375, 4.77001953125, 5.103515625, 5.43701171875, 5.7705078125, 6.10400390625, 6.4375, 6.77099609375, 7.1044921875, 7.43798828125, 7.771484375, 8.10498046875, 8.4384765625, 8.77197265625, 9.10546875, 9.43896484375, 9.7724609375, 10.10595703125, 10.439453125, 10.77294921875, 11.1064453125, 11.43994140625, 11.7734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 1.0, 4.0, 18.0, 23.0, 45.0, 72.0, 263.0, 3083.0, 363.0, 86.0, 38.0, 25.0, 14.0, 12.0, 13.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.3804931640625, -7.198486328125, -7.0164794921875, -6.83447265625, -6.6524658203125, -6.470458984375, -6.2884521484375, -6.1064453125, -5.9244384765625, -5.742431640625, -5.5604248046875, -5.37841796875, -5.1964111328125, -5.014404296875, -4.8323974609375, -4.650390625, -4.4683837890625, -4.286376953125, -4.1043701171875, -3.92236328125, -3.7403564453125, -3.558349609375, -3.3763427734375, -3.1943359375, -3.0123291015625, -2.830322265625, -2.6483154296875, -2.46630859375, -2.2843017578125, -2.102294921875, -1.9202880859375, -1.73828125, -1.5562744140625, -1.374267578125, -1.1922607421875, -1.01025390625, -0.8282470703125, -0.646240234375, -0.4642333984375, -0.2822265625, -0.1002197265625, 0.081787109375, 0.2637939453125, 0.44580078125, 0.6278076171875, 0.809814453125, 0.9918212890625, 1.173828125, 1.3558349609375, 1.537841796875, 1.7198486328125, 1.90185546875, 2.0838623046875, 2.265869140625, 2.4478759765625, 2.6298828125, 2.8118896484375, 2.993896484375, 3.1759033203125, 3.35791015625, 3.5399169921875, 3.721923828125, 3.9039306640625, 4.0859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 18.0, 68.0, 204.0, 333.0, 245.0, 81.0, 27.0, 14.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.069486618041992, -17.6395263671875, -16.209566116333008, -14.7796049118042, -13.349644660949707, -11.919684410095215, -10.489723205566406, -9.059762954711914, -7.629802703857422, -6.19984245300293, -4.769881725311279, -3.339920997619629, -1.9099607467651367, -0.48000049591064453, 0.9499607086181641, 2.3799209594726562, 3.8098812103271484, 5.239841461181641, 6.669802188873291, 8.099762916564941, 9.529723167419434, 10.959683418273926, 12.389644622802734, 13.819604873657227, 15.249565124511719, 16.67952537536621, 18.109485626220703, 19.539447784423828, 20.969406127929688, 22.399368286132812, 23.829328536987305, 25.259288787841797, 26.689247131347656, 28.11920738220215, 29.54916763305664, 30.979129791259766, 32.409088134765625, 33.83905029296875, 35.269012451171875, 36.698970794677734, 38.128929138183594, 39.55889129638672, 40.98884963989258, 42.4188117980957, 43.84877014160156, 45.27873229980469, 46.70869445800781, 48.13865280151367, 49.5686149597168, 50.99857711791992, 52.42853546142578, 53.858497619628906, 55.288455963134766, 56.71841812133789, 58.14837646484375, 59.578338623046875, 61.00830078125, 62.438262939453125, 63.868221282958984, 65.29817962646484, 66.72814178466797, 68.1581039428711, 69.58806610107422, 71.01802062988281, 72.44798278808594]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 15.0, 13.0, 15.0, 18.0, 21.0, 31.0, 28.0, 39.0, 38.0, 37.0, 43.0, 44.0, 41.0, 56.0, 53.0, 51.0, 48.0, 48.0, 36.0, 48.0, 42.0, 33.0, 34.0, 28.0, 19.0, 20.0, 14.0, 12.0, 9.0, 8.0, 9.0, 11.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-13.741985321044922, -13.377677917480469, -13.013370513916016, -12.649063110351562, -12.28475570678711, -11.92044734954834, -11.556139945983887, -11.191832542419434, -10.82752513885498, -10.463217735290527, -10.098910331726074, -9.734602928161621, -9.370294570922852, -9.005987167358398, -8.641679763793945, -8.277372360229492, -7.913064956665039, -7.548757553100586, -7.184450149536133, -6.8201422691345215, -6.455834865570068, -6.091527462005615, -5.727219581604004, -5.362912178039551, -4.998604774475098, -4.6342973709106445, -4.269989967346191, -3.90568208694458, -3.541374683380127, -3.177067279815674, -2.8127596378326416, -2.4484519958496094, -2.0841445922851562, -1.7198370695114136, -1.355529546737671, -0.9912220239639282, -0.6269145011901855, -0.26260697841644287, 0.1017005443572998, 0.46600818634033203, 0.8303155899047852, 1.1946231126785278, 1.5589306354522705, 1.9232381582260132, 2.287545680999756, 2.651853084564209, 3.016160726547241, 3.3804683685302734, 3.7447757720947266, 4.10908317565918, 4.473390579223633, 4.837698459625244, 5.202005863189697, 5.56631326675415, 5.930621147155762, 6.294928550720215, 6.659235954284668, 7.023543357849121, 7.387850761413574, 7.7521586418151855, 8.116466522216797, 8.48077392578125, 8.845081329345703, 9.209388732910156, 9.57369613647461]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 19.0, 7.0, 27.0, 20.0, 50.0, 54.0, 79.0, 130.0, 224.0, 359.0, 596.0, 1234.0, 2665.0, 6502.0, 20424.0, 87081.0, 415017.0, 399824.0, 82964.0, 19636.0, 6421.0, 2480.0, 1221.0, 564.0, 342.0, 211.0, 135.0, 76.0, 59.0, 40.0, 21.0, 24.0, 14.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.117919921875, -12.72021484375, -12.322509765625, -11.9248046875, -11.527099609375, -11.12939453125, -10.731689453125, -10.333984375, -9.936279296875, -9.53857421875, -9.140869140625, -8.7431640625, -8.345458984375, -7.94775390625, -7.550048828125, -7.15234375, -6.754638671875, -6.35693359375, -5.959228515625, -5.5615234375, -5.163818359375, -4.76611328125, -4.368408203125, -3.970703125, -3.572998046875, -3.17529296875, -2.777587890625, -2.3798828125, -1.982177734375, -1.58447265625, -1.186767578125, -0.7890625, -0.391357421875, 0.00634765625, 0.404052734375, 0.8017578125, 1.199462890625, 1.59716796875, 1.994873046875, 2.392578125, 2.790283203125, 3.18798828125, 3.585693359375, 3.9833984375, 4.381103515625, 4.77880859375, 5.176513671875, 5.57421875, 5.971923828125, 6.36962890625, 6.767333984375, 7.1650390625, 7.562744140625, 7.96044921875, 8.358154296875, 8.755859375, 9.153564453125, 9.55126953125, 9.948974609375, 10.3466796875, 10.744384765625, 11.14208984375, 11.539794921875, 11.9375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 15.0, 14.0, 29.0, 17.0, 33.0, 39.0, 35.0, 61.0, 67.0, 69.0, 66.0, 69.0, 80.0, 57.0, 55.0, 58.0, 45.0, 36.0, 27.0, 25.0, 25.0, 23.0, 5.0, 7.0, 5.0, 3.0, 6.0, 2.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.34613037109375, -4.1766357421875, -4.00714111328125, -3.837646484375, -3.66815185546875, -3.4986572265625, -3.32916259765625, -3.15966796875, -2.99017333984375, -2.8206787109375, -2.65118408203125, -2.481689453125, -2.31219482421875, -2.1427001953125, -1.97320556640625, -1.8037109375, -1.63421630859375, -1.4647216796875, -1.29522705078125, -1.125732421875, -0.95623779296875, -0.7867431640625, -0.61724853515625, -0.44775390625, -0.27825927734375, -0.1087646484375, 0.06072998046875, 0.230224609375, 0.39971923828125, 0.5692138671875, 0.73870849609375, 0.908203125, 1.07769775390625, 1.2471923828125, 1.41668701171875, 1.586181640625, 1.75567626953125, 1.9251708984375, 2.09466552734375, 2.26416015625, 2.43365478515625, 2.6031494140625, 2.77264404296875, 2.942138671875, 3.11163330078125, 3.2811279296875, 3.45062255859375, 3.6201171875, 3.78961181640625, 3.9591064453125, 4.12860107421875, 4.298095703125, 4.46759033203125, 4.6370849609375, 4.80657958984375, 4.97607421875, 5.14556884765625, 5.3150634765625, 5.48455810546875, 5.654052734375, 5.82354736328125, 5.9930419921875, 6.16253662109375, 6.33203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 16.0, 7.0, 21.0, 39.0, 30.0, 55.0, 84.0, 147.0, 246.0, 469.0, 1016.0, 3047.0, 17824.0, 634230.0, 374049.0, 12877.0, 2422.0, 895.0, 450.0, 251.0, 125.0, 77.0, 54.0, 36.0, 20.0, 17.0, 14.0, 8.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.4375, -29.51318359375, -28.5888671875, -27.66455078125, -26.740234375, -25.81591796875, -24.8916015625, -23.96728515625, -23.04296875, -22.11865234375, -21.1943359375, -20.27001953125, -19.345703125, -18.42138671875, -17.4970703125, -16.57275390625, -15.6484375, -14.72412109375, -13.7998046875, -12.87548828125, -11.951171875, -11.02685546875, -10.1025390625, -9.17822265625, -8.25390625, -7.32958984375, -6.4052734375, -5.48095703125, -4.556640625, -3.63232421875, -2.7080078125, -1.78369140625, -0.859375, 0.06494140625, 0.9892578125, 1.91357421875, 2.837890625, 3.76220703125, 4.6865234375, 5.61083984375, 6.53515625, 7.45947265625, 8.3837890625, 9.30810546875, 10.232421875, 11.15673828125, 12.0810546875, 13.00537109375, 13.9296875, 14.85400390625, 15.7783203125, 16.70263671875, 17.626953125, 18.55126953125, 19.4755859375, 20.39990234375, 21.32421875, 22.24853515625, 23.1728515625, 24.09716796875, 25.021484375, 25.94580078125, 26.8701171875, 27.79443359375, 28.71875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 3.0, 2.0, 13.0, 14.0, 12.0, 18.0, 16.0, 24.0, 21.0, 30.0, 37.0, 34.0, 39.0, 45.0, 44.0, 56.0, 52.0, 49.0, 53.0, 67.0, 52.0, 42.0, 35.0, 38.0, 37.0, 27.0, 26.0, 17.0, 22.0, 16.0, 11.0, 8.0, 9.0, 5.0, 3.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.23388671875, -17.5927734375, -16.95166015625, -16.310546875, -15.66943359375, -15.0283203125, -14.38720703125, -13.74609375, -13.10498046875, -12.4638671875, -11.82275390625, -11.181640625, -10.54052734375, -9.8994140625, -9.25830078125, -8.6171875, -7.97607421875, -7.3349609375, -6.69384765625, -6.052734375, -5.41162109375, -4.7705078125, -4.12939453125, -3.48828125, -2.84716796875, -2.2060546875, -1.56494140625, -0.923828125, -0.28271484375, 0.3583984375, 0.99951171875, 1.640625, 2.28173828125, 2.9228515625, 3.56396484375, 4.205078125, 4.84619140625, 5.4873046875, 6.12841796875, 6.76953125, 7.41064453125, 8.0517578125, 8.69287109375, 9.333984375, 9.97509765625, 10.6162109375, 11.25732421875, 11.8984375, 12.53955078125, 13.1806640625, 13.82177734375, 14.462890625, 15.10400390625, 15.7451171875, 16.38623046875, 17.02734375, 17.66845703125, 18.3095703125, 18.95068359375, 19.591796875, 20.23291015625, 20.8740234375, 21.51513671875, 22.15625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 6.0, 12.0, 18.0, 22.0, 30.0, 29.0, 48.0, 36.0, 62.0, 100.0, 143.0, 226.0, 331.0, 610.0, 1146.0, 2679.0, 7278.0, 31438.0, 294745.0, 633639.0, 57952.0, 10918.0, 3561.0, 1490.0, 753.0, 419.0, 236.0, 158.0, 112.0, 84.0, 75.0, 42.0, 35.0, 27.0, 18.0, 16.0, 11.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.363037109375, -5.19091796875, -5.018798828125, -4.8466796875, -4.674560546875, -4.50244140625, -4.330322265625, -4.158203125, -3.986083984375, -3.81396484375, -3.641845703125, -3.4697265625, -3.297607421875, -3.12548828125, -2.953369140625, -2.78125, -2.609130859375, -2.43701171875, -2.264892578125, -2.0927734375, -1.920654296875, -1.74853515625, -1.576416015625, -1.404296875, -1.232177734375, -1.06005859375, -0.887939453125, -0.7158203125, -0.543701171875, -0.37158203125, -0.199462890625, -0.02734375, 0.144775390625, 0.31689453125, 0.489013671875, 0.6611328125, 0.833251953125, 1.00537109375, 1.177490234375, 1.349609375, 1.521728515625, 1.69384765625, 1.865966796875, 2.0380859375, 2.210205078125, 2.38232421875, 2.554443359375, 2.7265625, 2.898681640625, 3.07080078125, 3.242919921875, 3.4150390625, 3.587158203125, 3.75927734375, 3.931396484375, 4.103515625, 4.275634765625, 4.44775390625, 4.619873046875, 4.7919921875, 4.964111328125, 5.13623046875, 5.308349609375, 5.48046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 7.0, 13.0, 10.0, 17.0, 56.0, 46.0, 78.0, 176.0, 223.0, 119.0, 68.0, 68.0, 49.0, 19.0, 17.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011196136474609375, -0.0010787397623062134, -0.0010378658771514893, -0.0009969919919967651, -0.000956118106842041, -0.0009152442216873169, -0.0008743703365325928, -0.0008334964513778687, -0.0007926225662231445, -0.0007517486810684204, -0.0007108747959136963, -0.0006700009107589722, -0.000629127025604248, -0.0005882531404495239, -0.0005473792552947998, -0.0005065053701400757, -0.00046563148498535156, -0.00042475759983062744, -0.0003838837146759033, -0.0003430098295211792, -0.0003021359443664551, -0.00026126205921173096, -0.00022038817405700684, -0.00017951428890228271, -0.0001386404037475586, -9.776651859283447e-05, -5.689263343811035e-05, -1.601874828338623e-05, 2.485513687133789e-05, 6.572902202606201e-05, 0.00010660290718078613, 0.00014747679233551025, 0.00018835067749023438, 0.0002292245626449585, 0.0002700984477996826, 0.00031097233295440674, 0.00035184621810913086, 0.000392720103263855, 0.0004335939884185791, 0.0004744678735733032, 0.0005153417587280273, 0.0005562156438827515, 0.0005970895290374756, 0.0006379634141921997, 0.0006788372993469238, 0.000719711184501648, 0.0007605850696563721, 0.0008014589548110962, 0.0008423328399658203, 0.0008832067251205444, 0.0009240806102752686, 0.0009649544954299927, 0.0010058283805847168, 0.001046702265739441, 0.001087576150894165, 0.0011284500360488892, 0.0011693239212036133, 0.0012101978063583374, 0.0012510716915130615, 0.0012919455766677856, 0.0013328194618225098, 0.0013736933469772339, 0.001414567232131958, 0.0014554411172866821, 0.0014963150024414062]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 15.0, 18.0, 14.0, 50.0, 86.0, 145.0, 333.0, 791.0, 2705.0, 15011.0, 395512.0, 610513.0, 18650.0, 3110.0, 915.0, 347.0, 160.0, 91.0, 41.0, 28.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8021240234375, -7.463623046875, -7.1251220703125, -6.78662109375, -6.4481201171875, -6.109619140625, -5.7711181640625, -5.4326171875, -5.0941162109375, -4.755615234375, -4.4171142578125, -4.07861328125, -3.7401123046875, -3.401611328125, -3.0631103515625, -2.724609375, -2.3861083984375, -2.047607421875, -1.7091064453125, -1.37060546875, -1.0321044921875, -0.693603515625, -0.3551025390625, -0.0166015625, 0.3218994140625, 0.660400390625, 0.9989013671875, 1.33740234375, 1.6759033203125, 2.014404296875, 2.3529052734375, 2.69140625, 3.0299072265625, 3.368408203125, 3.7069091796875, 4.04541015625, 4.3839111328125, 4.722412109375, 5.0609130859375, 5.3994140625, 5.7379150390625, 6.076416015625, 6.4149169921875, 6.75341796875, 7.0919189453125, 7.430419921875, 7.7689208984375, 8.107421875, 8.4459228515625, 8.784423828125, 9.1229248046875, 9.46142578125, 9.7999267578125, 10.138427734375, 10.4769287109375, 10.8154296875, 11.1539306640625, 11.492431640625, 11.8309326171875, 12.16943359375, 12.5079345703125, 12.846435546875, 13.1849365234375, 13.5234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 23.0, 23.0, 36.0, 44.0, 59.0, 85.0, 102.0, 92.0, 84.0, 88.0, 83.0, 67.0, 45.0, 30.0, 25.0, 17.0, 18.0, 10.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25, -6.0555419921875, -5.861083984375, -5.6666259765625, -5.47216796875, -5.2777099609375, -5.083251953125, -4.8887939453125, -4.6943359375, -4.4998779296875, -4.305419921875, -4.1109619140625, -3.91650390625, -3.7220458984375, -3.527587890625, -3.3331298828125, -3.138671875, -2.9442138671875, -2.749755859375, -2.5552978515625, -2.36083984375, -2.1663818359375, -1.971923828125, -1.7774658203125, -1.5830078125, -1.3885498046875, -1.194091796875, -0.9996337890625, -0.80517578125, -0.6107177734375, -0.416259765625, -0.2218017578125, -0.02734375, 0.1671142578125, 0.361572265625, 0.5560302734375, 0.75048828125, 0.9449462890625, 1.139404296875, 1.3338623046875, 1.5283203125, 1.7227783203125, 1.917236328125, 2.1116943359375, 2.30615234375, 2.5006103515625, 2.695068359375, 2.8895263671875, 3.083984375, 3.2784423828125, 3.472900390625, 3.6673583984375, 3.86181640625, 4.0562744140625, 4.250732421875, 4.4451904296875, 4.6396484375, 4.8341064453125, 5.028564453125, 5.2230224609375, 5.41748046875, 5.6119384765625, 5.806396484375, 6.0008544921875, 6.1953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 13.0, 20.0, 100.0, 251.0, 324.0, 199.0, 65.0, 17.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.46377563476562, -172.42108154296875, -165.3783721923828, -158.33567810058594, -151.29296875, -144.25027465820312, -137.2075653076172, -130.1648712158203, -123.12216186523438, -116.07946014404297, -109.03675842285156, -101.99405670166016, -94.95135498046875, -87.90866088867188, -80.86595153808594, -73.82325744628906, -66.78055572509766, -59.73785400390625, -52.695152282714844, -45.65245056152344, -38.60974884033203, -31.56705093383789, -24.524349212646484, -17.481647491455078, -10.438945770263672, -3.396244525909424, 3.646456718444824, 10.689157485961914, 17.73185920715332, 24.774559020996094, 31.8172607421875, 38.859962463378906, 45.90266418457031, 52.94536590576172, 59.988067626953125, 67.03076934814453, 74.07347106933594, 81.11616516113281, 88.15887451171875, 95.20156860351562, 102.24427795410156, 109.28697967529297, 116.32968139648438, 123.37238311767578, 130.4150848388672, 137.45777893066406, 144.50048828125, 151.54318237304688, 158.58587646484375, 165.62857055664062, 172.67127990722656, 179.71397399902344, 186.75668334960938, 193.79937744140625, 200.8420867919922, 207.88478088378906, 214.927490234375, 221.97018432617188, 229.0128936767578, 236.0555877685547, 243.09829711914062, 250.1409912109375, 257.1836853027344, 264.2264099121094, 271.26910400390625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 5.0, 9.0, 10.0, 20.0, 10.0, 30.0, 31.0, 32.0, 25.0, 29.0, 43.0, 51.0, 51.0, 45.0, 63.0, 46.0, 49.0, 60.0, 47.0, 50.0, 46.0, 38.0, 37.0, 23.0, 26.0, 25.0, 12.0, 14.0, 19.0, 18.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.14460754394531, -96.17861938476562, -93.21263122558594, -90.24664306640625, -87.28065490722656, -84.31466674804688, -81.34867858886719, -78.3826904296875, -75.41670227050781, -72.45071411132812, -69.48472595214844, -66.51873779296875, -63.55274963378906, -60.586761474609375, -57.62077331542969, -54.65478515625, -51.68879699707031, -48.722808837890625, -45.75682067871094, -42.79083251953125, -39.82484436035156, -36.858856201171875, -33.89286804199219, -30.9268798828125, -27.960891723632812, -24.994903564453125, -22.028915405273438, -19.06292724609375, -16.096939086914062, -13.130950927734375, -10.164962768554688, -7.198974609375, -4.232978820800781, -1.2669906616210938, 1.6989974975585938, 4.664985656738281, 7.630973815917969, 10.596961975097656, 13.562950134277344, 16.52893829345703, 19.49492645263672, 22.460914611816406, 25.426902770996094, 28.39289093017578, 31.35887908935547, 34.324867248535156, 37.290855407714844, 40.25684356689453, 43.22283172607422, 46.188819885253906, 49.154808044433594, 52.12079620361328, 55.08678436279297, 58.052772521972656, 61.018760681152344, 63.98474884033203, 66.95073699951172, 69.9167251586914, 72.8827133178711, 75.84870147705078, 78.81468963623047, 81.78067779541016, 84.74666595458984, 87.71265411376953, 90.67864227294922]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 3.0, 5.0, 17.0, 15.0, 16.0, 24.0, 47.0, 58.0, 84.0, 142.0, 196.0, 325.0, 605.0, 1217.0, 2624.0, 6176.0, 17359.0, 65469.0, 1302807.0, 2676417.0, 86217.0, 21314.0, 7265.0, 2975.0, 1355.0, 656.0, 351.0, 172.0, 125.0, 66.0, 54.0, 30.0, 24.0, 20.0, 12.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.53125, -9.2430419921875, -8.954833984375, -8.6666259765625, -8.37841796875, -8.0902099609375, -7.802001953125, -7.5137939453125, -7.2255859375, -6.9373779296875, -6.649169921875, -6.3609619140625, -6.07275390625, -5.7845458984375, -5.496337890625, -5.2081298828125, -4.919921875, -4.6317138671875, -4.343505859375, -4.0552978515625, -3.76708984375, -3.4788818359375, -3.190673828125, -2.9024658203125, -2.6142578125, -2.3260498046875, -2.037841796875, -1.7496337890625, -1.46142578125, -1.1732177734375, -0.885009765625, -0.5968017578125, -0.30859375, -0.0203857421875, 0.267822265625, 0.5560302734375, 0.84423828125, 1.1324462890625, 1.420654296875, 1.7088623046875, 1.9970703125, 2.2852783203125, 2.573486328125, 2.8616943359375, 3.14990234375, 3.4381103515625, 3.726318359375, 4.0145263671875, 4.302734375, 4.5909423828125, 4.879150390625, 5.1673583984375, 5.45556640625, 5.7437744140625, 6.031982421875, 6.3201904296875, 6.6083984375, 6.8966064453125, 7.184814453125, 7.4730224609375, 7.76123046875, 8.0494384765625, 8.337646484375, 8.6258544921875, 8.9140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 10.0, 14.0, 23.0, 33.0, 43.0, 48.0, 72.0, 97.0, 93.0, 101.0, 87.0, 97.0, 73.0, 59.0, 40.0, 33.0, 24.0, 18.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.015625, -9.7958984375, -9.576171875, -9.3564453125, -9.13671875, -8.9169921875, -8.697265625, -8.4775390625, -8.2578125, -8.0380859375, -7.818359375, -7.5986328125, -7.37890625, -7.1591796875, -6.939453125, -6.7197265625, -6.5, -6.2802734375, -6.060546875, -5.8408203125, -5.62109375, -5.4013671875, -5.181640625, -4.9619140625, -4.7421875, -4.5224609375, -4.302734375, -4.0830078125, -3.86328125, -3.6435546875, -3.423828125, -3.2041015625, -2.984375, -2.7646484375, -2.544921875, -2.3251953125, -2.10546875, -1.8857421875, -1.666015625, -1.4462890625, -1.2265625, -1.0068359375, -0.787109375, -0.5673828125, -0.34765625, -0.1279296875, 0.091796875, 0.3115234375, 0.53125, 0.7509765625, 0.970703125, 1.1904296875, 1.41015625, 1.6298828125, 1.849609375, 2.0693359375, 2.2890625, 2.5087890625, 2.728515625, 2.9482421875, 3.16796875, 3.3876953125, 3.607421875, 3.8271484375, 4.046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 14.0, 10.0, 13.0, 40.0, 82.0, 139.0, 430.0, 3027.0, 72810.0, 4089587.0, 26145.0, 1540.0, 236.0, 108.0, 41.0, 20.0, 17.0, 6.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.2880859375, -35.232421875, -34.1767578125, -33.12109375, -32.0654296875, -31.009765625, -29.9541015625, -28.8984375, -27.8427734375, -26.787109375, -25.7314453125, -24.67578125, -23.6201171875, -22.564453125, -21.5087890625, -20.453125, -19.3974609375, -18.341796875, -17.2861328125, -16.23046875, -15.1748046875, -14.119140625, -13.0634765625, -12.0078125, -10.9521484375, -9.896484375, -8.8408203125, -7.78515625, -6.7294921875, -5.673828125, -4.6181640625, -3.5625, -2.5068359375, -1.451171875, -0.3955078125, 0.66015625, 1.7158203125, 2.771484375, 3.8271484375, 4.8828125, 5.9384765625, 6.994140625, 8.0498046875, 9.10546875, 10.1611328125, 11.216796875, 12.2724609375, 13.328125, 14.3837890625, 15.439453125, 16.4951171875, 17.55078125, 18.6064453125, 19.662109375, 20.7177734375, 21.7734375, 22.8291015625, 23.884765625, 24.9404296875, 25.99609375, 27.0517578125, 28.107421875, 29.1630859375, 30.21875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 9.0, 15.0, 14.0, 29.0, 62.0, 100.0, 218.0, 1170.0, 1877.0, 339.0, 107.0, 45.0, 23.0, 18.0, 11.0, 9.0, 9.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-27.59375, -27.0084228515625, -26.423095703125, -25.8377685546875, -25.25244140625, -24.6671142578125, -24.081787109375, -23.4964599609375, -22.9111328125, -22.3258056640625, -21.740478515625, -21.1551513671875, -20.56982421875, -19.9844970703125, -19.399169921875, -18.8138427734375, -18.228515625, -17.6431884765625, -17.057861328125, -16.4725341796875, -15.88720703125, -15.3018798828125, -14.716552734375, -14.1312255859375, -13.5458984375, -12.9605712890625, -12.375244140625, -11.7899169921875, -11.20458984375, -10.6192626953125, -10.033935546875, -9.4486083984375, -8.86328125, -8.2779541015625, -7.692626953125, -7.1072998046875, -6.52197265625, -5.9366455078125, -5.351318359375, -4.7659912109375, -4.1806640625, -3.5953369140625, -3.010009765625, -2.4246826171875, -1.83935546875, -1.2540283203125, -0.668701171875, -0.0833740234375, 0.501953125, 1.0872802734375, 1.672607421875, 2.2579345703125, 2.84326171875, 3.4285888671875, 4.013916015625, 4.5992431640625, 5.1845703125, 5.7698974609375, 6.355224609375, 6.9405517578125, 7.52587890625, 8.1112060546875, 8.696533203125, 9.2818603515625, 9.8671875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 10.0, 25.0, 44.0, 95.0, 155.0, 238.0, 207.0, 133.0, 50.0, 15.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.86087036132812, -150.78329467773438, -146.7057342529297, -142.62815856933594, -138.5505828857422, -134.4730224609375, -130.39544677734375, -126.31787872314453, -122.24031066894531, -118.1627426147461, -114.08516693115234, -110.00759887695312, -105.9300308227539, -101.85246276855469, -97.77488708496094, -93.69731903076172, -89.61974334716797, -85.54217529296875, -81.464599609375, -77.38703155517578, -73.30946350097656, -69.23188781738281, -65.1543197631836, -61.076751708984375, -56.99917984008789, -52.921607971191406, -48.84403991699219, -44.7664680480957, -40.68889617919922, -36.611328125, -32.533756256103516, -28.456186294555664, -24.378623962402344, -20.301054000854492, -16.22348403930664, -12.145912170410156, -8.068342208862305, -3.990772247314453, 0.08679962158203125, 4.164369583129883, 8.241939544677734, 12.319509506225586, 16.397079467773438, 20.474651336669922, 24.552221298217773, 28.629791259765625, 32.70736312866211, 36.784934997558594, 40.86250305175781, 44.9400749206543, 49.017642974853516, 53.09521484375, 57.17278289794922, 61.2503547668457, 65.32792663574219, 69.4054946899414, 73.48306274414062, 77.56063079833984, 81.6382064819336, 85.71577453613281, 89.79334259033203, 93.87091064453125, 97.948486328125, 102.02605438232422, 106.10363006591797]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 3.0, 7.0, 11.0, 4.0, 11.0, 14.0, 17.0, 24.0, 25.0, 28.0, 29.0, 35.0, 37.0, 52.0, 49.0, 54.0, 55.0, 61.0, 55.0, 67.0, 49.0, 47.0, 39.0, 37.0, 35.0, 40.0, 23.0, 23.0, 19.0, 8.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.24712371826172, -46.44053649902344, -44.633949279785156, -42.827362060546875, -41.020774841308594, -39.21418762207031, -37.40760040283203, -35.601009368896484, -33.7944221496582, -31.987834930419922, -30.18124771118164, -28.37466049194336, -26.568071365356445, -24.761484146118164, -22.954896926879883, -21.14830780029297, -19.34172248840332, -17.53513526916504, -15.728547096252441, -13.92195987701416, -12.115371704101562, -10.308784484863281, -8.502197265625, -6.695609092712402, -4.889021873474121, -3.0824341773986816, -1.2758467197418213, 0.5307407379150391, 2.3373284339904785, 4.143916130065918, 5.950503349304199, 7.757091522216797, 9.563678741455078, 11.37026596069336, 13.176854133605957, 14.983441352844238, 16.790029525756836, 18.596616744995117, 20.4032039642334, 22.209793090820312, 24.016380310058594, 25.822967529296875, 27.629554748535156, 29.436141967773438, 31.24273109436035, 33.04931640625, 34.85590362548828, 36.66249465942383, 38.469078063964844, 40.275665283203125, 42.082252502441406, 43.88883972167969, 45.69542694091797, 47.50201416015625, 49.30860137939453, 51.11519241333008, 52.92177963256836, 54.72836685180664, 56.53495407104492, 58.3415412902832, 60.148128509521484, 61.95471954345703, 63.76130676269531, 65.5678939819336, 67.37448120117188]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 12.0, 9.0, 14.0, 25.0, 38.0, 70.0, 99.0, 161.0, 268.0, 609.0, 1213.0, 2875.0, 7884.0, 26713.0, 109189.0, 482872.0, 321087.0, 67673.0, 17979.0, 5785.0, 1990.0, 892.0, 460.0, 237.0, 150.0, 87.0, 43.0, 47.0, 25.0, 12.0, 7.0, 5.0, 5.0, 7.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.3648681640625, -11.018798828125, -10.6727294921875, -10.32666015625, -9.9805908203125, -9.634521484375, -9.2884521484375, -8.9423828125, -8.5963134765625, -8.250244140625, -7.9041748046875, -7.55810546875, -7.2120361328125, -6.865966796875, -6.5198974609375, -6.173828125, -5.8277587890625, -5.481689453125, -5.1356201171875, -4.78955078125, -4.4434814453125, -4.097412109375, -3.7513427734375, -3.4052734375, -3.0592041015625, -2.713134765625, -2.3670654296875, -2.02099609375, -1.6749267578125, -1.328857421875, -0.9827880859375, -0.63671875, -0.2906494140625, 0.055419921875, 0.4014892578125, 0.74755859375, 1.0936279296875, 1.439697265625, 1.7857666015625, 2.1318359375, 2.4779052734375, 2.823974609375, 3.1700439453125, 3.51611328125, 3.8621826171875, 4.208251953125, 4.5543212890625, 4.900390625, 5.2464599609375, 5.592529296875, 5.9385986328125, 6.28466796875, 6.6307373046875, 6.976806640625, 7.3228759765625, 7.6689453125, 8.0150146484375, 8.361083984375, 8.7071533203125, 9.05322265625, 9.3992919921875, 9.745361328125, 10.0914306640625, 10.4375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 12.0, 10.0, 17.0, 27.0, 31.0, 32.0, 30.0, 46.0, 52.0, 48.0, 61.0, 67.0, 71.0, 66.0, 58.0, 54.0, 61.0, 51.0, 29.0, 37.0, 30.0, 22.0, 27.0, 11.0, 12.0, 1.0, 9.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.977294921875, -4.83349609375, -4.689697265625, -4.5458984375, -4.402099609375, -4.25830078125, -4.114501953125, -3.970703125, -3.826904296875, -3.68310546875, -3.539306640625, -3.3955078125, -3.251708984375, -3.10791015625, -2.964111328125, -2.8203125, -2.676513671875, -2.53271484375, -2.388916015625, -2.2451171875, -2.101318359375, -1.95751953125, -1.813720703125, -1.669921875, -1.526123046875, -1.38232421875, -1.238525390625, -1.0947265625, -0.950927734375, -0.80712890625, -0.663330078125, -0.51953125, -0.375732421875, -0.23193359375, -0.088134765625, 0.0556640625, 0.199462890625, 0.34326171875, 0.487060546875, 0.630859375, 0.774658203125, 0.91845703125, 1.062255859375, 1.2060546875, 1.349853515625, 1.49365234375, 1.637451171875, 1.78125, 1.925048828125, 2.06884765625, 2.212646484375, 2.3564453125, 2.500244140625, 2.64404296875, 2.787841796875, 2.931640625, 3.075439453125, 3.21923828125, 3.363037109375, 3.5068359375, 3.650634765625, 3.79443359375, 3.938232421875, 4.08203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 12.0, 13.0, 17.0, 15.0, 28.0, 41.0, 65.0, 72.0, 114.0, 165.0, 231.0, 454.0, 931.0, 1954.0, 5627.0, 26725.0, 521581.0, 455048.0, 26094.0, 5410.0, 1832.0, 864.0, 490.0, 239.0, 151.0, 101.0, 71.0, 50.0, 25.0, 30.0, 22.0, 10.0, 10.0, 12.0, 6.0, 5.0, 4.0, 9.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-20.484375, -19.843994140625, -19.20361328125, -18.563232421875, -17.9228515625, -17.282470703125, -16.64208984375, -16.001708984375, -15.361328125, -14.720947265625, -14.08056640625, -13.440185546875, -12.7998046875, -12.159423828125, -11.51904296875, -10.878662109375, -10.23828125, -9.597900390625, -8.95751953125, -8.317138671875, -7.6767578125, -7.036376953125, -6.39599609375, -5.755615234375, -5.115234375, -4.474853515625, -3.83447265625, -3.194091796875, -2.5537109375, -1.913330078125, -1.27294921875, -0.632568359375, 0.0078125, 0.648193359375, 1.28857421875, 1.928955078125, 2.5693359375, 3.209716796875, 3.85009765625, 4.490478515625, 5.130859375, 5.771240234375, 6.41162109375, 7.052001953125, 7.6923828125, 8.332763671875, 8.97314453125, 9.613525390625, 10.25390625, 10.894287109375, 11.53466796875, 12.175048828125, 12.8154296875, 13.455810546875, 14.09619140625, 14.736572265625, 15.376953125, 16.017333984375, 16.65771484375, 17.298095703125, 17.9384765625, 18.578857421875, 19.21923828125, 19.859619140625, 20.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 7.0, 15.0, 18.0, 26.0, 24.0, 23.0, 41.0, 46.0, 48.0, 51.0, 68.0, 69.0, 70.0, 62.0, 74.0, 53.0, 58.0, 36.0, 37.0, 40.0, 31.0, 21.0, 18.0, 8.0, 9.0, 8.0, 4.0, 7.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.078125, -23.36181640625, -22.6455078125, -21.92919921875, -21.212890625, -20.49658203125, -19.7802734375, -19.06396484375, -18.34765625, -17.63134765625, -16.9150390625, -16.19873046875, -15.482421875, -14.76611328125, -14.0498046875, -13.33349609375, -12.6171875, -11.90087890625, -11.1845703125, -10.46826171875, -9.751953125, -9.03564453125, -8.3193359375, -7.60302734375, -6.88671875, -6.17041015625, -5.4541015625, -4.73779296875, -4.021484375, -3.30517578125, -2.5888671875, -1.87255859375, -1.15625, -0.43994140625, 0.2763671875, 0.99267578125, 1.708984375, 2.42529296875, 3.1416015625, 3.85791015625, 4.57421875, 5.29052734375, 6.0068359375, 6.72314453125, 7.439453125, 8.15576171875, 8.8720703125, 9.58837890625, 10.3046875, 11.02099609375, 11.7373046875, 12.45361328125, 13.169921875, 13.88623046875, 14.6025390625, 15.31884765625, 16.03515625, 16.75146484375, 17.4677734375, 18.18408203125, 18.900390625, 19.61669921875, 20.3330078125, 21.04931640625, 21.765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 11.0, 10.0, 20.0, 24.0, 32.0, 58.0, 119.0, 316.0, 959.0, 7699.0, 878127.0, 156349.0, 3659.0, 652.0, 247.0, 105.0, 61.0, 35.0, 18.0, 12.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.5146484375, -17.951171875, -17.3876953125, -16.82421875, -16.2607421875, -15.697265625, -15.1337890625, -14.5703125, -14.0068359375, -13.443359375, -12.8798828125, -12.31640625, -11.7529296875, -11.189453125, -10.6259765625, -10.0625, -9.4990234375, -8.935546875, -8.3720703125, -7.80859375, -7.2451171875, -6.681640625, -6.1181640625, -5.5546875, -4.9912109375, -4.427734375, -3.8642578125, -3.30078125, -2.7373046875, -2.173828125, -1.6103515625, -1.046875, -0.4833984375, 0.080078125, 0.6435546875, 1.20703125, 1.7705078125, 2.333984375, 2.8974609375, 3.4609375, 4.0244140625, 4.587890625, 5.1513671875, 5.71484375, 6.2783203125, 6.841796875, 7.4052734375, 7.96875, 8.5322265625, 9.095703125, 9.6591796875, 10.22265625, 10.7861328125, 11.349609375, 11.9130859375, 12.4765625, 13.0400390625, 13.603515625, 14.1669921875, 14.73046875, 15.2939453125, 15.857421875, 16.4208984375, 16.984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 7.0, 3.0, 11.0, 10.0, 21.0, 23.0, 43.0, 66.0, 130.0, 210.0, 172.0, 95.0, 59.0, 29.0, 20.0, 27.0, 24.0, 7.0, 8.0, 5.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011930465698242188, -0.0011500567197799683, -0.0011070668697357178, -0.0010640770196914673, -0.0010210871696472168, -0.0009780973196029663, -0.0009351074695587158, -0.0008921176195144653, -0.0008491277694702148, -0.0008061379194259644, -0.0007631480693817139, -0.0007201582193374634, -0.0006771683692932129, -0.0006341785192489624, -0.0005911886692047119, -0.0005481988191604614, -0.0005052089691162109, -0.00046221911907196045, -0.00041922926902770996, -0.00037623941898345947, -0.000333249568939209, -0.0002902597188949585, -0.000247269868850708, -0.00020428001880645752, -0.00016129016876220703, -0.00011830031871795654, -7.531046867370605e-05, -3.2320618629455566e-05, 1.0669231414794922e-05, 5.365908145904541e-05, 9.66489315032959e-05, 0.0001396387815475464, 0.00018262863159179688, 0.00022561848163604736, 0.00026860833168029785, 0.00031159818172454834, 0.00035458803176879883, 0.0003975778818130493, 0.0004405677318572998, 0.0004835575819015503, 0.0005265474319458008, 0.0005695372819900513, 0.0006125271320343018, 0.0006555169820785522, 0.0006985068321228027, 0.0007414966821670532, 0.0007844865322113037, 0.0008274763822555542, 0.0008704662322998047, 0.0009134560823440552, 0.0009564459323883057, 0.0009994357824325562, 0.0010424256324768066, 0.0010854154825210571, 0.0011284053325653076, 0.001171395182609558, 0.0012143850326538086, 0.001257374882698059, 0.0013003647327423096, 0.00134335458278656, 0.0013863444328308105, 0.001429334282875061, 0.0014723241329193115, 0.001515313982963562, 0.0015583038330078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 13.0, 10.0, 14.0, 20.0, 22.0, 41.0, 52.0, 79.0, 136.0, 220.0, 495.0, 1023.0, 2635.0, 10880.0, 109924.0, 861633.0, 50493.0, 7138.0, 1974.0, 796.0, 370.0, 197.0, 119.0, 76.0, 48.0, 40.0, 28.0, 20.0, 15.0, 7.0, 12.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.828125, -11.51983642578125, -11.2115478515625, -10.90325927734375, -10.594970703125, -10.28668212890625, -9.9783935546875, -9.67010498046875, -9.36181640625, -9.05352783203125, -8.7452392578125, -8.43695068359375, -8.128662109375, -7.82037353515625, -7.5120849609375, -7.20379638671875, -6.8955078125, -6.58721923828125, -6.2789306640625, -5.97064208984375, -5.662353515625, -5.35406494140625, -5.0457763671875, -4.73748779296875, -4.42919921875, -4.12091064453125, -3.8126220703125, -3.50433349609375, -3.196044921875, -2.88775634765625, -2.5794677734375, -2.27117919921875, -1.962890625, -1.65460205078125, -1.3463134765625, -1.03802490234375, -0.729736328125, -0.42144775390625, -0.1131591796875, 0.19512939453125, 0.50341796875, 0.81170654296875, 1.1199951171875, 1.42828369140625, 1.736572265625, 2.04486083984375, 2.3531494140625, 2.66143798828125, 2.9697265625, 3.27801513671875, 3.5863037109375, 3.89459228515625, 4.202880859375, 4.51116943359375, 4.8194580078125, 5.12774658203125, 5.43603515625, 5.74432373046875, 6.0526123046875, 6.36090087890625, 6.669189453125, 6.97747802734375, 7.2857666015625, 7.59405517578125, 7.90234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 9.0, 8.0, 15.0, 18.0, 30.0, 59.0, 46.0, 97.0, 151.0, 165.0, 124.0, 81.0, 59.0, 46.0, 18.0, 19.0, 15.0, 16.0, 10.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.4765625, -14.16424560546875, -13.8519287109375, -13.53961181640625, -13.227294921875, -12.91497802734375, -12.6026611328125, -12.29034423828125, -11.97802734375, -11.66571044921875, -11.3533935546875, -11.04107666015625, -10.728759765625, -10.41644287109375, -10.1041259765625, -9.79180908203125, -9.4794921875, -9.16717529296875, -8.8548583984375, -8.54254150390625, -8.230224609375, -7.91790771484375, -7.6055908203125, -7.29327392578125, -6.98095703125, -6.66864013671875, -6.3563232421875, -6.04400634765625, -5.731689453125, -5.41937255859375, -5.1070556640625, -4.79473876953125, -4.482421875, -4.17010498046875, -3.8577880859375, -3.54547119140625, -3.233154296875, -2.92083740234375, -2.6085205078125, -2.29620361328125, -1.98388671875, -1.67156982421875, -1.3592529296875, -1.04693603515625, -0.734619140625, -0.42230224609375, -0.1099853515625, 0.20233154296875, 0.5146484375, 0.82696533203125, 1.1392822265625, 1.45159912109375, 1.763916015625, 2.07623291015625, 2.3885498046875, 2.70086669921875, 3.01318359375, 3.32550048828125, 3.6378173828125, 3.95013427734375, 4.262451171875, 4.57476806640625, 4.8870849609375, 5.19940185546875, 5.51171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 21.0, 176.0, 426.0, 276.0, 69.0, 18.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-465.4208068847656, -456.759521484375, -448.09820556640625, -439.4369201660156, -430.775634765625, -422.11431884765625, -413.4530334472656, -404.7917175292969, -396.13043212890625, -387.4691467285156, -378.8078308105469, -370.14654541015625, -361.4852294921875, -352.8239440917969, -344.16265869140625, -335.5013427734375, -326.8400573730469, -318.17877197265625, -309.5174560546875, -300.8561706542969, -292.19488525390625, -283.5335693359375, -274.8722839355469, -266.2109680175781, -257.5496826171875, -248.8883819580078, -240.22708129882812, -231.5657958984375, -222.9044952392578, -214.24319458007812, -205.5819091796875, -196.9206085205078, -188.25927734375, -179.5979766845703, -170.93667602539062, -162.275390625, -153.6140899658203, -144.95278930664062, -136.29150390625, -127.63020324707031, -118.96890258789062, -110.30760192871094, -101.64630889892578, -92.98501586914062, -84.32371520996094, -75.66241455078125, -67.0011215209961, -58.33982467651367, -49.67852783203125, -41.01723098754883, -32.355934143066406, -23.694637298583984, -15.033340454101562, -6.372043609619141, 2.2892532348632812, 10.950550079345703, 19.611846923828125, 28.273143768310547, 36.93444061279297, 45.59573745727539, 54.25703430175781, 62.918331146240234, 71.57962799072266, 80.24092102050781, 88.9022216796875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 13.0, 20.0, 31.0, 34.0, 43.0, 65.0, 52.0, 76.0, 99.0, 108.0, 126.0, 77.0, 52.0, 60.0, 34.0, 32.0, 23.0, 14.0, 12.0, 5.0, 6.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.25932312011719, -105.12742614746094, -100.99553680419922, -96.86363983154297, -92.73175048828125, -88.599853515625, -84.46795654296875, -80.3360595703125, -76.20417022705078, -72.07227325439453, -67.94038391113281, -63.80848693847656, -59.67659378051758, -55.544700622558594, -51.412803649902344, -47.28091049194336, -43.149017333984375, -39.01712417602539, -34.885231018066406, -30.753334045410156, -26.621440887451172, -22.489547729492188, -18.35765266418457, -14.225757598876953, -10.093864440917969, -5.961970329284668, -1.8300762176513672, 2.3018178939819336, 6.433712005615234, 10.565605163574219, 14.697500228881836, 18.829395294189453, 22.9613037109375, 27.093196868896484, 31.2250919342041, 35.35698699951172, 39.4888801574707, 43.62077331542969, 47.75267028808594, 51.88456344604492, 56.016456604003906, 60.14834976196289, 64.28024291992188, 68.41213989257812, 72.54403686523438, 76.6759262084961, 80.80782318115234, 84.93971252441406, 89.07160949707031, 93.20350646972656, 97.33539581298828, 101.46729278564453, 105.59918212890625, 109.7310791015625, 113.86297607421875, 117.994873046875, 122.12676239013672, 126.25865936279297, 130.3905487060547, 134.52244567871094, 138.6543426513672, 142.78622436523438, 146.91812133789062, 151.05001831054688, 155.18191528320312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 8.0, 11.0, 11.0, 23.0, 41.0, 75.0, 120.0, 357.0, 1109.0, 4344.0, 26079.0, 1727802.0, 2400565.0, 27539.0, 4238.0, 1141.0, 352.0, 164.0, 100.0, 73.0, 29.0, 21.0, 17.0, 15.0, 10.0, 8.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -9.8665771484375, -9.397216796875, -8.9278564453125, -8.45849609375, -7.9891357421875, -7.519775390625, -7.0504150390625, -6.5810546875, -6.1116943359375, -5.642333984375, -5.1729736328125, -4.70361328125, -4.2342529296875, -3.764892578125, -3.2955322265625, -2.826171875, -2.3568115234375, -1.887451171875, -1.4180908203125, -0.94873046875, -0.4793701171875, -0.010009765625, 0.4593505859375, 0.9287109375, 1.3980712890625, 1.867431640625, 2.3367919921875, 2.80615234375, 3.2755126953125, 3.744873046875, 4.2142333984375, 4.68359375, 5.1529541015625, 5.622314453125, 6.0916748046875, 6.56103515625, 7.0303955078125, 7.499755859375, 7.9691162109375, 8.4384765625, 8.9078369140625, 9.377197265625, 9.8465576171875, 10.31591796875, 10.7852783203125, 11.254638671875, 11.7239990234375, 12.193359375, 12.6627197265625, 13.132080078125, 13.6014404296875, 14.07080078125, 14.5401611328125, 15.009521484375, 15.4788818359375, 15.9482421875, 16.4176025390625, 16.886962890625, 17.3563232421875, 17.82568359375, 18.2950439453125, 18.764404296875, 19.2337646484375, 19.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 7.0, 30.0, 45.0, 79.0, 116.0, 182.0, 187.0, 133.0, 105.0, 63.0, 31.0, 15.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.484619140625, -9.09423828125, -8.703857421875, -8.3134765625, -7.923095703125, -7.53271484375, -7.142333984375, -6.751953125, -6.361572265625, -5.97119140625, -5.580810546875, -5.1904296875, -4.800048828125, -4.40966796875, -4.019287109375, -3.62890625, -3.238525390625, -2.84814453125, -2.457763671875, -2.0673828125, -1.677001953125, -1.28662109375, -0.896240234375, -0.505859375, -0.115478515625, 0.27490234375, 0.665283203125, 1.0556640625, 1.446044921875, 1.83642578125, 2.226806640625, 2.6171875, 3.007568359375, 3.39794921875, 3.788330078125, 4.1787109375, 4.569091796875, 4.95947265625, 5.349853515625, 5.740234375, 6.130615234375, 6.52099609375, 6.911376953125, 7.3017578125, 7.692138671875, 8.08251953125, 8.472900390625, 8.86328125, 9.253662109375, 9.64404296875, 10.034423828125, 10.4248046875, 10.815185546875, 11.20556640625, 11.595947265625, 11.986328125, 12.376708984375, 12.76708984375, 13.157470703125, 13.5478515625, 13.938232421875, 14.32861328125, 14.718994140625, 15.109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 8.0, 13.0, 19.0, 36.0, 51.0, 89.0, 182.0, 381.0, 647.0, 1252.0, 2699.0, 6021.0, 15641.0, 54405.0, 488446.0, 3374239.0, 195980.0, 34424.0, 11279.0, 4432.0, 1946.0, 954.0, 510.0, 258.0, 152.0, 85.0, 47.0, 22.0, 22.0, 11.0, 2.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.973388671875, -5.72802734375, -5.482666015625, -5.2373046875, -4.991943359375, -4.74658203125, -4.501220703125, -4.255859375, -4.010498046875, -3.76513671875, -3.519775390625, -3.2744140625, -3.029052734375, -2.78369140625, -2.538330078125, -2.29296875, -2.047607421875, -1.80224609375, -1.556884765625, -1.3115234375, -1.066162109375, -0.82080078125, -0.575439453125, -0.330078125, -0.084716796875, 0.16064453125, 0.406005859375, 0.6513671875, 0.896728515625, 1.14208984375, 1.387451171875, 1.6328125, 1.878173828125, 2.12353515625, 2.368896484375, 2.6142578125, 2.859619140625, 3.10498046875, 3.350341796875, 3.595703125, 3.841064453125, 4.08642578125, 4.331787109375, 4.5771484375, 4.822509765625, 5.06787109375, 5.313232421875, 5.55859375, 5.803955078125, 6.04931640625, 6.294677734375, 6.5400390625, 6.785400390625, 7.03076171875, 7.276123046875, 7.521484375, 7.766845703125, 8.01220703125, 8.257568359375, 8.5029296875, 8.748291015625, 8.99365234375, 9.239013671875, 9.484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 10.0, 10.0, 16.0, 23.0, 37.0, 59.0, 110.0, 212.0, 556.0, 1210.0, 1003.0, 433.0, 163.0, 82.0, 44.0, 30.0, 15.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0384521484375, -8.725341796875, -8.4122314453125, -8.09912109375, -7.7860107421875, -7.472900390625, -7.1597900390625, -6.8466796875, -6.5335693359375, -6.220458984375, -5.9073486328125, -5.59423828125, -5.2811279296875, -4.968017578125, -4.6549072265625, -4.341796875, -4.0286865234375, -3.715576171875, -3.4024658203125, -3.08935546875, -2.7762451171875, -2.463134765625, -2.1500244140625, -1.8369140625, -1.5238037109375, -1.210693359375, -0.8975830078125, -0.58447265625, -0.2713623046875, 0.041748046875, 0.3548583984375, 0.66796875, 0.9810791015625, 1.294189453125, 1.6072998046875, 1.92041015625, 2.2335205078125, 2.546630859375, 2.8597412109375, 3.1728515625, 3.4859619140625, 3.799072265625, 4.1121826171875, 4.42529296875, 4.7384033203125, 5.051513671875, 5.3646240234375, 5.677734375, 5.9908447265625, 6.303955078125, 6.6170654296875, 6.93017578125, 7.2432861328125, 7.556396484375, 7.8695068359375, 8.1826171875, 8.4957275390625, 8.808837890625, 9.1219482421875, 9.43505859375, 9.7481689453125, 10.061279296875, 10.3743896484375, 10.6875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 53.0, 293.0, 449.0, 152.0, 28.0, 7.0, 5.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.9993438720703, -205.33248901367188, -199.6656494140625, -193.99879455566406, -188.33193969726562, -182.6650848388672, -176.99822998046875, -171.33139038085938, -165.66453552246094, -159.9976806640625, -154.33084106445312, -148.6639862060547, -142.99713134765625, -137.3302764892578, -131.66342163085938, -125.99658203125, -120.32972717285156, -114.66287231445312, -108.99602508544922, -103.32917785644531, -97.66232299804688, -91.99546813964844, -86.32862091064453, -80.66177368164062, -74.99491882324219, -69.32806396484375, -63.661216735839844, -57.99436569213867, -52.3275146484375, -46.66066360473633, -40.993812561035156, -35.326961517333984, -29.660125732421875, -23.993274688720703, -18.32642364501953, -12.65957260131836, -6.9927215576171875, -1.3258705139160156, 4.340980529785156, 10.007831573486328, 15.6746826171875, 21.341533660888672, 27.008384704589844, 32.675235748291016, 38.34208679199219, 44.00893783569336, 49.67578887939453, 55.3426399230957, 61.009490966796875, 66.67634582519531, 72.34319305419922, 78.01004028320312, 83.67689514160156, 89.34375, 95.0105972290039, 100.67744445800781, 106.34429931640625, 112.01115417480469, 117.6780014038086, 123.3448486328125, 129.01170349121094, 134.67855834960938, 140.34539794921875, 146.0122528076172, 151.67910766601562]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 11.0, 14.0, 13.0, 21.0, 31.0, 34.0, 53.0, 57.0, 75.0, 67.0, 90.0, 89.0, 82.0, 76.0, 59.0, 53.0, 36.0, 28.0, 39.0, 21.0, 13.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-69.08695983886719, -67.37101745605469, -65.65508270263672, -63.939144134521484, -62.22320556640625, -60.50726318359375, -58.79132843017578, -57.07538604736328, -55.35944747924805, -53.64350891113281, -51.92757034301758, -50.211631774902344, -48.49569320678711, -46.779754638671875, -45.063812255859375, -43.34787368774414, -41.631935119628906, -39.91599655151367, -38.20005798339844, -36.4841194152832, -34.76818084716797, -33.05223846435547, -31.336301803588867, -29.620361328125, -27.90442657470703, -26.188488006591797, -24.472549438476562, -22.756610870361328, -21.04067039489746, -19.324731826782227, -17.608793258666992, -15.892853736877441, -14.17691421508789, -12.460975646972656, -10.745036125183105, -9.029097557067871, -7.3131585121154785, -5.597219467163086, -3.8812808990478516, -2.165341377258301, -0.4494028091430664, 1.2665361166000366, 2.9824750423431396, 4.698413848876953, 6.414352893829346, 8.130291938781738, 9.846230506896973, 11.562170028686523, 13.278108596801758, 14.994047164916992, 16.709985733032227, 18.425926208496094, 20.141864776611328, 21.857803344726562, 23.573741912841797, 25.28968048095703, 27.005619049072266, 28.7215576171875, 30.437496185302734, 32.15343475341797, 33.8693733215332, 35.58531188964844, 37.30125427246094, 39.01719284057617, 40.733131408691406]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 10.0, 23.0, 24.0, 23.0, 41.0, 73.0, 106.0, 157.0, 248.0, 470.0, 785.0, 1596.0, 3195.0, 7329.0, 17936.0, 50265.0, 153266.0, 419247.0, 263075.0, 82114.0, 28408.0, 10757.0, 4667.0, 2121.0, 1083.0, 598.0, 357.0, 196.0, 112.0, 64.0, 65.0, 36.0, 21.0, 21.0, 11.0, 7.0, 11.0, 11.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.93359375, -7.70513916015625, -7.4766845703125, -7.24822998046875, -7.019775390625, -6.79132080078125, -6.5628662109375, -6.33441162109375, -6.10595703125, -5.87750244140625, -5.6490478515625, -5.42059326171875, -5.192138671875, -4.96368408203125, -4.7352294921875, -4.50677490234375, -4.2783203125, -4.04986572265625, -3.8214111328125, -3.59295654296875, -3.364501953125, -3.13604736328125, -2.9075927734375, -2.67913818359375, -2.45068359375, -2.22222900390625, -1.9937744140625, -1.76531982421875, -1.536865234375, -1.30841064453125, -1.0799560546875, -0.85150146484375, -0.623046875, -0.39459228515625, -0.1661376953125, 0.06231689453125, 0.290771484375, 0.51922607421875, 0.7476806640625, 0.97613525390625, 1.20458984375, 1.43304443359375, 1.6614990234375, 1.88995361328125, 2.118408203125, 2.34686279296875, 2.5753173828125, 2.80377197265625, 3.0322265625, 3.26068115234375, 3.4891357421875, 3.71759033203125, 3.946044921875, 4.17449951171875, 4.4029541015625, 4.63140869140625, 4.85986328125, 5.08831787109375, 5.3167724609375, 5.54522705078125, 5.773681640625, 6.00213623046875, 6.2305908203125, 6.45904541015625, 6.6875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 9.0, 9.0, 23.0, 25.0, 22.0, 40.0, 39.0, 48.0, 70.0, 77.0, 72.0, 61.0, 71.0, 67.0, 73.0, 54.0, 54.0, 49.0, 38.0, 20.0, 16.0, 18.0, 15.0, 3.0, 8.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.66351318359375, -4.5028076171875, -4.34210205078125, -4.181396484375, -4.02069091796875, -3.8599853515625, -3.69927978515625, -3.53857421875, -3.37786865234375, -3.2171630859375, -3.05645751953125, -2.895751953125, -2.73504638671875, -2.5743408203125, -2.41363525390625, -2.2529296875, -2.09222412109375, -1.9315185546875, -1.77081298828125, -1.610107421875, -1.44940185546875, -1.2886962890625, -1.12799072265625, -0.96728515625, -0.80657958984375, -0.6458740234375, -0.48516845703125, -0.324462890625, -0.16375732421875, -0.0030517578125, 0.15765380859375, 0.318359375, 0.47906494140625, 0.6397705078125, 0.80047607421875, 0.961181640625, 1.12188720703125, 1.2825927734375, 1.44329833984375, 1.60400390625, 1.76470947265625, 1.9254150390625, 2.08612060546875, 2.246826171875, 2.40753173828125, 2.5682373046875, 2.72894287109375, 2.8896484375, 3.05035400390625, 3.2110595703125, 3.37176513671875, 3.532470703125, 3.69317626953125, 3.8538818359375, 4.01458740234375, 4.17529296875, 4.33599853515625, 4.4967041015625, 4.65740966796875, 4.818115234375, 4.97882080078125, 5.1395263671875, 5.30023193359375, 5.4609375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 7.0, 5.0, 9.0, 10.0, 13.0, 21.0, 33.0, 42.0, 55.0, 79.0, 130.0, 230.0, 382.0, 662.0, 1323.0, 3324.0, 11113.0, 58962.0, 540829.0, 369881.0, 46468.0, 9365.0, 2869.0, 1152.0, 617.0, 339.0, 203.0, 126.0, 91.0, 63.0, 39.0, 26.0, 22.0, 13.0, 18.0, 6.0, 13.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3515625, -12.9581298828125, -12.564697265625, -12.1712646484375, -11.77783203125, -11.3843994140625, -10.990966796875, -10.5975341796875, -10.2041015625, -9.8106689453125, -9.417236328125, -9.0238037109375, -8.63037109375, -8.2369384765625, -7.843505859375, -7.4500732421875, -7.056640625, -6.6632080078125, -6.269775390625, -5.8763427734375, -5.48291015625, -5.0894775390625, -4.696044921875, -4.3026123046875, -3.9091796875, -3.5157470703125, -3.122314453125, -2.7288818359375, -2.33544921875, -1.9420166015625, -1.548583984375, -1.1551513671875, -0.76171875, -0.3682861328125, 0.025146484375, 0.4185791015625, 0.81201171875, 1.2054443359375, 1.598876953125, 1.9923095703125, 2.3857421875, 2.7791748046875, 3.172607421875, 3.5660400390625, 3.95947265625, 4.3529052734375, 4.746337890625, 5.1397705078125, 5.533203125, 5.9266357421875, 6.320068359375, 6.7135009765625, 7.10693359375, 7.5003662109375, 7.893798828125, 8.2872314453125, 8.6806640625, 9.0740966796875, 9.467529296875, 9.8609619140625, 10.25439453125, 10.6478271484375, 11.041259765625, 11.4346923828125, 11.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 11.0, 11.0, 12.0, 13.0, 15.0, 30.0, 31.0, 43.0, 37.0, 33.0, 46.0, 44.0, 51.0, 51.0, 46.0, 51.0, 47.0, 46.0, 42.0, 48.0, 43.0, 46.0, 40.0, 27.0, 28.0, 24.0, 13.0, 13.0, 14.0, 13.0, 7.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-15.421875, -14.972412109375, -14.52294921875, -14.073486328125, -13.6240234375, -13.174560546875, -12.72509765625, -12.275634765625, -11.826171875, -11.376708984375, -10.92724609375, -10.477783203125, -10.0283203125, -9.578857421875, -9.12939453125, -8.679931640625, -8.23046875, -7.781005859375, -7.33154296875, -6.882080078125, -6.4326171875, -5.983154296875, -5.53369140625, -5.084228515625, -4.634765625, -4.185302734375, -3.73583984375, -3.286376953125, -2.8369140625, -2.387451171875, -1.93798828125, -1.488525390625, -1.0390625, -0.589599609375, -0.14013671875, 0.309326171875, 0.7587890625, 1.208251953125, 1.65771484375, 2.107177734375, 2.556640625, 3.006103515625, 3.45556640625, 3.905029296875, 4.3544921875, 4.803955078125, 5.25341796875, 5.702880859375, 6.15234375, 6.601806640625, 7.05126953125, 7.500732421875, 7.9501953125, 8.399658203125, 8.84912109375, 9.298583984375, 9.748046875, 10.197509765625, 10.64697265625, 11.096435546875, 11.5458984375, 11.995361328125, 12.44482421875, 12.894287109375, 13.34375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 17.0, 19.0, 26.0, 49.0, 110.0, 290.0, 1075.0, 8770.0, 923849.0, 110114.0, 3199.0, 604.0, 194.0, 92.0, 48.0, 22.0, 13.0, 12.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.609375, -14.163818359375, -13.71826171875, -13.272705078125, -12.8271484375, -12.381591796875, -11.93603515625, -11.490478515625, -11.044921875, -10.599365234375, -10.15380859375, -9.708251953125, -9.2626953125, -8.817138671875, -8.37158203125, -7.926025390625, -7.48046875, -7.034912109375, -6.58935546875, -6.143798828125, -5.6982421875, -5.252685546875, -4.80712890625, -4.361572265625, -3.916015625, -3.470458984375, -3.02490234375, -2.579345703125, -2.1337890625, -1.688232421875, -1.24267578125, -0.797119140625, -0.3515625, 0.093994140625, 0.53955078125, 0.985107421875, 1.4306640625, 1.876220703125, 2.32177734375, 2.767333984375, 3.212890625, 3.658447265625, 4.10400390625, 4.549560546875, 4.9951171875, 5.440673828125, 5.88623046875, 6.331787109375, 6.77734375, 7.222900390625, 7.66845703125, 8.114013671875, 8.5595703125, 9.005126953125, 9.45068359375, 9.896240234375, 10.341796875, 10.787353515625, 11.23291015625, 11.678466796875, 12.1240234375, 12.569580078125, 13.01513671875, 13.460693359375, 13.90625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 15.0, 12.0, 14.0, 19.0, 27.0, 33.0, 48.0, 75.0, 93.0, 110.0, 121.0, 103.0, 70.0, 63.0, 43.0, 24.0, 20.0, 15.0, 11.0, 17.0, 9.0, 8.0, 7.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008258819580078125, -0.0008036792278289795, -0.0007814764976501465, -0.0007592737674713135, -0.0007370710372924805, -0.0007148683071136475, -0.0006926655769348145, -0.0006704628467559814, -0.0006482601165771484, -0.0006260573863983154, -0.0006038546562194824, -0.0005816519260406494, -0.0005594491958618164, -0.0005372464656829834, -0.0005150437355041504, -0.0004928410053253174, -0.0004706382751464844, -0.00044843554496765137, -0.00042623281478881836, -0.00040403008460998535, -0.00038182735443115234, -0.00035962462425231934, -0.00033742189407348633, -0.0003152191638946533, -0.0002930164337158203, -0.0002708137035369873, -0.0002486109733581543, -0.0002264082431793213, -0.00020420551300048828, -0.00018200278282165527, -0.00015980005264282227, -0.00013759732246398926, -0.00011539459228515625, -9.319186210632324e-05, -7.098913192749023e-05, -4.8786401748657227e-05, -2.658367156982422e-05, -4.380941390991211e-06, 1.7821788787841797e-05, 4.0024518966674805e-05, 6.222724914550781e-05, 8.442997932434082e-05, 0.00010663270950317383, 0.00012883543968200684, 0.00015103816986083984, 0.00017324090003967285, 0.00019544363021850586, 0.00021764636039733887, 0.00023984909057617188, 0.0002620518207550049, 0.0002842545509338379, 0.0003064572811126709, 0.0003286600112915039, 0.0003508627414703369, 0.0003730654716491699, 0.00039526820182800293, 0.00041747093200683594, 0.00043967366218566895, 0.00046187639236450195, 0.00048407912254333496, 0.000506281852722168, 0.000528484582901001, 0.000550687313079834, 0.000572890043258667, 0.0005950927734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 4.0, 12.0, 15.0, 23.0, 36.0, 42.0, 67.0, 129.0, 218.0, 415.0, 1034.0, 3033.0, 12271.0, 100604.0, 802271.0, 110040.0, 13012.0, 3129.0, 1133.0, 463.0, 219.0, 132.0, 72.0, 53.0, 41.0, 22.0, 10.0, 7.0, 10.0, 10.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.64453125, -5.45330810546875, -5.2620849609375, -5.07086181640625, -4.879638671875, -4.68841552734375, -4.4971923828125, -4.30596923828125, -4.11474609375, -3.92352294921875, -3.7322998046875, -3.54107666015625, -3.349853515625, -3.15863037109375, -2.9674072265625, -2.77618408203125, -2.5849609375, -2.39373779296875, -2.2025146484375, -2.01129150390625, -1.820068359375, -1.62884521484375, -1.4376220703125, -1.24639892578125, -1.05517578125, -0.86395263671875, -0.6727294921875, -0.48150634765625, -0.290283203125, -0.09906005859375, 0.0921630859375, 0.28338623046875, 0.474609375, 0.66583251953125, 0.8570556640625, 1.04827880859375, 1.239501953125, 1.43072509765625, 1.6219482421875, 1.81317138671875, 2.00439453125, 2.19561767578125, 2.3868408203125, 2.57806396484375, 2.769287109375, 2.96051025390625, 3.1517333984375, 3.34295654296875, 3.5341796875, 3.72540283203125, 3.9166259765625, 4.10784912109375, 4.299072265625, 4.49029541015625, 4.6815185546875, 4.87274169921875, 5.06396484375, 5.25518798828125, 5.4464111328125, 5.63763427734375, 5.828857421875, 6.02008056640625, 6.2113037109375, 6.40252685546875, 6.59375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 4.0, 8.0, 14.0, 18.0, 21.0, 29.0, 40.0, 53.0, 96.0, 116.0, 136.0, 121.0, 108.0, 60.0, 52.0, 38.0, 14.0, 15.0, 17.0, 14.0, 7.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.9573974609375, -3.781982421875, -3.6065673828125, -3.43115234375, -3.2557373046875, -3.080322265625, -2.9049072265625, -2.7294921875, -2.5540771484375, -2.378662109375, -2.2032470703125, -2.02783203125, -1.8524169921875, -1.677001953125, -1.5015869140625, -1.326171875, -1.1507568359375, -0.975341796875, -0.7999267578125, -0.62451171875, -0.4490966796875, -0.273681640625, -0.0982666015625, 0.0771484375, 0.2525634765625, 0.427978515625, 0.6033935546875, 0.77880859375, 0.9542236328125, 1.129638671875, 1.3050537109375, 1.48046875, 1.6558837890625, 1.831298828125, 2.0067138671875, 2.18212890625, 2.3575439453125, 2.532958984375, 2.7083740234375, 2.8837890625, 3.0592041015625, 3.234619140625, 3.4100341796875, 3.58544921875, 3.7608642578125, 3.936279296875, 4.1116943359375, 4.287109375, 4.4625244140625, 4.637939453125, 4.8133544921875, 4.98876953125, 5.1641845703125, 5.339599609375, 5.5150146484375, 5.6904296875, 5.8658447265625, 6.041259765625, 6.2166748046875, 6.39208984375, 6.5675048828125, 6.742919921875, 6.9183349609375, 7.09375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 6.0, 5.0, 14.0, 33.0, 116.0, 252.0, 309.0, 157.0, 54.0, 29.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.46949768066406, -97.07816314697266, -92.68682861328125, -88.29549407958984, -83.90415954589844, -79.51282501220703, -75.12149047851562, -70.73015594482422, -66.33882141113281, -61.947486877441406, -57.55615234375, -53.164817810058594, -48.77348327636719, -44.38214874267578, -39.990814208984375, -35.59947967529297, -31.208145141601562, -26.816810607910156, -22.42547607421875, -18.034141540527344, -13.642807006835938, -9.251472473144531, -4.860137939453125, -0.46880340576171875, 3.9225311279296875, 8.313865661621094, 12.7052001953125, 17.096534729003906, 21.487869262695312, 25.87920379638672, 30.270538330078125, 34.66187286376953, 39.05320739746094, 43.444541931152344, 47.83587646484375, 52.227210998535156, 56.61854553222656, 61.00988006591797, 65.40121459960938, 69.79254913330078, 74.18388366699219, 78.5752182006836, 82.966552734375, 87.3578872680664, 91.74922180175781, 96.14055633544922, 100.53189086914062, 104.92322540283203, 109.31455993652344, 113.70589447021484, 118.09722900390625, 122.48856353759766, 126.87989807128906, 131.271240234375, 135.66256713867188, 140.05389404296875, 144.4452362060547, 148.83657836914062, 153.2279052734375, 157.61923217773438, 162.0105743408203, 166.40191650390625, 170.79324340820312, 175.1845703125, 179.57591247558594]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 10.0, 4.0, 8.0, 10.0, 16.0, 27.0, 18.0, 32.0, 31.0, 33.0, 57.0, 52.0, 55.0, 80.0, 100.0, 75.0, 69.0, 59.0, 67.0, 50.0, 51.0, 25.0, 17.0, 23.0, 13.0, 11.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40533447265625, -49.729209899902344, -47.05308532714844, -44.37696075439453, -41.700836181640625, -39.02471160888672, -36.34858703613281, -33.672462463378906, -30.996335983276367, -28.32021141052246, -25.644086837768555, -22.967960357666016, -20.29183578491211, -17.615711212158203, -14.939586639404297, -12.26346206665039, -9.587337493896484, -6.911212921142578, -4.235087871551514, -1.5589628219604492, 1.117161750793457, 3.7932863235473633, 6.469411849975586, 9.145536422729492, 11.821660995483398, 14.497785568237305, 17.17391014099121, 19.85003662109375, 22.526161193847656, 25.202285766601562, 27.87841033935547, 30.554534912109375, 33.23065948486328, 35.90678405761719, 38.582908630371094, 41.259033203125, 43.935157775878906, 46.61128234863281, 49.28740692138672, 51.963531494140625, 54.63965606689453, 57.31578063964844, 59.991905212402344, 62.66802978515625, 65.34415435791016, 68.02027893066406, 70.69640350341797, 73.37252807617188, 76.04866027832031, 78.72478485107422, 81.40090942382812, 84.07703399658203, 86.75315856933594, 89.42928314208984, 92.10540771484375, 94.78153228759766, 97.45765686035156, 100.13378143310547, 102.80990600585938, 105.48603057861328, 108.16215515136719, 110.8382797241211, 113.514404296875, 116.1905288696289, 118.86665344238281]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 19.0, 27.0, 50.0, 90.0, 201.0, 483.0, 1310.0, 4768.0, 25171.0, 383160.0, 3637214.0, 124415.0, 12608.0, 2821.0, 970.0, 447.0, 200.0, 110.0, 68.0, 36.0, 34.0, 19.0, 10.0, 14.0, 13.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.60089111328125, -7.2447509765625, -6.88861083984375, -6.532470703125, -6.17633056640625, -5.8201904296875, -5.46405029296875, -5.10791015625, -4.75177001953125, -4.3956298828125, -4.03948974609375, -3.683349609375, -3.32720947265625, -2.9710693359375, -2.61492919921875, -2.2587890625, -1.90264892578125, -1.5465087890625, -1.19036865234375, -0.834228515625, -0.47808837890625, -0.1219482421875, 0.23419189453125, 0.59033203125, 0.94647216796875, 1.3026123046875, 1.65875244140625, 2.014892578125, 2.37103271484375, 2.7271728515625, 3.08331298828125, 3.439453125, 3.79559326171875, 4.1517333984375, 4.50787353515625, 4.864013671875, 5.22015380859375, 5.5762939453125, 5.93243408203125, 6.28857421875, 6.64471435546875, 7.0008544921875, 7.35699462890625, 7.713134765625, 8.06927490234375, 8.4254150390625, 8.78155517578125, 9.1376953125, 9.49383544921875, 9.8499755859375, 10.20611572265625, 10.562255859375, 10.91839599609375, 11.2745361328125, 11.63067626953125, 11.98681640625, 12.34295654296875, 12.6990966796875, 13.05523681640625, 13.411376953125, 13.76751708984375, 14.1236572265625, 14.47979736328125, 14.8359375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 6.0, 5.0, 21.0, 24.0, 32.0, 48.0, 81.0, 80.0, 104.0, 80.0, 106.0, 95.0, 90.0, 67.0, 72.0, 40.0, 27.0, 16.0, 6.0, 10.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.0147705078125, -1.818603515625, -1.6224365234375, -1.42626953125, -1.2301025390625, -1.033935546875, -0.8377685546875, -0.6416015625, -0.4454345703125, -0.249267578125, -0.0531005859375, 0.14306640625, 0.3392333984375, 0.535400390625, 0.7315673828125, 0.927734375, 1.1239013671875, 1.320068359375, 1.5162353515625, 1.71240234375, 1.9085693359375, 2.104736328125, 2.3009033203125, 2.4970703125, 2.6932373046875, 2.889404296875, 3.0855712890625, 3.28173828125, 3.4779052734375, 3.674072265625, 3.8702392578125, 4.06640625, 4.2625732421875, 4.458740234375, 4.6549072265625, 4.85107421875, 5.0472412109375, 5.243408203125, 5.4395751953125, 5.6357421875, 5.8319091796875, 6.028076171875, 6.2242431640625, 6.42041015625, 6.6165771484375, 6.812744140625, 7.0089111328125, 7.205078125, 7.4012451171875, 7.597412109375, 7.7935791015625, 7.98974609375, 8.1859130859375, 8.382080078125, 8.5782470703125, 8.7744140625, 8.9705810546875, 9.166748046875, 9.3629150390625, 9.55908203125, 9.7552490234375, 9.951416015625, 10.1475830078125, 10.34375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 15.0, 16.0, 28.0, 45.0, 112.0, 208.0, 471.0, 1439.0, 5171.0, 23208.0, 173148.0, 3487647.0, 452691.0, 39261.0, 7469.0, 2068.0, 650.0, 279.0, 149.0, 84.0, 41.0, 29.0, 14.0, 11.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.625732421875, -8.31396484375, -8.002197265625, -7.6904296875, -7.378662109375, -7.06689453125, -6.755126953125, -6.443359375, -6.131591796875, -5.81982421875, -5.508056640625, -5.1962890625, -4.884521484375, -4.57275390625, -4.260986328125, -3.94921875, -3.637451171875, -3.32568359375, -3.013916015625, -2.7021484375, -2.390380859375, -2.07861328125, -1.766845703125, -1.455078125, -1.143310546875, -0.83154296875, -0.519775390625, -0.2080078125, 0.103759765625, 0.41552734375, 0.727294921875, 1.0390625, 1.350830078125, 1.66259765625, 1.974365234375, 2.2861328125, 2.597900390625, 2.90966796875, 3.221435546875, 3.533203125, 3.844970703125, 4.15673828125, 4.468505859375, 4.7802734375, 5.092041015625, 5.40380859375, 5.715576171875, 6.02734375, 6.339111328125, 6.65087890625, 6.962646484375, 7.2744140625, 7.586181640625, 7.89794921875, 8.209716796875, 8.521484375, 8.833251953125, 9.14501953125, 9.456787109375, 9.7685546875, 10.080322265625, 10.39208984375, 10.703857421875, 11.015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 3.0, 6.0, 9.0, 3.0, 12.0, 16.0, 17.0, 20.0, 30.0, 36.0, 37.0, 54.0, 73.0, 111.0, 180.0, 218.0, 390.0, 591.0, 735.0, 543.0, 335.0, 195.0, 114.0, 103.0, 44.0, 49.0, 34.0, 35.0, 20.0, 8.0, 15.0, 10.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.29058837890625, -5.0811767578125, -4.87176513671875, -4.662353515625, -4.45294189453125, -4.2435302734375, -4.03411865234375, -3.82470703125, -3.61529541015625, -3.4058837890625, -3.19647216796875, -2.987060546875, -2.77764892578125, -2.5682373046875, -2.35882568359375, -2.1494140625, -1.94000244140625, -1.7305908203125, -1.52117919921875, -1.311767578125, -1.10235595703125, -0.8929443359375, -0.68353271484375, -0.47412109375, -0.26470947265625, -0.0552978515625, 0.15411376953125, 0.363525390625, 0.57293701171875, 0.7823486328125, 0.99176025390625, 1.201171875, 1.41058349609375, 1.6199951171875, 1.82940673828125, 2.038818359375, 2.24822998046875, 2.4576416015625, 2.66705322265625, 2.87646484375, 3.08587646484375, 3.2952880859375, 3.50469970703125, 3.714111328125, 3.92352294921875, 4.1329345703125, 4.34234619140625, 4.5517578125, 4.76116943359375, 4.9705810546875, 5.17999267578125, 5.389404296875, 5.59881591796875, 5.8082275390625, 6.01763916015625, 6.22705078125, 6.43646240234375, 6.6458740234375, 6.85528564453125, 7.064697265625, 7.27410888671875, 7.4835205078125, 7.69293212890625, 7.90234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 10.0, 22.0, 36.0, 77.0, 150.0, 189.0, 192.0, 140.0, 91.0, 40.0, 15.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.53693389892578, -55.8853874206543, -53.23383712768555, -50.58229064941406, -47.93074035644531, -45.27919387817383, -42.627647399902344, -39.976097106933594, -37.32455062866211, -34.673004150390625, -32.021453857421875, -29.36990737915039, -26.718358993530273, -24.066810607910156, -21.415264129638672, -18.763715744018555, -16.112167358398438, -13.46061897277832, -10.80907154083252, -8.157524108886719, -5.505975723266602, -2.8544273376464844, -0.2028799057006836, 2.448667526245117, 5.100215911865234, 7.751763820648193, 10.403311729431152, 13.054859161376953, 15.70640754699707, 18.357955932617188, 21.009502410888672, 23.66105079650879, 26.312591552734375, 28.964139938354492, 31.61568832397461, 34.267234802246094, 36.918785095214844, 39.57033157348633, 42.22187805175781, 44.87342834472656, 47.52497482299805, 50.17652130126953, 52.82807159423828, 55.479618072509766, 58.13116455078125, 60.78271484375, 63.434261322021484, 66.08580780029297, 68.73735809326172, 71.38890838623047, 74.04045104980469, 76.69200134277344, 79.34355163574219, 81.99510192871094, 84.64664459228516, 87.2981948852539, 89.94973754882812, 92.60128784179688, 95.2528305053711, 97.90438079833984, 100.5559310913086, 103.20747375488281, 105.85902404785156, 108.51057434082031, 111.16212463378906]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 12.0, 20.0, 16.0, 20.0, 26.0, 37.0, 36.0, 38.0, 50.0, 49.0, 62.0, 65.0, 67.0, 53.0, 65.0, 59.0, 57.0, 50.0, 38.0, 52.0, 35.0, 19.0, 15.0, 12.0, 8.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-61.19279861450195, -59.783447265625, -58.37409973144531, -56.96474838256836, -55.55540084838867, -54.14604949951172, -52.73670196533203, -51.32735061645508, -49.917999267578125, -48.50864791870117, -47.099300384521484, -45.68994903564453, -44.280601501464844, -42.87125015258789, -41.46189880371094, -40.05255126953125, -38.64320373535156, -37.23385238647461, -35.82450485229492, -34.41515350341797, -33.00580596923828, -31.596454620361328, -30.187105178833008, -28.777755737304688, -27.368404388427734, -25.959054946899414, -24.549705505371094, -23.14035415649414, -21.73100471496582, -20.3216552734375, -18.91230583190918, -17.50295639038086, -16.093603134155273, -14.684253692626953, -13.274903297424316, -11.865553855895996, -10.45620346069336, -9.046854019165039, -7.637504577636719, -6.228154182434082, -4.818804740905762, -3.409454822540283, -2.000105142593384, -0.5907554626464844, 0.8185944557189941, 2.2279443740844727, 3.637293815612793, 5.04664421081543, 6.45599365234375, 7.8653435707092285, 9.274693489074707, 10.684042930603027, 12.093393325805664, 13.502742767333984, 14.912092208862305, 16.321441650390625, 17.730792999267578, 19.1401424407959, 20.54949188232422, 21.958843231201172, 23.368192672729492, 24.777542114257812, 26.186891555786133, 27.596240997314453, 29.005590438842773]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 11.0, 10.0, 7.0, 20.0, 24.0, 35.0, 55.0, 89.0, 140.0, 216.0, 346.0, 629.0, 1209.0, 2336.0, 5190.0, 13430.0, 37627.0, 111258.0, 314854.0, 357309.0, 131611.0, 44888.0, 15658.0, 6080.0, 2627.0, 1189.0, 671.0, 345.0, 228.0, 137.0, 89.0, 69.0, 46.0, 32.0, 20.0, 17.0, 8.0, 8.0, 9.0, 4.0, 0.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.9765625, -6.7520751953125, -6.527587890625, -6.3031005859375, -6.07861328125, -5.8541259765625, -5.629638671875, -5.4051513671875, -5.1806640625, -4.9561767578125, -4.731689453125, -4.5072021484375, -4.28271484375, -4.0582275390625, -3.833740234375, -3.6092529296875, -3.384765625, -3.1602783203125, -2.935791015625, -2.7113037109375, -2.48681640625, -2.2623291015625, -2.037841796875, -1.8133544921875, -1.5888671875, -1.3643798828125, -1.139892578125, -0.9154052734375, -0.69091796875, -0.4664306640625, -0.241943359375, -0.0174560546875, 0.20703125, 0.4315185546875, 0.656005859375, 0.8804931640625, 1.10498046875, 1.3294677734375, 1.553955078125, 1.7784423828125, 2.0029296875, 2.2274169921875, 2.451904296875, 2.6763916015625, 2.90087890625, 3.1253662109375, 3.349853515625, 3.5743408203125, 3.798828125, 4.0233154296875, 4.247802734375, 4.4722900390625, 4.69677734375, 4.9212646484375, 5.145751953125, 5.3702392578125, 5.5947265625, 5.8192138671875, 6.043701171875, 6.2681884765625, 6.49267578125, 6.7171630859375, 6.941650390625, 7.1661376953125, 7.390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 7.0, 10.0, 6.0, 10.0, 12.0, 14.0, 21.0, 21.0, 23.0, 42.0, 43.0, 47.0, 35.0, 43.0, 48.0, 47.0, 59.0, 57.0, 57.0, 53.0, 42.0, 58.0, 37.0, 29.0, 30.0, 32.0, 41.0, 21.0, 19.0, 11.0, 12.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.108856201171875, -2.00482177734375, -1.900787353515625, -1.7967529296875, -1.692718505859375, -1.58868408203125, -1.484649658203125, -1.380615234375, -1.276580810546875, -1.17254638671875, -1.068511962890625, -0.9644775390625, -0.860443115234375, -0.75640869140625, -0.652374267578125, -0.54833984375, -0.444305419921875, -0.34027099609375, -0.236236572265625, -0.1322021484375, -0.028167724609375, 0.07586669921875, 0.179901123046875, 0.283935546875, 0.387969970703125, 0.49200439453125, 0.596038818359375, 0.7000732421875, 0.804107666015625, 0.90814208984375, 1.012176513671875, 1.1162109375, 1.220245361328125, 1.32427978515625, 1.428314208984375, 1.5323486328125, 1.636383056640625, 1.74041748046875, 1.844451904296875, 1.948486328125, 2.052520751953125, 2.15655517578125, 2.260589599609375, 2.3646240234375, 2.468658447265625, 2.57269287109375, 2.676727294921875, 2.78076171875, 2.884796142578125, 2.98883056640625, 3.092864990234375, 3.1968994140625, 3.300933837890625, 3.40496826171875, 3.509002685546875, 3.613037109375, 3.717071533203125, 3.82110595703125, 3.925140380859375, 4.0291748046875, 4.133209228515625, 4.23724365234375, 4.341278076171875, 4.4453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 8.0, 8.0, 13.0, 20.0, 38.0, 58.0, 54.0, 85.0, 110.0, 164.0, 293.0, 383.0, 543.0, 988.0, 1726.0, 3460.0, 11015.0, 66188.0, 671748.0, 249412.0, 29451.0, 6501.0, 2570.0, 1322.0, 829.0, 514.0, 323.0, 222.0, 165.0, 95.0, 46.0, 51.0, 44.0, 21.0, 16.0, 11.0, 9.0, 8.0, 9.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-13.203125, -12.800537109375, -12.39794921875, -11.995361328125, -11.5927734375, -11.190185546875, -10.78759765625, -10.385009765625, -9.982421875, -9.579833984375, -9.17724609375, -8.774658203125, -8.3720703125, -7.969482421875, -7.56689453125, -7.164306640625, -6.76171875, -6.359130859375, -5.95654296875, -5.553955078125, -5.1513671875, -4.748779296875, -4.34619140625, -3.943603515625, -3.541015625, -3.138427734375, -2.73583984375, -2.333251953125, -1.9306640625, -1.528076171875, -1.12548828125, -0.722900390625, -0.3203125, 0.082275390625, 0.48486328125, 0.887451171875, 1.2900390625, 1.692626953125, 2.09521484375, 2.497802734375, 2.900390625, 3.302978515625, 3.70556640625, 4.108154296875, 4.5107421875, 4.913330078125, 5.31591796875, 5.718505859375, 6.12109375, 6.523681640625, 6.92626953125, 7.328857421875, 7.7314453125, 8.134033203125, 8.53662109375, 8.939208984375, 9.341796875, 9.744384765625, 10.14697265625, 10.549560546875, 10.9521484375, 11.354736328125, 11.75732421875, 12.159912109375, 12.5625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 10.0, 18.0, 29.0, 34.0, 32.0, 43.0, 58.0, 60.0, 59.0, 60.0, 77.0, 82.0, 73.0, 68.0, 55.0, 47.0, 39.0, 37.0, 33.0, 29.0, 23.0, 14.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.65625, -15.09375, -14.53125, -13.96875, -13.40625, -12.84375, -12.28125, -11.71875, -11.15625, -10.59375, -10.03125, -9.46875, -8.90625, -8.34375, -7.78125, -7.21875, -6.65625, -6.09375, -5.53125, -4.96875, -4.40625, -3.84375, -3.28125, -2.71875, -2.15625, -1.59375, -1.03125, -0.46875, 0.09375, 0.65625, 1.21875, 1.78125, 2.34375, 2.90625, 3.46875, 4.03125, 4.59375, 5.15625, 5.71875, 6.28125, 6.84375, 7.40625, 7.96875, 8.53125, 9.09375, 9.65625, 10.21875, 10.78125, 11.34375, 11.90625, 12.46875, 13.03125, 13.59375, 14.15625, 14.71875, 15.28125, 15.84375, 16.40625, 16.96875, 17.53125, 18.09375, 18.65625, 19.21875, 19.78125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 7.0, 17.0, 28.0, 36.0, 33.0, 41.0, 93.0, 163.0, 257.0, 553.0, 1539.0, 7152.0, 111656.0, 885566.0, 35513.0, 3873.0, 1043.0, 419.0, 172.0, 145.0, 89.0, 40.0, 30.0, 21.0, 18.0, 11.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.1484375, -8.8966064453125, -8.644775390625, -8.3929443359375, -8.14111328125, -7.8892822265625, -7.637451171875, -7.3856201171875, -7.1337890625, -6.8819580078125, -6.630126953125, -6.3782958984375, -6.12646484375, -5.8746337890625, -5.622802734375, -5.3709716796875, -5.119140625, -4.8673095703125, -4.615478515625, -4.3636474609375, -4.11181640625, -3.8599853515625, -3.608154296875, -3.3563232421875, -3.1044921875, -2.8526611328125, -2.600830078125, -2.3489990234375, -2.09716796875, -1.8453369140625, -1.593505859375, -1.3416748046875, -1.08984375, -0.8380126953125, -0.586181640625, -0.3343505859375, -0.08251953125, 0.1693115234375, 0.421142578125, 0.6729736328125, 0.9248046875, 1.1766357421875, 1.428466796875, 1.6802978515625, 1.93212890625, 2.1839599609375, 2.435791015625, 2.6876220703125, 2.939453125, 3.1912841796875, 3.443115234375, 3.6949462890625, 3.94677734375, 4.1986083984375, 4.450439453125, 4.7022705078125, 4.9541015625, 5.2059326171875, 5.457763671875, 5.7095947265625, 5.96142578125, 6.2132568359375, 6.465087890625, 6.7169189453125, 6.96875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 14.0, 15.0, 22.0, 29.0, 26.0, 52.0, 69.0, 94.0, 182.0, 182.0, 91.0, 71.0, 39.0, 34.0, 23.0, 18.0, 10.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016040802001953125, -0.0015568435192108154, -0.0015096068382263184, -0.0014623701572418213, -0.0014151334762573242, -0.0013678967952728271, -0.00132066011428833, -0.001273423433303833, -0.001226186752319336, -0.0011789500713348389, -0.0011317133903503418, -0.0010844767093658447, -0.0010372400283813477, -0.0009900033473968506, -0.0009427666664123535, -0.0008955299854278564, -0.0008482933044433594, -0.0008010566234588623, -0.0007538199424743652, -0.0007065832614898682, -0.0006593465805053711, -0.000612109899520874, -0.000564873218536377, -0.0005176365375518799, -0.0004703998565673828, -0.00042316317558288574, -0.00037592649459838867, -0.0003286898136138916, -0.00028145313262939453, -0.00023421645164489746, -0.0001869797706604004, -0.00013974308967590332, -9.250640869140625e-05, -4.526972770690918e-05, 1.9669532775878906e-06, 4.920363426208496e-05, 9.644031524658203e-05, 0.0001436769962310791, 0.00019091367721557617, 0.00023815035820007324, 0.0002853870391845703, 0.0003326237201690674, 0.00037986040115356445, 0.0004270970821380615, 0.0004743337631225586, 0.0005215704441070557, 0.0005688071250915527, 0.0006160438060760498, 0.0006632804870605469, 0.0007105171680450439, 0.000757753849029541, 0.0008049905300140381, 0.0008522272109985352, 0.0008994638919830322, 0.0009467005729675293, 0.0009939372539520264, 0.0010411739349365234, 0.0010884106159210205, 0.0011356472969055176, 0.0011828839778900146, 0.0012301206588745117, 0.0012773573398590088, 0.0013245940208435059, 0.001371830701828003, 0.0014190673828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 8.0, 6.0, 6.0, 5.0, 8.0, 13.0, 23.0, 32.0, 62.0, 83.0, 134.0, 188.0, 382.0, 742.0, 1736.0, 4700.0, 20458.0, 824685.0, 178046.0, 11351.0, 3312.0, 1240.0, 585.0, 277.0, 154.0, 107.0, 61.0, 52.0, 14.0, 22.0, 14.0, 7.0, 7.0, 10.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1171875, -7.802978515625, -7.48876953125, -7.174560546875, -6.8603515625, -6.546142578125, -6.23193359375, -5.917724609375, -5.603515625, -5.289306640625, -4.97509765625, -4.660888671875, -4.3466796875, -4.032470703125, -3.71826171875, -3.404052734375, -3.08984375, -2.775634765625, -2.46142578125, -2.147216796875, -1.8330078125, -1.518798828125, -1.20458984375, -0.890380859375, -0.576171875, -0.261962890625, 0.05224609375, 0.366455078125, 0.6806640625, 0.994873046875, 1.30908203125, 1.623291015625, 1.9375, 2.251708984375, 2.56591796875, 2.880126953125, 3.1943359375, 3.508544921875, 3.82275390625, 4.136962890625, 4.451171875, 4.765380859375, 5.07958984375, 5.393798828125, 5.7080078125, 6.022216796875, 6.33642578125, 6.650634765625, 6.96484375, 7.279052734375, 7.59326171875, 7.907470703125, 8.2216796875, 8.535888671875, 8.85009765625, 9.164306640625, 9.478515625, 9.792724609375, 10.10693359375, 10.421142578125, 10.7353515625, 11.049560546875, 11.36376953125, 11.677978515625, 11.9921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 13.0, 33.0, 60.0, 68.0, 141.0, 211.0, 194.0, 108.0, 66.0, 43.0, 19.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.07989501953125, -5.8121337890625, -5.54437255859375, -5.276611328125, -5.00885009765625, -4.7410888671875, -4.47332763671875, -4.20556640625, -3.93780517578125, -3.6700439453125, -3.40228271484375, -3.134521484375, -2.86676025390625, -2.5989990234375, -2.33123779296875, -2.0634765625, -1.79571533203125, -1.5279541015625, -1.26019287109375, -0.992431640625, -0.72467041015625, -0.4569091796875, -0.18914794921875, 0.07861328125, 0.34637451171875, 0.6141357421875, 0.88189697265625, 1.149658203125, 1.41741943359375, 1.6851806640625, 1.95294189453125, 2.220703125, 2.48846435546875, 2.7562255859375, 3.02398681640625, 3.291748046875, 3.55950927734375, 3.8272705078125, 4.09503173828125, 4.36279296875, 4.63055419921875, 4.8983154296875, 5.16607666015625, 5.433837890625, 5.70159912109375, 5.9693603515625, 6.23712158203125, 6.5048828125, 6.77264404296875, 7.0404052734375, 7.30816650390625, 7.575927734375, 7.84368896484375, 8.1114501953125, 8.37921142578125, 8.64697265625, 8.91473388671875, 9.1824951171875, 9.45025634765625, 9.718017578125, 9.98577880859375, 10.2535400390625, 10.52130126953125, 10.7890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 17.0, 60.0, 134.0, 219.0, 314.0, 136.0, 72.0, 16.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.084014892578125, -58.00503158569336, -53.92605209350586, -49.847068786621094, -45.768089294433594, -41.68910598754883, -37.61012268066406, -33.53114318847656, -29.452159881591797, -25.373178482055664, -21.29419708251953, -17.215213775634766, -13.136232376098633, -9.0572509765625, -4.978267669677734, -0.8992862701416016, 3.1796951293945312, 7.258677005767822, 11.337658882141113, 15.416641235351562, 19.495622634887695, 23.574604034423828, 27.653587341308594, 31.732568740844727, 35.81155014038086, 39.890533447265625, 43.969512939453125, 48.04849624633789, 52.127479553222656, 56.206459045410156, 60.28544235229492, 64.36442565917969, 68.44340515136719, 72.52238464355469, 76.60137176513672, 80.68035125732422, 84.75933074951172, 88.83831787109375, 92.91729736328125, 96.99627685546875, 101.07525634765625, 105.15423583984375, 109.23322296142578, 113.31220245361328, 117.39118194580078, 121.47016906738281, 125.54914855957031, 129.6281280517578, 133.70712280273438, 137.78610229492188, 141.86508178710938, 145.94406127929688, 150.02305603027344, 154.10203552246094, 158.18101501464844, 162.25999450683594, 166.33897399902344, 170.41795349121094, 174.49693298339844, 178.575927734375, 182.6549072265625, 186.73388671875, 190.8128662109375, 194.891845703125, 198.9708251953125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 15.0, 10.0, 15.0, 20.0, 27.0, 17.0, 31.0, 31.0, 39.0, 53.0, 39.0, 45.0, 49.0, 73.0, 92.0, 72.0, 46.0, 51.0, 48.0, 35.0, 26.0, 22.0, 27.0, 21.0, 23.0, 16.0, 6.0, 9.0, 8.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.31729125976562, -62.577415466308594, -60.83753967285156, -59.097660064697266, -57.357784271240234, -55.6179084777832, -53.878028869628906, -52.138153076171875, -50.398277282714844, -48.65840148925781, -46.91852569580078, -45.178646087646484, -43.43877029418945, -41.69889450073242, -39.959014892578125, -38.219139099121094, -36.47926330566406, -34.73938751220703, -32.99951171875, -31.259632110595703, -29.519756317138672, -27.77988052368164, -26.040002822875977, -24.300125122070312, -22.56024932861328, -20.82037353515625, -19.080495834350586, -17.340618133544922, -15.60074234008789, -13.860865592956543, -12.120988845825195, -10.381112098693848, -8.641231536865234, -6.901354789733887, -5.161478042602539, -3.4216012954711914, -1.6817245483398438, 0.058152198791503906, 1.7980289459228516, 3.537905693054199, 5.277782440185547, 7.0176591873168945, 8.757535934448242, 10.49741268157959, 12.237289428710938, 13.977166175842285, 15.717042922973633, 17.456920623779297, 19.196796417236328, 20.93667221069336, 22.676549911499023, 24.416427612304688, 26.15630340576172, 27.89617919921875, 29.636056900024414, 31.375934600830078, 33.11581039428711, 34.85568618774414, 36.59556579589844, 38.33544158935547, 40.0753173828125, 41.81519317626953, 43.55506896972656, 45.29494857788086, 47.03482437133789]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 23.0, 52.0, 189.0, 870.0, 8200.0, 2887857.0, 1290259.0, 5680.0, 767.0, 217.0, 88.0, 36.0, 15.0, 10.0, 7.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.2862548828125, -9.549072265625, -8.8118896484375, -8.07470703125, -7.3375244140625, -6.600341796875, -5.8631591796875, -5.1259765625, -4.3887939453125, -3.651611328125, -2.9144287109375, -2.17724609375, -1.4400634765625, -0.702880859375, 0.0343017578125, 0.771484375, 1.5086669921875, 2.245849609375, 2.9830322265625, 3.72021484375, 4.4573974609375, 5.194580078125, 5.9317626953125, 6.6689453125, 7.4061279296875, 8.143310546875, 8.8804931640625, 9.61767578125, 10.3548583984375, 11.092041015625, 11.8292236328125, 12.56640625, 13.3035888671875, 14.040771484375, 14.7779541015625, 15.51513671875, 16.2523193359375, 16.989501953125, 17.7266845703125, 18.4638671875, 19.2010498046875, 19.938232421875, 20.6754150390625, 21.41259765625, 22.1497802734375, 22.886962890625, 23.6241455078125, 24.361328125, 25.0985107421875, 25.835693359375, 26.5728759765625, 27.31005859375, 28.0472412109375, 28.784423828125, 29.5216064453125, 30.2587890625, 30.9959716796875, 31.733154296875, 32.4703369140625, 33.20751953125, 33.9447021484375, 34.681884765625, 35.4190673828125, 36.15625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 14.0, 15.0, 17.0, 24.0, 41.0, 43.0, 57.0, 70.0, 50.0, 65.0, 58.0, 67.0, 79.0, 70.0, 59.0, 57.0, 47.0, 44.0, 34.0, 34.0, 17.0, 11.0, 13.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2586669921875, -4.118896484375, -3.9791259765625, -3.83935546875, -3.6995849609375, -3.559814453125, -3.4200439453125, -3.2802734375, -3.1405029296875, -3.000732421875, -2.8609619140625, -2.72119140625, -2.5814208984375, -2.441650390625, -2.3018798828125, -2.162109375, -2.0223388671875, -1.882568359375, -1.7427978515625, -1.60302734375, -1.4632568359375, -1.323486328125, -1.1837158203125, -1.0439453125, -0.9041748046875, -0.764404296875, -0.6246337890625, -0.48486328125, -0.3450927734375, -0.205322265625, -0.0655517578125, 0.07421875, 0.2139892578125, 0.353759765625, 0.4935302734375, 0.63330078125, 0.7730712890625, 0.912841796875, 1.0526123046875, 1.1923828125, 1.3321533203125, 1.471923828125, 1.6116943359375, 1.75146484375, 1.8912353515625, 2.031005859375, 2.1707763671875, 2.310546875, 2.4503173828125, 2.590087890625, 2.7298583984375, 2.86962890625, 3.0093994140625, 3.149169921875, 3.2889404296875, 3.4287109375, 3.5684814453125, 3.708251953125, 3.8480224609375, 3.98779296875, 4.1275634765625, 4.267333984375, 4.4071044921875, 4.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 6.0, 19.0, 27.0, 48.0, 74.0, 106.0, 207.0, 363.0, 668.0, 1496.0, 4711.0, 27448.0, 449512.0, 3593924.0, 99971.0, 11490.0, 2556.0, 936.0, 363.0, 170.0, 58.0, 57.0, 26.0, 13.0, 6.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.808837890625, -12.44580078125, -12.082763671875, -11.7197265625, -11.356689453125, -10.99365234375, -10.630615234375, -10.267578125, -9.904541015625, -9.54150390625, -9.178466796875, -8.8154296875, -8.452392578125, -8.08935546875, -7.726318359375, -7.36328125, -7.000244140625, -6.63720703125, -6.274169921875, -5.9111328125, -5.548095703125, -5.18505859375, -4.822021484375, -4.458984375, -4.095947265625, -3.73291015625, -3.369873046875, -3.0068359375, -2.643798828125, -2.28076171875, -1.917724609375, -1.5546875, -1.191650390625, -0.82861328125, -0.465576171875, -0.1025390625, 0.260498046875, 0.62353515625, 0.986572265625, 1.349609375, 1.712646484375, 2.07568359375, 2.438720703125, 2.8017578125, 3.164794921875, 3.52783203125, 3.890869140625, 4.25390625, 4.616943359375, 4.97998046875, 5.343017578125, 5.7060546875, 6.069091796875, 6.43212890625, 6.795166015625, 7.158203125, 7.521240234375, 7.88427734375, 8.247314453125, 8.6103515625, 8.973388671875, 9.33642578125, 9.699462890625, 10.0625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 14.0, 16.0, 15.0, 35.0, 48.0, 90.0, 142.0, 285.0, 668.0, 1264.0, 770.0, 364.0, 138.0, 93.0, 40.0, 25.0, 14.0, 16.0, 14.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.3170166015625, -10.969970703125, -10.6229248046875, -10.27587890625, -9.9288330078125, -9.581787109375, -9.2347412109375, -8.8876953125, -8.5406494140625, -8.193603515625, -7.8465576171875, -7.49951171875, -7.1524658203125, -6.805419921875, -6.4583740234375, -6.111328125, -5.7642822265625, -5.417236328125, -5.0701904296875, -4.72314453125, -4.3760986328125, -4.029052734375, -3.6820068359375, -3.3349609375, -2.9879150390625, -2.640869140625, -2.2938232421875, -1.94677734375, -1.5997314453125, -1.252685546875, -0.9056396484375, -0.55859375, -0.2115478515625, 0.135498046875, 0.4825439453125, 0.82958984375, 1.1766357421875, 1.523681640625, 1.8707275390625, 2.2177734375, 2.5648193359375, 2.911865234375, 3.2589111328125, 3.60595703125, 3.9530029296875, 4.300048828125, 4.6470947265625, 4.994140625, 5.3411865234375, 5.688232421875, 6.0352783203125, 6.38232421875, 6.7293701171875, 7.076416015625, 7.4234619140625, 7.7705078125, 8.1175537109375, 8.464599609375, 8.8116455078125, 9.15869140625, 9.5057373046875, 9.852783203125, 10.1998291015625, 10.546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 28.0, 46.0, 125.0, 226.0, 272.0, 169.0, 62.0, 27.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.40232849121094, -106.89427947998047, -103.38623046875, -99.87818908691406, -96.3701400756836, -92.86209106445312, -89.35404205322266, -85.84599304199219, -82.33794403076172, -78.82989501953125, -75.32184600830078, -71.81379699707031, -68.30575561523438, -64.7977066040039, -61.28965759277344, -57.78160858154297, -54.273563385009766, -50.7655143737793, -47.257469177246094, -43.749420166015625, -40.241371154785156, -36.73332214355469, -33.225276947021484, -29.717227935791016, -26.20918083190918, -22.701133728027344, -19.193084716796875, -15.685037612915039, -12.176989555358887, -8.668941497802734, -5.160894393920898, -1.6528453826904297, 1.8552017211914062, 5.363249778747559, 8.871297836303711, 12.379344940185547, 15.8873929977417, 19.39544105529785, 22.903488159179688, 26.411537170410156, 29.919584274291992, 33.42763137817383, 36.9356803894043, 40.4437255859375, 43.95177459716797, 47.45982360839844, 50.967872619628906, 54.475921630859375, 57.98396682739258, 61.49201583862305, 65.00006103515625, 68.50811004638672, 72.01615905761719, 75.52420806884766, 79.03225708007812, 82.54029846191406, 86.04834747314453, 89.556396484375, 93.06444549560547, 96.57249450683594, 100.08053588867188, 103.58858489990234, 107.09663391113281, 110.60468292236328, 114.11273193359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 12.0, 16.0, 11.0, 22.0, 23.0, 29.0, 42.0, 50.0, 37.0, 49.0, 53.0, 48.0, 50.0, 64.0, 54.0, 39.0, 56.0, 42.0, 41.0, 40.0, 44.0, 30.0, 30.0, 23.0, 19.0, 16.0, 13.0, 10.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.35072708129883, -36.03185272216797, -34.712982177734375, -33.394107818603516, -32.075233459472656, -30.756362915039062, -29.437488555908203, -28.118616104125977, -26.79974365234375, -25.480871200561523, -24.161998748779297, -22.843124389648438, -21.52425193786621, -20.205379486083984, -18.886505126953125, -17.5676326751709, -16.248760223388672, -14.929887771606445, -13.611014366149902, -12.29214096069336, -10.973268508911133, -9.654396057128906, -8.335522651672363, -7.01664924621582, -5.697776794433594, -4.378903865814209, -3.060030937194824, -1.7411580085754395, -0.4222850799560547, 0.8965878486633301, 2.215460777282715, 3.534334182739258, 4.85321044921875, 6.172083377838135, 7.4909563064575195, 8.809829711914062, 10.128702163696289, 11.447574615478516, 12.766448020935059, 14.085321426391602, 15.404193878173828, 16.723066329956055, 18.04193878173828, 19.36081314086914, 20.679685592651367, 21.998558044433594, 23.317432403564453, 24.63630485534668, 25.955177307128906, 27.274049758911133, 28.59292221069336, 29.91179656982422, 31.230669021606445, 32.54954147338867, 33.86841583251953, 35.187286376953125, 36.506160736083984, 37.825035095214844, 39.14390563964844, 40.4627799987793, 41.781654357910156, 43.10052490234375, 44.41939926147461, 45.73827362060547, 47.05714416503906]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 2.0, 15.0, 15.0, 8.0, 18.0, 42.0, 55.0, 87.0, 153.0, 340.0, 680.0, 1544.0, 4604.0, 16641.0, 79175.0, 444593.0, 406171.0, 71845.0, 15331.0, 4303.0, 1533.0, 672.0, 306.0, 159.0, 81.0, 60.0, 28.0, 28.0, 15.0, 11.0, 6.0, 6.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3203125, -11.987060546875, -11.65380859375, -11.320556640625, -10.9873046875, -10.654052734375, -10.32080078125, -9.987548828125, -9.654296875, -9.321044921875, -8.98779296875, -8.654541015625, -8.3212890625, -7.988037109375, -7.65478515625, -7.321533203125, -6.98828125, -6.655029296875, -6.32177734375, -5.988525390625, -5.6552734375, -5.322021484375, -4.98876953125, -4.655517578125, -4.322265625, -3.989013671875, -3.65576171875, -3.322509765625, -2.9892578125, -2.656005859375, -2.32275390625, -1.989501953125, -1.65625, -1.322998046875, -0.98974609375, -0.656494140625, -0.3232421875, 0.010009765625, 0.34326171875, 0.676513671875, 1.009765625, 1.343017578125, 1.67626953125, 2.009521484375, 2.3427734375, 2.676025390625, 3.00927734375, 3.342529296875, 3.67578125, 4.009033203125, 4.34228515625, 4.675537109375, 5.0087890625, 5.342041015625, 5.67529296875, 6.008544921875, 6.341796875, 6.675048828125, 7.00830078125, 7.341552734375, 7.6748046875, 8.008056640625, 8.34130859375, 8.674560546875, 9.0078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 14.0, 12.0, 14.0, 21.0, 24.0, 37.0, 39.0, 44.0, 60.0, 53.0, 55.0, 55.0, 78.0, 60.0, 58.0, 53.0, 47.0, 41.0, 48.0, 40.0, 31.0, 20.0, 28.0, 17.0, 11.0, 12.0, 5.0, 13.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.64019775390625, -3.5147705078125, -3.38934326171875, -3.263916015625, -3.13848876953125, -3.0130615234375, -2.88763427734375, -2.76220703125, -2.63677978515625, -2.5113525390625, -2.38592529296875, -2.260498046875, -2.13507080078125, -2.0096435546875, -1.88421630859375, -1.7587890625, -1.63336181640625, -1.5079345703125, -1.38250732421875, -1.257080078125, -1.13165283203125, -1.0062255859375, -0.88079833984375, -0.75537109375, -0.62994384765625, -0.5045166015625, -0.37908935546875, -0.253662109375, -0.12823486328125, -0.0028076171875, 0.12261962890625, 0.248046875, 0.37347412109375, 0.4989013671875, 0.62432861328125, 0.749755859375, 0.87518310546875, 1.0006103515625, 1.12603759765625, 1.25146484375, 1.37689208984375, 1.5023193359375, 1.62774658203125, 1.753173828125, 1.87860107421875, 2.0040283203125, 2.12945556640625, 2.2548828125, 2.38031005859375, 2.5057373046875, 2.63116455078125, 2.756591796875, 2.88201904296875, 3.0074462890625, 3.13287353515625, 3.25830078125, 3.38372802734375, 3.5091552734375, 3.63458251953125, 3.760009765625, 3.88543701171875, 4.0108642578125, 4.13629150390625, 4.26171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 4.0, 7.0, 3.0, 13.0, 14.0, 24.0, 37.0, 52.0, 73.0, 113.0, 159.0, 192.0, 362.0, 588.0, 1260.0, 2924.0, 10891.0, 82201.0, 815294.0, 114487.0, 13306.0, 3313.0, 1404.0, 714.0, 407.0, 227.0, 142.0, 92.0, 76.0, 51.0, 36.0, 18.0, 22.0, 7.0, 9.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.28125, -15.74853515625, -15.2158203125, -14.68310546875, -14.150390625, -13.61767578125, -13.0849609375, -12.55224609375, -12.01953125, -11.48681640625, -10.9541015625, -10.42138671875, -9.888671875, -9.35595703125, -8.8232421875, -8.29052734375, -7.7578125, -7.22509765625, -6.6923828125, -6.15966796875, -5.626953125, -5.09423828125, -4.5615234375, -4.02880859375, -3.49609375, -2.96337890625, -2.4306640625, -1.89794921875, -1.365234375, -0.83251953125, -0.2998046875, 0.23291015625, 0.765625, 1.29833984375, 1.8310546875, 2.36376953125, 2.896484375, 3.42919921875, 3.9619140625, 4.49462890625, 5.02734375, 5.56005859375, 6.0927734375, 6.62548828125, 7.158203125, 7.69091796875, 8.2236328125, 8.75634765625, 9.2890625, 9.82177734375, 10.3544921875, 10.88720703125, 11.419921875, 11.95263671875, 12.4853515625, 13.01806640625, 13.55078125, 14.08349609375, 14.6162109375, 15.14892578125, 15.681640625, 16.21435546875, 16.7470703125, 17.27978515625, 17.8125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 6.0, 3.0, 7.0, 11.0, 16.0, 23.0, 24.0, 22.0, 23.0, 34.0, 49.0, 48.0, 57.0, 62.0, 55.0, 57.0, 62.0, 51.0, 61.0, 44.0, 51.0, 33.0, 24.0, 36.0, 23.0, 29.0, 24.0, 13.0, 13.0, 7.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.109375, -14.649169921875, -14.18896484375, -13.728759765625, -13.2685546875, -12.808349609375, -12.34814453125, -11.887939453125, -11.427734375, -10.967529296875, -10.50732421875, -10.047119140625, -9.5869140625, -9.126708984375, -8.66650390625, -8.206298828125, -7.74609375, -7.285888671875, -6.82568359375, -6.365478515625, -5.9052734375, -5.445068359375, -4.98486328125, -4.524658203125, -4.064453125, -3.604248046875, -3.14404296875, -2.683837890625, -2.2236328125, -1.763427734375, -1.30322265625, -0.843017578125, -0.3828125, 0.077392578125, 0.53759765625, 0.997802734375, 1.4580078125, 1.918212890625, 2.37841796875, 2.838623046875, 3.298828125, 3.759033203125, 4.21923828125, 4.679443359375, 5.1396484375, 5.599853515625, 6.06005859375, 6.520263671875, 6.98046875, 7.440673828125, 7.90087890625, 8.361083984375, 8.8212890625, 9.281494140625, 9.74169921875, 10.201904296875, 10.662109375, 11.122314453125, 11.58251953125, 12.042724609375, 12.5029296875, 12.963134765625, 13.42333984375, 13.883544921875, 14.34375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 9.0, 7.0, 9.0, 17.0, 14.0, 27.0, 33.0, 43.0, 94.0, 187.0, 432.0, 993.0, 3116.0, 16610.0, 410730.0, 593615.0, 17460.0, 3149.0, 1044.0, 425.0, 198.0, 117.0, 70.0, 39.0, 23.0, 21.0, 15.0, 13.0, 8.0, 15.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.078125, -8.81884765625, -8.5595703125, -8.30029296875, -8.041015625, -7.78173828125, -7.5224609375, -7.26318359375, -7.00390625, -6.74462890625, -6.4853515625, -6.22607421875, -5.966796875, -5.70751953125, -5.4482421875, -5.18896484375, -4.9296875, -4.67041015625, -4.4111328125, -4.15185546875, -3.892578125, -3.63330078125, -3.3740234375, -3.11474609375, -2.85546875, -2.59619140625, -2.3369140625, -2.07763671875, -1.818359375, -1.55908203125, -1.2998046875, -1.04052734375, -0.78125, -0.52197265625, -0.2626953125, -0.00341796875, 0.255859375, 0.51513671875, 0.7744140625, 1.03369140625, 1.29296875, 1.55224609375, 1.8115234375, 2.07080078125, 2.330078125, 2.58935546875, 2.8486328125, 3.10791015625, 3.3671875, 3.62646484375, 3.8857421875, 4.14501953125, 4.404296875, 4.66357421875, 4.9228515625, 5.18212890625, 5.44140625, 5.70068359375, 5.9599609375, 6.21923828125, 6.478515625, 6.73779296875, 6.9970703125, 7.25634765625, 7.515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 12.0, 13.0, 21.0, 23.0, 35.0, 46.0, 121.0, 193.0, 201.0, 120.0, 65.0, 38.0, 29.0, 19.0, 20.0, 10.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016641616821289062, -0.001613810658454895, -0.0015634596347808838, -0.0015131086111068726, -0.0014627575874328613, -0.00141240656375885, -0.0013620555400848389, -0.0013117045164108276, -0.0012613534927368164, -0.0012110024690628052, -0.001160651445388794, -0.0011103004217147827, -0.0010599493980407715, -0.0010095983743667603, -0.000959247350692749, -0.0009088963270187378, -0.0008585453033447266, -0.0008081942796707153, -0.0007578432559967041, -0.0007074922323226929, -0.0006571412086486816, -0.0006067901849746704, -0.0005564391613006592, -0.000506088137626648, -0.0004557371139526367, -0.0004053860902786255, -0.00035503506660461426, -0.00030468404293060303, -0.0002543330192565918, -0.00020398199558258057, -0.00015363097190856934, -0.0001032799482345581, -5.2928924560546875e-05, -2.5779008865356445e-06, 4.7773122787475586e-05, 9.812414646148682e-05, 0.00014847517013549805, 0.00019882619380950928, 0.0002491772174835205, 0.00029952824115753174, 0.00034987926483154297, 0.0004002302885055542, 0.00045058131217956543, 0.0005009323358535767, 0.0005512833595275879, 0.0006016343832015991, 0.0006519854068756104, 0.0007023364305496216, 0.0007526874542236328, 0.000803038477897644, 0.0008533895015716553, 0.0009037405252456665, 0.0009540915489196777, 0.001004442572593689, 0.0010547935962677002, 0.0011051446199417114, 0.0011554956436157227, 0.0012058466672897339, 0.0012561976909637451, 0.0013065487146377563, 0.0013568997383117676, 0.0014072507619857788, 0.00145760178565979, 0.0015079528093338013, 0.0015583038330078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 24.0, 48.0, 67.0, 122.0, 232.0, 482.0, 1336.0, 5245.0, 41049.0, 878732.0, 109286.0, 8614.0, 2033.0, 644.0, 281.0, 136.0, 73.0, 38.0, 29.0, 12.0, 14.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.2484130859375, -8.989013671875, -8.7296142578125, -8.47021484375, -8.2108154296875, -7.951416015625, -7.6920166015625, -7.4326171875, -7.1732177734375, -6.913818359375, -6.6544189453125, -6.39501953125, -6.1356201171875, -5.876220703125, -5.6168212890625, -5.357421875, -5.0980224609375, -4.838623046875, -4.5792236328125, -4.31982421875, -4.0604248046875, -3.801025390625, -3.5416259765625, -3.2822265625, -3.0228271484375, -2.763427734375, -2.5040283203125, -2.24462890625, -1.9852294921875, -1.725830078125, -1.4664306640625, -1.20703125, -0.9476318359375, -0.688232421875, -0.4288330078125, -0.16943359375, 0.0899658203125, 0.349365234375, 0.6087646484375, 0.8681640625, 1.1275634765625, 1.386962890625, 1.6463623046875, 1.90576171875, 2.1651611328125, 2.424560546875, 2.6839599609375, 2.943359375, 3.2027587890625, 3.462158203125, 3.7215576171875, 3.98095703125, 4.2403564453125, 4.499755859375, 4.7591552734375, 5.0185546875, 5.2779541015625, 5.537353515625, 5.7967529296875, 6.05615234375, 6.3155517578125, 6.574951171875, 6.8343505859375, 7.09375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 21.0, 18.0, 21.0, 28.0, 54.0, 56.0, 74.0, 113.0, 107.0, 117.0, 94.0, 69.0, 45.0, 58.0, 29.0, 16.0, 19.0, 14.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.96636962890625, -4.8194580078125, -4.67254638671875, -4.525634765625, -4.37872314453125, -4.2318115234375, -4.08489990234375, -3.93798828125, -3.79107666015625, -3.6441650390625, -3.49725341796875, -3.350341796875, -3.20343017578125, -3.0565185546875, -2.90960693359375, -2.7626953125, -2.61578369140625, -2.4688720703125, -2.32196044921875, -2.175048828125, -2.02813720703125, -1.8812255859375, -1.73431396484375, -1.58740234375, -1.44049072265625, -1.2935791015625, -1.14666748046875, -0.999755859375, -0.85284423828125, -0.7059326171875, -0.55902099609375, -0.412109375, -0.26519775390625, -0.1182861328125, 0.02862548828125, 0.175537109375, 0.32244873046875, 0.4693603515625, 0.61627197265625, 0.76318359375, 0.91009521484375, 1.0570068359375, 1.20391845703125, 1.350830078125, 1.49774169921875, 1.6446533203125, 1.79156494140625, 1.9384765625, 2.08538818359375, 2.2322998046875, 2.37921142578125, 2.526123046875, 2.67303466796875, 2.8199462890625, 2.96685791015625, 3.11376953125, 3.26068115234375, 3.4075927734375, 3.55450439453125, 3.701416015625, 3.84832763671875, 3.9952392578125, 4.14215087890625, 4.2890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 15.0, 74.0, 343.0, 406.0, 108.0, 29.0, 15.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-323.5304260253906, -316.3431091308594, -309.1557922363281, -301.96844482421875, -294.7811279296875, -287.59381103515625, -280.406494140625, -273.21917724609375, -266.0318603515625, -258.84454345703125, -251.65721130371094, -244.4698944091797, -237.28257751464844, -230.09524536132812, -222.90792846679688, -215.72061157226562, -208.5332794189453, -201.34596252441406, -194.15863037109375, -186.9713134765625, -179.78399658203125, -172.5966796875, -165.4093475341797, -158.22203063964844, -151.03469848632812, -143.84738159179688, -136.66004943847656, -129.4727325439453, -122.28541564941406, -115.09809112548828, -107.9107666015625, -100.72344970703125, -93.5361328125, -86.34880828857422, -79.16149139404297, -71.97416687011719, -64.78684997558594, -57.599525451660156, -50.412200927734375, -43.22488021850586, -36.037559509277344, -28.850238800048828, -21.66291618347168, -14.475593566894531, -7.288272857666016, -0.1009521484375, 7.086372375488281, 14.273693084716797, 21.461013793945312, 28.648334503173828, 35.835655212402344, 43.022979736328125, 50.21030044555664, 57.397621154785156, 64.58494567871094, 71.77226257324219, 78.95958709716797, 86.14691162109375, 93.334228515625, 100.52155303955078, 107.70887756347656, 114.89619445800781, 122.0835189819336, 129.27084350585938, 136.45816040039062]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 14.0, 17.0, 14.0, 15.0, 15.0, 18.0, 27.0, 19.0, 28.0, 27.0, 27.0, 32.0, 36.0, 48.0, 81.0, 64.0, 69.0, 57.0, 46.0, 35.0, 31.0, 34.0, 33.0, 24.0, 34.0, 22.0, 11.0, 13.0, 12.0, 12.0, 13.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.30530548095703, -46.700382232666016, -45.095458984375, -43.49053955078125, -41.885616302490234, -40.28069305419922, -38.67577362060547, -37.07085037231445, -35.46592712402344, -33.86100387573242, -32.256080627441406, -30.651161193847656, -29.04623794555664, -27.441314697265625, -25.836393356323242, -24.23147201538086, -22.626548767089844, -21.021625518798828, -19.416704177856445, -17.811782836914062, -16.206859588623047, -14.601937294006348, -12.997014999389648, -11.39209270477295, -9.78717041015625, -8.18224811553955, -6.577325820922852, -4.972403526306152, -3.367481231689453, -1.762558937072754, -0.1576366424560547, 1.4472856521606445, 3.0522117614746094, 4.657134056091309, 6.262056350708008, 7.866978645324707, 9.471900939941406, 11.076823234558105, 12.681745529174805, 14.286667823791504, 15.891590118408203, 17.49651336669922, 19.1014347076416, 20.706356048583984, 22.311279296875, 23.916202545166016, 25.5211238861084, 27.12604522705078, 28.730968475341797, 30.335891723632812, 31.940813064575195, 33.54573440551758, 35.150657653808594, 36.75558090209961, 38.360504150390625, 39.965423583984375, 41.57034683227539, 43.175270080566406, 44.780189514160156, 46.38511276245117, 47.99003601074219, 49.5949592590332, 51.19988250732422, 52.80480194091797, 54.409725189208984]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 10.0, 21.0, 37.0, 53.0, 123.0, 277.0, 772.0, 3135.0, 24846.0, 3133235.0, 1014186.0, 14167.0, 2297.0, 630.0, 242.0, 123.0, 53.0, 34.0, 18.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.0396728515625, -5.571533203125, -5.1033935546875, -4.63525390625, -4.1671142578125, -3.698974609375, -3.2308349609375, -2.7626953125, -2.2945556640625, -1.826416015625, -1.3582763671875, -0.89013671875, -0.4219970703125, 0.046142578125, 0.5142822265625, 0.982421875, 1.4505615234375, 1.918701171875, 2.3868408203125, 2.85498046875, 3.3231201171875, 3.791259765625, 4.2593994140625, 4.7275390625, 5.1956787109375, 5.663818359375, 6.1319580078125, 6.60009765625, 7.0682373046875, 7.536376953125, 8.0045166015625, 8.47265625, 8.9407958984375, 9.408935546875, 9.8770751953125, 10.34521484375, 10.8133544921875, 11.281494140625, 11.7496337890625, 12.2177734375, 12.6859130859375, 13.154052734375, 13.6221923828125, 14.09033203125, 14.5584716796875, 15.026611328125, 15.4947509765625, 15.962890625, 16.4310302734375, 16.899169921875, 17.3673095703125, 17.83544921875, 18.3035888671875, 18.771728515625, 19.2398681640625, 19.7080078125, 20.1761474609375, 20.644287109375, 21.1124267578125, 21.58056640625, 22.0487060546875, 22.516845703125, 22.9849853515625, 23.453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 13.0, 9.0, 7.0, 12.0, 20.0, 20.0, 22.0, 30.0, 34.0, 52.0, 54.0, 52.0, 44.0, 61.0, 69.0, 57.0, 61.0, 53.0, 53.0, 50.0, 45.0, 35.0, 31.0, 20.0, 23.0, 17.0, 17.0, 15.0, 4.0, 8.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.12109375, -3.00640869140625, -2.8917236328125, -2.77703857421875, -2.662353515625, -2.54766845703125, -2.4329833984375, -2.31829833984375, -2.20361328125, -2.08892822265625, -1.9742431640625, -1.85955810546875, -1.744873046875, -1.63018798828125, -1.5155029296875, -1.40081787109375, -1.2861328125, -1.17144775390625, -1.0567626953125, -0.94207763671875, -0.827392578125, -0.71270751953125, -0.5980224609375, -0.48333740234375, -0.36865234375, -0.25396728515625, -0.1392822265625, -0.02459716796875, 0.090087890625, 0.20477294921875, 0.3194580078125, 0.43414306640625, 0.548828125, 0.66351318359375, 0.7781982421875, 0.89288330078125, 1.007568359375, 1.12225341796875, 1.2369384765625, 1.35162353515625, 1.46630859375, 1.58099365234375, 1.6956787109375, 1.81036376953125, 1.925048828125, 2.03973388671875, 2.1544189453125, 2.26910400390625, 2.3837890625, 2.49847412109375, 2.6131591796875, 2.72784423828125, 2.842529296875, 2.95721435546875, 3.0718994140625, 3.18658447265625, 3.30126953125, 3.41595458984375, 3.5306396484375, 3.64532470703125, 3.760009765625, 3.87469482421875, 3.9893798828125, 4.10406494140625, 4.21875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 11.0, 14.0, 27.0, 42.0, 78.0, 115.0, 242.0, 510.0, 1249.0, 3490.0, 14091.0, 142859.0, 3855230.0, 156047.0, 14432.0, 3482.0, 1258.0, 526.0, 264.0, 128.0, 72.0, 44.0, 20.0, 15.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -12.009521484375, -11.62841796875, -11.247314453125, -10.8662109375, -10.485107421875, -10.10400390625, -9.722900390625, -9.341796875, -8.960693359375, -8.57958984375, -8.198486328125, -7.8173828125, -7.436279296875, -7.05517578125, -6.674072265625, -6.29296875, -5.911865234375, -5.53076171875, -5.149658203125, -4.7685546875, -4.387451171875, -4.00634765625, -3.625244140625, -3.244140625, -2.863037109375, -2.48193359375, -2.100830078125, -1.7197265625, -1.338623046875, -0.95751953125, -0.576416015625, -0.1953125, 0.185791015625, 0.56689453125, 0.947998046875, 1.3291015625, 1.710205078125, 2.09130859375, 2.472412109375, 2.853515625, 3.234619140625, 3.61572265625, 3.996826171875, 4.3779296875, 4.759033203125, 5.14013671875, 5.521240234375, 5.90234375, 6.283447265625, 6.66455078125, 7.045654296875, 7.4267578125, 7.807861328125, 8.18896484375, 8.570068359375, 8.951171875, 9.332275390625, 9.71337890625, 10.094482421875, 10.4755859375, 10.856689453125, 11.23779296875, 11.618896484375, 12.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 14.0, 10.0, 14.0, 28.0, 54.0, 86.0, 177.0, 425.0, 988.0, 1114.0, 620.0, 236.0, 115.0, 69.0, 32.0, 27.0, 23.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.4638671875, -11.138671875, -10.8134765625, -10.48828125, -10.1630859375, -9.837890625, -9.5126953125, -9.1875, -8.8623046875, -8.537109375, -8.2119140625, -7.88671875, -7.5615234375, -7.236328125, -6.9111328125, -6.5859375, -6.2607421875, -5.935546875, -5.6103515625, -5.28515625, -4.9599609375, -4.634765625, -4.3095703125, -3.984375, -3.6591796875, -3.333984375, -3.0087890625, -2.68359375, -2.3583984375, -2.033203125, -1.7080078125, -1.3828125, -1.0576171875, -0.732421875, -0.4072265625, -0.08203125, 0.2431640625, 0.568359375, 0.8935546875, 1.21875, 1.5439453125, 1.869140625, 2.1943359375, 2.51953125, 2.8447265625, 3.169921875, 3.4951171875, 3.8203125, 4.1455078125, 4.470703125, 4.7958984375, 5.12109375, 5.4462890625, 5.771484375, 6.0966796875, 6.421875, 6.7470703125, 7.072265625, 7.3974609375, 7.72265625, 8.0478515625, 8.373046875, 8.6982421875, 9.0234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 8.0, 11.0, 26.0, 104.0, 262.0, 328.0, 161.0, 58.0, 15.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.7662353515625, -137.62794494628906, -133.4896697998047, -129.35137939453125, -125.21310424804688, -121.07481384277344, -116.93653106689453, -112.79824829101562, -108.65996551513672, -104.52168273925781, -100.3833999633789, -96.2451171875, -92.10682678222656, -87.96855163574219, -83.83026123046875, -79.69197845458984, -75.55369567871094, -71.41541290283203, -67.27713012695312, -63.13884353637695, -59.00056076049805, -54.86227798461914, -50.72399139404297, -46.58570861816406, -42.447425842285156, -38.30914306640625, -34.170860290527344, -30.032573699951172, -25.894290924072266, -21.75600814819336, -17.61772346496582, -13.479438781738281, -9.341140747070312, -5.20285701751709, -1.0645732879638672, 3.0737104415893555, 7.211994171142578, 11.350276947021484, 15.488561630249023, 19.626846313476562, 23.76512908935547, 27.903411865234375, 32.04169464111328, 36.17998123168945, 40.31826400756836, 44.456546783447266, 48.59483337402344, 52.733116149902344, 56.87139892578125, 61.009681701660156, 65.14796447753906, 69.28624725341797, 73.42453002929688, 77.56282043457031, 81.70110321044922, 85.83938598632812, 89.97766876220703, 94.11595153808594, 98.25423431396484, 102.39251708984375, 106.53080749511719, 110.66908264160156, 114.807373046875, 118.9456558227539, 123.08393859863281]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 7.0, 15.0, 11.0, 15.0, 21.0, 23.0, 25.0, 24.0, 29.0, 34.0, 33.0, 42.0, 43.0, 37.0, 30.0, 42.0, 39.0, 39.0, 38.0, 49.0, 45.0, 49.0, 37.0, 39.0, 30.0, 20.0, 24.0, 21.0, 27.0, 24.0, 13.0, 16.0, 7.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.62697982788086, -24.703126907348633, -23.779273986816406, -22.85542106628418, -21.931568145751953, -21.007715225219727, -20.0838623046875, -19.160011291503906, -18.236156463623047, -17.31230354309082, -16.388450622558594, -15.464597702026367, -14.54074478149414, -13.616891860961914, -12.693039894104004, -11.769186973571777, -10.845335006713867, -9.92148208618164, -8.997629165649414, -8.073776245117188, -7.149923801422119, -6.226070880889893, -5.302218437194824, -4.378365516662598, -3.454512596130371, -2.5306596755981445, -1.606806993484497, -0.6829543113708496, 0.24089860916137695, 1.1647515296936035, 2.088603973388672, 3.0124568939208984, 3.936309814453125, 4.860162734985352, 5.784015655517578, 6.7078680992126465, 7.631721019744873, 8.555574417114258, 9.479426383972168, 10.403279304504395, 11.327132225036621, 12.250985145568848, 13.174838066101074, 14.098690032958984, 15.022542953491211, 15.946395874023438, 16.870248794555664, 17.79410171508789, 18.717954635620117, 19.641807556152344, 20.56566047668457, 21.489513397216797, 22.413366317749023, 23.33721923828125, 24.261070251464844, 25.184925079345703, 26.108776092529297, 27.032629013061523, 27.95648193359375, 28.880334854125977, 29.804187774658203, 30.72804069519043, 31.651893615722656, 32.57574462890625, 33.49959945678711]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 6.0, 18.0, 24.0, 23.0, 36.0, 52.0, 86.0, 205.0, 327.0, 635.0, 1355.0, 3030.0, 7828.0, 23302.0, 87131.0, 355564.0, 415453.0, 109571.0, 28352.0, 8962.0, 3447.0, 1494.0, 742.0, 355.0, 192.0, 124.0, 56.0, 53.0, 32.0, 25.0, 11.0, 9.0, 12.0, 5.0, 8.0, 7.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.98614501953125, -6.7613525390625, -6.53656005859375, -6.311767578125, -6.08697509765625, -5.8621826171875, -5.63739013671875, -5.41259765625, -5.18780517578125, -4.9630126953125, -4.73822021484375, -4.513427734375, -4.28863525390625, -4.0638427734375, -3.83905029296875, -3.6142578125, -3.38946533203125, -3.1646728515625, -2.93988037109375, -2.715087890625, -2.49029541015625, -2.2655029296875, -2.04071044921875, -1.81591796875, -1.59112548828125, -1.3663330078125, -1.14154052734375, -0.916748046875, -0.69195556640625, -0.4671630859375, -0.24237060546875, -0.017578125, 0.20721435546875, 0.4320068359375, 0.65679931640625, 0.881591796875, 1.10638427734375, 1.3311767578125, 1.55596923828125, 1.78076171875, 2.00555419921875, 2.2303466796875, 2.45513916015625, 2.679931640625, 2.90472412109375, 3.1295166015625, 3.35430908203125, 3.5791015625, 3.80389404296875, 4.0286865234375, 4.25347900390625, 4.478271484375, 4.70306396484375, 4.9278564453125, 5.15264892578125, 5.37744140625, 5.60223388671875, 5.8270263671875, 6.05181884765625, 6.276611328125, 6.50140380859375, 6.7261962890625, 6.95098876953125, 7.17578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 6.0, 10.0, 5.0, 18.0, 20.0, 21.0, 20.0, 28.0, 36.0, 36.0, 42.0, 41.0, 47.0, 58.0, 47.0, 51.0, 63.0, 56.0, 53.0, 50.0, 39.0, 41.0, 32.0, 29.0, 29.0, 22.0, 19.0, 19.0, 12.0, 11.0, 6.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.50567626953125, -2.3980712890625, -2.29046630859375, -2.182861328125, -2.07525634765625, -1.9676513671875, -1.86004638671875, -1.75244140625, -1.64483642578125, -1.5372314453125, -1.42962646484375, -1.322021484375, -1.21441650390625, -1.1068115234375, -0.99920654296875, -0.8916015625, -0.78399658203125, -0.6763916015625, -0.56878662109375, -0.461181640625, -0.35357666015625, -0.2459716796875, -0.13836669921875, -0.03076171875, 0.07684326171875, 0.1844482421875, 0.29205322265625, 0.399658203125, 0.50726318359375, 0.6148681640625, 0.72247314453125, 0.830078125, 0.93768310546875, 1.0452880859375, 1.15289306640625, 1.260498046875, 1.36810302734375, 1.4757080078125, 1.58331298828125, 1.69091796875, 1.79852294921875, 1.9061279296875, 2.01373291015625, 2.121337890625, 2.22894287109375, 2.3365478515625, 2.44415283203125, 2.5517578125, 2.65936279296875, 2.7669677734375, 2.87457275390625, 2.982177734375, 3.08978271484375, 3.1973876953125, 3.30499267578125, 3.41259765625, 3.52020263671875, 3.6278076171875, 3.73541259765625, 3.843017578125, 3.95062255859375, 4.0582275390625, 4.16583251953125, 4.2734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 22.0, 32.0, 42.0, 75.0, 116.0, 158.0, 262.0, 548.0, 1230.0, 3208.0, 9535.0, 37639.0, 211320.0, 648317.0, 104590.0, 21177.0, 5986.0, 2263.0, 885.0, 438.0, 232.0, 146.0, 107.0, 49.0, 38.0, 29.0, 22.0, 15.0, 9.0, 9.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.155029296875, -8.88818359375, -8.621337890625, -8.3544921875, -8.087646484375, -7.82080078125, -7.553955078125, -7.287109375, -7.020263671875, -6.75341796875, -6.486572265625, -6.2197265625, -5.952880859375, -5.68603515625, -5.419189453125, -5.15234375, -4.885498046875, -4.61865234375, -4.351806640625, -4.0849609375, -3.818115234375, -3.55126953125, -3.284423828125, -3.017578125, -2.750732421875, -2.48388671875, -2.217041015625, -1.9501953125, -1.683349609375, -1.41650390625, -1.149658203125, -0.8828125, -0.615966796875, -0.34912109375, -0.082275390625, 0.1845703125, 0.451416015625, 0.71826171875, 0.985107421875, 1.251953125, 1.518798828125, 1.78564453125, 2.052490234375, 2.3193359375, 2.586181640625, 2.85302734375, 3.119873046875, 3.38671875, 3.653564453125, 3.92041015625, 4.187255859375, 4.4541015625, 4.720947265625, 4.98779296875, 5.254638671875, 5.521484375, 5.788330078125, 6.05517578125, 6.322021484375, 6.5888671875, 6.855712890625, 7.12255859375, 7.389404296875, 7.65625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 13.0, 16.0, 8.0, 12.0, 18.0, 27.0, 27.0, 27.0, 23.0, 42.0, 50.0, 43.0, 38.0, 41.0, 52.0, 50.0, 49.0, 46.0, 51.0, 38.0, 52.0, 32.0, 36.0, 33.0, 34.0, 18.0, 24.0, 17.0, 12.0, 10.0, 11.0, 9.0, 4.0, 1.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.450927734375, -10.11279296875, -9.774658203125, -9.4365234375, -9.098388671875, -8.76025390625, -8.422119140625, -8.083984375, -7.745849609375, -7.40771484375, -7.069580078125, -6.7314453125, -6.393310546875, -6.05517578125, -5.717041015625, -5.37890625, -5.040771484375, -4.70263671875, -4.364501953125, -4.0263671875, -3.688232421875, -3.35009765625, -3.011962890625, -2.673828125, -2.335693359375, -1.99755859375, -1.659423828125, -1.3212890625, -0.983154296875, -0.64501953125, -0.306884765625, 0.03125, 0.369384765625, 0.70751953125, 1.045654296875, 1.3837890625, 1.721923828125, 2.06005859375, 2.398193359375, 2.736328125, 3.074462890625, 3.41259765625, 3.750732421875, 4.0888671875, 4.427001953125, 4.76513671875, 5.103271484375, 5.44140625, 5.779541015625, 6.11767578125, 6.455810546875, 6.7939453125, 7.132080078125, 7.47021484375, 7.808349609375, 8.146484375, 8.484619140625, 8.82275390625, 9.160888671875, 9.4990234375, 9.837158203125, 10.17529296875, 10.513427734375, 10.8515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 14.0, 15.0, 27.0, 41.0, 70.0, 128.0, 149.0, 282.0, 497.0, 865.0, 1564.0, 3046.0, 6607.0, 16171.0, 47322.0, 218808.0, 617308.0, 90689.0, 25948.0, 9882.0, 4326.0, 2113.0, 1091.0, 637.0, 356.0, 202.0, 134.0, 78.0, 62.0, 36.0, 18.0, 17.0, 18.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.115234375, -3.026824951171875, -2.93841552734375, -2.850006103515625, -2.7615966796875, -2.673187255859375, -2.58477783203125, -2.496368408203125, -2.407958984375, -2.319549560546875, -2.23114013671875, -2.142730712890625, -2.0543212890625, -1.965911865234375, -1.87750244140625, -1.789093017578125, -1.70068359375, -1.612274169921875, -1.52386474609375, -1.435455322265625, -1.3470458984375, -1.258636474609375, -1.17022705078125, -1.081817626953125, -0.993408203125, -0.904998779296875, -0.81658935546875, -0.728179931640625, -0.6397705078125, -0.551361083984375, -0.46295166015625, -0.374542236328125, -0.2861328125, -0.197723388671875, -0.10931396484375, -0.020904541015625, 0.0675048828125, 0.155914306640625, 0.24432373046875, 0.332733154296875, 0.421142578125, 0.509552001953125, 0.59796142578125, 0.686370849609375, 0.7747802734375, 0.863189697265625, 0.95159912109375, 1.040008544921875, 1.12841796875, 1.216827392578125, 1.30523681640625, 1.393646240234375, 1.4820556640625, 1.570465087890625, 1.65887451171875, 1.747283935546875, 1.835693359375, 1.924102783203125, 2.01251220703125, 2.100921630859375, 2.1893310546875, 2.277740478515625, 2.36614990234375, 2.454559326171875, 2.54296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 10.0, 18.0, 31.0, 61.0, 193.0, 313.0, 195.0, 67.0, 42.0, 22.0, 13.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00220489501953125, -0.0021348893642425537, -0.0020648837089538574, -0.001994878053665161, -0.0019248723983764648, -0.0018548667430877686, -0.0017848610877990723, -0.001714855432510376, -0.0016448497772216797, -0.0015748441219329834, -0.0015048384666442871, -0.0014348328113555908, -0.0013648271560668945, -0.0012948215007781982, -0.001224815845489502, -0.0011548101902008057, -0.0010848045349121094, -0.001014798879623413, -0.0009447932243347168, -0.0008747875690460205, -0.0008047819137573242, -0.0007347762584686279, -0.0006647706031799316, -0.0005947649478912354, -0.0005247592926025391, -0.0004547536373138428, -0.0003847479820251465, -0.0003147423267364502, -0.0002447366714477539, -0.00017473101615905762, -0.00010472536087036133, -3.471970558166504e-05, 3.528594970703125e-05, 0.00010529160499572754, 0.00017529726028442383, 0.0002453029155731201, 0.0003153085708618164, 0.0003853142261505127, 0.000455319881439209, 0.0005253255367279053, 0.0005953311920166016, 0.0006653368473052979, 0.0007353425025939941, 0.0008053481578826904, 0.0008753538131713867, 0.000945359468460083, 0.0010153651237487793, 0.0010853707790374756, 0.0011553764343261719, 0.0012253820896148682, 0.0012953877449035645, 0.0013653934001922607, 0.001435399055480957, 0.0015054047107696533, 0.0015754103660583496, 0.001645416021347046, 0.0017154216766357422, 0.0017854273319244385, 0.0018554329872131348, 0.001925438642501831, 0.0019954442977905273, 0.0020654499530792236, 0.00213545560836792, 0.002205461263656616, 0.0022754669189453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 3.0, 10.0, 10.0, 21.0, 21.0, 53.0, 48.0, 84.0, 135.0, 204.0, 337.0, 697.0, 1379.0, 2867.0, 6722.0, 18234.0, 61485.0, 287783.0, 548401.0, 82398.0, 22670.0, 8118.0, 3340.0, 1580.0, 809.0, 441.0, 235.0, 172.0, 87.0, 65.0, 50.0, 27.0, 12.0, 13.0, 12.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.103515625, -3.015106201171875, -2.92669677734375, -2.838287353515625, -2.7498779296875, -2.661468505859375, -2.57305908203125, -2.484649658203125, -2.396240234375, -2.307830810546875, -2.21942138671875, -2.131011962890625, -2.0426025390625, -1.954193115234375, -1.86578369140625, -1.777374267578125, -1.68896484375, -1.600555419921875, -1.51214599609375, -1.423736572265625, -1.3353271484375, -1.246917724609375, -1.15850830078125, -1.070098876953125, -0.981689453125, -0.893280029296875, -0.80487060546875, -0.716461181640625, -0.6280517578125, -0.539642333984375, -0.45123291015625, -0.362823486328125, -0.2744140625, -0.186004638671875, -0.09759521484375, -0.009185791015625, 0.0792236328125, 0.167633056640625, 0.25604248046875, 0.344451904296875, 0.432861328125, 0.521270751953125, 0.60968017578125, 0.698089599609375, 0.7864990234375, 0.874908447265625, 0.96331787109375, 1.051727294921875, 1.14013671875, 1.228546142578125, 1.31695556640625, 1.405364990234375, 1.4937744140625, 1.582183837890625, 1.67059326171875, 1.759002685546875, 1.847412109375, 1.935821533203125, 2.02423095703125, 2.112640380859375, 2.2010498046875, 2.289459228515625, 2.37786865234375, 2.466278076171875, 2.5546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 12.0, 7.0, 11.0, 9.0, 11.0, 22.0, 25.0, 20.0, 49.0, 56.0, 62.0, 79.0, 86.0, 81.0, 87.0, 84.0, 62.0, 45.0, 45.0, 37.0, 33.0, 7.0, 13.0, 10.0, 10.0, 5.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0703125, -1.985076904296875, -1.89984130859375, -1.814605712890625, -1.7293701171875, -1.644134521484375, -1.55889892578125, -1.473663330078125, -1.388427734375, -1.303192138671875, -1.21795654296875, -1.132720947265625, -1.0474853515625, -0.962249755859375, -0.87701416015625, -0.791778564453125, -0.70654296875, -0.621307373046875, -0.53607177734375, -0.450836181640625, -0.3656005859375, -0.280364990234375, -0.19512939453125, -0.109893798828125, -0.024658203125, 0.060577392578125, 0.14581298828125, 0.231048583984375, 0.3162841796875, 0.401519775390625, 0.48675537109375, 0.571990966796875, 0.6572265625, 0.742462158203125, 0.82769775390625, 0.912933349609375, 0.9981689453125, 1.083404541015625, 1.16864013671875, 1.253875732421875, 1.339111328125, 1.424346923828125, 1.50958251953125, 1.594818115234375, 1.6800537109375, 1.765289306640625, 1.85052490234375, 1.935760498046875, 2.02099609375, 2.106231689453125, 2.19146728515625, 2.276702880859375, 2.3619384765625, 2.447174072265625, 2.53240966796875, 2.617645263671875, 2.702880859375, 2.788116455078125, 2.87335205078125, 2.958587646484375, 3.0438232421875, 3.129058837890625, 3.21429443359375, 3.299530029296875, 3.384765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 13.0, 22.0, 57.0, 113.0, 260.0, 259.0, 130.0, 61.0, 35.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.84793090820312, -86.06954193115234, -83.29115295410156, -80.51276397705078, -77.734375, -74.95597839355469, -72.17759704589844, -69.39920043945312, -66.62081146240234, -63.84242248535156, -61.06403350830078, -58.28564453125, -55.50725173950195, -52.72886276245117, -49.95047378540039, -47.172080993652344, -44.39369583129883, -41.61530685424805, -38.836917877197266, -36.05852508544922, -33.28013610839844, -30.501747131347656, -27.723358154296875, -24.94496726989746, -22.16657829284668, -19.3881893157959, -16.609798431396484, -13.831409454345703, -11.053019523620605, -8.274629592895508, -5.496240615844727, -2.7178497314453125, 0.06053924560546875, 2.8389289379119873, 5.617318630218506, 8.395708084106445, 11.174098014831543, 13.95248794555664, 16.730876922607422, 19.509267807006836, 22.287656784057617, 25.0660457611084, 27.844436645507812, 30.622825622558594, 33.401214599609375, 36.179603576660156, 38.95799255371094, 41.736385345458984, 44.514774322509766, 47.29316329956055, 50.07155227661133, 52.849945068359375, 55.628334045410156, 58.40672302246094, 61.18511199951172, 63.9635009765625, 66.74188995361328, 69.52027893066406, 72.29866790771484, 75.07705688476562, 77.8554458618164, 80.63383483886719, 83.4122314453125, 86.19062042236328, 88.96900939941406]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 7.0, 10.0, 12.0, 16.0, 11.0, 28.0, 27.0, 29.0, 35.0, 33.0, 34.0, 44.0, 45.0, 67.0, 92.0, 87.0, 76.0, 59.0, 41.0, 36.0, 33.0, 31.0, 28.0, 21.0, 11.0, 12.0, 6.0, 14.0, 5.0, 13.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.489017486572266, -44.936607360839844, -43.38419723510742, -41.831787109375, -40.279380798339844, -38.72697067260742, -37.174560546875, -35.62215042114258, -34.069740295410156, -32.517330169677734, -30.964920043945312, -29.412511825561523, -27.8601016998291, -26.30769157409668, -24.75528335571289, -23.20287322998047, -21.650463104248047, -20.098052978515625, -18.545642852783203, -16.993234634399414, -15.440824508666992, -13.88841438293457, -12.336005210876465, -10.78359603881836, -9.231185913085938, -7.678776264190674, -6.12636661529541, -4.5739569664001465, -3.021547317504883, -1.4691376686096191, 0.08327198028564453, 1.63568115234375, 3.1880874633789062, 4.74049711227417, 6.292906761169434, 7.845316410064697, 9.397726058959961, 10.950136184692383, 12.502545356750488, 14.054954528808594, 15.607364654541016, 17.159774780273438, 18.71218490600586, 20.26459312438965, 21.81700325012207, 23.369413375854492, 24.92182159423828, 26.474231719970703, 28.026641845703125, 29.579051971435547, 31.13146209716797, 32.68387222290039, 34.23628234863281, 35.78868865966797, 37.34109878540039, 38.89350891113281, 40.445919036865234, 41.998329162597656, 43.55073928833008, 45.1031494140625, 46.655555725097656, 48.20796585083008, 49.7603759765625, 51.31278610229492, 52.865196228027344]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 12.0, 14.0, 16.0, 31.0, 58.0, 120.0, 244.0, 540.0, 1256.0, 3888.0, 17216.0, 278647.0, 3756059.0, 119866.0, 11305.0, 2984.0, 1020.0, 454.0, 227.0, 114.0, 84.0, 44.0, 23.0, 23.0, 12.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.7098388671875, -4.404052734375, -4.0982666015625, -3.79248046875, -3.4866943359375, -3.180908203125, -2.8751220703125, -2.5693359375, -2.2635498046875, -1.957763671875, -1.6519775390625, -1.34619140625, -1.0404052734375, -0.734619140625, -0.4288330078125, -0.123046875, 0.1827392578125, 0.488525390625, 0.7943115234375, 1.10009765625, 1.4058837890625, 1.711669921875, 2.0174560546875, 2.3232421875, 2.6290283203125, 2.934814453125, 3.2406005859375, 3.54638671875, 3.8521728515625, 4.157958984375, 4.4637451171875, 4.76953125, 5.0753173828125, 5.381103515625, 5.6868896484375, 5.99267578125, 6.2984619140625, 6.604248046875, 6.9100341796875, 7.2158203125, 7.5216064453125, 7.827392578125, 8.1331787109375, 8.43896484375, 8.7447509765625, 9.050537109375, 9.3563232421875, 9.662109375, 9.9678955078125, 10.273681640625, 10.5794677734375, 10.88525390625, 11.1910400390625, 11.496826171875, 11.8026123046875, 12.1083984375, 12.4141845703125, 12.719970703125, 13.0257568359375, 13.33154296875, 13.6373291015625, 13.943115234375, 14.2489013671875, 14.5546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 7.0, 11.0, 11.0, 16.0, 21.0, 22.0, 31.0, 34.0, 37.0, 40.0, 31.0, 46.0, 49.0, 63.0, 43.0, 60.0, 53.0, 49.0, 67.0, 42.0, 39.0, 34.0, 28.0, 28.0, 22.0, 27.0, 20.0, 12.0, 22.0, 9.0, 3.0, 2.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.1395263671875, -2.040771484375, -1.9420166015625, -1.84326171875, -1.7445068359375, -1.645751953125, -1.5469970703125, -1.4482421875, -1.3494873046875, -1.250732421875, -1.1519775390625, -1.05322265625, -0.9544677734375, -0.855712890625, -0.7569580078125, -0.658203125, -0.5594482421875, -0.460693359375, -0.3619384765625, -0.26318359375, -0.1644287109375, -0.065673828125, 0.0330810546875, 0.1318359375, 0.2305908203125, 0.329345703125, 0.4281005859375, 0.52685546875, 0.6256103515625, 0.724365234375, 0.8231201171875, 0.921875, 1.0206298828125, 1.119384765625, 1.2181396484375, 1.31689453125, 1.4156494140625, 1.514404296875, 1.6131591796875, 1.7119140625, 1.8106689453125, 1.909423828125, 2.0081787109375, 2.10693359375, 2.2056884765625, 2.304443359375, 2.4031982421875, 2.501953125, 2.6007080078125, 2.699462890625, 2.7982177734375, 2.89697265625, 2.9957275390625, 3.094482421875, 3.1932373046875, 3.2919921875, 3.3907470703125, 3.489501953125, 3.5882568359375, 3.68701171875, 3.7857666015625, 3.884521484375, 3.9832763671875, 4.08203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 14.0, 29.0, 64.0, 132.0, 361.0, 1287.0, 13190.0, 3315575.0, 854104.0, 7977.0, 1001.0, 323.0, 122.0, 47.0, 27.0, 10.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.6439208984375, -20.069091796875, -19.4942626953125, -18.91943359375, -18.3446044921875, -17.769775390625, -17.1949462890625, -16.6201171875, -16.0452880859375, -15.470458984375, -14.8956298828125, -14.32080078125, -13.7459716796875, -13.171142578125, -12.5963134765625, -12.021484375, -11.4466552734375, -10.871826171875, -10.2969970703125, -9.72216796875, -9.1473388671875, -8.572509765625, -7.9976806640625, -7.4228515625, -6.8480224609375, -6.273193359375, -5.6983642578125, -5.12353515625, -4.5487060546875, -3.973876953125, -3.3990478515625, -2.82421875, -2.2493896484375, -1.674560546875, -1.0997314453125, -0.52490234375, 0.0499267578125, 0.624755859375, 1.1995849609375, 1.7744140625, 2.3492431640625, 2.924072265625, 3.4989013671875, 4.07373046875, 4.6485595703125, 5.223388671875, 5.7982177734375, 6.373046875, 6.9478759765625, 7.522705078125, 8.0975341796875, 8.67236328125, 9.2471923828125, 9.822021484375, 10.3968505859375, 10.9716796875, 11.5465087890625, 12.121337890625, 12.6961669921875, 13.27099609375, 13.8458251953125, 14.420654296875, 14.9954833984375, 15.5703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 18.0, 24.0, 32.0, 42.0, 71.0, 135.0, 233.0, 481.0, 899.0, 937.0, 545.0, 253.0, 157.0, 83.0, 39.0, 35.0, 27.0, 13.0, 16.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5859375, -8.33416748046875, -8.0823974609375, -7.83062744140625, -7.578857421875, -7.32708740234375, -7.0753173828125, -6.82354736328125, -6.57177734375, -6.32000732421875, -6.0682373046875, -5.81646728515625, -5.564697265625, -5.31292724609375, -5.0611572265625, -4.80938720703125, -4.5576171875, -4.30584716796875, -4.0540771484375, -3.80230712890625, -3.550537109375, -3.29876708984375, -3.0469970703125, -2.79522705078125, -2.54345703125, -2.29168701171875, -2.0399169921875, -1.78814697265625, -1.536376953125, -1.28460693359375, -1.0328369140625, -0.78106689453125, -0.529296875, -0.27752685546875, -0.0257568359375, 0.22601318359375, 0.477783203125, 0.72955322265625, 0.9813232421875, 1.23309326171875, 1.48486328125, 1.73663330078125, 1.9884033203125, 2.24017333984375, 2.491943359375, 2.74371337890625, 2.9954833984375, 3.24725341796875, 3.4990234375, 3.75079345703125, 4.0025634765625, 4.25433349609375, 4.506103515625, 4.75787353515625, 5.0096435546875, 5.26141357421875, 5.51318359375, 5.76495361328125, 6.0167236328125, 6.26849365234375, 6.520263671875, 6.77203369140625, 7.0238037109375, 7.27557373046875, 7.52734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 26.0, 46.0, 90.0, 148.0, 207.0, 175.0, 106.0, 67.0, 57.0, 20.0, 16.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.69213104248047, -60.71463394165039, -58.73713684082031, -56.7596435546875, -54.78214645385742, -52.804649353027344, -50.827152252197266, -48.84965515136719, -46.872161865234375, -44.8946647644043, -42.91716766357422, -40.939674377441406, -38.96217727661133, -36.98468017578125, -35.00718307495117, -33.029685974121094, -31.05219078063965, -29.07469367980957, -27.097198486328125, -25.119701385498047, -23.1422061920166, -21.164709091186523, -19.187213897705078, -17.209716796875, -15.232220649719238, -13.254724502563477, -11.277228355407715, -9.299732208251953, -7.322235584259033, -5.344738960266113, -3.3672428131103516, -1.3897466659545898, 0.5877494812011719, 2.5652456283569336, 4.542741775512695, 6.520238399505615, 8.497734069824219, 10.475231170654297, 12.452727317810059, 14.43022346496582, 16.407718658447266, 18.385215759277344, 20.36271095275879, 22.340208053588867, 24.317703247070312, 26.29520034790039, 28.27269744873047, 30.250192642211914, 32.227691650390625, 34.2051887512207, 36.18268585205078, 38.160179138183594, 40.13767623901367, 42.11517333984375, 44.09267044067383, 46.070167541503906, 48.04766082763672, 50.0251579284668, 52.002655029296875, 53.98014831542969, 55.957645416259766, 57.935142517089844, 59.91263961791992, 61.89013671875, 63.86763000488281]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 4.0, 8.0, 11.0, 8.0, 7.0, 16.0, 15.0, 12.0, 21.0, 17.0, 16.0, 21.0, 24.0, 32.0, 48.0, 32.0, 29.0, 30.0, 51.0, 49.0, 47.0, 47.0, 48.0, 34.0, 30.0, 49.0, 30.0, 33.0, 24.0, 22.0, 21.0, 27.0, 27.0, 13.0, 13.0, 16.0, 12.0, 9.0, 8.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.787128448486328, -21.075515747070312, -20.363903045654297, -19.65229034423828, -18.940677642822266, -18.22906494140625, -17.517452239990234, -16.80584144592285, -16.094228744506836, -15.38261604309082, -14.671003341674805, -13.959390640258789, -13.24777889251709, -12.536166191101074, -11.824553489685059, -11.11294174194336, -10.401328086853027, -9.689715385437012, -8.978102684020996, -8.266490936279297, -7.554878234863281, -6.843265533447266, -6.13165283203125, -5.420040607452393, -4.708427906036377, -3.9968154430389404, -3.285202980041504, -2.5735902786254883, -1.8619778156280518, -1.1503653526306152, -0.4387526512145996, 0.2728595733642578, 0.9844722747802734, 1.69608473777771, 2.4076972007751465, 3.119309902191162, 3.8309223651885986, 4.542534828186035, 5.254147529602051, 5.965759754180908, 6.677372455596924, 7.3889851570129395, 8.100597381591797, 8.812210083007812, 9.523822784423828, 10.235435485839844, 10.94704818725586, 11.658659934997559, 12.370272636413574, 13.08188533782959, 13.793498039245605, 14.505109786987305, 15.21672248840332, 15.928335189819336, 16.63994789123535, 17.351560592651367, 18.063173294067383, 18.7747859954834, 19.486398696899414, 20.19801139831543, 20.909624099731445, 21.621234893798828, 22.332847595214844, 23.04446029663086, 23.756072998046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 11.0, 13.0, 30.0, 34.0, 75.0, 121.0, 263.0, 577.0, 1426.0, 3832.0, 12432.0, 48886.0, 236511.0, 548678.0, 149309.0, 32847.0, 8538.0, 2886.0, 1088.0, 499.0, 207.0, 115.0, 64.0, 37.0, 26.0, 15.0, 12.0, 8.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.734375, -7.50927734375, -7.2841796875, -7.05908203125, -6.833984375, -6.60888671875, -6.3837890625, -6.15869140625, -5.93359375, -5.70849609375, -5.4833984375, -5.25830078125, -5.033203125, -4.80810546875, -4.5830078125, -4.35791015625, -4.1328125, -3.90771484375, -3.6826171875, -3.45751953125, -3.232421875, -3.00732421875, -2.7822265625, -2.55712890625, -2.33203125, -2.10693359375, -1.8818359375, -1.65673828125, -1.431640625, -1.20654296875, -0.9814453125, -0.75634765625, -0.53125, -0.30615234375, -0.0810546875, 0.14404296875, 0.369140625, 0.59423828125, 0.8193359375, 1.04443359375, 1.26953125, 1.49462890625, 1.7197265625, 1.94482421875, 2.169921875, 2.39501953125, 2.6201171875, 2.84521484375, 3.0703125, 3.29541015625, 3.5205078125, 3.74560546875, 3.970703125, 4.19580078125, 4.4208984375, 4.64599609375, 4.87109375, 5.09619140625, 5.3212890625, 5.54638671875, 5.771484375, 5.99658203125, 6.2216796875, 6.44677734375, 6.671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 10.0, 11.0, 15.0, 13.0, 14.0, 11.0, 20.0, 29.0, 35.0, 26.0, 40.0, 38.0, 51.0, 50.0, 51.0, 56.0, 53.0, 58.0, 51.0, 33.0, 57.0, 38.0, 39.0, 31.0, 21.0, 28.0, 22.0, 20.0, 19.0, 7.0, 12.0, 8.0, 7.0, 10.0, 5.0, 1.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.164398193359375, -2.06512451171875, -1.965850830078125, -1.8665771484375, -1.767303466796875, -1.66802978515625, -1.568756103515625, -1.469482421875, -1.370208740234375, -1.27093505859375, -1.171661376953125, -1.0723876953125, -0.973114013671875, -0.87384033203125, -0.774566650390625, -0.67529296875, -0.576019287109375, -0.47674560546875, -0.377471923828125, -0.2781982421875, -0.178924560546875, -0.07965087890625, 0.019622802734375, 0.118896484375, 0.218170166015625, 0.31744384765625, 0.416717529296875, 0.5159912109375, 0.615264892578125, 0.71453857421875, 0.813812255859375, 0.9130859375, 1.012359619140625, 1.11163330078125, 1.210906982421875, 1.3101806640625, 1.409454345703125, 1.50872802734375, 1.608001708984375, 1.707275390625, 1.806549072265625, 1.90582275390625, 2.005096435546875, 2.1043701171875, 2.203643798828125, 2.30291748046875, 2.402191162109375, 2.50146484375, 2.600738525390625, 2.70001220703125, 2.799285888671875, 2.8985595703125, 2.997833251953125, 3.09710693359375, 3.196380615234375, 3.295654296875, 3.394927978515625, 3.49420166015625, 3.593475341796875, 3.6927490234375, 3.792022705078125, 3.89129638671875, 3.990570068359375, 4.08984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 5.0, 9.0, 17.0, 19.0, 18.0, 28.0, 43.0, 49.0, 86.0, 104.0, 133.0, 166.0, 290.0, 446.0, 705.0, 1424.0, 3294.0, 10624.0, 46644.0, 298582.0, 602572.0, 62141.0, 13255.0, 3870.0, 1633.0, 798.0, 487.0, 345.0, 201.0, 158.0, 104.0, 77.0, 57.0, 42.0, 36.0, 27.0, 20.0, 14.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.98828125, -7.73931884765625, -7.4903564453125, -7.24139404296875, -6.992431640625, -6.74346923828125, -6.4945068359375, -6.24554443359375, -5.99658203125, -5.74761962890625, -5.4986572265625, -5.24969482421875, -5.000732421875, -4.75177001953125, -4.5028076171875, -4.25384521484375, -4.0048828125, -3.75592041015625, -3.5069580078125, -3.25799560546875, -3.009033203125, -2.76007080078125, -2.5111083984375, -2.26214599609375, -2.01318359375, -1.76422119140625, -1.5152587890625, -1.26629638671875, -1.017333984375, -0.76837158203125, -0.5194091796875, -0.27044677734375, -0.021484375, 0.22747802734375, 0.4764404296875, 0.72540283203125, 0.974365234375, 1.22332763671875, 1.4722900390625, 1.72125244140625, 1.97021484375, 2.21917724609375, 2.4681396484375, 2.71710205078125, 2.966064453125, 3.21502685546875, 3.4639892578125, 3.71295166015625, 3.9619140625, 4.21087646484375, 4.4598388671875, 4.70880126953125, 4.957763671875, 5.20672607421875, 5.4556884765625, 5.70465087890625, 5.95361328125, 6.20257568359375, 6.4515380859375, 6.70050048828125, 6.949462890625, 7.19842529296875, 7.4473876953125, 7.69635009765625, 7.9453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 9.0, 9.0, 16.0, 11.0, 13.0, 18.0, 34.0, 17.0, 26.0, 38.0, 34.0, 43.0, 31.0, 51.0, 49.0, 49.0, 58.0, 39.0, 55.0, 48.0, 46.0, 45.0, 47.0, 33.0, 22.0, 26.0, 21.0, 19.0, 17.0, 15.0, 9.0, 7.0, 8.0, 5.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-12.515625, -12.1728515625, -11.830078125, -11.4873046875, -11.14453125, -10.8017578125, -10.458984375, -10.1162109375, -9.7734375, -9.4306640625, -9.087890625, -8.7451171875, -8.40234375, -8.0595703125, -7.716796875, -7.3740234375, -7.03125, -6.6884765625, -6.345703125, -6.0029296875, -5.66015625, -5.3173828125, -4.974609375, -4.6318359375, -4.2890625, -3.9462890625, -3.603515625, -3.2607421875, -2.91796875, -2.5751953125, -2.232421875, -1.8896484375, -1.546875, -1.2041015625, -0.861328125, -0.5185546875, -0.17578125, 0.1669921875, 0.509765625, 0.8525390625, 1.1953125, 1.5380859375, 1.880859375, 2.2236328125, 2.56640625, 2.9091796875, 3.251953125, 3.5947265625, 3.9375, 4.2802734375, 4.623046875, 4.9658203125, 5.30859375, 5.6513671875, 5.994140625, 6.3369140625, 6.6796875, 7.0224609375, 7.365234375, 7.7080078125, 8.05078125, 8.3935546875, 8.736328125, 9.0791015625, 9.421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 10.0, 19.0, 18.0, 27.0, 51.0, 75.0, 118.0, 235.0, 445.0, 1003.0, 2935.0, 9421.0, 40114.0, 364303.0, 572908.0, 42025.0, 9769.0, 2948.0, 1036.0, 506.0, 222.0, 136.0, 61.0, 51.0, 33.0, 18.0, 17.0, 11.0, 8.0, 10.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.411407470703125, -2.31500244140625, -2.218597412109375, -2.1221923828125, -2.025787353515625, -1.92938232421875, -1.832977294921875, -1.736572265625, -1.640167236328125, -1.54376220703125, -1.447357177734375, -1.3509521484375, -1.254547119140625, -1.15814208984375, -1.061737060546875, -0.96533203125, -0.868927001953125, -0.77252197265625, -0.676116943359375, -0.5797119140625, -0.483306884765625, -0.38690185546875, -0.290496826171875, -0.194091796875, -0.097686767578125, -0.00128173828125, 0.095123291015625, 0.1915283203125, 0.287933349609375, 0.38433837890625, 0.480743408203125, 0.5771484375, 0.673553466796875, 0.76995849609375, 0.866363525390625, 0.9627685546875, 1.059173583984375, 1.15557861328125, 1.251983642578125, 1.348388671875, 1.444793701171875, 1.54119873046875, 1.637603759765625, 1.7340087890625, 1.830413818359375, 1.92681884765625, 2.023223876953125, 2.11962890625, 2.216033935546875, 2.31243896484375, 2.408843994140625, 2.5052490234375, 2.601654052734375, 2.69805908203125, 2.794464111328125, 2.890869140625, 2.987274169921875, 3.08367919921875, 3.180084228515625, 3.2764892578125, 3.372894287109375, 3.46929931640625, 3.565704345703125, 3.662109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 6.0, 6.0, 6.0, 9.0, 3.0, 12.0, 12.0, 16.0, 26.0, 30.0, 32.0, 46.0, 55.0, 80.0, 113.0, 132.0, 116.0, 71.0, 43.0, 28.0, 25.0, 32.0, 19.0, 10.0, 15.0, 10.0, 6.0, 7.0, 4.0, 2.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005016326904296875, -0.0004851818084716797, -0.0004687309265136719, -0.00045228004455566406, -0.00043582916259765625, -0.00041937828063964844, -0.0004029273986816406, -0.0003864765167236328, -0.000370025634765625, -0.0003535747528076172, -0.0003371238708496094, -0.00032067298889160156, -0.00030422210693359375, -0.00028777122497558594, -0.0002713203430175781, -0.0002548694610595703, -0.0002384185791015625, -0.0002219676971435547, -0.00020551681518554688, -0.00018906593322753906, -0.00017261505126953125, -0.00015616416931152344, -0.00013971328735351562, -0.0001232624053955078, -0.0001068115234375, -9.036064147949219e-05, -7.390975952148438e-05, -5.745887756347656e-05, -4.100799560546875e-05, -2.4557113647460938e-05, -8.106231689453125e-06, 8.344650268554688e-06, 2.47955322265625e-05, 4.124641418457031e-05, 5.7697296142578125e-05, 7.414817810058594e-05, 9.059906005859375e-05, 0.00010704994201660156, 0.00012350082397460938, 0.0001399517059326172, 0.000156402587890625, 0.0001728534698486328, 0.00018930435180664062, 0.00020575523376464844, 0.00022220611572265625, 0.00023865699768066406, 0.0002551078796386719, 0.0002715587615966797, 0.0002880096435546875, 0.0003044605255126953, 0.0003209114074707031, 0.00033736228942871094, 0.00035381317138671875, 0.00037026405334472656, 0.0003867149353027344, 0.0004031658172607422, 0.00041961669921875, 0.0004360675811767578, 0.0004525184631347656, 0.00046896934509277344, 0.00048542022705078125, 0.0005018711090087891, 0.0005183219909667969, 0.0005347728729248047, 0.0005512237548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 6.0, 8.0, 9.0, 20.0, 43.0, 65.0, 115.0, 248.0, 503.0, 1360.0, 4553.0, 23177.0, 276276.0, 700423.0, 33088.0, 5861.0, 1596.0, 603.0, 287.0, 140.0, 62.0, 41.0, 27.0, 15.0, 11.0, 1.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.451416015625, -4.31689453125, -4.182373046875, -4.0478515625, -3.913330078125, -3.77880859375, -3.644287109375, -3.509765625, -3.375244140625, -3.24072265625, -3.106201171875, -2.9716796875, -2.837158203125, -2.70263671875, -2.568115234375, -2.43359375, -2.299072265625, -2.16455078125, -2.030029296875, -1.8955078125, -1.760986328125, -1.62646484375, -1.491943359375, -1.357421875, -1.222900390625, -1.08837890625, -0.953857421875, -0.8193359375, -0.684814453125, -0.55029296875, -0.415771484375, -0.28125, -0.146728515625, -0.01220703125, 0.122314453125, 0.2568359375, 0.391357421875, 0.52587890625, 0.660400390625, 0.794921875, 0.929443359375, 1.06396484375, 1.198486328125, 1.3330078125, 1.467529296875, 1.60205078125, 1.736572265625, 1.87109375, 2.005615234375, 2.14013671875, 2.274658203125, 2.4091796875, 2.543701171875, 2.67822265625, 2.812744140625, 2.947265625, 3.081787109375, 3.21630859375, 3.350830078125, 3.4853515625, 3.619873046875, 3.75439453125, 3.888916015625, 4.0234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 10.0, 5.0, 11.0, 16.0, 18.0, 28.0, 41.0, 68.0, 107.0, 143.0, 170.0, 117.0, 85.0, 60.0, 29.0, 20.0, 14.0, 14.0, 8.0, 4.0, 1.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -4.0142822265625, -3.903564453125, -3.7928466796875, -3.68212890625, -3.5714111328125, -3.460693359375, -3.3499755859375, -3.2392578125, -3.1285400390625, -3.017822265625, -2.9071044921875, -2.79638671875, -2.6856689453125, -2.574951171875, -2.4642333984375, -2.353515625, -2.2427978515625, -2.132080078125, -2.0213623046875, -1.91064453125, -1.7999267578125, -1.689208984375, -1.5784912109375, -1.4677734375, -1.3570556640625, -1.246337890625, -1.1356201171875, -1.02490234375, -0.9141845703125, -0.803466796875, -0.6927490234375, -0.58203125, -0.4713134765625, -0.360595703125, -0.2498779296875, -0.13916015625, -0.0284423828125, 0.082275390625, 0.1929931640625, 0.3037109375, 0.4144287109375, 0.525146484375, 0.6358642578125, 0.74658203125, 0.8572998046875, 0.968017578125, 1.0787353515625, 1.189453125, 1.3001708984375, 1.410888671875, 1.5216064453125, 1.63232421875, 1.7430419921875, 1.853759765625, 1.9644775390625, 2.0751953125, 2.1859130859375, 2.296630859375, 2.4073486328125, 2.51806640625, 2.6287841796875, 2.739501953125, 2.8502197265625, 2.9609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 13.0, 19.0, 37.0, 65.0, 96.0, 145.0, 276.0, 153.0, 80.0, 39.0, 24.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.74422454833984, -73.03071594238281, -71.31719970703125, -69.60369110107422, -67.89017486572266, -66.17666625976562, -64.46315002441406, -62.74964141845703, -61.03612518310547, -59.32261276245117, -57.609100341796875, -55.89558792114258, -54.18207550048828, -52.468563079833984, -50.75505065917969, -49.041542053222656, -47.32802963256836, -45.61451721191406, -43.901004791259766, -42.18749237060547, -40.47397994995117, -38.760467529296875, -37.046958923339844, -35.33344268798828, -33.61993408203125, -31.906421661376953, -30.192909240722656, -28.47939682006836, -26.765884399414062, -25.052371978759766, -23.3388614654541, -21.625349044799805, -19.911834716796875, -18.198322296142578, -16.48480987548828, -14.7712984085083, -13.057785987854004, -11.344273567199707, -9.630762100219727, -7.91724967956543, -6.203737258911133, -4.490224838256836, -2.7767128944396973, -1.0632009506225586, 0.6503114700317383, 2.363823890686035, 4.077335357666016, 5.7908477783203125, 7.504360198974609, 9.217872619628906, 10.931385040283203, 12.644896507263184, 14.35840892791748, 16.071922302246094, 17.785432815551758, 19.498945236206055, 21.21245765686035, 22.92597007751465, 24.639482498168945, 26.35299301147461, 28.066505432128906, 29.780017852783203, 31.4935302734375, 33.2070426940918, 34.920555114746094]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 4.0, 9.0, 11.0, 6.0, 7.0, 17.0, 15.0, 18.0, 19.0, 25.0, 41.0, 30.0, 42.0, 45.0, 76.0, 98.0, 130.0, 71.0, 50.0, 37.0, 35.0, 27.0, 22.0, 29.0, 22.0, 22.0, 17.0, 13.0, 9.0, 13.0, 11.0, 5.0, 4.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.282814025878906, -40.82621383666992, -39.36961364746094, -37.91301345825195, -36.45641326904297, -34.99981689453125, -33.543212890625, -32.08661651611328, -30.630016326904297, -29.173416137695312, -27.716815948486328, -26.260215759277344, -24.803617477416992, -23.347017288208008, -21.890417098999023, -20.433818817138672, -18.977216720581055, -17.52061653137207, -16.064016342163086, -14.607417106628418, -13.15081787109375, -11.694217681884766, -10.237617492675781, -8.781018257141113, -7.324418067932129, -5.867818355560303, -4.411218643188477, -2.954618453979492, -1.498018741607666, -0.041419029235839844, 1.4151811599731445, 2.8717803955078125, 4.328380584716797, 5.784980297088623, 7.241580009460449, 8.698180198669434, 10.154779434204102, 11.611379623413086, 13.06797981262207, 14.524579048156738, 15.981179237365723, 17.43777847290039, 18.894378662109375, 20.35097885131836, 21.807579040527344, 23.264179229736328, 24.720779418945312, 26.177377700805664, 27.63397789001465, 29.090578079223633, 30.547178268432617, 32.00377655029297, 33.46037673950195, 34.91697692871094, 36.37357711791992, 37.830177307128906, 39.28677749633789, 40.743377685546875, 42.19997787475586, 43.656578063964844, 45.11317825317383, 46.56977844238281, 48.02637481689453, 49.482975006103516, 50.9395751953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 10.0, 9.0, 23.0, 22.0, 28.0, 50.0, 81.0, 169.0, 284.0, 572.0, 1128.0, 2645.0, 7500.0, 33813.0, 453020.0, 3361471.0, 298348.0, 24744.0, 5912.0, 2051.0, 1044.0, 528.0, 295.0, 172.0, 99.0, 48.0, 57.0, 40.0, 16.0, 15.0, 12.0, 11.0, 8.0, 9.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.62890625, -6.39581298828125, -6.1627197265625, -5.92962646484375, -5.696533203125, -5.46343994140625, -5.2303466796875, -4.99725341796875, -4.76416015625, -4.53106689453125, -4.2979736328125, -4.06488037109375, -3.831787109375, -3.59869384765625, -3.3656005859375, -3.13250732421875, -2.8994140625, -2.66632080078125, -2.4332275390625, -2.20013427734375, -1.967041015625, -1.73394775390625, -1.5008544921875, -1.26776123046875, -1.03466796875, -0.80157470703125, -0.5684814453125, -0.33538818359375, -0.102294921875, 0.13079833984375, 0.3638916015625, 0.59698486328125, 0.830078125, 1.06317138671875, 1.2962646484375, 1.52935791015625, 1.762451171875, 1.99554443359375, 2.2286376953125, 2.46173095703125, 2.69482421875, 2.92791748046875, 3.1610107421875, 3.39410400390625, 3.627197265625, 3.86029052734375, 4.0933837890625, 4.32647705078125, 4.5595703125, 4.79266357421875, 5.0257568359375, 5.25885009765625, 5.491943359375, 5.72503662109375, 5.9581298828125, 6.19122314453125, 6.42431640625, 6.65740966796875, 6.8905029296875, 7.12359619140625, 7.356689453125, 7.58978271484375, 7.8228759765625, 8.05596923828125, 8.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 16.0, 19.0, 13.0, 21.0, 27.0, 33.0, 31.0, 38.0, 40.0, 57.0, 38.0, 50.0, 58.0, 47.0, 43.0, 51.0, 44.0, 55.0, 51.0, 33.0, 29.0, 30.0, 21.0, 24.0, 25.0, 19.0, 15.0, 9.0, 7.0, 12.0, 5.0, 6.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.41168212890625, -2.3155517578125, -2.21942138671875, -2.123291015625, -2.02716064453125, -1.9310302734375, -1.83489990234375, -1.73876953125, -1.64263916015625, -1.5465087890625, -1.45037841796875, -1.354248046875, -1.25811767578125, -1.1619873046875, -1.06585693359375, -0.9697265625, -0.87359619140625, -0.7774658203125, -0.68133544921875, -0.585205078125, -0.48907470703125, -0.3929443359375, -0.29681396484375, -0.20068359375, -0.10455322265625, -0.0084228515625, 0.08770751953125, 0.183837890625, 0.27996826171875, 0.3760986328125, 0.47222900390625, 0.568359375, 0.66448974609375, 0.7606201171875, 0.85675048828125, 0.952880859375, 1.04901123046875, 1.1451416015625, 1.24127197265625, 1.33740234375, 1.43353271484375, 1.5296630859375, 1.62579345703125, 1.721923828125, 1.81805419921875, 1.9141845703125, 2.01031494140625, 2.1064453125, 2.20257568359375, 2.2987060546875, 2.39483642578125, 2.490966796875, 2.58709716796875, 2.6832275390625, 2.77935791015625, 2.87548828125, 2.97161865234375, 3.0677490234375, 3.16387939453125, 3.260009765625, 3.35614013671875, 3.4522705078125, 3.54840087890625, 3.64453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 11.0, 33.0, 62.0, 118.0, 207.0, 497.0, 1744.0, 23439.0, 3756338.0, 402904.0, 7178.0, 977.0, 392.0, 168.0, 108.0, 54.0, 25.0, 9.0, 9.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.28125, -15.784912109375, -15.28857421875, -14.792236328125, -14.2958984375, -13.799560546875, -13.30322265625, -12.806884765625, -12.310546875, -11.814208984375, -11.31787109375, -10.821533203125, -10.3251953125, -9.828857421875, -9.33251953125, -8.836181640625, -8.33984375, -7.843505859375, -7.34716796875, -6.850830078125, -6.3544921875, -5.858154296875, -5.36181640625, -4.865478515625, -4.369140625, -3.872802734375, -3.37646484375, -2.880126953125, -2.3837890625, -1.887451171875, -1.39111328125, -0.894775390625, -0.3984375, 0.097900390625, 0.59423828125, 1.090576171875, 1.5869140625, 2.083251953125, 2.57958984375, 3.075927734375, 3.572265625, 4.068603515625, 4.56494140625, 5.061279296875, 5.5576171875, 6.053955078125, 6.55029296875, 7.046630859375, 7.54296875, 8.039306640625, 8.53564453125, 9.031982421875, 9.5283203125, 10.024658203125, 10.52099609375, 11.017333984375, 11.513671875, 12.010009765625, 12.50634765625, 13.002685546875, 13.4990234375, 13.995361328125, 14.49169921875, 14.988037109375, 15.484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 9.0, 13.0, 13.0, 31.0, 42.0, 61.0, 100.0, 167.0, 331.0, 596.0, 856.0, 769.0, 472.0, 230.0, 132.0, 76.0, 51.0, 37.0, 30.0, 23.0, 10.0, 8.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.7474365234375, -4.494873046875, -4.2423095703125, -3.98974609375, -3.7371826171875, -3.484619140625, -3.2320556640625, -2.9794921875, -2.7269287109375, -2.474365234375, -2.2218017578125, -1.96923828125, -1.7166748046875, -1.464111328125, -1.2115478515625, -0.958984375, -0.7064208984375, -0.453857421875, -0.2012939453125, 0.05126953125, 0.3038330078125, 0.556396484375, 0.8089599609375, 1.0615234375, 1.3140869140625, 1.566650390625, 1.8192138671875, 2.07177734375, 2.3243408203125, 2.576904296875, 2.8294677734375, 3.08203125, 3.3345947265625, 3.587158203125, 3.8397216796875, 4.09228515625, 4.3448486328125, 4.597412109375, 4.8499755859375, 5.1025390625, 5.3551025390625, 5.607666015625, 5.8602294921875, 6.11279296875, 6.3653564453125, 6.617919921875, 6.8704833984375, 7.123046875, 7.3756103515625, 7.628173828125, 7.8807373046875, 8.13330078125, 8.3858642578125, 8.638427734375, 8.8909912109375, 9.1435546875, 9.3961181640625, 9.648681640625, 9.9012451171875, 10.15380859375, 10.4063720703125, 10.658935546875, 10.9114990234375, 11.1640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 14.0, 28.0, 51.0, 103.0, 195.0, 225.0, 162.0, 83.0, 53.0, 26.0, 19.0, 15.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.26677703857422, -45.96961212158203, -43.672447204589844, -41.375282287597656, -39.0781135559082, -36.780948638916016, -34.48378372192383, -32.186614990234375, -29.88945198059082, -27.592287063598633, -25.295120239257812, -22.997955322265625, -20.700790405273438, -18.403623580932617, -16.10645866394043, -13.80929183959961, -11.512126922607422, -9.214961051940918, -6.917795658111572, -4.620630264282227, -2.3234643936157227, -0.02629852294921875, 2.2708663940429688, 4.568033218383789, 6.865198135375977, 9.16236400604248, 11.459529876708984, 13.756694793701172, 16.05385971069336, 18.35102653503418, 20.648191452026367, 22.945358276367188, 25.242523193359375, 27.539688110351562, 29.836854934692383, 32.13401794433594, 34.43118667602539, 36.72835159301758, 39.025516510009766, 41.32268524169922, 43.619850158691406, 45.917015075683594, 48.21417999267578, 50.51134490966797, 52.80851364135742, 55.10567855834961, 57.4028434753418, 59.70001220703125, 61.99717330932617, 64.29434204101562, 66.59150695800781, 68.888671875, 71.18583679199219, 73.48300170898438, 75.78016662597656, 78.07733154296875, 80.37449645996094, 82.67166137695312, 84.96882629394531, 87.2659912109375, 89.56315612792969, 91.86032104492188, 94.15748596191406, 96.45465850830078, 98.75182342529297]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 11.0, 13.0, 12.0, 21.0, 19.0, 28.0, 40.0, 36.0, 51.0, 45.0, 48.0, 48.0, 52.0, 58.0, 61.0, 45.0, 52.0, 50.0, 52.0, 41.0, 45.0, 31.0, 18.0, 21.0, 19.0, 16.0, 8.0, 10.0, 9.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-40.776832580566406, -39.683162689208984, -38.58949279785156, -37.495819091796875, -36.40214920043945, -35.30847930908203, -34.21480941772461, -33.12113952636719, -32.0274658203125, -30.933795928955078, -29.840124130249023, -28.7464542388916, -27.652782440185547, -26.559112548828125, -25.465442657470703, -24.37177085876465, -23.278100967407227, -22.184431076049805, -21.09075927734375, -19.997089385986328, -18.903417587280273, -17.80974769592285, -16.716075897216797, -15.622406005859375, -14.528735160827637, -13.435064315795898, -12.34139347076416, -11.247722625732422, -10.154052734375, -9.060380935668945, -7.966711044311523, -6.873040199279785, -5.779369354248047, -4.685698509216309, -3.5920279026031494, -2.4983572959899902, -1.404686450958252, -0.31101560592651367, 0.7826547622680664, 1.8763256072998047, 2.969996452331543, 4.063667297363281, 5.1573381423950195, 6.2510085105896, 7.344679355621338, 8.438350677490234, 9.532020568847656, 10.625691413879395, 11.719362258911133, 12.813033103942871, 13.90670394897461, 15.000373840332031, 16.094045639038086, 17.187715530395508, 18.281387329101562, 19.375057220458984, 20.468727111816406, 21.562397003173828, 22.656068801879883, 23.749738693237305, 24.84341049194336, 25.93708038330078, 27.030750274658203, 28.124422073364258, 29.218093872070312]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 11.0, 15.0, 23.0, 41.0, 68.0, 120.0, 208.0, 368.0, 747.0, 1520.0, 3178.0, 7098.0, 17575.0, 48334.0, 152424.0, 444787.0, 252395.0, 74941.0, 26256.0, 10012.0, 4310.0, 2003.0, 950.0, 524.0, 288.0, 131.0, 88.0, 48.0, 35.0, 21.0, 15.0, 12.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -5.997802734375, -5.81982421875, -5.641845703125, -5.4638671875, -5.285888671875, -5.10791015625, -4.929931640625, -4.751953125, -4.573974609375, -4.39599609375, -4.218017578125, -4.0400390625, -3.862060546875, -3.68408203125, -3.506103515625, -3.328125, -3.150146484375, -2.97216796875, -2.794189453125, -2.6162109375, -2.438232421875, -2.26025390625, -2.082275390625, -1.904296875, -1.726318359375, -1.54833984375, -1.370361328125, -1.1923828125, -1.014404296875, -0.83642578125, -0.658447265625, -0.48046875, -0.302490234375, -0.12451171875, 0.053466796875, 0.2314453125, 0.409423828125, 0.58740234375, 0.765380859375, 0.943359375, 1.121337890625, 1.29931640625, 1.477294921875, 1.6552734375, 1.833251953125, 2.01123046875, 2.189208984375, 2.3671875, 2.545166015625, 2.72314453125, 2.901123046875, 3.0791015625, 3.257080078125, 3.43505859375, 3.613037109375, 3.791015625, 3.968994140625, 4.14697265625, 4.324951171875, 4.5029296875, 4.680908203125, 4.85888671875, 5.036865234375, 5.21484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 22.0, 23.0, 26.0, 17.0, 24.0, 24.0, 37.0, 44.0, 45.0, 50.0, 56.0, 51.0, 53.0, 53.0, 46.0, 36.0, 39.0, 45.0, 43.0, 30.0, 28.0, 28.0, 21.0, 23.0, 18.0, 9.0, 11.0, 8.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.69805908203125, -2.5972900390625, -2.49652099609375, -2.395751953125, -2.29498291015625, -2.1942138671875, -2.09344482421875, -1.99267578125, -1.89190673828125, -1.7911376953125, -1.69036865234375, -1.589599609375, -1.48883056640625, -1.3880615234375, -1.28729248046875, -1.1865234375, -1.08575439453125, -0.9849853515625, -0.88421630859375, -0.783447265625, -0.68267822265625, -0.5819091796875, -0.48114013671875, -0.38037109375, -0.27960205078125, -0.1788330078125, -0.07806396484375, 0.022705078125, 0.12347412109375, 0.2242431640625, 0.32501220703125, 0.42578125, 0.52655029296875, 0.6273193359375, 0.72808837890625, 0.828857421875, 0.92962646484375, 1.0303955078125, 1.13116455078125, 1.23193359375, 1.33270263671875, 1.4334716796875, 1.53424072265625, 1.635009765625, 1.73577880859375, 1.8365478515625, 1.93731689453125, 2.0380859375, 2.13885498046875, 2.2396240234375, 2.34039306640625, 2.441162109375, 2.54193115234375, 2.6427001953125, 2.74346923828125, 2.84423828125, 2.94500732421875, 3.0457763671875, 3.14654541015625, 3.247314453125, 3.34808349609375, 3.4488525390625, 3.54962158203125, 3.650390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 13.0, 13.0, 32.0, 27.0, 53.0, 60.0, 90.0, 107.0, 179.0, 271.0, 329.0, 597.0, 1000.0, 2178.0, 7253.0, 52248.0, 835698.0, 129236.0, 12699.0, 3077.0, 1372.0, 623.0, 478.0, 298.0, 177.0, 115.0, 95.0, 54.0, 48.0, 35.0, 26.0, 12.0, 17.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.7890625, -12.420166015625, -12.05126953125, -11.682373046875, -11.3134765625, -10.944580078125, -10.57568359375, -10.206787109375, -9.837890625, -9.468994140625, -9.10009765625, -8.731201171875, -8.3623046875, -7.993408203125, -7.62451171875, -7.255615234375, -6.88671875, -6.517822265625, -6.14892578125, -5.780029296875, -5.4111328125, -5.042236328125, -4.67333984375, -4.304443359375, -3.935546875, -3.566650390625, -3.19775390625, -2.828857421875, -2.4599609375, -2.091064453125, -1.72216796875, -1.353271484375, -0.984375, -0.615478515625, -0.24658203125, 0.122314453125, 0.4912109375, 0.860107421875, 1.22900390625, 1.597900390625, 1.966796875, 2.335693359375, 2.70458984375, 3.073486328125, 3.4423828125, 3.811279296875, 4.18017578125, 4.549072265625, 4.91796875, 5.286865234375, 5.65576171875, 6.024658203125, 6.3935546875, 6.762451171875, 7.13134765625, 7.500244140625, 7.869140625, 8.238037109375, 8.60693359375, 8.975830078125, 9.3447265625, 9.713623046875, 10.08251953125, 10.451416015625, 10.8203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 5.0, 3.0, 9.0, 11.0, 10.0, 14.0, 15.0, 19.0, 31.0, 27.0, 32.0, 49.0, 52.0, 63.0, 59.0, 67.0, 57.0, 69.0, 78.0, 54.0, 41.0, 41.0, 43.0, 33.0, 28.0, 22.0, 15.0, 9.0, 8.0, 6.0, 4.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.828125, -16.3516845703125, -15.875244140625, -15.3988037109375, -14.92236328125, -14.4459228515625, -13.969482421875, -13.4930419921875, -13.0166015625, -12.5401611328125, -12.063720703125, -11.5872802734375, -11.11083984375, -10.6343994140625, -10.157958984375, -9.6815185546875, -9.205078125, -8.7286376953125, -8.252197265625, -7.7757568359375, -7.29931640625, -6.8228759765625, -6.346435546875, -5.8699951171875, -5.3935546875, -4.9171142578125, -4.440673828125, -3.9642333984375, -3.48779296875, -3.0113525390625, -2.534912109375, -2.0584716796875, -1.58203125, -1.1055908203125, -0.629150390625, -0.1527099609375, 0.32373046875, 0.8001708984375, 1.276611328125, 1.7530517578125, 2.2294921875, 2.7059326171875, 3.182373046875, 3.6588134765625, 4.13525390625, 4.6116943359375, 5.088134765625, 5.5645751953125, 6.041015625, 6.5174560546875, 6.993896484375, 7.4703369140625, 7.94677734375, 8.4232177734375, 8.899658203125, 9.3760986328125, 9.8525390625, 10.3289794921875, 10.805419921875, 11.2818603515625, 11.75830078125, 12.2347412109375, 12.711181640625, 13.1876220703125, 13.6640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 9.0, 18.0, 22.0, 15.0, 24.0, 54.0, 59.0, 65.0, 143.0, 233.0, 506.0, 1384.0, 5245.0, 35648.0, 882826.0, 108386.0, 10231.0, 2157.0, 691.0, 296.0, 176.0, 86.0, 64.0, 46.0, 33.0, 29.0, 18.0, 12.0, 12.0, 15.0, 12.0, 8.0, 3.0, 3.0, 0.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.4267578125, -4.287109375, -4.1474609375, -4.0078125, -3.8681640625, -3.728515625, -3.5888671875, -3.44921875, -3.3095703125, -3.169921875, -3.0302734375, -2.890625, -2.7509765625, -2.611328125, -2.4716796875, -2.33203125, -2.1923828125, -2.052734375, -1.9130859375, -1.7734375, -1.6337890625, -1.494140625, -1.3544921875, -1.21484375, -1.0751953125, -0.935546875, -0.7958984375, -0.65625, -0.5166015625, -0.376953125, -0.2373046875, -0.09765625, 0.0419921875, 0.181640625, 0.3212890625, 0.4609375, 0.6005859375, 0.740234375, 0.8798828125, 1.01953125, 1.1591796875, 1.298828125, 1.4384765625, 1.578125, 1.7177734375, 1.857421875, 1.9970703125, 2.13671875, 2.2763671875, 2.416015625, 2.5556640625, 2.6953125, 2.8349609375, 2.974609375, 3.1142578125, 3.25390625, 3.3935546875, 3.533203125, 3.6728515625, 3.8125, 3.9521484375, 4.091796875, 4.2314453125, 4.37109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 4.0, 4.0, 2.0, 10.0, 5.0, 6.0, 10.0, 10.0, 25.0, 24.0, 30.0, 38.0, 69.0, 83.0, 127.0, 154.0, 106.0, 70.0, 48.0, 26.0, 27.0, 27.0, 14.0, 9.0, 9.0, 15.0, 9.0, 6.0, 4.0, 2.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005741119384765625, -0.0005544722080230713, -0.0005348324775695801, -0.0005151927471160889, -0.0004955530166625977, -0.00047591328620910645, -0.00045627355575561523, -0.000436633825302124, -0.0004169940948486328, -0.0003973543643951416, -0.0003777146339416504, -0.0003580749034881592, -0.00033843517303466797, -0.00031879544258117676, -0.00029915571212768555, -0.00027951598167419434, -0.0002598762512207031, -0.00024023652076721191, -0.0002205967903137207, -0.0002009570598602295, -0.00018131732940673828, -0.00016167759895324707, -0.00014203786849975586, -0.00012239813804626465, -0.00010275840759277344, -8.311867713928223e-05, -6.347894668579102e-05, -4.3839216232299805e-05, -2.4199485778808594e-05, -4.559755325317383e-06, 1.5079975128173828e-05, 3.471970558166504e-05, 5.435943603515625e-05, 7.399916648864746e-05, 9.363889694213867e-05, 0.00011327862739562988, 0.0001329183578491211, 0.0001525580883026123, 0.00017219781875610352, 0.00019183754920959473, 0.00021147727966308594, 0.00023111701011657715, 0.00025075674057006836, 0.00027039647102355957, 0.0002900362014770508, 0.000309675931930542, 0.0003293156623840332, 0.0003489553928375244, 0.0003685951232910156, 0.00038823485374450684, 0.00040787458419799805, 0.00042751431465148926, 0.00044715404510498047, 0.0004667937755584717, 0.0004864335060119629, 0.0005060732364654541, 0.0005257129669189453, 0.0005453526973724365, 0.0005649924278259277, 0.0005846321582794189, 0.0006042718887329102, 0.0006239116191864014, 0.0006435513496398926, 0.0006631910800933838, 0.000682830810546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 11.0, 12.0, 21.0, 25.0, 40.0, 50.0, 90.0, 136.0, 248.0, 390.0, 792.0, 1613.0, 3894.0, 11535.0, 62170.0, 788000.0, 148772.0, 20390.0, 5729.0, 2238.0, 1007.0, 565.0, 304.0, 163.0, 98.0, 60.0, 44.0, 32.0, 18.0, 10.0, 12.0, 6.0, 8.0, 3.0, 11.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.005859375, -2.913909912109375, -2.82196044921875, -2.730010986328125, -2.6380615234375, -2.546112060546875, -2.45416259765625, -2.362213134765625, -2.270263671875, -2.178314208984375, -2.08636474609375, -1.994415283203125, -1.9024658203125, -1.810516357421875, -1.71856689453125, -1.626617431640625, -1.53466796875, -1.442718505859375, -1.35076904296875, -1.258819580078125, -1.1668701171875, -1.074920654296875, -0.98297119140625, -0.891021728515625, -0.799072265625, -0.707122802734375, -0.61517333984375, -0.523223876953125, -0.4312744140625, -0.339324951171875, -0.24737548828125, -0.155426025390625, -0.0634765625, 0.028472900390625, 0.12042236328125, 0.212371826171875, 0.3043212890625, 0.396270751953125, 0.48822021484375, 0.580169677734375, 0.672119140625, 0.764068603515625, 0.85601806640625, 0.947967529296875, 1.0399169921875, 1.131866455078125, 1.22381591796875, 1.315765380859375, 1.40771484375, 1.499664306640625, 1.59161376953125, 1.683563232421875, 1.7755126953125, 1.867462158203125, 1.95941162109375, 2.051361083984375, 2.143310546875, 2.235260009765625, 2.32720947265625, 2.419158935546875, 2.5111083984375, 2.603057861328125, 2.69500732421875, 2.786956787109375, 2.87890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 10.0, 1.0, 6.0, 13.0, 22.0, 20.0, 15.0, 35.0, 51.0, 67.0, 92.0, 123.0, 133.0, 104.0, 79.0, 55.0, 35.0, 28.0, 21.0, 21.0, 13.0, 4.0, 10.0, 12.0, 1.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.40625, -3.314239501953125, -3.22222900390625, -3.130218505859375, -3.0382080078125, -2.946197509765625, -2.85418701171875, -2.762176513671875, -2.670166015625, -2.578155517578125, -2.48614501953125, -2.394134521484375, -2.3021240234375, -2.210113525390625, -2.11810302734375, -2.026092529296875, -1.93408203125, -1.842071533203125, -1.75006103515625, -1.658050537109375, -1.5660400390625, -1.474029541015625, -1.38201904296875, -1.290008544921875, -1.197998046875, -1.105987548828125, -1.01397705078125, -0.921966552734375, -0.8299560546875, -0.737945556640625, -0.64593505859375, -0.553924560546875, -0.4619140625, -0.369903564453125, -0.27789306640625, -0.185882568359375, -0.0938720703125, -0.001861572265625, 0.09014892578125, 0.182159423828125, 0.274169921875, 0.366180419921875, 0.45819091796875, 0.550201416015625, 0.6422119140625, 0.734222412109375, 0.82623291015625, 0.918243408203125, 1.01025390625, 1.102264404296875, 1.19427490234375, 1.286285400390625, 1.3782958984375, 1.470306396484375, 1.56231689453125, 1.654327392578125, 1.746337890625, 1.838348388671875, 1.93035888671875, 2.022369384765625, 2.1143798828125, 2.206390380859375, 2.29840087890625, 2.390411376953125, 2.482421875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 18.0, 37.0, 199.0, 631.0, 96.0, 9.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-225.95693969726562, -219.5528564453125, -213.14877319335938, -206.74468994140625, -200.34060668945312, -193.9365234375, -187.53245544433594, -181.1283721923828, -174.7242889404297, -168.32020568847656, -161.91612243652344, -155.5120391845703, -149.10797119140625, -142.70388793945312, -136.2998046875, -129.89572143554688, -123.49163818359375, -117.08755493164062, -110.6834716796875, -104.2793960571289, -97.87531280517578, -91.47122955322266, -85.06715393066406, -78.66307067871094, -72.25898742675781, -65.85490417480469, -59.45082473754883, -53.04674530029297, -46.642662048339844, -40.23857879638672, -33.83449935913086, -27.430419921875, -21.026351928710938, -14.622270584106445, -8.218189239501953, -1.814107894897461, 4.589973449707031, 10.994056701660156, 17.398136138916016, 23.802215576171875, 30.206298828125, 36.610382080078125, 43.014461517333984, 49.418540954589844, 55.82262420654297, 62.226707458496094, 68.63078308105469, 75.03486633300781, 81.43894958496094, 87.84303283691406, 94.24711608886719, 100.65119171142578, 107.0552749633789, 113.45935821533203, 119.86343383789062, 126.26751708984375, 132.67160034179688, 139.07568359375, 145.47976684570312, 151.88385009765625, 158.28793334960938, 164.6920166015625, 171.09608459472656, 177.5001678466797, 183.9042510986328]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 6.0, 13.0, 14.0, 14.0, 23.0, 19.0, 25.0, 39.0, 41.0, 43.0, 42.0, 65.0, 170.0, 125.0, 60.0, 35.0, 34.0, 25.0, 20.0, 25.0, 24.0, 21.0, 21.0, 12.0, 20.0, 5.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.00350570678711, -54.124385833740234, -52.245269775390625, -50.36614990234375, -48.487030029296875, -46.60791015625, -44.728790283203125, -42.849674224853516, -40.97055435180664, -39.091434478759766, -37.212318420410156, -35.33319854736328, -33.454078674316406, -31.57495880126953, -29.69584083557129, -27.816722869873047, -25.937602996826172, -24.058483123779297, -22.179365158081055, -20.300247192382812, -18.421127319335938, -16.542007446289062, -14.66288948059082, -12.783770561218262, -10.904651641845703, -9.025532722473145, -7.146413803100586, -5.267294883728027, -3.3881759643554688, -1.5090570449829102, 0.37006187438964844, 2.249180793762207, 4.128303527832031, 6.00742244720459, 7.886541366577148, 9.765660285949707, 11.644779205322266, 13.523898124694824, 15.403017044067383, 17.282135009765625, 19.1612548828125, 21.040374755859375, 22.919492721557617, 24.79861068725586, 26.677730560302734, 28.55685043334961, 30.43596839904785, 32.315086364746094, 34.19420623779297, 36.073326110839844, 37.95244598388672, 39.83156204223633, 41.7106819152832, 43.58980178833008, 45.46891784667969, 47.34803771972656, 49.22715759277344, 51.10627746582031, 52.98539733886719, 54.8645133972168, 56.74363327026367, 58.62275314331055, 60.501869201660156, 62.38098907470703, 64.2601089477539]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 11.0, 28.0, 42.0, 74.0, 174.0, 365.0, 750.0, 1918.0, 4951.0, 16957.0, 105603.0, 1498876.0, 2353845.0, 178197.0, 22323.0, 6038.0, 2203.0, 934.0, 475.0, 209.0, 115.0, 67.0, 38.0, 30.0, 11.0, 14.0, 12.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.20794677734375, -4.9354248046875, -4.66290283203125, -4.390380859375, -4.11785888671875, -3.8453369140625, -3.57281494140625, -3.30029296875, -3.02777099609375, -2.7552490234375, -2.48272705078125, -2.210205078125, -1.93768310546875, -1.6651611328125, -1.39263916015625, -1.1201171875, -0.84759521484375, -0.5750732421875, -0.30255126953125, -0.030029296875, 0.24249267578125, 0.5150146484375, 0.78753662109375, 1.06005859375, 1.33258056640625, 1.6051025390625, 1.87762451171875, 2.150146484375, 2.42266845703125, 2.6951904296875, 2.96771240234375, 3.240234375, 3.51275634765625, 3.7852783203125, 4.05780029296875, 4.330322265625, 4.60284423828125, 4.8753662109375, 5.14788818359375, 5.42041015625, 5.69293212890625, 5.9654541015625, 6.23797607421875, 6.510498046875, 6.78302001953125, 7.0555419921875, 7.32806396484375, 7.6005859375, 7.87310791015625, 8.1456298828125, 8.41815185546875, 8.690673828125, 8.96319580078125, 9.2357177734375, 9.50823974609375, 9.78076171875, 10.05328369140625, 10.3258056640625, 10.59832763671875, 10.870849609375, 11.14337158203125, 11.4158935546875, 11.68841552734375, 11.9609375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 0.0, 7.0, 3.0, 8.0, 9.0, 11.0, 13.0, 22.0, 22.0, 31.0, 16.0, 34.0, 32.0, 36.0, 28.0, 51.0, 44.0, 49.0, 53.0, 38.0, 43.0, 52.0, 37.0, 33.0, 47.0, 37.0, 37.0, 25.0, 37.0, 20.0, 30.0, 17.0, 13.0, 16.0, 9.0, 11.0, 7.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.70703125, -2.61700439453125, -2.5269775390625, -2.43695068359375, -2.346923828125, -2.25689697265625, -2.1668701171875, -2.07684326171875, -1.98681640625, -1.89678955078125, -1.8067626953125, -1.71673583984375, -1.626708984375, -1.53668212890625, -1.4466552734375, -1.35662841796875, -1.2666015625, -1.17657470703125, -1.0865478515625, -0.99652099609375, -0.906494140625, -0.81646728515625, -0.7264404296875, -0.63641357421875, -0.54638671875, -0.45635986328125, -0.3663330078125, -0.27630615234375, -0.186279296875, -0.09625244140625, -0.0062255859375, 0.08380126953125, 0.173828125, 0.26385498046875, 0.3538818359375, 0.44390869140625, 0.533935546875, 0.62396240234375, 0.7139892578125, 0.80401611328125, 0.89404296875, 0.98406982421875, 1.0740966796875, 1.16412353515625, 1.254150390625, 1.34417724609375, 1.4342041015625, 1.52423095703125, 1.6142578125, 1.70428466796875, 1.7943115234375, 1.88433837890625, 1.974365234375, 2.06439208984375, 2.1544189453125, 2.24444580078125, 2.33447265625, 2.42449951171875, 2.5145263671875, 2.60455322265625, 2.694580078125, 2.78460693359375, 2.8746337890625, 2.96466064453125, 3.0546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 9.0, 13.0, 8.0, 38.0, 64.0, 234.0, 668.0, 2984.0, 138883.0, 4040842.0, 8677.0, 1265.0, 340.0, 148.0, 56.0, 27.0, 10.0, 5.0, 13.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.203125, -29.965087890625, -28.72705078125, -27.489013671875, -26.2509765625, -25.012939453125, -23.77490234375, -22.536865234375, -21.298828125, -20.060791015625, -18.82275390625, -17.584716796875, -16.3466796875, -15.108642578125, -13.87060546875, -12.632568359375, -11.39453125, -10.156494140625, -8.91845703125, -7.680419921875, -6.4423828125, -5.204345703125, -3.96630859375, -2.728271484375, -1.490234375, -0.252197265625, 0.98583984375, 2.223876953125, 3.4619140625, 4.699951171875, 5.93798828125, 7.176025390625, 8.4140625, 9.652099609375, 10.89013671875, 12.128173828125, 13.3662109375, 14.604248046875, 15.84228515625, 17.080322265625, 18.318359375, 19.556396484375, 20.79443359375, 22.032470703125, 23.2705078125, 24.508544921875, 25.74658203125, 26.984619140625, 28.22265625, 29.460693359375, 30.69873046875, 31.936767578125, 33.1748046875, 34.412841796875, 35.65087890625, 36.888916015625, 38.126953125, 39.364990234375, 40.60302734375, 41.841064453125, 43.0791015625, 44.317138671875, 45.55517578125, 46.793212890625, 48.03125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 10.0, 6.0, 7.0, 22.0, 20.0, 42.0, 48.0, 98.0, 170.0, 306.0, 471.0, 686.0, 793.0, 530.0, 309.0, 181.0, 132.0, 84.0, 62.0, 33.0, 19.0, 16.0, 10.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.35736083984375, -6.9295654296875, -6.50177001953125, -6.073974609375, -5.64617919921875, -5.2183837890625, -4.79058837890625, -4.36279296875, -3.93499755859375, -3.5072021484375, -3.07940673828125, -2.651611328125, -2.22381591796875, -1.7960205078125, -1.36822509765625, -0.9404296875, -0.51263427734375, -0.0848388671875, 0.34295654296875, 0.770751953125, 1.19854736328125, 1.6263427734375, 2.05413818359375, 2.48193359375, 2.90972900390625, 3.3375244140625, 3.76531982421875, 4.193115234375, 4.62091064453125, 5.0487060546875, 5.47650146484375, 5.904296875, 6.33209228515625, 6.7598876953125, 7.18768310546875, 7.615478515625, 8.04327392578125, 8.4710693359375, 8.89886474609375, 9.32666015625, 9.75445556640625, 10.1822509765625, 10.61004638671875, 11.037841796875, 11.46563720703125, 11.8934326171875, 12.32122802734375, 12.7490234375, 13.17681884765625, 13.6046142578125, 14.03240966796875, 14.460205078125, 14.88800048828125, 15.3157958984375, 15.74359130859375, 16.17138671875, 16.59918212890625, 17.0269775390625, 17.45477294921875, 17.882568359375, 18.31036376953125, 18.7381591796875, 19.16595458984375, 19.59375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 21.0, 38.0, 110.0, 312.0, 333.0, 113.0, 33.0, 12.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.89826965332031, -73.56704711914062, -66.23583221435547, -58.90461349487305, -51.573394775390625, -44.2421760559082, -36.91095733642578, -29.57973861694336, -22.248519897460938, -14.917301177978516, -7.586082458496094, -0.2548637390136719, 7.07635498046875, 14.407573699951172, 21.738792419433594, 29.070011138916016, 36.40122985839844, 43.73244857788086, 51.06366729736328, 58.3948860168457, 65.72610473632812, 73.05732727050781, 80.38854217529297, 87.71975708007812, 95.05097961425781, 102.3822021484375, 109.71341705322266, 117.04463195800781, 124.3758544921875, 131.7070770263672, 139.03829956054688, 146.3695068359375, 153.70071411132812, 161.0319366455078, 168.3631591796875, 175.69436645507812, 183.0255889892578, 190.3568115234375, 197.68801879882812, 205.0192413330078, 212.3504638671875, 219.6816864013672, 227.01290893554688, 234.3441162109375, 241.6753387451172, 249.00656127929688, 256.3377685546875, 263.66900634765625, 271.0002136230469, 278.3314208984375, 285.66265869140625, 292.9938659667969, 300.3250732421875, 307.65631103515625, 314.9875183105469, 322.3187561035156, 329.64996337890625, 336.9811706542969, 344.3124084472656, 351.64361572265625, 358.974853515625, 366.3060607910156, 373.63726806640625, 380.968505859375, 388.2997131347656]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 9.0, 8.0, 12.0, 9.0, 12.0, 18.0, 22.0, 33.0, 45.0, 37.0, 61.0, 58.0, 70.0, 69.0, 83.0, 82.0, 68.0, 54.0, 58.0, 39.0, 36.0, 26.0, 17.0, 13.0, 9.0, 14.0, 11.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.11614227294922, -61.81248092651367, -59.508819580078125, -57.205162048339844, -54.9015007019043, -52.59783935546875, -50.29418182373047, -47.99052047729492, -45.686859130859375, -43.38319778442383, -41.07953643798828, -38.77587890625, -36.47221755981445, -34.168556213378906, -31.864896774291992, -29.561237335205078, -27.25757598876953, -24.953914642333984, -22.65025520324707, -20.346595764160156, -18.04293441772461, -15.739274024963379, -13.435613632202148, -11.131954193115234, -8.828292846679688, -6.524632453918457, -4.220972061157227, -1.917311668395996, 0.3863487243652344, 2.690009117126465, 4.993669509887695, 7.297328948974609, 9.600997924804688, 11.904658317565918, 14.208318710327148, 16.511978149414062, 18.81563949584961, 21.119300842285156, 23.42296028137207, 25.726619720458984, 28.03028106689453, 30.333942413330078, 32.637603759765625, 34.941261291503906, 37.24492263793945, 39.548583984375, 41.85224151611328, 44.15590286254883, 46.459564208984375, 48.76322555541992, 51.06688690185547, 53.37054443359375, 55.6742057800293, 57.977867126464844, 60.281524658203125, 62.58518600463867, 64.88884735107422, 67.1925048828125, 69.49617004394531, 71.7998275756836, 74.10348510742188, 76.40715026855469, 78.71080780029297, 81.01446533203125, 83.31813049316406]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 11.0, 25.0, 28.0, 36.0, 63.0, 94.0, 186.0, 348.0, 673.0, 1397.0, 3098.0, 8235.0, 28980.0, 183768.0, 714020.0, 80631.0, 17000.0, 5516.0, 2244.0, 1040.0, 502.0, 263.0, 149.0, 77.0, 56.0, 40.0, 16.0, 12.0, 11.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.69921875, -7.47479248046875, -7.2503662109375, -7.02593994140625, -6.801513671875, -6.57708740234375, -6.3526611328125, -6.12823486328125, -5.90380859375, -5.67938232421875, -5.4549560546875, -5.23052978515625, -5.006103515625, -4.78167724609375, -4.5572509765625, -4.33282470703125, -4.1083984375, -3.88397216796875, -3.6595458984375, -3.43511962890625, -3.210693359375, -2.98626708984375, -2.7618408203125, -2.53741455078125, -2.31298828125, -2.08856201171875, -1.8641357421875, -1.63970947265625, -1.415283203125, -1.19085693359375, -0.9664306640625, -0.74200439453125, -0.517578125, -0.29315185546875, -0.0687255859375, 0.15570068359375, 0.380126953125, 0.60455322265625, 0.8289794921875, 1.05340576171875, 1.27783203125, 1.50225830078125, 1.7266845703125, 1.95111083984375, 2.175537109375, 2.39996337890625, 2.6243896484375, 2.84881591796875, 3.0732421875, 3.29766845703125, 3.5220947265625, 3.74652099609375, 3.970947265625, 4.19537353515625, 4.4197998046875, 4.64422607421875, 4.86865234375, 5.09307861328125, 5.3175048828125, 5.54193115234375, 5.766357421875, 5.99078369140625, 6.2152099609375, 6.43963623046875, 6.6640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 14.0, 13.0, 9.0, 20.0, 35.0, 33.0, 42.0, 43.0, 64.0, 67.0, 68.0, 86.0, 72.0, 68.0, 80.0, 63.0, 50.0, 45.0, 33.0, 29.0, 20.0, 12.0, 9.0, 7.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1109619140625, -4.928955078125, -4.7469482421875, -4.56494140625, -4.3829345703125, -4.200927734375, -4.0189208984375, -3.8369140625, -3.6549072265625, -3.472900390625, -3.2908935546875, -3.10888671875, -2.9268798828125, -2.744873046875, -2.5628662109375, -2.380859375, -2.1988525390625, -2.016845703125, -1.8348388671875, -1.65283203125, -1.4708251953125, -1.288818359375, -1.1068115234375, -0.9248046875, -0.7427978515625, -0.560791015625, -0.3787841796875, -0.19677734375, -0.0147705078125, 0.167236328125, 0.3492431640625, 0.53125, 0.7132568359375, 0.895263671875, 1.0772705078125, 1.25927734375, 1.4412841796875, 1.623291015625, 1.8052978515625, 1.9873046875, 2.1693115234375, 2.351318359375, 2.5333251953125, 2.71533203125, 2.8973388671875, 3.079345703125, 3.2613525390625, 3.443359375, 3.6253662109375, 3.807373046875, 3.9893798828125, 4.17138671875, 4.3533935546875, 4.535400390625, 4.7174072265625, 4.8994140625, 5.0814208984375, 5.263427734375, 5.4454345703125, 5.62744140625, 5.8094482421875, 5.991455078125, 6.1734619140625, 6.35546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 14.0, 7.0, 13.0, 23.0, 30.0, 52.0, 82.0, 90.0, 116.0, 204.0, 262.0, 506.0, 1046.0, 2794.0, 14824.0, 246751.0, 757261.0, 18443.0, 3325.0, 1135.0, 512.0, 352.0, 202.0, 151.0, 84.0, 68.0, 55.0, 36.0, 29.0, 20.0, 16.0, 6.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.92755126953125, -6.6715087890625, -6.41546630859375, -6.159423828125, -5.90338134765625, -5.6473388671875, -5.39129638671875, -5.13525390625, -4.87921142578125, -4.6231689453125, -4.36712646484375, -4.111083984375, -3.85504150390625, -3.5989990234375, -3.34295654296875, -3.0869140625, -2.83087158203125, -2.5748291015625, -2.31878662109375, -2.062744140625, -1.80670166015625, -1.5506591796875, -1.29461669921875, -1.03857421875, -0.78253173828125, -0.5264892578125, -0.27044677734375, -0.014404296875, 0.24163818359375, 0.4976806640625, 0.75372314453125, 1.009765625, 1.26580810546875, 1.5218505859375, 1.77789306640625, 2.033935546875, 2.28997802734375, 2.5460205078125, 2.80206298828125, 3.05810546875, 3.31414794921875, 3.5701904296875, 3.82623291015625, 4.082275390625, 4.33831787109375, 4.5943603515625, 4.85040283203125, 5.1064453125, 5.36248779296875, 5.6185302734375, 5.87457275390625, 6.130615234375, 6.38665771484375, 6.6427001953125, 6.89874267578125, 7.15478515625, 7.41082763671875, 7.6668701171875, 7.92291259765625, 8.178955078125, 8.43499755859375, 8.6910400390625, 8.94708251953125, 9.203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 8.0, 3.0, 11.0, 12.0, 16.0, 11.0, 19.0, 15.0, 26.0, 30.0, 33.0, 47.0, 35.0, 59.0, 83.0, 77.0, 86.0, 77.0, 60.0, 53.0, 36.0, 31.0, 33.0, 26.0, 19.0, 17.0, 12.0, 14.0, 11.0, 8.0, 5.0, 9.0, 5.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.9188232421875, -13.439208984375, -12.9595947265625, -12.47998046875, -12.0003662109375, -11.520751953125, -11.0411376953125, -10.5615234375, -10.0819091796875, -9.602294921875, -9.1226806640625, -8.64306640625, -8.1634521484375, -7.683837890625, -7.2042236328125, -6.724609375, -6.2449951171875, -5.765380859375, -5.2857666015625, -4.80615234375, -4.3265380859375, -3.846923828125, -3.3673095703125, -2.8876953125, -2.4080810546875, -1.928466796875, -1.4488525390625, -0.96923828125, -0.4896240234375, -0.010009765625, 0.4696044921875, 0.94921875, 1.4288330078125, 1.908447265625, 2.3880615234375, 2.86767578125, 3.3472900390625, 3.826904296875, 4.3065185546875, 4.7861328125, 5.2657470703125, 5.745361328125, 6.2249755859375, 6.70458984375, 7.1842041015625, 7.663818359375, 8.1434326171875, 8.623046875, 9.1026611328125, 9.582275390625, 10.0618896484375, 10.54150390625, 11.0211181640625, 11.500732421875, 11.9803466796875, 12.4599609375, 12.9395751953125, 13.419189453125, 13.8988037109375, 14.37841796875, 14.8580322265625, 15.337646484375, 15.8172607421875, 16.296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 10.0, 16.0, 17.0, 32.0, 50.0, 100.0, 142.0, 307.0, 824.0, 3240.0, 23155.0, 962812.0, 50520.0, 5257.0, 1185.0, 395.0, 200.0, 91.0, 54.0, 42.0, 13.0, 27.0, 19.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0859375, -2.017852783203125, -1.94976806640625, -1.881683349609375, -1.8135986328125, -1.745513916015625, -1.67742919921875, -1.609344482421875, -1.541259765625, -1.473175048828125, -1.40509033203125, -1.337005615234375, -1.2689208984375, -1.200836181640625, -1.13275146484375, -1.064666748046875, -0.99658203125, -0.928497314453125, -0.86041259765625, -0.792327880859375, -0.7242431640625, -0.656158447265625, -0.58807373046875, -0.519989013671875, -0.451904296875, -0.383819580078125, -0.31573486328125, -0.247650146484375, -0.1795654296875, -0.111480712890625, -0.04339599609375, 0.024688720703125, 0.0927734375, 0.160858154296875, 0.22894287109375, 0.297027587890625, 0.3651123046875, 0.433197021484375, 0.50128173828125, 0.569366455078125, 0.637451171875, 0.705535888671875, 0.77362060546875, 0.841705322265625, 0.9097900390625, 0.977874755859375, 1.04595947265625, 1.114044189453125, 1.18212890625, 1.250213623046875, 1.31829833984375, 1.386383056640625, 1.4544677734375, 1.522552490234375, 1.59063720703125, 1.658721923828125, 1.726806640625, 1.794891357421875, 1.86297607421875, 1.931060791015625, 1.9991455078125, 2.067230224609375, 2.13531494140625, 2.203399658203125, 2.271484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 2.0, 10.0, 13.0, 4.0, 13.0, 16.0, 31.0, 46.0, 52.0, 94.0, 146.0, 144.0, 121.0, 85.0, 54.0, 28.0, 23.0, 16.0, 14.0, 12.0, 11.0, 7.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00024020671844482422, -0.00023206137120723724, -0.00022391602396965027, -0.0002157706767320633, -0.00020762532949447632, -0.00019947998225688934, -0.00019133463501930237, -0.0001831892877817154, -0.00017504394054412842, -0.00016689859330654144, -0.00015875324606895447, -0.0001506078988313675, -0.00014246255159378052, -0.00013431720435619354, -0.00012617185711860657, -0.00011802650988101959, -0.00010988116264343262, -0.00010173581540584564, -9.359046816825867e-05, -8.544512093067169e-05, -7.729977369308472e-05, -6.915442645549774e-05, -6.1009079217910767e-05, -5.286373198032379e-05, -4.4718384742736816e-05, -3.657303750514984e-05, -2.8427690267562866e-05, -2.028234302997589e-05, -1.2136995792388916e-05, -3.991648554801941e-06, 4.153698682785034e-06, 1.229904592037201e-05, 2.0444393157958984e-05, 2.858974039554596e-05, 3.6735087633132935e-05, 4.488043487071991e-05, 5.3025782108306885e-05, 6.117112934589386e-05, 6.931647658348083e-05, 7.746182382106781e-05, 8.560717105865479e-05, 9.375251829624176e-05, 0.00010189786553382874, 0.00011004321277141571, 0.00011818856000900269, 0.00012633390724658966, 0.00013447925448417664, 0.0001426246017217636, 0.00015076994895935059, 0.00015891529619693756, 0.00016706064343452454, 0.0001752059906721115, 0.00018335133790969849, 0.00019149668514728546, 0.00019964203238487244, 0.0002077873796224594, 0.0002159327268600464, 0.00022407807409763336, 0.00023222342133522034, 0.0002403687685728073, 0.0002485141158103943, 0.00025665946304798126, 0.00026480481028556824, 0.0002729501575231552, 0.0002810955047607422]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 9.0, 6.0, 11.0, 13.0, 27.0, 39.0, 42.0, 85.0, 150.0, 273.0, 638.0, 1435.0, 4296.0, 16204.0, 130748.0, 851597.0, 31948.0, 7130.0, 2184.0, 843.0, 368.0, 186.0, 108.0, 61.0, 41.0, 28.0, 15.0, 11.0, 11.0, 12.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4501953125, -1.4051666259765625, -1.360137939453125, -1.3151092529296875, -1.27008056640625, -1.2250518798828125, -1.180023193359375, -1.1349945068359375, -1.0899658203125, -1.0449371337890625, -0.999908447265625, -0.9548797607421875, -0.90985107421875, -0.8648223876953125, -0.819793701171875, -0.7747650146484375, -0.729736328125, -0.6847076416015625, -0.639678955078125, -0.5946502685546875, -0.54962158203125, -0.5045928955078125, -0.459564208984375, -0.4145355224609375, -0.3695068359375, -0.3244781494140625, -0.279449462890625, -0.2344207763671875, -0.18939208984375, -0.1443634033203125, -0.099334716796875, -0.0543060302734375, -0.00927734375, 0.0357513427734375, 0.080780029296875, 0.1258087158203125, 0.17083740234375, 0.2158660888671875, 0.260894775390625, 0.3059234619140625, 0.3509521484375, 0.3959808349609375, 0.441009521484375, 0.4860382080078125, 0.53106689453125, 0.5760955810546875, 0.621124267578125, 0.6661529541015625, 0.711181640625, 0.7562103271484375, 0.801239013671875, 0.8462677001953125, 0.89129638671875, 0.9363250732421875, 0.981353759765625, 1.0263824462890625, 1.0714111328125, 1.1164398193359375, 1.161468505859375, 1.2064971923828125, 1.25152587890625, 1.2965545654296875, 1.341583251953125, 1.3866119384765625, 1.431640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 6.0, 7.0, 4.0, 7.0, 8.0, 8.0, 10.0, 12.0, 12.0, 5.0, 14.0, 28.0, 31.0, 53.0, 70.0, 85.0, 120.0, 110.0, 101.0, 73.0, 60.0, 34.0, 33.0, 15.0, 9.0, 10.0, 14.0, 6.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9638671875, -0.93292236328125, -0.9019775390625, -0.87103271484375, -0.840087890625, -0.80914306640625, -0.7781982421875, -0.74725341796875, -0.71630859375, -0.68536376953125, -0.6544189453125, -0.62347412109375, -0.592529296875, -0.56158447265625, -0.5306396484375, -0.49969482421875, -0.46875, -0.43780517578125, -0.4068603515625, -0.37591552734375, -0.344970703125, -0.31402587890625, -0.2830810546875, -0.25213623046875, -0.22119140625, -0.19024658203125, -0.1593017578125, -0.12835693359375, -0.097412109375, -0.06646728515625, -0.0355224609375, -0.00457763671875, 0.0263671875, 0.05731201171875, 0.0882568359375, 0.11920166015625, 0.150146484375, 0.18109130859375, 0.2120361328125, 0.24298095703125, 0.27392578125, 0.30487060546875, 0.3358154296875, 0.36676025390625, 0.397705078125, 0.42864990234375, 0.4595947265625, 0.49053955078125, 0.521484375, 0.55242919921875, 0.5833740234375, 0.61431884765625, 0.645263671875, 0.67620849609375, 0.7071533203125, 0.73809814453125, 0.76904296875, 0.79998779296875, 0.8309326171875, 0.86187744140625, 0.892822265625, 0.92376708984375, 0.9547119140625, 0.98565673828125, 1.0166015625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 42.0, 59.0, 122.0, 560.0, 105.0, 39.0, 26.0, 10.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.05158996582031, -53.8454475402832, -51.63930892944336, -49.43316650390625, -47.227027893066406, -45.0208854675293, -42.81474304199219, -40.608604431152344, -38.402462005615234, -36.196319580078125, -33.99018096923828, -31.784038543701172, -29.577898025512695, -27.37175750732422, -25.16561508178711, -22.959474563598633, -20.753334045410156, -18.54719352722168, -16.341053009033203, -14.134910583496094, -11.928770065307617, -9.72262954711914, -7.516488075256348, -5.310346603393555, -3.104206085205078, -0.8980650901794434, 1.3080759048461914, 3.514216899871826, 5.720357894897461, 7.9264984130859375, 10.13263988494873, 12.338781356811523, 14.544929504394531, 16.751070022583008, 18.957210540771484, 21.163352966308594, 23.36949348449707, 25.575634002685547, 27.781776428222656, 29.987916946411133, 32.19405746459961, 34.40019989013672, 36.60633850097656, 38.81248092651367, 41.01862335205078, 43.224761962890625, 45.430904388427734, 47.637046813964844, 49.84318542480469, 52.0493278503418, 54.25546646118164, 56.46160888671875, 58.667747497558594, 60.8738899230957, 63.08003234863281, 65.28617095947266, 67.4923095703125, 69.69844818115234, 71.90459442138672, 74.11073303222656, 76.3168716430664, 78.52301025390625, 80.72915649414062, 82.93529510498047, 85.14144134521484]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 5.0, 2.0, 4.0, 8.0, 16.0, 10.0, 9.0, 12.0, 22.0, 15.0, 27.0, 19.0, 35.0, 33.0, 36.0, 295.0, 194.0, 38.0, 30.0, 27.0, 26.0, 32.0, 19.0, 22.0, 14.0, 8.0, 9.0, 12.0, 4.0, 6.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.107627868652344, -46.55012893676758, -44.99263381958008, -43.43513488769531, -41.87763595581055, -40.32013702392578, -38.76264190673828, -37.205142974853516, -35.64764404296875, -34.090145111083984, -32.532649993896484, -30.97515106201172, -29.417652130126953, -27.86015510559082, -26.302658081054688, -24.745159149169922, -23.18766212463379, -21.630165100097656, -20.07266616821289, -18.515169143676758, -16.957670211791992, -15.40017318725586, -13.84267520904541, -12.285177230834961, -10.727679252624512, -9.170181274414062, -7.612683296203613, -6.055185794830322, -4.497687816619873, -2.940189838409424, -1.3826923370361328, 0.1748056411743164, 1.7323036193847656, 3.289801597595215, 4.847299575805664, 6.404797077178955, 7.962295055389404, 9.519792556762695, 11.077290534973145, 12.634788513183594, 14.192286491394043, 15.749784469604492, 17.307281494140625, 18.86478042602539, 20.422277450561523, 21.97977638244629, 23.537273406982422, 25.094772338867188, 26.65226936340332, 28.209766387939453, 29.76726531982422, 31.32476234436035, 32.882259368896484, 34.43975830078125, 35.997257232666016, 37.55475616455078, 39.11225128173828, 40.66975021362305, 42.22724533081055, 43.78474426269531, 45.34224319458008, 46.899742126464844, 48.457237243652344, 50.01473617553711, 51.572235107421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 11.0, 10.0, 19.0, 10.0, 23.0, 28.0, 26.0, 17.0, 29.0, 41.0, 53.0, 74.0, 254.0, 138.0, 42.0, 32.0, 34.0, 26.0, 21.0, 19.0, 15.0, 16.0, 10.0, 12.0, 10.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.752838134765625, -2.62091064453125, -2.488983154296875, -2.3570556640625, -2.225128173828125, -2.09320068359375, -1.961273193359375, -1.829345703125, -1.697418212890625, -1.56549072265625, -1.433563232421875, -1.3016357421875, -1.169708251953125, -1.03778076171875, -0.905853271484375, -0.77392578125, -0.641998291015625, -0.51007080078125, -0.378143310546875, -0.2462158203125, -0.114288330078125, 0.01763916015625, 0.149566650390625, 0.281494140625, 0.413421630859375, 0.54534912109375, 0.677276611328125, 0.8092041015625, 0.941131591796875, 1.07305908203125, 1.204986572265625, 1.3369140625, 1.468841552734375, 1.60076904296875, 1.732696533203125, 1.8646240234375, 1.996551513671875, 2.12847900390625, 2.260406494140625, 2.392333984375, 2.524261474609375, 2.65618896484375, 2.788116455078125, 2.9200439453125, 3.051971435546875, 3.18389892578125, 3.315826416015625, 3.44775390625, 3.579681396484375, 3.71160888671875, 3.843536376953125, 3.9754638671875, 4.107391357421875, 4.23931884765625, 4.371246337890625, 4.503173828125, 4.635101318359375, 4.76702880859375, 4.898956298828125, 5.0308837890625, 5.162811279296875, 5.29473876953125, 5.426666259765625, 5.55859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 7.0, 2.0, 3.0, 21.0, 13.0, 33.0, 61.0, 125.0, 617.0, 6158.0, 8373290.0, 7269.0, 618.0, 174.0, 73.0, 24.0, 17.0, 15.0, 23.0, 20.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.71324920654297, -88.0074234008789, -85.30159759521484, -82.59577178955078, -79.88994598388672, -77.18412017822266, -74.47830200195312, -71.77247619628906, -69.066650390625, -66.36082458496094, -63.654998779296875, -60.94917297363281, -58.24334716796875, -55.53752136230469, -52.83169937133789, -50.12587356567383, -47.4200439453125, -44.71421813964844, -42.008392333984375, -39.30256652832031, -36.59674072265625, -33.89091491699219, -31.18509292602539, -28.479267120361328, -25.773441314697266, -23.067615509033203, -20.36178970336914, -17.65596580505371, -14.950139999389648, -12.244314193725586, -9.538490295410156, -6.832664489746094, -4.126838684082031, -1.421013355255127, 1.2848119735717773, 3.9906368255615234, 6.696462631225586, 9.402288436889648, 12.108112335205078, 14.81393814086914, 17.519763946533203, 20.225589752197266, 22.931415557861328, 25.637239456176758, 28.34306526184082, 31.048891067504883, 33.75471496582031, 36.460540771484375, 39.16636657714844, 41.8721923828125, 44.57801818847656, 47.283843994140625, 49.98966979980469, 52.69549560546875, 55.40131759643555, 58.10714340209961, 60.81296920776367, 63.518795013427734, 66.22461700439453, 68.9304428100586, 71.63626861572266, 74.34209442138672, 77.04792022705078, 79.75374603271484, 82.4595718383789]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 3.0, 8.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-72.89608001708984, -70.56991577148438, -68.24375915527344, -65.91759490966797, -63.5914306640625, -61.2652702331543, -58.939109802246094, -56.612945556640625, -54.286781311035156, -51.96062088012695, -49.634456634521484, -47.30829620361328, -44.98213195800781, -42.65597152709961, -40.329811096191406, -38.00364685058594, -35.677486419677734, -33.35132598876953, -31.025161743164062, -28.69900131225586, -26.37283706665039, -24.046676635742188, -21.72051429748535, -19.394351959228516, -17.06818962097168, -14.742027282714844, -12.415864944458008, -10.089703559875488, -7.763541221618652, -5.437378883361816, -3.111217498779297, -0.7850551605224609, 1.541107177734375, 3.867269277572632, 6.193431377410889, 8.519593238830566, 10.845755577087402, 13.171917915344238, 15.498079299926758, 17.824241638183594, 20.15040397644043, 22.476566314697266, 24.8027286529541, 27.128890991210938, 29.45505142211914, 31.78121566772461, 34.10737609863281, 36.43354034423828, 38.759700775146484, 41.08586120605469, 43.412025451660156, 45.73818588256836, 48.06435012817383, 50.39051055908203, 52.7166748046875, 55.0428352355957, 57.368995666503906, 59.69515609741211, 62.02132034301758, 64.34748077392578, 66.67364501953125, 68.99980926513672, 71.32596588134766, 73.65213012695312, 75.9782943725586]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 7.0, 12.0, 23.0, 35.0, 54.0, 78.0, 120.0, 193.0, 442.0, 971.0, 2325.0, 7437.0, 26966.0, 117258.0, 254376.0, 83553.0, 20460.0, 5889.0, 2033.0, 878.0, 421.0, 225.0, 131.0, 96.0, 74.0, 51.0, 38.0, 20.0, 24.0, 19.0, 14.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-36.875, -35.66162109375, -34.4482421875, -33.23486328125, -32.021484375, -30.80810546875, -29.5947265625, -28.38134765625, -27.16796875, -25.95458984375, -24.7412109375, -23.52783203125, -22.314453125, -21.10107421875, -19.8876953125, -18.67431640625, -17.4609375, -16.24755859375, -15.0341796875, -13.82080078125, -12.607421875, -11.39404296875, -10.1806640625, -8.96728515625, -7.75390625, -6.54052734375, -5.3271484375, -4.11376953125, -2.900390625, -1.68701171875, -0.4736328125, 0.73974609375, 1.953125, 3.16650390625, 4.3798828125, 5.59326171875, 6.806640625, 8.02001953125, 9.2333984375, 10.44677734375, 11.66015625, 12.87353515625, 14.0869140625, 15.30029296875, 16.513671875, 17.72705078125, 18.9404296875, 20.15380859375, 21.3671875, 22.58056640625, 23.7939453125, 25.00732421875, 26.220703125, 27.43408203125, 28.6474609375, 29.86083984375, 31.07421875, 32.28759765625, 33.5009765625, 34.71435546875, 35.927734375, 37.14111328125, 38.3544921875, 39.56787109375, 40.78125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 12.0, 19.0, 21.0, 39.0, 42.0, 75.0, 75.0, 79.0, 102.0, 103.0, 83.0, 72.0, 65.0, 54.0, 36.0, 35.0, 24.0, 15.0, 8.0, 13.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.46905517578125, -5.2935791015625, -5.11810302734375, -4.942626953125, -4.76715087890625, -4.5916748046875, -4.41619873046875, -4.24072265625, -4.06524658203125, -3.8897705078125, -3.71429443359375, -3.538818359375, -3.36334228515625, -3.1878662109375, -3.01239013671875, -2.8369140625, -2.66143798828125, -2.4859619140625, -2.31048583984375, -2.135009765625, -1.95953369140625, -1.7840576171875, -1.60858154296875, -1.43310546875, -1.25762939453125, -1.0821533203125, -0.90667724609375, -0.731201171875, -0.55572509765625, -0.3802490234375, -0.20477294921875, -0.029296875, 0.14617919921875, 0.3216552734375, 0.49713134765625, 0.672607421875, 0.84808349609375, 1.0235595703125, 1.19903564453125, 1.37451171875, 1.54998779296875, 1.7254638671875, 1.90093994140625, 2.076416015625, 2.25189208984375, 2.4273681640625, 2.60284423828125, 2.7783203125, 2.95379638671875, 3.1292724609375, 3.30474853515625, 3.480224609375, 3.65570068359375, 3.8311767578125, 4.00665283203125, 4.18212890625, 4.35760498046875, 4.5330810546875, 4.70855712890625, 4.884033203125, 5.05950927734375, 5.2349853515625, 5.41046142578125, 5.5859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 14.0, 25.0, 31.0, 44.0, 65.0, 61.0, 59.0, 35.0, 43.0, 25.0, 14.0, 8.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.223989486694336, -20.266834259033203, -19.309677124023438, -18.352521896362305, -17.395366668701172, -16.438209533691406, -15.481054306030273, -14.52389907836914, -13.566742897033691, -12.609586715698242, -11.65243148803711, -10.69527530670166, -9.738119125366211, -8.780963897705078, -7.823807716369629, -6.866652011871338, -5.909496307373047, -4.952340602874756, -3.9951846599578857, -3.0380287170410156, -2.0808730125427246, -1.1237173080444336, -0.16656112670898438, 0.7905945777893066, 1.7477502822875977, 2.7049059867858887, 3.662061929702759, 4.619217872619629, 5.57637357711792, 6.533529281616211, 7.49068546295166, 8.44784164428711, 9.40499496459961, 10.362151145935059, 11.319306373596191, 12.27646255493164, 13.233617782592773, 14.190773963928223, 15.147930145263672, 16.105085372924805, 17.062240600585938, 18.01939582824707, 18.976552963256836, 19.93370819091797, 20.8908634185791, 21.848018646240234, 22.80517578125, 23.762331008911133, 24.7194881439209, 25.67664337158203, 26.633800506591797, 27.59095573425293, 28.548110961914062, 29.505268096923828, 30.46242332458496, 31.419578552246094, 32.37673568725586, 33.333892822265625, 34.291046142578125, 35.24820327758789, 36.205360412597656, 37.162513732910156, 38.11967086791992, 39.07682800292969, 40.03398132324219]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 7.0, 3.0, 4.0, 7.0, 11.0, 26.0, 51.0, 84.0, 103.0, 52.0, 39.0, 16.0, 10.0, 7.0, 4.0, 10.0, 13.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.15948486328125, -15.530378341674805, -14.90127182006836, -14.272165298461914, -13.643058776855469, -13.013952255249023, -12.384845733642578, -11.755739212036133, -11.126632690429688, -10.497526168823242, -9.868419647216797, -9.239313125610352, -8.610206604003906, -7.981100082397461, -7.351993083953857, -6.722886562347412, -6.093779563903809, -5.464673042297363, -4.835566520690918, -4.206459999084473, -3.5773532390594482, -2.948246717453003, -2.3191399574279785, -1.6900334358215332, -1.060926914215088, -0.4318203330039978, 0.19728624820709229, 0.8263928890228271, 1.4554994106292725, 2.0846059322357178, 2.713712692260742, 3.3428192138671875, 3.971925735473633, 4.601032257080078, 5.230138778686523, 5.859245300292969, 6.488351821899414, 7.117458343505859, 7.746565341949463, 8.37567138671875, 9.004777908325195, 9.63388442993164, 10.262990951538086, 10.892097473144531, 11.521203994750977, 12.150310516357422, 12.779417037963867, 13.408523559570312, 14.037631034851074, 14.66673755645752, 15.295844078063965, 15.92495059967041, 16.554058074951172, 17.183164596557617, 17.812271118164062, 18.441377639770508, 19.070484161376953, 19.6995906829834, 20.328697204589844, 20.95780372619629, 21.586910247802734, 22.21601676940918, 22.845123291015625, 23.47422981262207, 24.103336334228516]}, "eval/loss": 5.628564834594727, "eval/wer": 1.5293172212631705, "eval/runtime": 963.4096, "eval/samples_per_second": 2.742, "eval/steps_per_second": 0.344} \ No newline at end of file +{"train/loss": 4.4894, "train/learning_rate": 3.4682080924855494e-08, "train/epoch": 5.0, "train/global_step": 4460, "_runtime": 28486, "_timestamp": 1646256169, "_step": 4462, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 99.0, 21.0, 7.0, 6.0, 3.0, 3.0, 8.0, 1.0, 30037.0, 216.0, 45.0, 17.0, 10.0, 9.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.90625, -37.05322265625, -36.2001953125, -35.34716796875, -34.494140625, -33.64111328125, -32.7880859375, -31.93505859375, -31.08203125, -30.22900390625, -29.3759765625, -28.52294921875, -27.669921875, -26.81689453125, -25.9638671875, -25.11083984375, -24.2578125, -23.40478515625, -22.5517578125, -21.69873046875, -20.845703125, -19.99267578125, -19.1396484375, -18.28662109375, -17.43359375, -16.58056640625, -15.7275390625, -14.87451171875, -14.021484375, -13.16845703125, -12.3154296875, -11.46240234375, -10.609375, -9.75634765625, -8.9033203125, -8.05029296875, -7.197265625, -6.34423828125, -5.4912109375, -4.63818359375, -3.78515625, -2.93212890625, -2.0791015625, -1.22607421875, -0.373046875, 0.47998046875, 1.3330078125, 2.18603515625, 3.0390625, 3.89208984375, 4.7451171875, 5.59814453125, 6.451171875, 7.30419921875, 8.1572265625, 9.01025390625, 9.86328125, 10.71630859375, 11.5693359375, 12.42236328125, 13.275390625, 14.12841796875, 14.9814453125, 15.83447265625, 16.6875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 7.0, 4.0, 4.0, 6.0, 12.0, 9.0, 14.0, 21.0, 15.0, 24.0, 20.0, 27.0, 33.0, 33.0, 27.0, 43.0, 30.0, 41.0, 36.0, 46.0, 47.0, 38.0, 46.0, 42.0, 43.0, 36.0, 41.0, 30.0, 37.0, 29.0, 19.0, 30.0, 25.0, 12.0, 11.0, 6.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.805110931396484, -9.561691284179688, -9.318270683288574, -9.074851036071777, -8.83143138885498, -8.588010787963867, -8.34459114074707, -8.101171493530273, -7.857751369476318, -7.614331245422363, -7.370911598205566, -7.127491474151611, -6.884071350097656, -6.640651702880859, -6.397231578826904, -6.153811454772949, -5.910391807556152, -5.666971683502197, -5.4235520362854, -5.180131912231445, -4.936712265014648, -4.693292140960693, -4.449872016906738, -4.206452369689941, -3.9630322456359863, -3.7196123600006104, -3.4761924743652344, -3.2327723503112793, -2.9893524646759033, -2.7459325790405273, -2.5025124549865723, -2.2590925693511963, -2.0156731605529785, -1.7722532749176025, -1.528833270072937, -1.2854132652282715, -1.0419933795928955, -0.7985734939575195, -0.555153489112854, -0.3117334842681885, -0.0683135986328125, 0.17510634660720825, 0.418526291847229, 0.6619462370872498, 0.9053661823272705, 1.1487860679626465, 1.392206072807312, 1.6356260776519775, 1.8790459632873535, 2.1224658489227295, 2.3658857345581055, 2.6093058586120605, 2.8527257442474365, 3.0961456298828125, 3.3395657539367676, 3.5829856395721436, 3.8264055252075195, 4.069825649261475, 4.3132452964782715, 4.556665420532227, 4.800085067749023, 5.0435051918029785, 5.286925315856934, 5.5303449630737305, 5.7737650871276855]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 8.0, 18.0, 13.0, 11.0, 20.0, 17.0, 17.0, 32.0, 21.0, 36.0, 31.0, 45.0, 40.0, 37.0, 50.0, 38.0, 42.0, 51.0, 40.0, 46.0, 35.0, 37.0, 23.0, 35.0, 31.0, 34.0, 24.0, 28.0, 20.0, 19.0, 16.0, 18.0, 13.0, 5.0, 4.0, 3.0, 5.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.515730857849121, -7.263637065887451, -7.011543273925781, -6.759449481964111, -6.507355690002441, -6.255261421203613, -6.003167629241943, -5.751073837280273, -5.4989800453186035, -5.246886253356934, -4.994792461395264, -4.742698669433594, -4.490604400634766, -4.238511085510254, -3.986416816711426, -3.734323024749756, -3.482229232788086, -3.230135440826416, -2.978041648864746, -2.725947618484497, -2.473853826522827, -2.2217600345611572, -1.9696661233901978, -1.7175722122192383, -1.4654784202575684, -1.2133846282958984, -0.961290717124939, -0.7091968655586243, -0.45710301399230957, -0.20500922203063965, 0.047084689140319824, 0.2991786003112793, 0.5512733459472656, 0.8033671975135803, 1.055461049079895, 1.3075549602508545, 1.5596487522125244, 1.8117425441741943, 2.0638365745544434, 2.3159303665161133, 2.568024158477783, 2.820117950439453, 3.072211742401123, 3.324305772781372, 3.576399564743042, 3.828493356704712, 4.080587387084961, 4.332681179046631, 4.584774971008301, 4.836868762969971, 5.088962554931641, 5.3410563468933105, 5.5931501388549805, 5.845244407653809, 6.0973381996154785, 6.349431991577148, 6.601525783538818, 6.853619575500488, 7.105713367462158, 7.357807159423828, 7.609901428222656, 7.861994743347168, 8.114089012145996, 8.366182327270508, 8.618276596069336]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 16.0, 19.0, 35.0, 68.0, 95.0, 158.0, 251.0, 411.0, 623.0, 1083.0, 1743.0, 2828.0, 4714.0, 7535.0, 11752.0, 18425.0, 27274.0, 40217.0, 57174.0, 77683.0, 101516.0, 139276.0, 158053.0, 112234.0, 85687.0, 64222.0, 45651.0, 31301.0, 21287.0, 13941.0, 8838.0, 5490.0, 3435.0, 2130.0, 1269.0, 783.0, 509.0, 310.0, 202.0, 112.0, 59.0, 50.0, 27.0, 22.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.625, -23.904541015625, -23.18408203125, -22.463623046875, -21.7431640625, -21.022705078125, -20.30224609375, -19.581787109375, -18.861328125, -18.140869140625, -17.42041015625, -16.699951171875, -15.9794921875, -15.259033203125, -14.53857421875, -13.818115234375, -13.09765625, -12.377197265625, -11.65673828125, -10.936279296875, -10.2158203125, -9.495361328125, -8.77490234375, -8.054443359375, -7.333984375, -6.613525390625, -5.89306640625, -5.172607421875, -4.4521484375, -3.731689453125, -3.01123046875, -2.290771484375, -1.5703125, -0.849853515625, -0.12939453125, 0.591064453125, 1.3115234375, 2.031982421875, 2.75244140625, 3.472900390625, 4.193359375, 4.913818359375, 5.63427734375, 6.354736328125, 7.0751953125, 7.795654296875, 8.51611328125, 9.236572265625, 9.95703125, 10.677490234375, 11.39794921875, 12.118408203125, 12.8388671875, 13.559326171875, 14.27978515625, 15.000244140625, 15.720703125, 16.441162109375, 17.16162109375, 17.882080078125, 18.6025390625, 19.322998046875, 20.04345703125, 20.763916015625, 21.484375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 25.0, 18.0, 13.0, 26.0, 38.0, 43.0, 42.0, 41.0, 53.0, 61.0, 65.0, 69.0, 62.0, 61.0, 49.0, 32.0, 31.0, 23.0, 24.0, 27.0, 26.0, 12.0, 18.0, 14.0, 15.0, 9.0, 3.0, 5.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.316650390625, -8.98486328125, -8.653076171875, -8.3212890625, -7.989501953125, -7.65771484375, -7.325927734375, -6.994140625, -6.662353515625, -6.33056640625, -5.998779296875, -5.6669921875, -5.335205078125, -5.00341796875, -4.671630859375, -4.33984375, -4.008056640625, -3.67626953125, -3.344482421875, -3.0126953125, -2.680908203125, -2.34912109375, -2.017333984375, -1.685546875, -1.353759765625, -1.02197265625, -0.690185546875, -0.3583984375, -0.026611328125, 0.30517578125, 0.636962890625, 0.96875, 1.300537109375, 1.63232421875, 1.964111328125, 2.2958984375, 2.627685546875, 2.95947265625, 3.291259765625, 3.623046875, 3.954833984375, 4.28662109375, 4.618408203125, 4.9501953125, 5.281982421875, 5.61376953125, 5.945556640625, 6.27734375, 6.609130859375, 6.94091796875, 7.272705078125, 7.6044921875, 7.936279296875, 8.26806640625, 8.599853515625, 8.931640625, 9.263427734375, 9.59521484375, 9.927001953125, 10.2587890625, 10.590576171875, 10.92236328125, 11.254150390625, 11.5859375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 9.0, 13.0, 10.0, 16.0, 16.0, 22.0, 28.0, 28.0, 36.0, 31.0, 39.0, 64.0, 54.0, 49.0, 53.0, 59.0, 43.0, 55.0, 50.0, 34.0, 46.0, 38.0, 37.0, 26.0, 29.0, 19.0, 15.0, 15.0, 8.0, 12.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.451366424560547, -6.244081974029541, -6.036797523498535, -5.829513072967529, -5.622228622436523, -5.414944171905518, -5.207659721374512, -5.000375747680664, -4.7930908203125, -4.585806369781494, -4.378521919250488, -4.171237468719482, -3.9639530181884766, -3.7566685676574707, -3.549384355545044, -3.342099905014038, -3.1348156929016113, -2.9275312423706055, -2.7202467918395996, -2.5129623413085938, -2.305677890777588, -2.098393440246582, -1.8911092281341553, -1.6838247776031494, -1.4765403270721436, -1.2692558765411377, -1.0619714260101318, -0.8546870946884155, -0.6474026441574097, -0.4401181936264038, -0.2328338623046875, -0.02554941177368164, 0.18173551559448242, 0.3890199363231659, 0.5963043570518494, 0.8035887479782104, 1.0108731985092163, 1.2181576490402222, 1.4254419803619385, 1.6327264308929443, 1.8400108814239502, 2.047295331954956, 2.254579782485962, 2.4618639945983887, 2.6691484451293945, 2.8764328956604004, 3.0837173461914062, 3.291001796722412, 3.498286247253418, 3.705570697784424, 3.9128551483154297, 4.1201395988464355, 4.327424049377441, 4.534708499908447, 4.741992950439453, 4.949276924133301, 5.156561851501465, 5.363846302032471, 5.571130752563477, 5.778415203094482, 5.985699653625488, 6.192984104156494, 6.4002685546875, 6.607552528381348, 6.8148369789123535]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 8.0, 6.0, 13.0, 11.0, 16.0, 23.0, 15.0, 31.0, 28.0, 38.0, 33.0, 35.0, 45.0, 45.0, 48.0, 45.0, 57.0, 41.0, 48.0, 38.0, 36.0, 39.0, 43.0, 33.0, 45.0, 30.0, 29.0, 25.0, 24.0, 7.0, 14.0, 11.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.627979278564453, -5.424100875854492, -5.220222473144531, -5.01634407043457, -4.812465667724609, -4.608587265014648, -4.404709339141846, -4.200830936431885, -3.996952533721924, -3.793074131011963, -3.589195728302002, -3.38531756401062, -3.181439161300659, -2.9775607585906982, -2.7736825942993164, -2.5698041915893555, -2.3659257888793945, -2.1620473861694336, -1.9581691026687622, -1.7542908191680908, -1.5504124164581299, -1.346534013748169, -1.1426557302474976, -0.9387774467468262, -0.7348990440368652, -0.5310207009315491, -0.3271423578262329, -0.12326401472091675, 0.08061432838439941, 0.28449273109436035, 0.48837101459503174, 0.6922492980957031, 0.8961272239685059, 1.1000056266784668, 1.3038839101791382, 1.5077621936798096, 1.7116405963897705, 1.9155189990997314, 2.1193971633911133, 2.323275566101074, 2.527153968811035, 2.731032371520996, 2.934910774230957, 3.138788938522339, 3.3426673412323, 3.5465457439422607, 3.7504239082336426, 3.9543023109436035, 4.1581807136535645, 4.362059116363525, 4.565937519073486, 4.769815921783447, 4.97369384765625, 5.177572250366211, 5.381450653076172, 5.585329055786133, 5.789207458496094, 5.993085861206055, 6.196964263916016, 6.400842666625977, 6.6047210693359375, 6.808599472045898, 7.012477397918701, 7.216355800628662, 7.420234203338623]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 25.0, 34.0, 39.0, 78.0, 102.0, 146.0, 199.0, 330.0, 532.0, 806.0, 1317.0, 2168.0, 3330.0, 5413.0, 8947.0, 14418.0, 23731.0, 38487.0, 62220.0, 101652.0, 165023.0, 262525.0, 398320.0, 545724.0, 634460.0, 601583.0, 471734.0, 321557.0, 203793.0, 126650.0, 76489.0, 47312.0, 29068.0, 17646.0, 10741.0, 6525.0, 4180.0, 2508.0, 1584.0, 995.0, 677.0, 394.0, 235.0, 176.0, 132.0, 77.0, 54.0, 30.0, 27.0, 20.0, 15.0, 5.0, 10.0, 6.0, 4.0], "bins": [-4.8046875, -4.6622314453125, -4.519775390625, -4.3773193359375, -4.23486328125, -4.0924072265625, -3.949951171875, -3.8074951171875, -3.6650390625, -3.5225830078125, -3.380126953125, -3.2376708984375, -3.09521484375, -2.9527587890625, -2.810302734375, -2.6678466796875, -2.525390625, -2.3829345703125, -2.240478515625, -2.0980224609375, -1.95556640625, -1.8131103515625, -1.670654296875, -1.5281982421875, -1.3857421875, -1.2432861328125, -1.100830078125, -0.9583740234375, -0.81591796875, -0.6734619140625, -0.531005859375, -0.3885498046875, -0.24609375, -0.1036376953125, 0.038818359375, 0.1812744140625, 0.32373046875, 0.4661865234375, 0.608642578125, 0.7510986328125, 0.8935546875, 1.0360107421875, 1.178466796875, 1.3209228515625, 1.46337890625, 1.6058349609375, 1.748291015625, 1.8907470703125, 2.033203125, 2.1756591796875, 2.318115234375, 2.4605712890625, 2.60302734375, 2.7454833984375, 2.887939453125, 3.0303955078125, 3.1728515625, 3.3153076171875, 3.457763671875, 3.6002197265625, 3.74267578125, 3.8851318359375, 4.027587890625, 4.1700439453125, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 12.0, 6.0, 15.0, 18.0, 21.0, 19.0, 25.0, 31.0, 39.0, 35.0, 38.0, 35.0, 46.0, 44.0, 52.0, 25.0, 31.0, 38.0, 43.0, 38.0, 44.0, 43.0, 41.0, 33.0, 37.0, 25.0, 21.0, 21.0, 18.0, 13.0, 10.0, 11.0, 10.0, 13.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1845703125, -4.037109375, -3.8896484375, -3.7421875, -3.5947265625, -3.447265625, -3.2998046875, -3.15234375, -3.0048828125, -2.857421875, -2.7099609375, -2.5625, -2.4150390625, -2.267578125, -2.1201171875, -1.97265625, -1.8251953125, -1.677734375, -1.5302734375, -1.3828125, -1.2353515625, -1.087890625, -0.9404296875, -0.79296875, -0.6455078125, -0.498046875, -0.3505859375, -0.203125, -0.0556640625, 0.091796875, 0.2392578125, 0.38671875, 0.5341796875, 0.681640625, 0.8291015625, 0.9765625, 1.1240234375, 1.271484375, 1.4189453125, 1.56640625, 1.7138671875, 1.861328125, 2.0087890625, 2.15625, 2.3037109375, 2.451171875, 2.5986328125, 2.74609375, 2.8935546875, 3.041015625, 3.1884765625, 3.3359375, 3.4833984375, 3.630859375, 3.7783203125, 3.92578125, 4.0732421875, 4.220703125, 4.3681640625, 4.515625, 4.6630859375, 4.810546875, 4.9580078125, 5.10546875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 20.0, 32.0, 45.0, 50.0, 106.0, 162.0, 265.0, 438.0, 731.0, 1176.0, 2094.0, 3319.0, 5919.0, 9896.0, 16776.0, 27900.0, 46589.0, 76213.0, 122406.0, 190160.0, 285649.0, 405693.0, 530305.0, 598291.0, 555293.0, 436782.0, 312968.0, 211478.0, 136680.0, 85377.0, 52662.0, 31946.0, 19276.0, 11207.0, 6706.0, 3895.0, 2339.0, 1372.0, 789.0, 465.0, 278.0, 195.0, 109.0, 84.0, 53.0, 27.0, 21.0, 7.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 16.0, 29.0, 33.0, 46.0, 58.0, 83.0, 104.0, 103.0, 140.0, 167.0, 208.0, 213.0, 236.0, 257.0, 287.0, 284.0, 267.0, 258.0, 214.0, 203.0, 145.0, 125.0, 120.0, 99.0, 70.0, 65.0, 62.0, 31.0, 38.0, 22.0, 16.0, 9.0, 9.0, 12.0, 7.0, 3.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.33740234375, -2.2646484375, -2.19189453125, -2.119140625, -2.04638671875, -1.9736328125, -1.90087890625, -1.828125, -1.75537109375, -1.6826171875, -1.60986328125, -1.537109375, -1.46435546875, -1.3916015625, -1.31884765625, -1.24609375, -1.17333984375, -1.1005859375, -1.02783203125, -0.955078125, -0.88232421875, -0.8095703125, -0.73681640625, -0.6640625, -0.59130859375, -0.5185546875, -0.44580078125, -0.373046875, -0.30029296875, -0.2275390625, -0.15478515625, -0.08203125, -0.00927734375, 0.0634765625, 0.13623046875, 0.208984375, 0.28173828125, 0.3544921875, 0.42724609375, 0.5, 0.57275390625, 0.6455078125, 0.71826171875, 0.791015625, 0.86376953125, 0.9365234375, 1.00927734375, 1.08203125, 1.15478515625, 1.2275390625, 1.30029296875, 1.373046875, 1.44580078125, 1.5185546875, 1.59130859375, 1.6640625, 1.73681640625, 1.8095703125, 1.88232421875, 1.955078125, 2.02783203125, 2.1005859375, 2.17333984375, 2.24609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 19.0, 25.0, 28.0, 32.0, 28.0, 33.0, 56.0, 61.0, 54.0, 71.0, 48.0, 50.0, 69.0, 50.0, 52.0, 48.0, 36.0, 38.0, 30.0, 34.0, 21.0, 20.0, 11.0, 8.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.364202499389648, -7.164638042449951, -6.965073585510254, -6.765509605407715, -6.565945148468018, -6.36638069152832, -6.166816234588623, -5.967251777648926, -5.767687797546387, -5.5681233406066895, -5.368558883666992, -5.168994903564453, -4.969430446624756, -4.769865989685059, -4.570301532745361, -4.370737075805664, -4.171173095703125, -3.9716086387634277, -3.7720444202423096, -3.5724799633026123, -3.372915744781494, -3.173351287841797, -2.9737868309020996, -2.7742226123809814, -2.574657917022705, -2.375093460083008, -2.1755292415618896, -1.9759647846221924, -1.7764005661010742, -1.576836109161377, -1.3772717714309692, -1.1777074337005615, -0.9781432151794434, -0.7785788774490356, -0.5790145397186279, -0.37945014238357544, -0.17988580465316772, 0.01967853307723999, 0.21924293041229248, 0.4188072681427002, 0.6183716058731079, 0.8179359436035156, 1.0175002813339233, 1.217064619064331, 1.4166290760040283, 1.6161932945251465, 1.8157577514648438, 2.015322208404541, 2.214886426925659, 2.4144508838653564, 2.6140151023864746, 2.813579559326172, 3.01314377784729, 3.2127082347869873, 3.4122724533081055, 3.6118369102478027, 3.8114013671875, 4.010965824127197, 4.2105302810668945, 4.410094261169434, 4.609658718109131, 4.809223175048828, 5.008787631988525, 5.208352088928223, 5.407916069030762]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 14.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 16.0, 23.0, 15.0, 26.0, 24.0, 27.0, 23.0, 36.0, 32.0, 34.0, 31.0, 48.0, 30.0, 41.0, 31.0, 48.0, 45.0, 41.0, 33.0, 29.0, 28.0, 31.0, 29.0, 27.0, 22.0, 23.0, 19.0, 16.0, 18.0, 12.0, 8.0, 7.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.708048343658447, -4.56910514831543, -4.430161952972412, -4.2912187576293945, -4.152275562286377, -4.013332366943359, -3.8743889331817627, -3.735445737838745, -3.5965025424957275, -3.45755934715271, -3.3186161518096924, -3.179672956466675, -3.040729522705078, -2.9017863273620605, -2.762843132019043, -2.6238999366760254, -2.484956741333008, -2.3460135459899902, -2.2070703506469727, -2.068127155303955, -1.929183840751648, -1.7902406454086304, -1.6512973308563232, -1.5123541355133057, -1.373410940170288, -1.2344677448272705, -1.095524549484253, -0.9565812349319458, -0.8176380395889282, -0.6786948442459106, -0.5397515892982483, -0.40080833435058594, -0.26186561584472656, -0.1229223906993866, 0.01602083444595337, 0.15496405959129333, 0.2939072847366333, 0.4328504800796509, 0.5717937350273132, 0.7107369899749756, 0.8496801853179932, 0.9886233806610107, 1.1275665760040283, 1.2665098905563354, 1.405453085899353, 1.5443962812423706, 1.6833395957946777, 1.8222827911376953, 1.961225986480713, 2.1001691818237305, 2.239112377166748, 2.3780555725097656, 2.516998767852783, 2.655941963195801, 2.7948853969573975, 2.933828592300415, 3.0727717876434326, 3.21171498298645, 3.3506581783294678, 3.4896013736724854, 3.628544807434082, 3.7674880027770996, 3.906431198120117, 4.045374393463135, 4.184317588806152]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 25.0, 30.0, 41.0, 64.0, 81.0, 140.0, 250.0, 371.0, 638.0, 930.0, 1547.0, 2532.0, 4204.0, 7248.0, 13091.0, 24033.0, 47192.0, 95628.0, 187896.0, 268893.0, 191403.0, 97959.0, 48615.0, 24462.0, 13171.0, 7180.0, 4278.0, 2462.0, 1504.0, 987.0, 614.0, 401.0, 234.0, 155.0, 107.0, 67.0, 39.0, 20.0, 15.0, 16.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.04083251953125, -3.8824462890625, -3.72406005859375, -3.565673828125, -3.40728759765625, -3.2489013671875, -3.09051513671875, -2.93212890625, -2.77374267578125, -2.6153564453125, -2.45697021484375, -2.298583984375, -2.14019775390625, -1.9818115234375, -1.82342529296875, -1.6650390625, -1.50665283203125, -1.3482666015625, -1.18988037109375, -1.031494140625, -0.87310791015625, -0.7147216796875, -0.55633544921875, -0.39794921875, -0.23956298828125, -0.0811767578125, 0.07720947265625, 0.235595703125, 0.39398193359375, 0.5523681640625, 0.71075439453125, 0.869140625, 1.02752685546875, 1.1859130859375, 1.34429931640625, 1.502685546875, 1.66107177734375, 1.8194580078125, 1.97784423828125, 2.13623046875, 2.29461669921875, 2.4530029296875, 2.61138916015625, 2.769775390625, 2.92816162109375, 3.0865478515625, 3.24493408203125, 3.4033203125, 3.56170654296875, 3.7200927734375, 3.87847900390625, 4.036865234375, 4.19525146484375, 4.3536376953125, 4.51202392578125, 4.67041015625, 4.82879638671875, 4.9871826171875, 5.14556884765625, 5.303955078125, 5.46234130859375, 5.6207275390625, 5.77911376953125, 5.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 10.0, 14.0, 17.0, 22.0, 12.0, 25.0, 26.0, 31.0, 27.0, 43.0, 30.0, 44.0, 36.0, 49.0, 38.0, 58.0, 35.0, 29.0, 46.0, 37.0, 36.0, 33.0, 39.0, 27.0, 33.0, 37.0, 23.0, 17.0, 18.0, 9.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.41796875, -5.26171875, -5.10546875, -4.94921875, -4.79296875, -4.63671875, -4.48046875, -4.32421875, -4.16796875, -4.01171875, -3.85546875, -3.69921875, -3.54296875, -3.38671875, -3.23046875, -3.07421875, -2.91796875, -2.76171875, -2.60546875, -2.44921875, -2.29296875, -2.13671875, -1.98046875, -1.82421875, -1.66796875, -1.51171875, -1.35546875, -1.19921875, -1.04296875, -0.88671875, -0.73046875, -0.57421875, -0.41796875, -0.26171875, -0.10546875, 0.05078125, 0.20703125, 0.36328125, 0.51953125, 0.67578125, 0.83203125, 0.98828125, 1.14453125, 1.30078125, 1.45703125, 1.61328125, 1.76953125, 1.92578125, 2.08203125, 2.23828125, 2.39453125, 2.55078125, 2.70703125, 2.86328125, 3.01953125, 3.17578125, 3.33203125, 3.48828125, 3.64453125, 3.80078125, 3.95703125, 4.11328125, 4.26953125, 4.42578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 12.0, 20.0, 34.0, 40.0, 49.0, 64.0, 75.0, 158.0, 207.0, 267.0, 443.0, 608.0, 944.0, 1514.0, 2507.0, 4383.0, 8156.0, 16576.0, 38212.0, 103439.0, 298008.0, 351266.0, 132584.0, 47082.0, 19555.0, 9520.0, 4990.0, 2832.0, 1735.0, 1065.0, 654.0, 459.0, 319.0, 210.0, 148.0, 85.0, 68.0, 63.0, 39.0, 34.0, 28.0, 11.0, 12.0, 15.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.38671875, -4.2457275390625, -4.104736328125, -3.9637451171875, -3.82275390625, -3.6817626953125, -3.540771484375, -3.3997802734375, -3.2587890625, -3.1177978515625, -2.976806640625, -2.8358154296875, -2.69482421875, -2.5538330078125, -2.412841796875, -2.2718505859375, -2.130859375, -1.9898681640625, -1.848876953125, -1.7078857421875, -1.56689453125, -1.4259033203125, -1.284912109375, -1.1439208984375, -1.0029296875, -0.8619384765625, -0.720947265625, -0.5799560546875, -0.43896484375, -0.2979736328125, -0.156982421875, -0.0159912109375, 0.125, 0.2659912109375, 0.406982421875, 0.5479736328125, 0.68896484375, 0.8299560546875, 0.970947265625, 1.1119384765625, 1.2529296875, 1.3939208984375, 1.534912109375, 1.6759033203125, 1.81689453125, 1.9578857421875, 2.098876953125, 2.2398681640625, 2.380859375, 2.5218505859375, 2.662841796875, 2.8038330078125, 2.94482421875, 3.0858154296875, 3.226806640625, 3.3677978515625, 3.5087890625, 3.6497802734375, 3.790771484375, 3.9317626953125, 4.07275390625, 4.2137451171875, 4.354736328125, 4.4957275390625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 8.0, 17.0, 14.0, 16.0, 16.0, 18.0, 18.0, 20.0, 22.0, 29.0, 37.0, 31.0, 32.0, 31.0, 32.0, 36.0, 29.0, 30.0, 43.0, 44.0, 43.0, 36.0, 48.0, 33.0, 38.0, 32.0, 27.0, 22.0, 30.0, 29.0, 27.0, 11.0, 19.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.741546630859375, -2.64324951171875, -2.544952392578125, -2.4466552734375, -2.348358154296875, -2.25006103515625, -2.151763916015625, -2.053466796875, -1.955169677734375, -1.85687255859375, -1.758575439453125, -1.6602783203125, -1.561981201171875, -1.46368408203125, -1.365386962890625, -1.26708984375, -1.168792724609375, -1.07049560546875, -0.972198486328125, -0.8739013671875, -0.775604248046875, -0.67730712890625, -0.579010009765625, -0.480712890625, -0.382415771484375, -0.28411865234375, -0.185821533203125, -0.0875244140625, 0.010772705078125, 0.10906982421875, 0.207366943359375, 0.3056640625, 0.403961181640625, 0.50225830078125, 0.600555419921875, 0.6988525390625, 0.797149658203125, 0.89544677734375, 0.993743896484375, 1.092041015625, 1.190338134765625, 1.28863525390625, 1.386932373046875, 1.4852294921875, 1.583526611328125, 1.68182373046875, 1.780120849609375, 1.87841796875, 1.976715087890625, 2.07501220703125, 2.173309326171875, 2.2716064453125, 2.369903564453125, 2.46820068359375, 2.566497802734375, 2.664794921875, 2.763092041015625, 2.86138916015625, 2.959686279296875, 3.0579833984375, 3.156280517578125, 3.25457763671875, 3.352874755859375, 3.451171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 16.0, 18.0, 19.0, 33.0, 49.0, 84.0, 126.0, 213.0, 301.0, 480.0, 878.0, 1626.0, 4419.0, 28056.0, 978213.0, 25996.0, 4214.0, 1618.0, 831.0, 512.0, 292.0, 189.0, 113.0, 77.0, 58.0, 26.0, 20.0, 16.0, 11.0, 12.0, 9.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.064453125, -18.31640625, -17.568359375, -16.8203125, -16.072265625, -15.32421875, -14.576171875, -13.828125, -13.080078125, -12.33203125, -11.583984375, -10.8359375, -10.087890625, -9.33984375, -8.591796875, -7.84375, -7.095703125, -6.34765625, -5.599609375, -4.8515625, -4.103515625, -3.35546875, -2.607421875, -1.859375, -1.111328125, -0.36328125, 0.384765625, 1.1328125, 1.880859375, 2.62890625, 3.376953125, 4.125, 4.873046875, 5.62109375, 6.369140625, 7.1171875, 7.865234375, 8.61328125, 9.361328125, 10.109375, 10.857421875, 11.60546875, 12.353515625, 13.1015625, 13.849609375, 14.59765625, 15.345703125, 16.09375, 16.841796875, 17.58984375, 18.337890625, 19.0859375, 19.833984375, 20.58203125, 21.330078125, 22.078125, 22.826171875, 23.57421875, 24.322265625, 25.0703125, 25.818359375, 26.56640625, 27.314453125, 28.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 11.0, 33.0, 58.0, 221.0, 408.0, 136.0, 47.0, 23.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007940083742141724, -0.0007669031620025635, -0.0007397979497909546, -0.0007126927375793457, -0.0006855875253677368, -0.0006584823131561279, -0.000631377100944519, -0.0006042718887329102, -0.0005771666765213013, -0.0005500614643096924, -0.0005229562520980835, -0.0004958510398864746, -0.0004687458276748657, -0.00044164061546325684, -0.00041453540325164795, -0.00038743019104003906, -0.0003603249788284302, -0.0003332197666168213, -0.0003061145544052124, -0.0002790093421936035, -0.00025190412998199463, -0.00022479891777038574, -0.00019769370555877686, -0.00017058849334716797, -0.00014348328113555908, -0.0001163780689239502, -8.927285671234131e-05, -6.216764450073242e-05, -3.5062432289123535e-05, -7.957220077514648e-06, 1.9147992134094238e-05, 4.6253204345703125e-05, 7.335841655731201e-05, 0.0001004636287689209, 0.00012756884098052979, 0.00015467405319213867, 0.00018177926540374756, 0.00020888447761535645, 0.00023598968982696533, 0.0002630949020385742, 0.0002902001142501831, 0.000317305326461792, 0.0003444105386734009, 0.00037151575088500977, 0.00039862096309661865, 0.00042572617530822754, 0.0004528313875198364, 0.0004799365997314453, 0.0005070418119430542, 0.0005341470241546631, 0.000561252236366272, 0.0005883574485778809, 0.0006154626607894897, 0.0006425678730010986, 0.0006696730852127075, 0.0006967782974243164, 0.0007238835096359253, 0.0007509887218475342, 0.0007780939340591431, 0.000805199146270752, 0.0008323043584823608, 0.0008594095706939697, 0.0008865147829055786, 0.0009136199951171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 19.0, 8.0, 26.0, 32.0, 40.0, 56.0, 74.0, 115.0, 164.0, 220.0, 303.0, 411.0, 588.0, 824.0, 1158.0, 1546.0, 2312.0, 3710.0, 6001.0, 11396.0, 26493.0, 90347.0, 429666.0, 351747.0, 71797.0, 22815.0, 10104.0, 5605.0, 3465.0, 2207.0, 1549.0, 1081.0, 689.0, 552.0, 407.0, 291.0, 200.0, 156.0, 105.0, 70.0, 58.0, 38.0, 36.0, 31.0, 17.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.42608642578125, -5.2506103515625, -5.07513427734375, -4.899658203125, -4.72418212890625, -4.5487060546875, -4.37322998046875, -4.19775390625, -4.02227783203125, -3.8468017578125, -3.67132568359375, -3.495849609375, -3.32037353515625, -3.1448974609375, -2.96942138671875, -2.7939453125, -2.61846923828125, -2.4429931640625, -2.26751708984375, -2.092041015625, -1.91656494140625, -1.7410888671875, -1.56561279296875, -1.39013671875, -1.21466064453125, -1.0391845703125, -0.86370849609375, -0.688232421875, -0.51275634765625, -0.3372802734375, -0.16180419921875, 0.013671875, 0.18914794921875, 0.3646240234375, 0.54010009765625, 0.715576171875, 0.89105224609375, 1.0665283203125, 1.24200439453125, 1.41748046875, 1.59295654296875, 1.7684326171875, 1.94390869140625, 2.119384765625, 2.29486083984375, 2.4703369140625, 2.64581298828125, 2.8212890625, 2.99676513671875, 3.1722412109375, 3.34771728515625, 3.523193359375, 3.69866943359375, 3.8741455078125, 4.04962158203125, 4.22509765625, 4.40057373046875, 4.5760498046875, 4.75152587890625, 4.927001953125, 5.10247802734375, 5.2779541015625, 5.45343017578125, 5.62890625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 8.0, 12.0, 28.0, 48.0, 99.0, 160.0, 208.0, 178.0, 102.0, 58.0, 23.0, 13.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.50732421875, -2.4345703125, -2.36181640625, -2.2890625, -2.21630859375, -2.1435546875, -2.07080078125, -1.998046875, -1.92529296875, -1.8525390625, -1.77978515625, -1.70703125, -1.63427734375, -1.5615234375, -1.48876953125, -1.416015625, -1.34326171875, -1.2705078125, -1.19775390625, -1.125, -1.05224609375, -0.9794921875, -0.90673828125, -0.833984375, -0.76123046875, -0.6884765625, -0.61572265625, -0.54296875, -0.47021484375, -0.3974609375, -0.32470703125, -0.251953125, -0.17919921875, -0.1064453125, -0.03369140625, 0.0390625, 0.11181640625, 0.1845703125, 0.25732421875, 0.330078125, 0.40283203125, 0.4755859375, 0.54833984375, 0.62109375, 0.69384765625, 0.7666015625, 0.83935546875, 0.912109375, 0.98486328125, 1.0576171875, 1.13037109375, 1.203125, 1.27587890625, 1.3486328125, 1.42138671875, 1.494140625, 1.56689453125, 1.6396484375, 1.71240234375, 1.78515625, 1.85791015625, 1.9306640625, 2.00341796875, 2.076171875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 4.0, 8.0, 17.0, 8.0, 6.0, 14.0, 25.0, 20.0, 32.0, 26.0, 36.0, 29.0, 47.0, 41.0, 44.0, 64.0, 49.0, 57.0, 54.0, 40.0, 51.0, 39.0, 37.0, 42.0, 44.0, 24.0, 24.0, 22.0, 22.0, 19.0, 7.0, 7.0, 8.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.619289875030518, -5.4501519203186035, -5.281014442443848, -5.111876487731934, -4.942739009857178, -4.773601055145264, -4.604463577270508, -4.435325622558594, -4.266188144683838, -4.097050189971924, -3.927912712097168, -3.758774995803833, -3.589637279510498, -3.420499563217163, -3.251361846923828, -3.082223892211914, -2.913086175918579, -2.743948459625244, -2.574810743331909, -2.405673027038574, -2.2365353107452393, -2.0673975944519043, -1.8982597589492798, -1.7291220426559448, -1.5599843263626099, -1.390846610069275, -1.22170889377594, -1.0525710582733154, -0.8834334015846252, -0.7142956852912903, -0.5451579093933105, -0.3760201930999756, -0.20688247680664062, -0.03774474561214447, 0.13139298558235168, 0.30053073167800903, 0.469668447971344, 0.638806164264679, 0.8079439401626587, 0.9770816564559937, 1.1462193727493286, 1.3153570890426636, 1.4844948053359985, 1.653632640838623, 1.822770357131958, 1.991908073425293, 2.161045789718628, 2.330183506011963, 2.499321222305298, 2.668458938598633, 2.8375966548919678, 3.0067343711853027, 3.1758720874786377, 3.3450098037719727, 3.5141477584838867, 3.6832852363586426, 3.8524231910705566, 4.021561145782471, 4.190698623657227, 4.359836578369141, 4.5289740562438965, 4.6981120109558105, 4.867249488830566, 5.0363874435424805, 5.205524921417236]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 5.0, 6.0, 8.0, 10.0, 17.0, 19.0, 15.0, 7.0, 26.0, 21.0, 23.0, 30.0, 32.0, 29.0, 27.0, 35.0, 26.0, 38.0, 37.0, 37.0, 48.0, 30.0, 41.0, 42.0, 36.0, 28.0, 28.0, 30.0, 34.0, 23.0, 33.0, 23.0, 17.0, 21.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-4.382673263549805, -4.250843048095703, -4.119012355804443, -3.987182140350342, -3.8553519248962402, -3.7235214710235596, -3.591691017150879, -3.4598608016967773, -3.328030586242676, -3.196200132369995, -3.0643699169158936, -2.932539463043213, -2.8007092475891113, -2.6688787937164307, -2.53704833984375, -2.4052181243896484, -2.2733876705169678, -2.141557216644287, -2.0097270011901855, -1.8778965473175049, -1.7460663318634033, -1.6142358779907227, -1.4824055433273315, -1.3505752086639404, -1.2187448740005493, -1.0869145393371582, -0.9550842046737671, -0.8232538104057312, -0.6914234757423401, -0.559593141078949, -0.4277627468109131, -0.295932412147522, -0.16410207748413086, -0.03227172791957855, 0.09955862164497375, 0.23138898611068726, 0.36321932077407837, 0.4950496554374695, 0.6268800497055054, 0.7587103843688965, 0.8905407190322876, 1.0223710536956787, 1.1542013883590698, 1.286031723022461, 1.4178621768951416, 1.5496923923492432, 1.6815228462219238, 1.813353180885315, 1.945183515548706, 2.0770139694213867, 2.2088441848754883, 2.340674638748169, 2.4725048542022705, 2.604335308074951, 2.7361655235290527, 2.8679959774017334, 2.999826431274414, 3.1316568851470947, 3.2634871006011963, 3.395317554473877, 3.5271477699279785, 3.658978223800659, 3.79080867767334, 3.9226388931274414, 4.054469108581543]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 30.0, 44.0, 53.0, 101.0, 161.0, 264.0, 402.0, 631.0, 978.0, 1594.0, 2510.0, 4238.0, 6575.0, 10311.0, 16142.0, 24500.0, 36111.0, 51080.0, 68924.0, 86676.0, 101723.0, 111442.0, 111356.0, 101975.0, 86930.0, 68407.0, 51169.0, 36173.0, 24162.0, 16151.0, 10241.0, 6521.0, 4033.0, 2610.0, 1686.0, 981.0, 636.0, 372.0, 237.0, 167.0, 98.0, 45.0, 31.0, 21.0, 11.0, 5.0, 16.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.58984375, -4.45074462890625, -4.3116455078125, -4.17254638671875, -4.033447265625, -3.89434814453125, -3.7552490234375, -3.61614990234375, -3.47705078125, -3.33795166015625, -3.1988525390625, -3.05975341796875, -2.920654296875, -2.78155517578125, -2.6424560546875, -2.50335693359375, -2.3642578125, -2.22515869140625, -2.0860595703125, -1.94696044921875, -1.807861328125, -1.66876220703125, -1.5296630859375, -1.39056396484375, -1.25146484375, -1.11236572265625, -0.9732666015625, -0.83416748046875, -0.695068359375, -0.55596923828125, -0.4168701171875, -0.27777099609375, -0.138671875, 0.00042724609375, 0.1395263671875, 0.27862548828125, 0.417724609375, 0.55682373046875, 0.6959228515625, 0.83502197265625, 0.97412109375, 1.11322021484375, 1.2523193359375, 1.39141845703125, 1.530517578125, 1.66961669921875, 1.8087158203125, 1.94781494140625, 2.0869140625, 2.22601318359375, 2.3651123046875, 2.50421142578125, 2.643310546875, 2.78240966796875, 2.9215087890625, 3.06060791015625, 3.19970703125, 3.33880615234375, 3.4779052734375, 3.61700439453125, 3.756103515625, 3.89520263671875, 4.0343017578125, 4.17340087890625, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 7.0, 8.0, 10.0, 13.0, 23.0, 24.0, 21.0, 17.0, 25.0, 37.0, 38.0, 30.0, 31.0, 40.0, 53.0, 34.0, 33.0, 50.0, 48.0, 36.0, 37.0, 42.0, 33.0, 24.0, 28.0, 41.0, 28.0, 23.0, 27.0, 18.0, 16.0, 14.0, 15.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-5.015625, -4.8765869140625, -4.737548828125, -4.5985107421875, -4.45947265625, -4.3204345703125, -4.181396484375, -4.0423583984375, -3.9033203125, -3.7642822265625, -3.625244140625, -3.4862060546875, -3.34716796875, -3.2081298828125, -3.069091796875, -2.9300537109375, -2.791015625, -2.6519775390625, -2.512939453125, -2.3739013671875, -2.23486328125, -2.0958251953125, -1.956787109375, -1.8177490234375, -1.6787109375, -1.5396728515625, -1.400634765625, -1.2615966796875, -1.12255859375, -0.9835205078125, -0.844482421875, -0.7054443359375, -0.56640625, -0.4273681640625, -0.288330078125, -0.1492919921875, -0.01025390625, 0.1287841796875, 0.267822265625, 0.4068603515625, 0.5458984375, 0.6849365234375, 0.823974609375, 0.9630126953125, 1.10205078125, 1.2410888671875, 1.380126953125, 1.5191650390625, 1.658203125, 1.7972412109375, 1.936279296875, 2.0753173828125, 2.21435546875, 2.3533935546875, 2.492431640625, 2.6314697265625, 2.7705078125, 2.9095458984375, 3.048583984375, 3.1876220703125, 3.32666015625, 3.4656982421875, 3.604736328125, 3.7437744140625, 3.8828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 19.0, 17.0, 33.0, 43.0, 66.0, 146.0, 238.0, 322.0, 505.0, 746.0, 1313.0, 2147.0, 3458.0, 5567.0, 9152.0, 14708.0, 23169.0, 35971.0, 53307.0, 75009.0, 98540.0, 117690.0, 126550.0, 121282.0, 104971.0, 81787.0, 59596.0, 40778.0, 26961.0, 16761.0, 10474.0, 6610.0, 3907.0, 2542.0, 1585.0, 915.0, 560.0, 393.0, 262.0, 171.0, 94.0, 61.0, 43.0, 29.0, 20.0, 8.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2734375, -5.1119384765625, -4.950439453125, -4.7889404296875, -4.62744140625, -4.4659423828125, -4.304443359375, -4.1429443359375, -3.9814453125, -3.8199462890625, -3.658447265625, -3.4969482421875, -3.33544921875, -3.1739501953125, -3.012451171875, -2.8509521484375, -2.689453125, -2.5279541015625, -2.366455078125, -2.2049560546875, -2.04345703125, -1.8819580078125, -1.720458984375, -1.5589599609375, -1.3974609375, -1.2359619140625, -1.074462890625, -0.9129638671875, -0.75146484375, -0.5899658203125, -0.428466796875, -0.2669677734375, -0.10546875, 0.0560302734375, 0.217529296875, 0.3790283203125, 0.54052734375, 0.7020263671875, 0.863525390625, 1.0250244140625, 1.1865234375, 1.3480224609375, 1.509521484375, 1.6710205078125, 1.83251953125, 1.9940185546875, 2.155517578125, 2.3170166015625, 2.478515625, 2.6400146484375, 2.801513671875, 2.9630126953125, 3.12451171875, 3.2860107421875, 3.447509765625, 3.6090087890625, 3.7705078125, 3.9320068359375, 4.093505859375, 4.2550048828125, 4.41650390625, 4.5780029296875, 4.739501953125, 4.9010009765625, 5.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 13.0, 16.0, 12.0, 19.0, 19.0, 21.0, 22.0, 30.0, 35.0, 35.0, 38.0, 37.0, 47.0, 55.0, 51.0, 44.0, 39.0, 49.0, 47.0, 39.0, 39.0, 38.0, 30.0, 23.0, 25.0, 24.0, 20.0, 14.0, 13.0, 12.0, 10.0, 8.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.063262939453125, -2.96441650390625, -2.865570068359375, -2.7667236328125, -2.667877197265625, -2.56903076171875, -2.470184326171875, -2.371337890625, -2.272491455078125, -2.17364501953125, -2.074798583984375, -1.9759521484375, -1.877105712890625, -1.77825927734375, -1.679412841796875, -1.58056640625, -1.481719970703125, -1.38287353515625, -1.284027099609375, -1.1851806640625, -1.086334228515625, -0.98748779296875, -0.888641357421875, -0.789794921875, -0.690948486328125, -0.59210205078125, -0.493255615234375, -0.3944091796875, -0.295562744140625, -0.19671630859375, -0.097869873046875, 0.0009765625, 0.099822998046875, 0.19866943359375, 0.297515869140625, 0.3963623046875, 0.495208740234375, 0.59405517578125, 0.692901611328125, 0.791748046875, 0.890594482421875, 0.98944091796875, 1.088287353515625, 1.1871337890625, 1.285980224609375, 1.38482666015625, 1.483673095703125, 1.58251953125, 1.681365966796875, 1.78021240234375, 1.879058837890625, 1.9779052734375, 2.076751708984375, 2.17559814453125, 2.274444580078125, 2.373291015625, 2.472137451171875, 2.57098388671875, 2.669830322265625, 2.7686767578125, 2.867523193359375, 2.96636962890625, 3.065216064453125, 3.1640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 11.0, 13.0, 23.0, 22.0, 34.0, 41.0, 64.0, 92.0, 120.0, 168.0, 234.0, 373.0, 542.0, 821.0, 1304.0, 2198.0, 3693.0, 6567.0, 12338.0, 23544.0, 45969.0, 85466.0, 141070.0, 190806.0, 192863.0, 145926.0, 90202.0, 48539.0, 25288.0, 13051.0, 6923.0, 3818.0, 2247.0, 1377.0, 877.0, 594.0, 401.0, 252.0, 178.0, 139.0, 94.0, 83.0, 53.0, 32.0, 31.0, 10.0, 22.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.11846923828125, -2.0455322265625, -1.97259521484375, -1.899658203125, -1.82672119140625, -1.7537841796875, -1.68084716796875, -1.60791015625, -1.53497314453125, -1.4620361328125, -1.38909912109375, -1.316162109375, -1.24322509765625, -1.1702880859375, -1.09735107421875, -1.0244140625, -0.95147705078125, -0.8785400390625, -0.80560302734375, -0.732666015625, -0.65972900390625, -0.5867919921875, -0.51385498046875, -0.44091796875, -0.36798095703125, -0.2950439453125, -0.22210693359375, -0.149169921875, -0.07623291015625, -0.0032958984375, 0.06964111328125, 0.142578125, 0.21551513671875, 0.2884521484375, 0.36138916015625, 0.434326171875, 0.50726318359375, 0.5802001953125, 0.65313720703125, 0.72607421875, 0.79901123046875, 0.8719482421875, 0.94488525390625, 1.017822265625, 1.09075927734375, 1.1636962890625, 1.23663330078125, 1.3095703125, 1.38250732421875, 1.4554443359375, 1.52838134765625, 1.601318359375, 1.67425537109375, 1.7471923828125, 1.82012939453125, 1.89306640625, 1.96600341796875, 2.0389404296875, 2.11187744140625, 2.184814453125, 2.25775146484375, 2.3306884765625, 2.40362548828125, 2.4765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 2.0, 4.0, 10.0, 16.0, 20.0, 28.0, 22.0, 42.0, 34.0, 45.0, 58.0, 55.0, 72.0, 65.0, 87.0, 68.0, 60.0, 62.0, 50.0, 44.0, 41.0, 28.0, 24.0, 13.0, 13.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021754205226898193, -0.0002097785472869873, -0.00020201504230499268, -0.00019425153732299805, -0.00018648803234100342, -0.0001787245273590088, -0.00017096102237701416, -0.00016319751739501953, -0.0001554340124130249, -0.00014767050743103027, -0.00013990700244903564, -0.00013214349746704102, -0.0001243799924850464, -0.00011661648750305176, -0.00010885298252105713, -0.0001010894775390625, -9.332597255706787e-05, -8.556246757507324e-05, -7.779896259307861e-05, -7.003545761108398e-05, -6.227195262908936e-05, -5.4508447647094727e-05, -4.67449426651001e-05, -3.898143768310547e-05, -3.121793270111084e-05, -2.345442771911621e-05, -1.5690922737121582e-05, -7.927417755126953e-06, -1.6391277313232422e-07, 7.599592208862305e-06, 1.5363097190856934e-05, 2.3126602172851562e-05, 3.089010715484619e-05, 3.865361213684082e-05, 4.641711711883545e-05, 5.418062210083008e-05, 6.194412708282471e-05, 6.970763206481934e-05, 7.747113704681396e-05, 8.52346420288086e-05, 9.299814701080322e-05, 0.00010076165199279785, 0.00010852515697479248, 0.00011628866195678711, 0.00012405216693878174, 0.00013181567192077637, 0.000139579176902771, 0.00014734268188476562, 0.00015510618686676025, 0.00016286969184875488, 0.0001706331968307495, 0.00017839670181274414, 0.00018616020679473877, 0.0001939237117767334, 0.00020168721675872803, 0.00020945072174072266, 0.00021721422672271729, 0.00022497773170471191, 0.00023274123668670654, 0.00024050474166870117, 0.0002482682466506958, 0.00025603175163269043, 0.00026379525661468506, 0.0002715587615966797]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 1.0, 9.0, 12.0, 16.0, 12.0, 14.0, 26.0, 32.0, 42.0, 61.0, 84.0, 114.0, 116.0, 190.0, 275.0, 495.0, 821.0, 1465.0, 2728.0, 5407.0, 10136.0, 19336.0, 37308.0, 67574.0, 111863.0, 157183.0, 181363.0, 165040.0, 120948.0, 75988.0, 42284.0, 22590.0, 11659.0, 5953.0, 3126.0, 1674.0, 908.0, 575.0, 367.0, 217.0, 143.0, 98.0, 80.0, 58.0, 35.0, 38.0, 23.0, 20.0, 8.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-2.029296875, -1.9670562744140625, -1.904815673828125, -1.8425750732421875, -1.78033447265625, -1.7180938720703125, -1.655853271484375, -1.5936126708984375, -1.5313720703125, -1.4691314697265625, -1.406890869140625, -1.3446502685546875, -1.28240966796875, -1.2201690673828125, -1.157928466796875, -1.0956878662109375, -1.033447265625, -0.9712066650390625, -0.908966064453125, -0.8467254638671875, -0.78448486328125, -0.7222442626953125, -0.660003662109375, -0.5977630615234375, -0.5355224609375, -0.4732818603515625, -0.411041259765625, -0.3488006591796875, -0.28656005859375, -0.2243194580078125, -0.162078857421875, -0.0998382568359375, -0.03759765625, 0.0246429443359375, 0.086883544921875, 0.1491241455078125, 0.21136474609375, 0.2736053466796875, 0.335845947265625, 0.3980865478515625, 0.4603271484375, 0.5225677490234375, 0.584808349609375, 0.6470489501953125, 0.70928955078125, 0.7715301513671875, 0.833770751953125, 0.8960113525390625, 0.958251953125, 1.0204925537109375, 1.082733154296875, 1.1449737548828125, 1.20721435546875, 1.2694549560546875, 1.331695556640625, 1.3939361572265625, 1.4561767578125, 1.5184173583984375, 1.580657958984375, 1.6428985595703125, 1.70513916015625, 1.7673797607421875, 1.829620361328125, 1.8918609619140625, 1.9541015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 17.0, 14.0, 35.0, 36.0, 44.0, 38.0, 39.0, 42.0, 61.0, 64.0, 62.0, 63.0, 60.0, 55.0, 50.0, 50.0, 43.0, 44.0, 24.0, 30.0, 26.0, 13.0, 12.0, 11.0, 6.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6356277465820312, -0.6130523681640625, -0.5904769897460938, -0.567901611328125, -0.5453262329101562, -0.5227508544921875, -0.5001754760742188, -0.47760009765625, -0.45502471923828125, -0.4324493408203125, -0.40987396240234375, -0.387298583984375, -0.36472320556640625, -0.3421478271484375, -0.31957244873046875, -0.2969970703125, -0.27442169189453125, -0.2518463134765625, -0.22927093505859375, -0.206695556640625, -0.18412017822265625, -0.1615447998046875, -0.13896942138671875, -0.11639404296875, -0.09381866455078125, -0.0712432861328125, -0.04866790771484375, -0.026092529296875, -0.00351715087890625, 0.0190582275390625, 0.04163360595703125, 0.064208984375, 0.08678436279296875, 0.1093597412109375, 0.13193511962890625, 0.154510498046875, 0.17708587646484375, 0.1996612548828125, 0.22223663330078125, 0.24481201171875, 0.26738739013671875, 0.2899627685546875, 0.31253814697265625, 0.335113525390625, 0.35768890380859375, 0.3802642822265625, 0.40283966064453125, 0.4254150390625, 0.44799041748046875, 0.4705657958984375, 0.49314117431640625, 0.515716552734375, 0.5382919311523438, 0.5608673095703125, 0.5834426879882812, 0.60601806640625, 0.6285934448242188, 0.6511688232421875, 0.6737442016601562, 0.696319580078125, 0.7188949584960938, 0.7414703369140625, 0.7640457153320312, 0.78662109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 5.0, 11.0, 14.0, 12.0, 13.0, 13.0, 16.0, 21.0, 19.0, 35.0, 28.0, 33.0, 35.0, 43.0, 45.0, 64.0, 53.0, 45.0, 55.0, 44.0, 47.0, 35.0, 29.0, 39.0, 39.0, 34.0, 28.0, 27.0, 25.0, 21.0, 8.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.122591495513916, -4.962081432342529, -4.801571369171143, -4.641060829162598, -4.480550765991211, -4.320040702819824, -4.1595306396484375, -3.9990203380584717, -3.838510036468506, -3.677999973297119, -3.5174896717071533, -3.3569796085357666, -3.196469306945801, -3.035959243774414, -2.8754491806030273, -2.7149388790130615, -2.554428815841675, -2.393918752670288, -2.2334084510803223, -2.0728983879089355, -1.9123880863189697, -1.751878023147583, -1.5913678407669067, -1.4308576583862305, -1.2703474760055542, -1.109837293624878, -0.9493271112442017, -0.7888169884681702, -0.6283068060874939, -0.4677966237068176, -0.30728650093078613, -0.14677631855010986, 0.013733863830566406, 0.17424403131008148, 0.33475419878959656, 0.49526435136795044, 0.6557745337486267, 0.816284716129303, 0.9767948389053345, 1.1373050212860107, 1.297815203666687, 1.4583253860473633, 1.6188355684280396, 1.7793457508087158, 1.9398558139801025, 2.1003661155700684, 2.260876178741455, 2.421386241912842, 2.5818965435028076, 2.7424066066741943, 2.90291690826416, 3.063426971435547, 3.2239372730255127, 3.3844473361968994, 3.5449576377868652, 3.705467700958252, 3.8659777641296387, 4.026487827301025, 4.186997890472412, 4.347508430480957, 4.508018493652344, 4.6685285568237305, 4.829038619995117, 4.989548683166504, 5.150059223175049]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 10.0, 12.0, 15.0, 22.0, 14.0, 30.0, 24.0, 31.0, 29.0, 30.0, 36.0, 53.0, 35.0, 39.0, 42.0, 50.0, 44.0, 47.0, 34.0, 34.0, 36.0, 44.0, 29.0, 31.0, 34.0, 22.0, 21.0, 16.0, 20.0, 11.0, 13.0, 10.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021089553833008, -4.866550922393799, -4.71201229095459, -4.557473182678223, -4.402934551239014, -4.248395919799805, -4.093857288360596, -3.9393186569213867, -3.7847800254821777, -3.6302413940429688, -3.4757025241851807, -3.3211638927459717, -3.1666252613067627, -3.0120863914489746, -2.8575477600097656, -2.7030091285705566, -2.5484702587127686, -2.3939316272735596, -2.2393927574157715, -2.0848541259765625, -1.9303154945373535, -1.775776743888855, -1.6212379932403564, -1.4666993618011475, -1.312160611152649, -1.1576218605041504, -1.0030832290649414, -0.8485444784164429, -0.6940057873725891, -0.5394670963287354, -0.3849283456802368, -0.23038971424102783, -0.0758509635925293, 0.07868774235248566, 0.2332264482975006, 0.38776516914367676, 0.5423038601875305, 0.6968425512313843, 0.8513813018798828, 1.0059199333190918, 1.1604586839675903, 1.3149974346160889, 1.4695360660552979, 1.6240748167037964, 1.778613567352295, 1.933152198791504, 2.087690830230713, 2.242229461669922, 2.39676833152771, 2.551306962966919, 2.705845832824707, 2.860384464263916, 3.014923095703125, 3.169461727142334, 3.324000597000122, 3.478539228439331, 3.633078098297119, 3.787616729736328, 3.942155599594116, 4.096693992614746, 4.251233100891113, 4.405771732330322, 4.560310363769531, 4.71484899520874, 4.869387626647949]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 7.0, 23.0, 20.0, 57.0, 79.0, 129.0, 240.0, 389.0, 644.0, 1086.0, 1690.0, 2903.0, 4884.0, 7936.0, 13549.0, 22353.0, 37250.0, 61627.0, 101512.0, 163475.0, 256915.0, 380127.0, 509729.0, 596424.0, 583854.0, 486224.0, 353835.0, 234928.0, 147725.0, 90589.0, 54667.0, 32431.0, 19222.0, 11378.0, 6745.0, 3961.0, 2298.0, 1391.0, 827.0, 479.0, 264.0, 172.0, 107.0, 53.0, 35.0, 21.0, 15.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.25, -4.128204345703125, -4.00640869140625, -3.884613037109375, -3.7628173828125, -3.641021728515625, -3.51922607421875, -3.397430419921875, -3.275634765625, -3.153839111328125, -3.03204345703125, -2.910247802734375, -2.7884521484375, -2.666656494140625, -2.54486083984375, -2.423065185546875, -2.30126953125, -2.179473876953125, -2.05767822265625, -1.935882568359375, -1.8140869140625, -1.692291259765625, -1.57049560546875, -1.448699951171875, -1.326904296875, -1.205108642578125, -1.08331298828125, -0.961517333984375, -0.8397216796875, -0.717926025390625, -0.59613037109375, -0.474334716796875, -0.3525390625, -0.230743408203125, -0.10894775390625, 0.012847900390625, 0.1346435546875, 0.256439208984375, 0.37823486328125, 0.500030517578125, 0.621826171875, 0.743621826171875, 0.86541748046875, 0.987213134765625, 1.1090087890625, 1.230804443359375, 1.35260009765625, 1.474395751953125, 1.59619140625, 1.717987060546875, 1.83978271484375, 1.961578369140625, 2.0833740234375, 2.205169677734375, 2.32696533203125, 2.448760986328125, 2.570556640625, 2.692352294921875, 2.81414794921875, 2.935943603515625, 3.0577392578125, 3.179534912109375, 3.30133056640625, 3.423126220703125, 3.544921875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 6.0, 11.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 26.0, 28.0, 38.0, 37.0, 27.0, 44.0, 35.0, 50.0, 34.0, 43.0, 57.0, 42.0, 41.0, 30.0, 50.0, 40.0, 39.0, 34.0, 32.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 8.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.479644775390625, -3.35577392578125, -3.231903076171875, -3.1080322265625, -2.984161376953125, -2.86029052734375, -2.736419677734375, -2.612548828125, -2.488677978515625, -2.36480712890625, -2.240936279296875, -2.1170654296875, -1.993194580078125, -1.86932373046875, -1.745452880859375, -1.62158203125, -1.497711181640625, -1.37384033203125, -1.249969482421875, -1.1260986328125, -1.002227783203125, -0.87835693359375, -0.754486083984375, -0.630615234375, -0.506744384765625, -0.38287353515625, -0.259002685546875, -0.1351318359375, -0.011260986328125, 0.11260986328125, 0.236480712890625, 0.3603515625, 0.484222412109375, 0.60809326171875, 0.731964111328125, 0.8558349609375, 0.979705810546875, 1.10357666015625, 1.227447509765625, 1.351318359375, 1.475189208984375, 1.59906005859375, 1.722930908203125, 1.8468017578125, 1.970672607421875, 2.09454345703125, 2.218414306640625, 2.34228515625, 2.466156005859375, 2.59002685546875, 2.713897705078125, 2.8377685546875, 2.961639404296875, 3.08551025390625, 3.209381103515625, 3.333251953125, 3.457122802734375, 3.58099365234375, 3.704864501953125, 3.8287353515625, 3.952606201171875, 4.07647705078125, 4.200347900390625, 4.32421875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 16.0, 15.0, 31.0, 70.0, 82.0, 164.0, 277.0, 460.0, 914.0, 1554.0, 2873.0, 5252.0, 9363.0, 17180.0, 29773.0, 51312.0, 86806.0, 142476.0, 221547.0, 327103.0, 444346.0, 539694.0, 570593.0, 520358.0, 416514.0, 299272.0, 199450.0, 126904.0, 76408.0, 44967.0, 25758.0, 14409.0, 8047.0, 4601.0, 2482.0, 1438.0, 781.0, 448.0, 216.0, 147.0, 78.0, 38.0, 24.0, 20.0, 7.0, 8.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.359375, -4.23614501953125, -4.1129150390625, -3.98968505859375, -3.866455078125, -3.74322509765625, -3.6199951171875, -3.49676513671875, -3.37353515625, -3.25030517578125, -3.1270751953125, -3.00384521484375, -2.880615234375, -2.75738525390625, -2.6341552734375, -2.51092529296875, -2.3876953125, -2.26446533203125, -2.1412353515625, -2.01800537109375, -1.894775390625, -1.77154541015625, -1.6483154296875, -1.52508544921875, -1.40185546875, -1.27862548828125, -1.1553955078125, -1.03216552734375, -0.908935546875, -0.78570556640625, -0.6624755859375, -0.53924560546875, -0.416015625, -0.29278564453125, -0.1695556640625, -0.04632568359375, 0.076904296875, 0.20013427734375, 0.3233642578125, 0.44659423828125, 0.56982421875, 0.69305419921875, 0.8162841796875, 0.93951416015625, 1.062744140625, 1.18597412109375, 1.3092041015625, 1.43243408203125, 1.5556640625, 1.67889404296875, 1.8021240234375, 1.92535400390625, 2.048583984375, 2.17181396484375, 2.2950439453125, 2.41827392578125, 2.54150390625, 2.66473388671875, 2.7879638671875, 2.91119384765625, 3.034423828125, 3.15765380859375, 3.2808837890625, 3.40411376953125, 3.52734375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 11.0, 14.0, 12.0, 13.0, 25.0, 32.0, 33.0, 45.0, 44.0, 60.0, 93.0, 88.0, 118.0, 137.0, 160.0, 183.0, 183.0, 214.0, 236.0, 252.0, 241.0, 258.0, 233.0, 186.0, 204.0, 166.0, 132.0, 136.0, 107.0, 96.0, 70.0, 69.0, 47.0, 32.0, 28.0, 29.0, 17.0, 21.0, 15.0, 9.0, 5.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.650390625, -1.595611572265625, -1.54083251953125, -1.486053466796875, -1.4312744140625, -1.376495361328125, -1.32171630859375, -1.266937255859375, -1.212158203125, -1.157379150390625, -1.10260009765625, -1.047821044921875, -0.9930419921875, -0.938262939453125, -0.88348388671875, -0.828704833984375, -0.77392578125, -0.719146728515625, -0.66436767578125, -0.609588623046875, -0.5548095703125, -0.500030517578125, -0.44525146484375, -0.390472412109375, -0.335693359375, -0.280914306640625, -0.22613525390625, -0.171356201171875, -0.1165771484375, -0.061798095703125, -0.00701904296875, 0.047760009765625, 0.1025390625, 0.157318115234375, 0.21209716796875, 0.266876220703125, 0.3216552734375, 0.376434326171875, 0.43121337890625, 0.485992431640625, 0.540771484375, 0.595550537109375, 0.65032958984375, 0.705108642578125, 0.7598876953125, 0.814666748046875, 0.86944580078125, 0.924224853515625, 0.97900390625, 1.033782958984375, 1.08856201171875, 1.143341064453125, 1.1981201171875, 1.252899169921875, 1.30767822265625, 1.362457275390625, 1.417236328125, 1.472015380859375, 1.52679443359375, 1.581573486328125, 1.6363525390625, 1.691131591796875, 1.74591064453125, 1.800689697265625, 1.85546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 14.0, 17.0, 9.0, 16.0, 22.0, 30.0, 33.0, 36.0, 46.0, 35.0, 50.0, 43.0, 53.0, 56.0, 51.0, 52.0, 52.0, 39.0, 45.0, 36.0, 42.0, 39.0, 29.0, 22.0, 31.0, 15.0, 10.0, 15.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9960076808929443, -3.8486523628234863, -3.7012972831726074, -3.5539419651031494, -3.4065866470336914, -3.2592313289642334, -3.1118760108947754, -2.9645209312438965, -2.8171656131744385, -2.6698102951049805, -2.5224552154541016, -2.3750998973846436, -2.2277445793151855, -2.0803892612457275, -1.933034062385559, -1.7856788635253906, -1.6383235454559326, -1.4909682273864746, -1.3436130285263062, -1.1962578296661377, -1.0489025115966797, -0.9015472531318665, -0.7541919946670532, -0.6068367958068848, -0.45948147773742676, -0.3121262192726135, -0.1647709608078003, -0.01741570234298706, 0.12993955612182617, 0.2772948145866394, 0.42465007305145264, 0.5720052719116211, 0.7193608283996582, 0.8667160868644714, 1.0140713453292847, 1.1614265441894531, 1.3087818622589111, 1.4561371803283691, 1.6034923791885376, 1.750847578048706, 1.898202896118164, 2.045558214187622, 2.19291353225708, 2.340268611907959, 2.487623929977417, 2.634979248046875, 2.782334327697754, 2.929689645767212, 3.07704496383667, 3.224400281906128, 3.371755599975586, 3.519110679626465, 3.666465997695923, 3.813821315765381, 3.9611763954162598, 4.108531951904297, 4.255887031555176, 4.403242111206055, 4.550597667694092, 4.697952747344971, 4.845308303833008, 4.992663383483887, 5.140018463134766, 5.2873735427856445, 5.434729099273682]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 7.0, 11.0, 11.0, 8.0, 13.0, 14.0, 17.0, 14.0, 22.0, 28.0, 26.0, 27.0, 26.0, 32.0, 41.0, 43.0, 33.0, 49.0, 32.0, 38.0, 43.0, 48.0, 27.0, 49.0, 40.0, 39.0, 30.0, 34.0, 23.0, 30.0, 21.0, 18.0, 21.0, 13.0, 16.0, 9.0, 8.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.188475131988525, -4.064115047454834, -3.9397549629211426, -3.815394878387451, -3.6910347938537598, -3.5666747093200684, -3.442314624786377, -3.3179545402526855, -3.193594455718994, -3.0692343711853027, -2.9448742866516113, -2.82051420211792, -2.6961541175842285, -2.571794033050537, -2.4474339485168457, -2.3230738639831543, -2.198714017868042, -2.0743539333343506, -1.9499938488006592, -1.8256337642669678, -1.7012736797332764, -1.576913595199585, -1.452553629875183, -1.3281935453414917, -1.2038334608078003, -1.0794733762741089, -0.9551132917404175, -0.8307532668113708, -0.7063931822776794, -0.582033097743988, -0.4576730728149414, -0.33331298828125, -0.2089526653289795, -0.08459259569644928, 0.03976747393608093, 0.16412752866744995, 0.28848761320114136, 0.41284769773483276, 0.5372077226638794, 0.6615678071975708, 0.7859278917312622, 0.9102879762649536, 1.034648060798645, 1.1590080261230469, 1.2833681106567383, 1.4077281951904297, 1.532088279724121, 1.6564483642578125, 1.780808448791504, 1.9051685333251953, 2.0295286178588867, 2.153888702392578, 2.2782487869262695, 2.402608871459961, 2.5269689559936523, 2.6513290405273438, 2.775689125061035, 2.9000492095947266, 3.024409294128418, 3.1487693786621094, 3.273129463195801, 3.397489547729492, 3.5218496322631836, 3.646209716796875, 3.7705695629119873]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 12.0, 20.0, 21.0, 40.0, 43.0, 75.0, 118.0, 201.0, 270.0, 446.0, 753.0, 1254.0, 2168.0, 3897.0, 7795.0, 16462.0, 37349.0, 88790.0, 210077.0, 326745.0, 199994.0, 84234.0, 35627.0, 15628.0, 7339.0, 3846.0, 2159.0, 1229.0, 720.0, 419.0, 287.0, 169.0, 100.0, 91.0, 48.0, 36.0, 21.0, 17.0, 12.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.27288818359375, -5.0809326171875, -4.88897705078125, -4.697021484375, -4.50506591796875, -4.3131103515625, -4.12115478515625, -3.92919921875, -3.73724365234375, -3.5452880859375, -3.35333251953125, -3.161376953125, -2.96942138671875, -2.7774658203125, -2.58551025390625, -2.3935546875, -2.20159912109375, -2.0096435546875, -1.81768798828125, -1.625732421875, -1.43377685546875, -1.2418212890625, -1.04986572265625, -0.85791015625, -0.66595458984375, -0.4739990234375, -0.28204345703125, -0.090087890625, 0.10186767578125, 0.2938232421875, 0.48577880859375, 0.677734375, 0.86968994140625, 1.0616455078125, 1.25360107421875, 1.445556640625, 1.63751220703125, 1.8294677734375, 2.02142333984375, 2.21337890625, 2.40533447265625, 2.5972900390625, 2.78924560546875, 2.981201171875, 3.17315673828125, 3.3651123046875, 3.55706787109375, 3.7490234375, 3.94097900390625, 4.1329345703125, 4.32489013671875, 4.516845703125, 4.70880126953125, 4.9007568359375, 5.09271240234375, 5.28466796875, 5.47662353515625, 5.6685791015625, 5.86053466796875, 6.052490234375, 6.24444580078125, 6.4364013671875, 6.62835693359375, 6.8203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 11.0, 13.0, 9.0, 20.0, 15.0, 14.0, 22.0, 34.0, 20.0, 32.0, 30.0, 25.0, 30.0, 31.0, 40.0, 40.0, 46.0, 44.0, 37.0, 33.0, 45.0, 44.0, 30.0, 35.0, 21.0, 31.0, 24.0, 22.0, 18.0, 22.0, 19.0, 21.0, 14.0, 19.0, 13.0, 6.0, 9.0, 10.0, 3.0, 1.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.728515625, -3.610595703125, -3.49267578125, -3.374755859375, -3.2568359375, -3.138916015625, -3.02099609375, -2.903076171875, -2.78515625, -2.667236328125, -2.54931640625, -2.431396484375, -2.3134765625, -2.195556640625, -2.07763671875, -1.959716796875, -1.841796875, -1.723876953125, -1.60595703125, -1.488037109375, -1.3701171875, -1.252197265625, -1.13427734375, -1.016357421875, -0.8984375, -0.780517578125, -0.66259765625, -0.544677734375, -0.4267578125, -0.308837890625, -0.19091796875, -0.072998046875, 0.044921875, 0.162841796875, 0.28076171875, 0.398681640625, 0.5166015625, 0.634521484375, 0.75244140625, 0.870361328125, 0.98828125, 1.106201171875, 1.22412109375, 1.342041015625, 1.4599609375, 1.577880859375, 1.69580078125, 1.813720703125, 1.931640625, 2.049560546875, 2.16748046875, 2.285400390625, 2.4033203125, 2.521240234375, 2.63916015625, 2.757080078125, 2.875, 2.992919921875, 3.11083984375, 3.228759765625, 3.3466796875, 3.464599609375, 3.58251953125, 3.700439453125, 3.818359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 12.0, 20.0, 27.0, 37.0, 52.0, 86.0, 98.0, 141.0, 180.0, 271.0, 363.0, 508.0, 722.0, 1086.0, 1759.0, 2833.0, 4528.0, 8055.0, 15187.0, 31146.0, 69167.0, 161390.0, 309219.0, 240138.0, 106288.0, 46141.0, 21544.0, 11107.0, 5991.0, 3616.0, 2211.0, 1424.0, 978.0, 662.0, 455.0, 333.0, 229.0, 148.0, 107.0, 80.0, 60.0, 48.0, 22.0, 23.0, 21.0, 11.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-4.29296875, -4.16943359375, -4.0458984375, -3.92236328125, -3.798828125, -3.67529296875, -3.5517578125, -3.42822265625, -3.3046875, -3.18115234375, -3.0576171875, -2.93408203125, -2.810546875, -2.68701171875, -2.5634765625, -2.43994140625, -2.31640625, -2.19287109375, -2.0693359375, -1.94580078125, -1.822265625, -1.69873046875, -1.5751953125, -1.45166015625, -1.328125, -1.20458984375, -1.0810546875, -0.95751953125, -0.833984375, -0.71044921875, -0.5869140625, -0.46337890625, -0.33984375, -0.21630859375, -0.0927734375, 0.03076171875, 0.154296875, 0.27783203125, 0.4013671875, 0.52490234375, 0.6484375, 0.77197265625, 0.8955078125, 1.01904296875, 1.142578125, 1.26611328125, 1.3896484375, 1.51318359375, 1.63671875, 1.76025390625, 1.8837890625, 2.00732421875, 2.130859375, 2.25439453125, 2.3779296875, 2.50146484375, 2.625, 2.74853515625, 2.8720703125, 2.99560546875, 3.119140625, 3.24267578125, 3.3662109375, 3.48974609375, 3.61328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 8.0, 10.0, 12.0, 13.0, 13.0, 19.0, 13.0, 20.0, 19.0, 28.0, 28.0, 18.0, 27.0, 32.0, 42.0, 43.0, 24.0, 33.0, 31.0, 32.0, 39.0, 48.0, 38.0, 40.0, 42.0, 34.0, 41.0, 24.0, 34.0, 24.0, 21.0, 19.0, 20.0, 14.0, 15.0, 17.0, 7.0, 14.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.32501220703125, -2.2457275390625, -2.16644287109375, -2.087158203125, -2.00787353515625, -1.9285888671875, -1.84930419921875, -1.77001953125, -1.69073486328125, -1.6114501953125, -1.53216552734375, -1.452880859375, -1.37359619140625, -1.2943115234375, -1.21502685546875, -1.1357421875, -1.05645751953125, -0.9771728515625, -0.89788818359375, -0.818603515625, -0.73931884765625, -0.6600341796875, -0.58074951171875, -0.50146484375, -0.42218017578125, -0.3428955078125, -0.26361083984375, -0.184326171875, -0.10504150390625, -0.0257568359375, 0.05352783203125, 0.1328125, 0.21209716796875, 0.2913818359375, 0.37066650390625, 0.449951171875, 0.52923583984375, 0.6085205078125, 0.68780517578125, 0.76708984375, 0.84637451171875, 0.9256591796875, 1.00494384765625, 1.084228515625, 1.16351318359375, 1.2427978515625, 1.32208251953125, 1.4013671875, 1.48065185546875, 1.5599365234375, 1.63922119140625, 1.718505859375, 1.79779052734375, 1.8770751953125, 1.95635986328125, 2.03564453125, 2.11492919921875, 2.1942138671875, 2.27349853515625, 2.352783203125, 2.43206787109375, 2.5113525390625, 2.59063720703125, 2.669921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 7.0, 16.0, 29.0, 47.0, 63.0, 104.0, 187.0, 272.0, 453.0, 649.0, 1083.0, 1812.0, 3224.0, 6522.0, 15726.0, 61687.0, 695563.0, 210619.0, 29825.0, 10017.0, 4678.0, 2360.0, 1365.0, 771.0, 487.0, 339.0, 234.0, 136.0, 105.0, 58.0, 35.0, 22.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.0645751953125, -5.867431640625, -5.6702880859375, -5.47314453125, -5.2760009765625, -5.078857421875, -4.8817138671875, -4.6845703125, -4.4874267578125, -4.290283203125, -4.0931396484375, -3.89599609375, -3.6988525390625, -3.501708984375, -3.3045654296875, -3.107421875, -2.9102783203125, -2.713134765625, -2.5159912109375, -2.31884765625, -2.1217041015625, -1.924560546875, -1.7274169921875, -1.5302734375, -1.3331298828125, -1.135986328125, -0.9388427734375, -0.74169921875, -0.5445556640625, -0.347412109375, -0.1502685546875, 0.046875, 0.2440185546875, 0.441162109375, 0.6383056640625, 0.83544921875, 1.0325927734375, 1.229736328125, 1.4268798828125, 1.6240234375, 1.8211669921875, 2.018310546875, 2.2154541015625, 2.41259765625, 2.6097412109375, 2.806884765625, 3.0040283203125, 3.201171875, 3.3983154296875, 3.595458984375, 3.7926025390625, 3.98974609375, 4.1868896484375, 4.384033203125, 4.5811767578125, 4.7783203125, 4.9754638671875, 5.172607421875, 5.3697509765625, 5.56689453125, 5.7640380859375, 5.961181640625, 6.1583251953125, 6.35546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 10.0, 9.0, 22.0, 27.0, 68.0, 142.0, 287.0, 206.0, 94.0, 51.0, 20.0, 22.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008754730224609375, -0.0008528754115104675, -0.0008302778005599976, -0.0008076801896095276, -0.0007850825786590576, -0.0007624849677085876, -0.0007398873567581177, -0.0007172897458076477, -0.0006946921348571777, -0.0006720945239067078, -0.0006494969129562378, -0.0006268993020057678, -0.0006043016910552979, -0.0005817040801048279, -0.0005591064691543579, -0.0005365088582038879, -0.000513911247253418, -0.000491313636302948, -0.00046871602535247803, -0.00044611841440200806, -0.0004235208034515381, -0.0004009231925010681, -0.00037832558155059814, -0.0003557279706001282, -0.0003331303596496582, -0.00031053274869918823, -0.00028793513774871826, -0.0002653375267982483, -0.00024273991584777832, -0.00022014230489730835, -0.00019754469394683838, -0.0001749470829963684, -0.00015234947204589844, -0.00012975186109542847, -0.0001071542501449585, -8.455663919448853e-05, -6.195902824401855e-05, -3.9361417293548584e-05, -1.6763806343078613e-05, 5.833804607391357e-06, 2.8431415557861328e-05, 5.10290265083313e-05, 7.362663745880127e-05, 9.622424840927124e-05, 0.00011882185935974121, 0.00014141947031021118, 0.00016401708126068115, 0.00018661469221115112, 0.0002092123031616211, 0.00023180991411209106, 0.00025440752506256104, 0.000277005136013031, 0.000299602746963501, 0.00032220035791397095, 0.0003447979688644409, 0.0003673955798149109, 0.00038999319076538086, 0.00041259080171585083, 0.0004351884126663208, 0.00045778602361679077, 0.00048038363456726074, 0.0005029812455177307, 0.0005255788564682007, 0.0005481764674186707, 0.0005707740783691406]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 16.0, 23.0, 32.0, 48.0, 52.0, 85.0, 126.0, 179.0, 230.0, 373.0, 496.0, 657.0, 986.0, 1409.0, 2205.0, 3412.0, 5424.0, 9344.0, 18558.0, 42486.0, 120809.0, 370820.0, 304261.0, 93817.0, 34234.0, 15770.0, 8360.0, 4780.0, 3125.0, 2008.0, 1319.0, 909.0, 615.0, 477.0, 316.0, 236.0, 145.0, 121.0, 87.0, 65.0, 37.0, 27.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.935546875, -3.808135986328125, -3.68072509765625, -3.553314208984375, -3.4259033203125, -3.298492431640625, -3.17108154296875, -3.043670654296875, -2.916259765625, -2.788848876953125, -2.66143798828125, -2.534027099609375, -2.4066162109375, -2.279205322265625, -2.15179443359375, -2.024383544921875, -1.89697265625, -1.769561767578125, -1.64215087890625, -1.514739990234375, -1.3873291015625, -1.259918212890625, -1.13250732421875, -1.005096435546875, -0.877685546875, -0.750274658203125, -0.62286376953125, -0.495452880859375, -0.3680419921875, -0.240631103515625, -0.11322021484375, 0.014190673828125, 0.1416015625, 0.269012451171875, 0.39642333984375, 0.523834228515625, 0.6512451171875, 0.778656005859375, 0.90606689453125, 1.033477783203125, 1.160888671875, 1.288299560546875, 1.41571044921875, 1.543121337890625, 1.6705322265625, 1.797943115234375, 1.92535400390625, 2.052764892578125, 2.18017578125, 2.307586669921875, 2.43499755859375, 2.562408447265625, 2.6898193359375, 2.817230224609375, 2.94464111328125, 3.072052001953125, 3.199462890625, 3.326873779296875, 3.45428466796875, 3.581695556640625, 3.7091064453125, 3.836517333984375, 3.96392822265625, 4.091339111328125, 4.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 4.0, 4.0, 4.0, 6.0, 15.0, 14.0, 19.0, 31.0, 40.0, 63.0, 49.0, 71.0, 72.0, 103.0, 92.0, 86.0, 69.0, 60.0, 46.0, 27.0, 25.0, 15.0, 13.0, 11.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.97802734375, -0.95001220703125, -0.9219970703125, -0.89398193359375, -0.865966796875, -0.83795166015625, -0.8099365234375, -0.78192138671875, -0.75390625, -0.72589111328125, -0.6978759765625, -0.66986083984375, -0.641845703125, -0.61383056640625, -0.5858154296875, -0.55780029296875, -0.52978515625, -0.50177001953125, -0.4737548828125, -0.44573974609375, -0.417724609375, -0.38970947265625, -0.3616943359375, -0.33367919921875, -0.3056640625, -0.27764892578125, -0.2496337890625, -0.22161865234375, -0.193603515625, -0.16558837890625, -0.1375732421875, -0.10955810546875, -0.08154296875, -0.05352783203125, -0.0255126953125, 0.00250244140625, 0.030517578125, 0.05853271484375, 0.0865478515625, 0.11456298828125, 0.142578125, 0.17059326171875, 0.1986083984375, 0.22662353515625, 0.254638671875, 0.28265380859375, 0.3106689453125, 0.33868408203125, 0.36669921875, 0.39471435546875, 0.4227294921875, 0.45074462890625, 0.478759765625, 0.50677490234375, 0.5347900390625, 0.56280517578125, 0.5908203125, 0.61883544921875, 0.6468505859375, 0.67486572265625, 0.702880859375, 0.73089599609375, 0.7589111328125, 0.78692626953125, 0.81494140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 18.0, 17.0, 30.0, 26.0, 30.0, 40.0, 45.0, 37.0, 37.0, 37.0, 35.0, 39.0, 49.0, 54.0, 49.0, 42.0, 33.0, 38.0, 24.0, 32.0, 32.0, 26.0, 31.0, 17.0, 24.0, 19.0, 11.0, 12.0, 6.0, 6.0, 13.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6007587909698486, -3.4782354831695557, -3.3557121753692627, -3.2331888675689697, -3.1106653213500977, -2.9881420135498047, -2.8656187057495117, -2.7430953979492188, -2.620572090148926, -2.498048782348633, -2.37552547454834, -2.253002166748047, -2.130478858947754, -2.007955551147461, -1.8854320049285889, -1.762908697128296, -1.640385389328003, -1.51786208152771, -1.395338773727417, -1.2728153467178345, -1.1502920389175415, -1.0277687311172485, -0.9052453637123108, -0.782721996307373, -0.6601986885070801, -0.5376753807067871, -0.41515201330184937, -0.292628675699234, -0.17010533809661865, -0.047582030296325684, 0.07494133710861206, 0.1974647045135498, 0.3199882507324219, 0.44251158833503723, 0.5650349259376526, 0.6875582933425903, 0.8100816011428833, 0.9326049089431763, 1.0551283359527588, 1.1776516437530518, 1.3001749515533447, 1.4226982593536377, 1.5452215671539307, 1.6677449941635132, 1.7902683019638062, 1.9127916097640991, 2.0353150367736816, 2.1578383445739746, 2.2803616523742676, 2.4028849601745605, 2.5254082679748535, 2.6479315757751465, 2.7704548835754395, 2.8929781913757324, 3.0155017375946045, 3.1380250453948975, 3.2605483531951904, 3.3830716609954834, 3.5055949687957764, 3.6281182765960693, 3.7506418228149414, 3.8731651306152344, 3.9956884384155273, 4.11821174621582, 4.240735054016113]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 13.0, 11.0, 7.0, 15.0, 12.0, 21.0, 12.0, 23.0, 17.0, 26.0, 25.0, 29.0, 33.0, 39.0, 30.0, 42.0, 40.0, 43.0, 52.0, 30.0, 38.0, 39.0, 41.0, 49.0, 39.0, 34.0, 34.0, 19.0, 25.0, 26.0, 23.0, 14.0, 15.0, 14.0, 12.0, 7.0, 3.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.016229152679443, -3.8973805904388428, -3.778532028198242, -3.6596834659576416, -3.540834903717041, -3.4219865798950195, -3.303138017654419, -3.1842894554138184, -3.0654408931732178, -2.946592330932617, -2.8277437686920166, -2.708895206451416, -2.5900468826293945, -2.471198081970215, -2.3523497581481934, -2.2335011959075928, -2.114652633666992, -1.9958040714263916, -1.876955509185791, -1.75810706615448, -1.6392585039138794, -1.5204099416732788, -1.4015614986419678, -1.2827129364013672, -1.1638643741607666, -1.045015811920166, -0.9261673092842102, -0.8073188066482544, -0.6884702444076538, -0.5696216821670532, -0.4507731795310974, -0.3319246768951416, -0.21307611465454102, -0.09422758221626282, 0.02462095022201538, 0.14346948266029358, 0.2623180150985718, 0.38116657733917236, 0.5000150799751282, 0.618863582611084, 0.7377121448516846, 0.8565607070922852, 0.975409209728241, 1.0942577123641968, 1.2131062746047974, 1.331954836845398, 1.450803279876709, 1.5696518421173096, 1.6885004043579102, 1.8073489665985107, 1.9261975288391113, 2.045046091079712, 2.1638946533203125, 2.282742977142334, 2.4015915393829346, 2.520440101623535, 2.6392886638641357, 2.7581372261047363, 2.876985788345337, 2.9958343505859375, 3.114682674407959, 3.2335314750671387, 3.35237979888916, 3.4712283611297607, 3.5900769233703613]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 31.0, 41.0, 61.0, 97.0, 136.0, 200.0, 310.0, 487.0, 710.0, 1082.0, 1701.0, 2751.0, 4259.0, 6712.0, 10392.0, 16315.0, 24860.0, 37364.0, 53346.0, 72787.0, 92835.0, 110228.0, 118796.0, 115629.0, 102177.0, 82811.0, 62211.0, 44310.0, 30027.0, 19990.0, 12816.0, 8378.0, 5220.0, 3376.0, 2107.0, 1356.0, 857.0, 602.0, 352.0, 246.0, 183.0, 134.0, 65.0, 48.0, 36.0, 20.0, 19.0, 13.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 9.0, 16.0, 12.0, 15.0, 18.0, 30.0, 18.0, 19.0, 39.0, 23.0, 26.0, 35.0, 41.0, 40.0, 32.0, 43.0, 41.0, 42.0, 42.0, 46.0, 36.0, 46.0, 41.0, 38.0, 29.0, 26.0, 36.0, 26.0, 18.0, 16.0, 14.0, 14.0, 10.0, 10.0, 7.0, 4.0, 8.0, 1.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.865234375, -3.747894287109375, -3.63055419921875, -3.513214111328125, -3.3958740234375, -3.278533935546875, -3.16119384765625, -3.043853759765625, -2.926513671875, -2.809173583984375, -2.69183349609375, -2.574493408203125, -2.4571533203125, -2.339813232421875, -2.22247314453125, -2.105133056640625, -1.98779296875, -1.870452880859375, -1.75311279296875, -1.635772705078125, -1.5184326171875, -1.401092529296875, -1.28375244140625, -1.166412353515625, -1.049072265625, -0.931732177734375, -0.81439208984375, -0.697052001953125, -0.5797119140625, -0.462371826171875, -0.34503173828125, -0.227691650390625, -0.1103515625, 0.006988525390625, 0.12432861328125, 0.241668701171875, 0.3590087890625, 0.476348876953125, 0.59368896484375, 0.711029052734375, 0.828369140625, 0.945709228515625, 1.06304931640625, 1.180389404296875, 1.2977294921875, 1.415069580078125, 1.53240966796875, 1.649749755859375, 1.76708984375, 1.884429931640625, 2.00177001953125, 2.119110107421875, 2.2364501953125, 2.353790283203125, 2.47113037109375, 2.588470458984375, 2.705810546875, 2.823150634765625, 2.94049072265625, 3.057830810546875, 3.1751708984375, 3.292510986328125, 3.40985107421875, 3.527191162109375, 3.64453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 13.0, 14.0, 29.0, 43.0, 79.0, 125.0, 191.0, 292.0, 549.0, 790.0, 1393.0, 2312.0, 3759.0, 6144.0, 10282.0, 16606.0, 26349.0, 40187.0, 58723.0, 81777.0, 105485.0, 121920.0, 126443.0, 118413.0, 99664.0, 76025.0, 53878.0, 35964.0, 23340.0, 14671.0, 9080.0, 5587.0, 3328.0, 2023.0, 1261.0, 683.0, 440.0, 285.0, 152.0, 82.0, 72.0, 40.0, 23.0, 15.0, 10.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.0194091796875, -3.882568359375, -3.7457275390625, -3.60888671875, -3.4720458984375, -3.335205078125, -3.1983642578125, -3.0615234375, -2.9246826171875, -2.787841796875, -2.6510009765625, -2.51416015625, -2.3773193359375, -2.240478515625, -2.1036376953125, -1.966796875, -1.8299560546875, -1.693115234375, -1.5562744140625, -1.41943359375, -1.2825927734375, -1.145751953125, -1.0089111328125, -0.8720703125, -0.7352294921875, -0.598388671875, -0.4615478515625, -0.32470703125, -0.1878662109375, -0.051025390625, 0.0858154296875, 0.22265625, 0.3594970703125, 0.496337890625, 0.6331787109375, 0.77001953125, 0.9068603515625, 1.043701171875, 1.1805419921875, 1.3173828125, 1.4542236328125, 1.591064453125, 1.7279052734375, 1.86474609375, 2.0015869140625, 2.138427734375, 2.2752685546875, 2.412109375, 2.5489501953125, 2.685791015625, 2.8226318359375, 2.95947265625, 3.0963134765625, 3.233154296875, 3.3699951171875, 3.5068359375, 3.6436767578125, 3.780517578125, 3.9173583984375, 4.05419921875, 4.1910400390625, 4.327880859375, 4.4647216796875, 4.6015625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 10.0, 11.0, 18.0, 8.0, 11.0, 14.0, 22.0, 21.0, 31.0, 28.0, 31.0, 39.0, 36.0, 24.0, 37.0, 41.0, 41.0, 46.0, 44.0, 38.0, 44.0, 53.0, 29.0, 41.0, 36.0, 27.0, 20.0, 29.0, 25.0, 17.0, 18.0, 15.0, 21.0, 18.0, 11.0, 8.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.303192138671875, -2.22552490234375, -2.147857666015625, -2.0701904296875, -1.992523193359375, -1.91485595703125, -1.837188720703125, -1.759521484375, -1.681854248046875, -1.60418701171875, -1.526519775390625, -1.4488525390625, -1.371185302734375, -1.29351806640625, -1.215850830078125, -1.13818359375, -1.060516357421875, -0.98284912109375, -0.905181884765625, -0.8275146484375, -0.749847412109375, -0.67218017578125, -0.594512939453125, -0.516845703125, -0.439178466796875, -0.36151123046875, -0.283843994140625, -0.2061767578125, -0.128509521484375, -0.05084228515625, 0.026824951171875, 0.1044921875, 0.182159423828125, 0.25982666015625, 0.337493896484375, 0.4151611328125, 0.492828369140625, 0.57049560546875, 0.648162841796875, 0.725830078125, 0.803497314453125, 0.88116455078125, 0.958831787109375, 1.0364990234375, 1.114166259765625, 1.19183349609375, 1.269500732421875, 1.34716796875, 1.424835205078125, 1.50250244140625, 1.580169677734375, 1.6578369140625, 1.735504150390625, 1.81317138671875, 1.890838623046875, 1.968505859375, 2.046173095703125, 2.12384033203125, 2.201507568359375, 2.2791748046875, 2.356842041015625, 2.43450927734375, 2.512176513671875, 2.58984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 13.0, 22.0, 19.0, 42.0, 54.0, 78.0, 110.0, 167.0, 191.0, 348.0, 452.0, 686.0, 991.0, 1628.0, 2673.0, 4959.0, 9748.0, 21169.0, 48439.0, 111224.0, 213081.0, 267553.0, 191670.0, 95153.0, 40639.0, 17735.0, 8366.0, 4438.0, 2430.0, 1563.0, 908.0, 598.0, 430.0, 284.0, 207.0, 155.0, 81.0, 72.0, 44.0, 36.0, 22.0, 20.0, 15.0, 15.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.25616455078125, -3.1490478515625, -3.04193115234375, -2.934814453125, -2.82769775390625, -2.7205810546875, -2.61346435546875, -2.50634765625, -2.39923095703125, -2.2921142578125, -2.18499755859375, -2.077880859375, -1.97076416015625, -1.8636474609375, -1.75653076171875, -1.6494140625, -1.54229736328125, -1.4351806640625, -1.32806396484375, -1.220947265625, -1.11383056640625, -1.0067138671875, -0.89959716796875, -0.79248046875, -0.68536376953125, -0.5782470703125, -0.47113037109375, -0.364013671875, -0.25689697265625, -0.1497802734375, -0.04266357421875, 0.064453125, 0.17156982421875, 0.2786865234375, 0.38580322265625, 0.492919921875, 0.60003662109375, 0.7071533203125, 0.81427001953125, 0.92138671875, 1.02850341796875, 1.1356201171875, 1.24273681640625, 1.349853515625, 1.45697021484375, 1.5640869140625, 1.67120361328125, 1.7783203125, 1.88543701171875, 1.9925537109375, 2.09967041015625, 2.206787109375, 2.31390380859375, 2.4210205078125, 2.52813720703125, 2.63525390625, 2.74237060546875, 2.8494873046875, 2.95660400390625, 3.063720703125, 3.17083740234375, 3.2779541015625, 3.38507080078125, 3.4921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 13.0, 9.0, 9.0, 31.0, 27.0, 32.0, 57.0, 61.0, 71.0, 70.0, 68.0, 78.0, 82.0, 59.0, 62.0, 53.0, 31.0, 39.0, 28.0, 30.0, 22.0, 21.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003304481506347656, -0.00032163411378860474, -0.00031282007694244385, -0.00030400604009628296, -0.00029519200325012207, -0.0002863779664039612, -0.0002775639295578003, -0.0002687498927116394, -0.0002599358558654785, -0.0002511218190193176, -0.00024230778217315674, -0.00023349374532699585, -0.00022467970848083496, -0.00021586567163467407, -0.00020705163478851318, -0.0001982375979423523, -0.0001894235610961914, -0.00018060952425003052, -0.00017179548740386963, -0.00016298145055770874, -0.00015416741371154785, -0.00014535337686538696, -0.00013653934001922607, -0.00012772530317306519, -0.0001189112663269043, -0.00011009722948074341, -0.00010128319263458252, -9.246915578842163e-05, -8.365511894226074e-05, -7.484108209609985e-05, -6.602704524993896e-05, -5.7213008403778076e-05, -4.839897155761719e-05, -3.95849347114563e-05, -3.077089786529541e-05, -2.195686101913452e-05, -1.3142824172973633e-05, -4.328787326812744e-06, 4.4852495193481445e-06, 1.3299286365509033e-05, 2.2113323211669922e-05, 3.092736005783081e-05, 3.97413969039917e-05, 4.855543375015259e-05, 5.7369470596313477e-05, 6.618350744247437e-05, 7.499754428863525e-05, 8.381158113479614e-05, 9.262561798095703e-05, 0.00010143965482711792, 0.00011025369167327881, 0.0001190677285194397, 0.00012788176536560059, 0.00013669580221176147, 0.00014550983905792236, 0.00015432387590408325, 0.00016313791275024414, 0.00017195194959640503, 0.00018076598644256592, 0.0001895800232887268, 0.0001983940601348877, 0.00020720809698104858, 0.00021602213382720947, 0.00022483617067337036, 0.00023365020751953125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 20.0, 23.0, 54.0, 61.0, 86.0, 168.0, 233.0, 325.0, 496.0, 722.0, 1231.0, 2039.0, 3574.0, 6433.0, 11765.0, 22186.0, 41990.0, 77182.0, 129225.0, 180852.0, 194642.0, 155637.0, 98937.0, 55483.0, 29726.0, 15757.0, 8454.0, 4484.0, 2549.0, 1542.0, 862.0, 593.0, 395.0, 220.0, 184.0, 134.0, 81.0, 64.0, 42.0, 25.0, 21.0, 15.0, 13.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4609375, -2.386871337890625, -2.31280517578125, -2.238739013671875, -2.1646728515625, -2.090606689453125, -2.01654052734375, -1.942474365234375, -1.868408203125, -1.794342041015625, -1.72027587890625, -1.646209716796875, -1.5721435546875, -1.498077392578125, -1.42401123046875, -1.349945068359375, -1.27587890625, -1.201812744140625, -1.12774658203125, -1.053680419921875, -0.9796142578125, -0.905548095703125, -0.83148193359375, -0.757415771484375, -0.683349609375, -0.609283447265625, -0.53521728515625, -0.461151123046875, -0.3870849609375, -0.313018798828125, -0.23895263671875, -0.164886474609375, -0.0908203125, -0.016754150390625, 0.05731201171875, 0.131378173828125, 0.2054443359375, 0.279510498046875, 0.35357666015625, 0.427642822265625, 0.501708984375, 0.575775146484375, 0.64984130859375, 0.723907470703125, 0.7979736328125, 0.872039794921875, 0.94610595703125, 1.020172119140625, 1.09423828125, 1.168304443359375, 1.24237060546875, 1.316436767578125, 1.3905029296875, 1.464569091796875, 1.53863525390625, 1.612701416015625, 1.686767578125, 1.760833740234375, 1.83489990234375, 1.908966064453125, 1.9830322265625, 2.057098388671875, 2.13116455078125, 2.205230712890625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 15.0, 12.0, 16.0, 13.0, 23.0, 22.0, 28.0, 31.0, 46.0, 37.0, 50.0, 47.0, 60.0, 49.0, 53.0, 49.0, 54.0, 60.0, 47.0, 46.0, 32.0, 36.0, 30.0, 24.0, 19.0, 15.0, 15.0, 9.0, 8.0, 5.0, 4.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79541015625, -0.7714614868164062, -0.7475128173828125, -0.7235641479492188, -0.699615478515625, -0.6756668090820312, -0.6517181396484375, -0.6277694702148438, -0.60382080078125, -0.5798721313476562, -0.5559234619140625, -0.5319747924804688, -0.508026123046875, -0.48407745361328125, -0.4601287841796875, -0.43618011474609375, -0.4122314453125, -0.38828277587890625, -0.3643341064453125, -0.34038543701171875, -0.316436767578125, -0.29248809814453125, -0.2685394287109375, -0.24459075927734375, -0.22064208984375, -0.19669342041015625, -0.1727447509765625, -0.14879608154296875, -0.124847412109375, -0.10089874267578125, -0.0769500732421875, -0.05300140380859375, -0.029052734375, -0.00510406494140625, 0.0188446044921875, 0.04279327392578125, 0.066741943359375, 0.09069061279296875, 0.1146392822265625, 0.13858795166015625, 0.16253662109375, 0.18648529052734375, 0.2104339599609375, 0.23438262939453125, 0.258331298828125, 0.28227996826171875, 0.3062286376953125, 0.33017730712890625, 0.3541259765625, 0.37807464599609375, 0.4020233154296875, 0.42597198486328125, 0.449920654296875, 0.47386932373046875, 0.4978179931640625, 0.5217666625976562, 0.54571533203125, 0.5696640014648438, 0.5936126708984375, 0.6175613403320312, 0.641510009765625, 0.6654586791992188, 0.6894073486328125, 0.7133560180664062, 0.7373046875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 9.0, 8.0, 11.0, 12.0, 18.0, 22.0, 28.0, 24.0, 22.0, 37.0, 40.0, 45.0, 44.0, 44.0, 53.0, 47.0, 41.0, 45.0, 44.0, 46.0, 29.0, 41.0, 39.0, 22.0, 27.0, 25.0, 23.0, 21.0, 22.0, 11.0, 16.0, 13.0, 7.0, 9.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6092023849487305, -3.489184856414795, -3.3691673278808594, -3.249149799346924, -3.1291322708129883, -3.0091147422790527, -2.889097213745117, -2.7690794467926025, -2.649061918258667, -2.5290443897247314, -2.409026861190796, -2.2890093326568604, -2.168991804122925, -2.04897403717041, -1.9289566278457642, -1.808938980102539, -1.688921570777893, -1.5689040422439575, -1.448886513710022, -1.3288688659667969, -1.2088513374328613, -1.0888338088989258, -0.9688162803649902, -0.8487986922264099, -0.7287811636924744, -0.6087636351585388, -0.4887460470199585, -0.36872851848602295, -0.24871096014976501, -0.12869340181350708, -0.008675873279571533, 0.11134171485900879, 0.23135924339294434, 0.35137680172920227, 0.4713943600654602, 0.5914118885993958, 0.7114294767379761, 0.8314470052719116, 0.9514645338058472, 1.0714821815490723, 1.1914997100830078, 1.3115172386169434, 1.431534767150879, 1.5515522956848145, 1.6715699434280396, 1.791587471961975, 1.9116050004959106, 2.0316226482391357, 2.151639938354492, 2.2716574668884277, 2.3916749954223633, 2.511692523956299, 2.6317100524902344, 2.75172758102417, 2.8717451095581055, 2.99176287651062, 3.1117804050445557, 3.231797933578491, 3.3518154621124268, 3.4718329906463623, 3.591850519180298, 3.7118682861328125, 3.831885814666748, 3.9519033432006836, 4.071920871734619]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 9.0, 8.0, 9.0, 15.0, 12.0, 14.0, 10.0, 10.0, 15.0, 23.0, 19.0, 34.0, 30.0, 37.0, 32.0, 44.0, 49.0, 31.0, 42.0, 45.0, 45.0, 35.0, 38.0, 36.0, 42.0, 33.0, 42.0, 26.0, 32.0, 17.0, 23.0, 20.0, 16.0, 22.0, 9.0, 12.0, 8.0, 14.0, 11.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.8113772869110107, -3.691875696182251, -3.572374105453491, -3.4528725147247314, -3.3333709239959717, -3.213869333267212, -3.094367742538452, -2.9748661518096924, -2.8553645610809326, -2.735862970352173, -2.616361379623413, -2.4968597888946533, -2.3773581981658936, -2.257856607437134, -2.138355016708374, -2.0188534259796143, -1.8993518352508545, -1.7798502445220947, -1.660348653793335, -1.5408470630645752, -1.4213454723358154, -1.3018438816070557, -1.182342290878296, -1.0628407001495361, -0.9433391094207764, -0.8238375186920166, -0.7043359279632568, -0.5848343372344971, -0.4653327465057373, -0.34583115577697754, -0.22632956504821777, -0.10682797431945801, 0.012673377990722656, 0.13217496871948242, 0.2516765594482422, 0.37117815017700195, 0.4906797409057617, 0.6101813316345215, 0.7296829223632812, 0.849184513092041, 0.9686861038208008, 1.0881876945495605, 1.2076892852783203, 1.32719087600708, 1.4466924667358398, 1.5661940574645996, 1.6856956481933594, 1.8051972389221191, 1.924698829650879, 2.0442004203796387, 2.1637020111083984, 2.283203601837158, 2.402705192565918, 2.5222067832946777, 2.6417083740234375, 2.7612099647521973, 2.880711555480957, 3.000213146209717, 3.1197147369384766, 3.2392163276672363, 3.358717918395996, 3.478219509124756, 3.5977210998535156, 3.7172226905822754, 3.836724281311035]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 8.0, 19.0, 29.0, 41.0, 71.0, 147.0, 202.0, 342.0, 498.0, 861.0, 1453.0, 2343.0, 3724.0, 6109.0, 9958.0, 16278.0, 26585.0, 42211.0, 67967.0, 107281.0, 166552.0, 249078.0, 354256.0, 459905.0, 533483.0, 541889.0, 477075.0, 374384.0, 267073.0, 179271.0, 115153.0, 72621.0, 45410.0, 28037.0, 16967.0, 10563.0, 6354.0, 3959.0, 2421.0, 1408.0, 870.0, 564.0, 318.0, 201.0, 123.0, 85.0, 52.0, 30.0, 14.0, 16.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.919921875, -2.826019287109375, -2.73211669921875, -2.638214111328125, -2.5443115234375, -2.450408935546875, -2.35650634765625, -2.262603759765625, -2.168701171875, -2.074798583984375, -1.98089599609375, -1.886993408203125, -1.7930908203125, -1.699188232421875, -1.60528564453125, -1.511383056640625, -1.41748046875, -1.323577880859375, -1.22967529296875, -1.135772705078125, -1.0418701171875, -0.947967529296875, -0.85406494140625, -0.760162353515625, -0.666259765625, -0.572357177734375, -0.47845458984375, -0.384552001953125, -0.2906494140625, -0.196746826171875, -0.10284423828125, -0.008941650390625, 0.0849609375, 0.178863525390625, 0.27276611328125, 0.366668701171875, 0.4605712890625, 0.554473876953125, 0.64837646484375, 0.742279052734375, 0.836181640625, 0.930084228515625, 1.02398681640625, 1.117889404296875, 1.2117919921875, 1.305694580078125, 1.39959716796875, 1.493499755859375, 1.58740234375, 1.681304931640625, 1.77520751953125, 1.869110107421875, 1.9630126953125, 2.056915283203125, 2.15081787109375, 2.244720458984375, 2.338623046875, 2.432525634765625, 2.52642822265625, 2.620330810546875, 2.7142333984375, 2.808135986328125, 2.90203857421875, 2.995941162109375, 3.08984375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 2.0, 7.0, 12.0, 10.0, 16.0, 8.0, 14.0, 13.0, 21.0, 20.0, 18.0, 27.0, 31.0, 44.0, 36.0, 37.0, 33.0, 38.0, 35.0, 42.0, 33.0, 51.0, 44.0, 40.0, 38.0, 29.0, 28.0, 27.0, 27.0, 24.0, 29.0, 20.0, 17.0, 22.0, 21.0, 21.0, 8.0, 12.0, 9.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.526580810546875, -2.43597412109375, -2.345367431640625, -2.2547607421875, -2.164154052734375, -2.07354736328125, -1.982940673828125, -1.892333984375, -1.801727294921875, -1.71112060546875, -1.620513916015625, -1.5299072265625, -1.439300537109375, -1.34869384765625, -1.258087158203125, -1.16748046875, -1.076873779296875, -0.98626708984375, -0.895660400390625, -0.8050537109375, -0.714447021484375, -0.62384033203125, -0.533233642578125, -0.442626953125, -0.352020263671875, -0.26141357421875, -0.170806884765625, -0.0802001953125, 0.010406494140625, 0.10101318359375, 0.191619873046875, 0.2822265625, 0.372833251953125, 0.46343994140625, 0.554046630859375, 0.6446533203125, 0.735260009765625, 0.82586669921875, 0.916473388671875, 1.007080078125, 1.097686767578125, 1.18829345703125, 1.278900146484375, 1.3695068359375, 1.460113525390625, 1.55072021484375, 1.641326904296875, 1.73193359375, 1.822540283203125, 1.91314697265625, 2.003753662109375, 2.0943603515625, 2.184967041015625, 2.27557373046875, 2.366180419921875, 2.456787109375, 2.547393798828125, 2.63800048828125, 2.728607177734375, 2.8192138671875, 2.909820556640625, 3.00042724609375, 3.091033935546875, 3.181640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 24.0, 29.0, 41.0, 67.0, 145.0, 267.0, 450.0, 807.0, 1671.0, 3110.0, 6082.0, 11950.0, 22364.0, 41566.0, 76856.0, 134260.0, 224595.0, 348208.0, 488313.0, 596026.0, 619137.0, 544317.0, 410737.0, 275480.0, 171091.0, 98577.0, 55544.0, 29649.0, 15491.0, 8332.0, 4204.0, 2271.0, 1262.0, 618.0, 307.0, 188.0, 102.0, 57.0, 37.0, 21.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.998046875, -3.8812255859375, -3.764404296875, -3.6475830078125, -3.53076171875, -3.4139404296875, -3.297119140625, -3.1802978515625, -3.0634765625, -2.9466552734375, -2.829833984375, -2.7130126953125, -2.59619140625, -2.4793701171875, -2.362548828125, -2.2457275390625, -2.12890625, -2.0120849609375, -1.895263671875, -1.7784423828125, -1.66162109375, -1.5447998046875, -1.427978515625, -1.3111572265625, -1.1943359375, -1.0775146484375, -0.960693359375, -0.8438720703125, -0.72705078125, -0.6102294921875, -0.493408203125, -0.3765869140625, -0.259765625, -0.1429443359375, -0.026123046875, 0.0906982421875, 0.20751953125, 0.3243408203125, 0.441162109375, 0.5579833984375, 0.6748046875, 0.7916259765625, 0.908447265625, 1.0252685546875, 1.14208984375, 1.2589111328125, 1.375732421875, 1.4925537109375, 1.609375, 1.7261962890625, 1.843017578125, 1.9598388671875, 2.07666015625, 2.1934814453125, 2.310302734375, 2.4271240234375, 2.5439453125, 2.6607666015625, 2.777587890625, 2.8944091796875, 3.01123046875, 3.1280517578125, 3.244873046875, 3.3616943359375, 3.478515625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 14.0, 25.0, 28.0, 27.0, 54.0, 54.0, 71.0, 96.0, 82.0, 128.0, 155.0, 168.0, 216.0, 235.0, 258.0, 247.0, 242.0, 253.0, 255.0, 245.0, 203.0, 192.0, 173.0, 128.0, 123.0, 86.0, 73.0, 65.0, 35.0, 37.0, 26.0, 23.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6337890625, -1.582061767578125, -1.53033447265625, -1.478607177734375, -1.4268798828125, -1.375152587890625, -1.32342529296875, -1.271697998046875, -1.219970703125, -1.168243408203125, -1.11651611328125, -1.064788818359375, -1.0130615234375, -0.961334228515625, -0.90960693359375, -0.857879638671875, -0.80615234375, -0.754425048828125, -0.70269775390625, -0.650970458984375, -0.5992431640625, -0.547515869140625, -0.49578857421875, -0.444061279296875, -0.392333984375, -0.340606689453125, -0.28887939453125, -0.237152099609375, -0.1854248046875, -0.133697509765625, -0.08197021484375, -0.030242919921875, 0.021484375, 0.073211669921875, 0.12493896484375, 0.176666259765625, 0.2283935546875, 0.280120849609375, 0.33184814453125, 0.383575439453125, 0.435302734375, 0.487030029296875, 0.53875732421875, 0.590484619140625, 0.6422119140625, 0.693939208984375, 0.74566650390625, 0.797393798828125, 0.84912109375, 0.900848388671875, 0.95257568359375, 1.004302978515625, 1.0560302734375, 1.107757568359375, 1.15948486328125, 1.211212158203125, 1.262939453125, 1.314666748046875, 1.36639404296875, 1.418121337890625, 1.4698486328125, 1.521575927734375, 1.57330322265625, 1.625030517578125, 1.6767578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 6.0, 11.0, 8.0, 5.0, 9.0, 14.0, 16.0, 20.0, 27.0, 30.0, 16.0, 27.0, 49.0, 35.0, 40.0, 43.0, 49.0, 50.0, 49.0, 45.0, 39.0, 47.0, 53.0, 38.0, 43.0, 32.0, 35.0, 25.0, 18.0, 19.0, 20.0, 18.0, 18.0, 13.0, 6.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.854025363922119, -3.737438917160034, -3.620852470397949, -3.5042660236358643, -3.3876795768737793, -3.2710931301116943, -3.1545066833496094, -3.0379204750061035, -2.9213337898254395, -2.8047473430633545, -2.6881608963012695, -2.5715744495391846, -2.4549880027770996, -2.3384015560150146, -2.2218151092529297, -2.105228900909424, -1.9886424541473389, -1.872056007385254, -1.755469560623169, -1.638883113861084, -1.522296667098999, -1.405710220336914, -1.2891238927841187, -1.1725374460220337, -1.0559509992599487, -0.9393645524978638, -0.8227781057357788, -0.7061917185783386, -0.5896052718162537, -0.4730188250541687, -0.3564324378967285, -0.23984599113464355, -0.1232595443725586, -0.006673112511634827, 0.10991331934928894, 0.2264997363090515, 0.3430861830711365, 0.45967262983322144, 0.5762590169906616, 0.6928454637527466, 0.8094319105148315, 0.9260183572769165, 1.0426048040390015, 1.1591911315917969, 1.2757775783538818, 1.3923640251159668, 1.5089504718780518, 1.6255369186401367, 1.7421233654022217, 1.8587098121643066, 1.9752962589263916, 2.0918827056884766, 2.2084691524505615, 2.3250555992126465, 2.4416418075561523, 2.5582284927368164, 2.6748147010803223, 2.7914011478424072, 2.907987594604492, 3.024574041366577, 3.141160488128662, 3.257746934890747, 3.374333381652832, 3.490919589996338, 3.607506275177002]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 3.0, 5.0, 10.0, 8.0, 16.0, 14.0, 8.0, 17.0, 20.0, 20.0, 24.0, 27.0, 31.0, 34.0, 42.0, 29.0, 33.0, 36.0, 42.0, 40.0, 44.0, 50.0, 45.0, 44.0, 31.0, 33.0, 42.0, 34.0, 21.0, 32.0, 23.0, 24.0, 24.0, 14.0, 9.0, 10.0, 11.0, 12.0, 5.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.6561279296875, -3.55086612701416, -3.4456043243408203, -3.3403425216674805, -3.2350807189941406, -3.129818916320801, -3.024557113647461, -2.919295310974121, -2.8140335083007812, -2.7087717056274414, -2.6035099029541016, -2.4982481002807617, -2.392986297607422, -2.287724494934082, -2.182462692260742, -2.0772008895874023, -1.9719388484954834, -1.8666770458221436, -1.7614152431488037, -1.6561534404754639, -1.550891637802124, -1.4456298351287842, -1.3403679132461548, -1.235106110572815, -1.129844307899475, -1.0245825052261353, -0.9193207025527954, -0.8140588402748108, -0.708797037601471, -0.6035352349281311, -0.4982733726501465, -0.39301156997680664, -0.2877495288848877, -0.18248771131038666, -0.07722589373588562, 0.02803593873977661, 0.13329774141311646, 0.2385595440864563, 0.3438214063644409, 0.44908320903778076, 0.5543450117111206, 0.6596068143844604, 0.7648686170578003, 0.8701304793357849, 0.9753922820091248, 1.0806541442871094, 1.1859159469604492, 1.291177749633789, 1.396439552307129, 1.5017013549804688, 1.6069631576538086, 1.7122249603271484, 1.8174867630004883, 1.9227485656738281, 2.028010368347168, 2.133272171020508, 2.2385339736938477, 2.3437957763671875, 2.4490575790405273, 2.554319381713867, 2.659581184387207, 2.764842987060547, 2.8701047897338867, 2.9753665924072266, 3.0806286334991455]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 19.0, 26.0, 49.0, 63.0, 96.0, 146.0, 222.0, 302.0, 430.0, 629.0, 925.0, 1337.0, 1958.0, 2953.0, 4453.0, 6807.0, 10514.0, 16383.0, 26178.0, 41741.0, 67147.0, 105428.0, 155079.0, 182426.0, 149921.0, 100633.0, 63528.0, 39225.0, 24912.0, 15551.0, 10067.0, 6485.0, 4162.0, 2790.0, 1890.0, 1256.0, 839.0, 613.0, 435.0, 278.0, 202.0, 164.0, 105.0, 62.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.613372802734375, -2.52752685546875, -2.441680908203125, -2.3558349609375, -2.269989013671875, -2.18414306640625, -2.098297119140625, -2.012451171875, -1.926605224609375, -1.84075927734375, -1.754913330078125, -1.6690673828125, -1.583221435546875, -1.49737548828125, -1.411529541015625, -1.32568359375, -1.239837646484375, -1.15399169921875, -1.068145751953125, -0.9822998046875, -0.896453857421875, -0.81060791015625, -0.724761962890625, -0.638916015625, -0.553070068359375, -0.46722412109375, -0.381378173828125, -0.2955322265625, -0.209686279296875, -0.12384033203125, -0.037994384765625, 0.0478515625, 0.133697509765625, 0.21954345703125, 0.305389404296875, 0.3912353515625, 0.477081298828125, 0.56292724609375, 0.648773193359375, 0.734619140625, 0.820465087890625, 0.90631103515625, 0.992156982421875, 1.0780029296875, 1.163848876953125, 1.24969482421875, 1.335540771484375, 1.42138671875, 1.507232666015625, 1.59307861328125, 1.678924560546875, 1.7647705078125, 1.850616455078125, 1.93646240234375, 2.022308349609375, 2.108154296875, 2.194000244140625, 2.27984619140625, 2.365692138671875, 2.4515380859375, 2.537384033203125, 2.62322998046875, 2.709075927734375, 2.794921875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 11.0, 8.0, 15.0, 14.0, 17.0, 26.0, 20.0, 13.0, 27.0, 30.0, 27.0, 33.0, 37.0, 35.0, 45.0, 40.0, 47.0, 43.0, 40.0, 29.0, 46.0, 29.0, 39.0, 32.0, 31.0, 35.0, 25.0, 26.0, 32.0, 22.0, 22.0, 8.0, 14.0, 10.0, 7.0, 8.0, 11.0, 10.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.5625, -3.45538330078125, -3.3482666015625, -3.24114990234375, -3.134033203125, -3.02691650390625, -2.9197998046875, -2.81268310546875, -2.70556640625, -2.59844970703125, -2.4913330078125, -2.38421630859375, -2.277099609375, -2.16998291015625, -2.0628662109375, -1.95574951171875, -1.8486328125, -1.74151611328125, -1.6343994140625, -1.52728271484375, -1.420166015625, -1.31304931640625, -1.2059326171875, -1.09881591796875, -0.99169921875, -0.88458251953125, -0.7774658203125, -0.67034912109375, -0.563232421875, -0.45611572265625, -0.3489990234375, -0.24188232421875, -0.134765625, -0.02764892578125, 0.0794677734375, 0.18658447265625, 0.293701171875, 0.40081787109375, 0.5079345703125, 0.61505126953125, 0.72216796875, 0.82928466796875, 0.9364013671875, 1.04351806640625, 1.150634765625, 1.25775146484375, 1.3648681640625, 1.47198486328125, 1.5791015625, 1.68621826171875, 1.7933349609375, 1.90045166015625, 2.007568359375, 2.11468505859375, 2.2218017578125, 2.32891845703125, 2.43603515625, 2.54315185546875, 2.6502685546875, 2.75738525390625, 2.864501953125, 2.97161865234375, 3.0787353515625, 3.18585205078125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 13.0, 6.0, 13.0, 30.0, 29.0, 47.0, 73.0, 107.0, 177.0, 238.0, 378.0, 578.0, 1010.0, 1621.0, 2760.0, 4887.0, 8876.0, 16460.0, 33230.0, 70466.0, 153697.0, 283381.0, 241621.0, 118397.0, 54255.0, 25792.0, 13323.0, 7056.0, 3998.0, 2349.0, 1389.0, 799.0, 488.0, 352.0, 199.0, 136.0, 98.0, 70.0, 45.0, 32.0, 16.0, 13.0, 12.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.973846435546875, -2.87738037109375, -2.780914306640625, -2.6844482421875, -2.587982177734375, -2.49151611328125, -2.395050048828125, -2.298583984375, -2.202117919921875, -2.10565185546875, -2.009185791015625, -1.9127197265625, -1.816253662109375, -1.71978759765625, -1.623321533203125, -1.52685546875, -1.430389404296875, -1.33392333984375, -1.237457275390625, -1.1409912109375, -1.044525146484375, -0.94805908203125, -0.851593017578125, -0.755126953125, -0.658660888671875, -0.56219482421875, -0.465728759765625, -0.3692626953125, -0.272796630859375, -0.17633056640625, -0.079864501953125, 0.0166015625, 0.113067626953125, 0.20953369140625, 0.305999755859375, 0.4024658203125, 0.498931884765625, 0.59539794921875, 0.691864013671875, 0.788330078125, 0.884796142578125, 0.98126220703125, 1.077728271484375, 1.1741943359375, 1.270660400390625, 1.36712646484375, 1.463592529296875, 1.56005859375, 1.656524658203125, 1.75299072265625, 1.849456787109375, 1.9459228515625, 2.042388916015625, 2.13885498046875, 2.235321044921875, 2.331787109375, 2.428253173828125, 2.52471923828125, 2.621185302734375, 2.7176513671875, 2.814117431640625, 2.91058349609375, 3.007049560546875, 3.103515625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 11.0, 7.0, 10.0, 10.0, 14.0, 11.0, 11.0, 26.0, 22.0, 20.0, 19.0, 43.0, 23.0, 30.0, 30.0, 31.0, 35.0, 30.0, 39.0, 39.0, 47.0, 37.0, 34.0, 44.0, 44.0, 41.0, 26.0, 40.0, 26.0, 25.0, 20.0, 26.0, 21.0, 11.0, 16.0, 12.0, 12.0, 10.0, 6.0, 6.0, 9.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.01171875, -1.9432373046875, -1.874755859375, -1.8062744140625, -1.73779296875, -1.6693115234375, -1.600830078125, -1.5323486328125, -1.4638671875, -1.3953857421875, -1.326904296875, -1.2584228515625, -1.18994140625, -1.1214599609375, -1.052978515625, -0.9844970703125, -0.916015625, -0.8475341796875, -0.779052734375, -0.7105712890625, -0.64208984375, -0.5736083984375, -0.505126953125, -0.4366455078125, -0.3681640625, -0.2996826171875, -0.231201171875, -0.1627197265625, -0.09423828125, -0.0257568359375, 0.042724609375, 0.1112060546875, 0.1796875, 0.2481689453125, 0.316650390625, 0.3851318359375, 0.45361328125, 0.5220947265625, 0.590576171875, 0.6590576171875, 0.7275390625, 0.7960205078125, 0.864501953125, 0.9329833984375, 1.00146484375, 1.0699462890625, 1.138427734375, 1.2069091796875, 1.275390625, 1.3438720703125, 1.412353515625, 1.4808349609375, 1.54931640625, 1.6177978515625, 1.686279296875, 1.7547607421875, 1.8232421875, 1.8917236328125, 1.960205078125, 2.0286865234375, 2.09716796875, 2.1656494140625, 2.234130859375, 2.3026123046875, 2.37109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 10.0, 9.0, 13.0, 11.0, 25.0, 47.0, 61.0, 75.0, 98.0, 133.0, 199.0, 269.0, 348.0, 497.0, 724.0, 1111.0, 1626.0, 2412.0, 3848.0, 6490.0, 11274.0, 22789.0, 59159.0, 281531.0, 497077.0, 92870.0, 30456.0, 14030.0, 7763.0, 4579.0, 2891.0, 1921.0, 1232.0, 837.0, 602.0, 451.0, 302.0, 198.0, 160.0, 132.0, 70.0, 62.0, 41.0, 40.0, 24.0, 16.0, 8.0, 11.0, 5.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.455078125, -3.340576171875, -3.22607421875, -3.111572265625, -2.9970703125, -2.882568359375, -2.76806640625, -2.653564453125, -2.5390625, -2.424560546875, -2.31005859375, -2.195556640625, -2.0810546875, -1.966552734375, -1.85205078125, -1.737548828125, -1.623046875, -1.508544921875, -1.39404296875, -1.279541015625, -1.1650390625, -1.050537109375, -0.93603515625, -0.821533203125, -0.70703125, -0.592529296875, -0.47802734375, -0.363525390625, -0.2490234375, -0.134521484375, -0.02001953125, 0.094482421875, 0.208984375, 0.323486328125, 0.43798828125, 0.552490234375, 0.6669921875, 0.781494140625, 0.89599609375, 1.010498046875, 1.125, 1.239501953125, 1.35400390625, 1.468505859375, 1.5830078125, 1.697509765625, 1.81201171875, 1.926513671875, 2.041015625, 2.155517578125, 2.27001953125, 2.384521484375, 2.4990234375, 2.613525390625, 2.72802734375, 2.842529296875, 2.95703125, 3.071533203125, 3.18603515625, 3.300537109375, 3.4150390625, 3.529541015625, 3.64404296875, 3.758544921875, 3.873046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 0.0, 7.0, 6.0, 4.0, 6.0, 7.0, 16.0, 12.0, 23.0, 39.0, 40.0, 58.0, 94.0, 160.0, 164.0, 111.0, 69.0, 39.0, 31.0, 23.0, 13.0, 15.0, 8.0, 12.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003421306610107422, -0.00032897666096687317, -0.00031582266092300415, -0.00030266866087913513, -0.0002895146608352661, -0.0002763606607913971, -0.0002632066607475281, -0.00025005266070365906, -0.00023689866065979004, -0.00022374466061592102, -0.000210590660572052, -0.00019743666052818298, -0.00018428266048431396, -0.00017112866044044495, -0.00015797466039657593, -0.0001448206603527069, -0.0001316666603088379, -0.00011851266026496887, -0.00010535866022109985, -9.220466017723083e-05, -7.905066013336182e-05, -6.58966600894928e-05, -5.274266004562378e-05, -3.958866000175476e-05, -2.6434659957885742e-05, -1.3280659914016724e-05, -1.2665987014770508e-07, 1.3027340173721313e-05, 2.6181340217590332e-05, 3.933534026145935e-05, 5.248934030532837e-05, 6.564334034919739e-05, 7.87973403930664e-05, 9.195134043693542e-05, 0.00010510534048080444, 0.00011825934052467346, 0.00013141334056854248, 0.0001445673406124115, 0.00015772134065628052, 0.00017087534070014954, 0.00018402934074401855, 0.00019718334078788757, 0.0002103373408317566, 0.0002234913408756256, 0.00023664534091949463, 0.00024979934096336365, 0.00026295334100723267, 0.0002761073410511017, 0.0002892613410949707, 0.0003024153411388397, 0.00031556934118270874, 0.00032872334122657776, 0.0003418773412704468, 0.0003550313413143158, 0.0003681853413581848, 0.00038133934140205383, 0.00039449334144592285, 0.00040764734148979187, 0.0004208013415336609, 0.0004339553415775299, 0.0004471093416213989, 0.00046026334166526794, 0.00047341734170913696, 0.000486571341753006, 0.000499725341796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 11.0, 9.0, 16.0, 24.0, 49.0, 55.0, 81.0, 102.0, 168.0, 244.0, 350.0, 533.0, 827.0, 1240.0, 1911.0, 3218.0, 5084.0, 8338.0, 14519.0, 27435.0, 61338.0, 165420.0, 393606.0, 213638.0, 76011.0, 32646.0, 16700.0, 9547.0, 5602.0, 3580.0, 2175.0, 1437.0, 942.0, 560.0, 351.0, 257.0, 155.0, 103.0, 73.0, 63.0, 45.0, 29.0, 22.0, 11.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.375, -3.26824951171875, -3.1614990234375, -3.05474853515625, -2.947998046875, -2.84124755859375, -2.7344970703125, -2.62774658203125, -2.52099609375, -2.41424560546875, -2.3074951171875, -2.20074462890625, -2.093994140625, -1.98724365234375, -1.8804931640625, -1.77374267578125, -1.6669921875, -1.56024169921875, -1.4534912109375, -1.34674072265625, -1.239990234375, -1.13323974609375, -1.0264892578125, -0.91973876953125, -0.81298828125, -0.70623779296875, -0.5994873046875, -0.49273681640625, -0.385986328125, -0.27923583984375, -0.1724853515625, -0.06573486328125, 0.041015625, 0.14776611328125, 0.2545166015625, 0.36126708984375, 0.468017578125, 0.57476806640625, 0.6815185546875, 0.78826904296875, 0.89501953125, 1.00177001953125, 1.1085205078125, 1.21527099609375, 1.322021484375, 1.42877197265625, 1.5355224609375, 1.64227294921875, 1.7490234375, 1.85577392578125, 1.9625244140625, 2.06927490234375, 2.176025390625, 2.28277587890625, 2.3895263671875, 2.49627685546875, 2.60302734375, 2.70977783203125, 2.8165283203125, 2.92327880859375, 3.030029296875, 3.13677978515625, 3.2435302734375, 3.35028076171875, 3.45703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 5.0, 12.0, 14.0, 14.0, 27.0, 20.0, 21.0, 37.0, 30.0, 47.0, 74.0, 63.0, 89.0, 115.0, 86.0, 54.0, 54.0, 38.0, 48.0, 25.0, 17.0, 29.0, 12.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.7531204223632812, -0.7288970947265625, -0.7046737670898438, -0.680450439453125, -0.6562271118164062, -0.6320037841796875, -0.6077804565429688, -0.58355712890625, -0.5593338012695312, -0.5351104736328125, -0.5108871459960938, -0.486663818359375, -0.46244049072265625, -0.4382171630859375, -0.41399383544921875, -0.3897705078125, -0.36554718017578125, -0.3413238525390625, -0.31710052490234375, -0.292877197265625, -0.26865386962890625, -0.2444305419921875, -0.22020721435546875, -0.19598388671875, -0.17176055908203125, -0.1475372314453125, -0.12331390380859375, -0.099090576171875, -0.07486724853515625, -0.0506439208984375, -0.02642059326171875, -0.002197265625, 0.02202606201171875, 0.0462493896484375, 0.07047271728515625, 0.094696044921875, 0.11891937255859375, 0.1431427001953125, 0.16736602783203125, 0.19158935546875, 0.21581268310546875, 0.2400360107421875, 0.26425933837890625, 0.288482666015625, 0.31270599365234375, 0.3369293212890625, 0.36115264892578125, 0.3853759765625, 0.40959930419921875, 0.4338226318359375, 0.45804595947265625, 0.482269287109375, 0.5064926147460938, 0.5307159423828125, 0.5549392700195312, 0.57916259765625, 0.6033859252929688, 0.6276092529296875, 0.6518325805664062, 0.676055908203125, 0.7002792358398438, 0.7245025634765625, 0.7487258911132812, 0.77294921875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 15.0, 15.0, 17.0, 24.0, 34.0, 27.0, 23.0, 43.0, 46.0, 44.0, 48.0, 42.0, 54.0, 56.0, 53.0, 57.0, 54.0, 53.0, 43.0, 32.0, 45.0, 27.0, 21.0, 20.0, 17.0, 16.0, 8.0, 7.0, 7.0, 5.0, 3.0, 8.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982191801071167, -3.8511953353881836, -3.7201988697052, -3.589202404022217, -3.4582056999206543, -3.327209234237671, -3.1962127685546875, -3.065216302871704, -2.9342198371887207, -2.8032233715057373, -2.672226905822754, -2.5412302017211914, -2.410233736038208, -2.2792372703552246, -2.148240804672241, -2.017244338989258, -1.8862476348876953, -1.755251169204712, -1.624254584312439, -1.4932581186294556, -1.3622615337371826, -1.2312650680541992, -1.1002686023712158, -0.9692720770835876, -0.8382755517959595, -0.7072790265083313, -0.5762825012207031, -0.4452860355377197, -0.31428951025009155, -0.18329298496246338, -0.05229651927947998, 0.0787000060081482, 0.20969676971435547, 0.34069329500198364, 0.47168979048728943, 0.6026862859725952, 0.7336828112602234, 0.8646793365478516, 0.995675802230835, 1.1266722679138184, 1.2576688528060913, 1.3886653184890747, 1.5196619033813477, 1.650658369064331, 1.7816548347473145, 1.9126514196395874, 2.0436477661132812, 2.1746444702148438, 2.305640935897827, 2.4366374015808105, 2.567633867263794, 2.6986303329467773, 2.82962703704834, 2.9606235027313232, 3.0916199684143066, 3.22261643409729, 3.3536128997802734, 3.484609365463257, 3.6156058311462402, 3.7466025352478027, 3.877599000930786, 4.0085954666137695, 4.139592170715332, 4.270588397979736, 4.401585102081299]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 3.0, 6.0, 13.0, 15.0, 16.0, 11.0, 12.0, 21.0, 27.0, 24.0, 25.0, 35.0, 37.0, 26.0, 43.0, 33.0, 39.0, 41.0, 47.0, 46.0, 46.0, 42.0, 40.0, 36.0, 27.0, 39.0, 34.0, 19.0, 31.0, 17.0, 32.0, 12.0, 22.0, 14.0, 9.0, 13.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.6701035499572754, -3.5632424354553223, -3.4563815593719482, -3.349520444869995, -3.242659330368042, -3.135798454284668, -3.028937339782715, -2.9220762252807617, -2.8152151107788086, -2.7083539962768555, -2.6014931201934814, -2.4946320056915283, -2.387770891189575, -2.280910015106201, -2.174048900604248, -2.067187786102295, -1.960326910018921, -1.8534659147262573, -1.7466048002243042, -1.6397438049316406, -1.5328826904296875, -1.426021695137024, -1.3191606998443604, -1.2122995853424072, -1.1054385900497437, -0.9985775351524353, -0.891716480255127, -0.7848554849624634, -0.677994430065155, -0.5711333751678467, -0.4642723798751831, -0.35741132497787476, -0.2505500316619873, -0.14368899166584015, -0.03682795166969299, 0.07003307342529297, 0.17689412832260132, 0.28375518321990967, 0.39061617851257324, 0.4974772334098816, 0.6043382883071899, 0.7111993432044983, 0.8180603981018066, 0.9249213933944702, 1.0317823886871338, 1.138643503189087, 1.2455044984817505, 1.352365493774414, 1.4592266082763672, 1.5660876035690308, 1.6729487180709839, 1.7798097133636475, 1.8866708278656006, 1.9935318231582642, 2.1003928184509277, 2.207253932952881, 2.314115047454834, 2.420976161956787, 2.527837038040161, 2.6346981525421143, 2.7415592670440674, 2.8484201431274414, 2.9552812576293945, 3.0621423721313477, 3.1690032482147217]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 9.0, 3.0, 2.0, 19.0, 13.0, 41.0, 60.0, 88.0, 153.0, 186.0, 323.0, 506.0, 689.0, 1133.0, 1786.0, 2650.0, 4091.0, 6081.0, 9229.0, 13578.0, 19701.0, 27911.0, 39051.0, 51711.0, 67357.0, 82172.0, 94945.0, 102395.0, 102096.0, 94698.0, 82118.0, 66362.0, 51554.0, 38081.0, 27809.0, 19560.0, 13222.0, 9183.0, 6142.0, 4073.0, 2701.0, 1830.0, 1139.0, 728.0, 537.0, 295.0, 193.0, 122.0, 88.0, 52.0, 34.0, 25.0, 19.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.361328125, -3.259429931640625, -3.15753173828125, -3.055633544921875, -2.9537353515625, -2.851837158203125, -2.74993896484375, -2.648040771484375, -2.546142578125, -2.444244384765625, -2.34234619140625, -2.240447998046875, -2.1385498046875, -2.036651611328125, -1.93475341796875, -1.832855224609375, -1.73095703125, -1.629058837890625, -1.52716064453125, -1.425262451171875, -1.3233642578125, -1.221466064453125, -1.11956787109375, -1.017669677734375, -0.915771484375, -0.813873291015625, -0.71197509765625, -0.610076904296875, -0.5081787109375, -0.406280517578125, -0.30438232421875, -0.202484130859375, -0.1005859375, 0.001312255859375, 0.10321044921875, 0.205108642578125, 0.3070068359375, 0.408905029296875, 0.51080322265625, 0.612701416015625, 0.714599609375, 0.816497802734375, 0.91839599609375, 1.020294189453125, 1.1221923828125, 1.224090576171875, 1.32598876953125, 1.427886962890625, 1.52978515625, 1.631683349609375, 1.73358154296875, 1.835479736328125, 1.9373779296875, 2.039276123046875, 2.14117431640625, 2.243072509765625, 2.344970703125, 2.446868896484375, 2.54876708984375, 2.650665283203125, 2.7525634765625, 2.854461669921875, 2.95635986328125, 3.058258056640625, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 13.0, 15.0, 21.0, 14.0, 23.0, 32.0, 39.0, 26.0, 33.0, 36.0, 32.0, 30.0, 33.0, 36.0, 38.0, 53.0, 39.0, 45.0, 36.0, 38.0, 34.0, 28.0, 41.0, 25.0, 32.0, 22.0, 29.0, 15.0, 21.0, 17.0, 10.0, 9.0, 18.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.447265625, -3.344970703125, -3.24267578125, -3.140380859375, -3.0380859375, -2.935791015625, -2.83349609375, -2.731201171875, -2.62890625, -2.526611328125, -2.42431640625, -2.322021484375, -2.2197265625, -2.117431640625, -2.01513671875, -1.912841796875, -1.810546875, -1.708251953125, -1.60595703125, -1.503662109375, -1.4013671875, -1.299072265625, -1.19677734375, -1.094482421875, -0.9921875, -0.889892578125, -0.78759765625, -0.685302734375, -0.5830078125, -0.480712890625, -0.37841796875, -0.276123046875, -0.173828125, -0.071533203125, 0.03076171875, 0.133056640625, 0.2353515625, 0.337646484375, 0.43994140625, 0.542236328125, 0.64453125, 0.746826171875, 0.84912109375, 0.951416015625, 1.0537109375, 1.156005859375, 1.25830078125, 1.360595703125, 1.462890625, 1.565185546875, 1.66748046875, 1.769775390625, 1.8720703125, 1.974365234375, 2.07666015625, 2.178955078125, 2.28125, 2.383544921875, 2.48583984375, 2.588134765625, 2.6904296875, 2.792724609375, 2.89501953125, 2.997314453125, 3.099609375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 25.0, 23.0, 54.0, 83.0, 93.0, 195.0, 318.0, 519.0, 810.0, 1446.0, 2322.0, 3945.0, 6564.0, 10437.0, 16807.0, 26084.0, 39631.0, 57727.0, 78152.0, 99556.0, 115591.0, 121551.0, 116269.0, 100996.0, 79646.0, 58073.0, 40366.0, 26835.0, 17084.0, 10741.0, 6526.0, 3997.0, 2389.0, 1450.0, 866.0, 535.0, 337.0, 198.0, 123.0, 66.0, 49.0, 19.0, 14.0, 14.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.681640625, -3.564849853515625, -3.44805908203125, -3.331268310546875, -3.2144775390625, -3.097686767578125, -2.98089599609375, -2.864105224609375, -2.747314453125, -2.630523681640625, -2.51373291015625, -2.396942138671875, -2.2801513671875, -2.163360595703125, -2.04656982421875, -1.929779052734375, -1.81298828125, -1.696197509765625, -1.57940673828125, -1.462615966796875, -1.3458251953125, -1.229034423828125, -1.11224365234375, -0.995452880859375, -0.878662109375, -0.761871337890625, -0.64508056640625, -0.528289794921875, -0.4114990234375, -0.294708251953125, -0.17791748046875, -0.061126708984375, 0.0556640625, 0.172454833984375, 0.28924560546875, 0.406036376953125, 0.5228271484375, 0.639617919921875, 0.75640869140625, 0.873199462890625, 0.989990234375, 1.106781005859375, 1.22357177734375, 1.340362548828125, 1.4571533203125, 1.573944091796875, 1.69073486328125, 1.807525634765625, 1.92431640625, 2.041107177734375, 2.15789794921875, 2.274688720703125, 2.3914794921875, 2.508270263671875, 2.62506103515625, 2.741851806640625, 2.858642578125, 2.975433349609375, 3.09222412109375, 3.209014892578125, 3.3258056640625, 3.442596435546875, 3.55938720703125, 3.676177978515625, 3.79296875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 1.0, 8.0, 12.0, 10.0, 10.0, 12.0, 21.0, 17.0, 24.0, 21.0, 25.0, 16.0, 29.0, 36.0, 32.0, 46.0, 37.0, 43.0, 37.0, 43.0, 50.0, 36.0, 43.0, 41.0, 40.0, 39.0, 28.0, 33.0, 31.0, 26.0, 19.0, 27.0, 15.0, 12.0, 15.0, 14.0, 6.0, 10.0, 9.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.103607177734375, -2.03533935546875, -1.967071533203125, -1.8988037109375, -1.830535888671875, -1.76226806640625, -1.694000244140625, -1.625732421875, -1.557464599609375, -1.48919677734375, -1.420928955078125, -1.3526611328125, -1.284393310546875, -1.21612548828125, -1.147857666015625, -1.07958984375, -1.011322021484375, -0.94305419921875, -0.874786376953125, -0.8065185546875, -0.738250732421875, -0.66998291015625, -0.601715087890625, -0.533447265625, -0.465179443359375, -0.39691162109375, -0.328643798828125, -0.2603759765625, -0.192108154296875, -0.12384033203125, -0.055572509765625, 0.0126953125, 0.080963134765625, 0.14923095703125, 0.217498779296875, 0.2857666015625, 0.354034423828125, 0.42230224609375, 0.490570068359375, 0.558837890625, 0.627105712890625, 0.69537353515625, 0.763641357421875, 0.8319091796875, 0.900177001953125, 0.96844482421875, 1.036712646484375, 1.10498046875, 1.173248291015625, 1.24151611328125, 1.309783935546875, 1.3780517578125, 1.446319580078125, 1.51458740234375, 1.582855224609375, 1.651123046875, 1.719390869140625, 1.78765869140625, 1.855926513671875, 1.9241943359375, 1.992462158203125, 2.06072998046875, 2.128997802734375, 2.197265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 7.0, 9.0, 14.0, 26.0, 35.0, 54.0, 74.0, 114.0, 171.0, 214.0, 309.0, 464.0, 659.0, 1069.0, 1631.0, 2518.0, 4450.0, 8460.0, 17438.0, 38248.0, 89579.0, 190745.0, 277061.0, 217166.0, 107261.0, 46866.0, 20808.0, 9741.0, 5282.0, 2869.0, 1758.0, 1043.0, 773.0, 482.0, 371.0, 228.0, 183.0, 123.0, 83.0, 43.0, 30.0, 25.0, 27.0, 17.0, 12.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.968170166015625, -3.84649658203125, -3.724822998046875, -3.6031494140625, -3.481475830078125, -3.35980224609375, -3.238128662109375, -3.116455078125, -2.994781494140625, -2.87310791015625, -2.751434326171875, -2.6297607421875, -2.508087158203125, -2.38641357421875, -2.264739990234375, -2.14306640625, -2.021392822265625, -1.89971923828125, -1.778045654296875, -1.6563720703125, -1.534698486328125, -1.41302490234375, -1.291351318359375, -1.169677734375, -1.048004150390625, -0.92633056640625, -0.804656982421875, -0.6829833984375, -0.561309814453125, -0.43963623046875, -0.317962646484375, -0.1962890625, -0.074615478515625, 0.04705810546875, 0.168731689453125, 0.2904052734375, 0.412078857421875, 0.53375244140625, 0.655426025390625, 0.777099609375, 0.898773193359375, 1.02044677734375, 1.142120361328125, 1.2637939453125, 1.385467529296875, 1.50714111328125, 1.628814697265625, 1.75048828125, 1.872161865234375, 1.99383544921875, 2.115509033203125, 2.2371826171875, 2.358856201171875, 2.48052978515625, 2.602203369140625, 2.723876953125, 2.845550537109375, 2.96722412109375, 3.088897705078125, 3.2105712890625, 3.332244873046875, 3.45391845703125, 3.575592041015625, 3.697265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 23.0, 20.0, 38.0, 32.0, 57.0, 57.0, 95.0, 85.0, 123.0, 93.0, 78.0, 56.0, 70.0, 35.0, 29.0, 25.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0005211830139160156, -0.0005088746547698975, -0.0004965662956237793, -0.00048425793647766113, -0.00047194957733154297, -0.0004596412181854248, -0.00044733285903930664, -0.0004350244998931885, -0.0004227161407470703, -0.00041040778160095215, -0.000398099422454834, -0.0003857910633087158, -0.00037348270416259766, -0.0003611743450164795, -0.00034886598587036133, -0.00033655762672424316, -0.000324249267578125, -0.00031194090843200684, -0.00029963254928588867, -0.0002873241901397705, -0.00027501583099365234, -0.0002627074718475342, -0.000250399112701416, -0.00023809075355529785, -0.0002257823944091797, -0.00021347403526306152, -0.00020116567611694336, -0.0001888573169708252, -0.00017654895782470703, -0.00016424059867858887, -0.0001519322395324707, -0.00013962388038635254, -0.00012731552124023438, -0.00011500716209411621, -0.00010269880294799805, -9.039044380187988e-05, -7.808208465576172e-05, -6.577372550964355e-05, -5.346536636352539e-05, -4.1157007217407227e-05, -2.8848648071289062e-05, -1.65402889251709e-05, -4.231929779052734e-06, 8.07642936706543e-06, 2.0384788513183594e-05, 3.269314765930176e-05, 4.500150680541992e-05, 5.7309865951538086e-05, 6.961822509765625e-05, 8.192658424377441e-05, 9.423494338989258e-05, 0.00010654330253601074, 0.0001188516616821289, 0.00013116002082824707, 0.00014346837997436523, 0.0001557767391204834, 0.00016808509826660156, 0.00018039345741271973, 0.0001927018165588379, 0.00020501017570495605, 0.00021731853485107422, 0.00022962689399719238, 0.00024193525314331055, 0.0002542436122894287, 0.0002665519714355469]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 20.0, 27.0, 33.0, 48.0, 85.0, 124.0, 174.0, 317.0, 464.0, 704.0, 1134.0, 1798.0, 3086.0, 5074.0, 8710.0, 14711.0, 24937.0, 41823.0, 68069.0, 102617.0, 138919.0, 159228.0, 150393.0, 117837.0, 81310.0, 51355.0, 30510.0, 18253.0, 10589.0, 6284.0, 3758.0, 2324.0, 1433.0, 816.0, 580.0, 329.0, 230.0, 150.0, 95.0, 63.0, 52.0, 26.0, 18.0, 14.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.0050048828125, -1.939697265625, -1.8743896484375, -1.80908203125, -1.7437744140625, -1.678466796875, -1.6131591796875, -1.5478515625, -1.4825439453125, -1.417236328125, -1.3519287109375, -1.28662109375, -1.2213134765625, -1.156005859375, -1.0906982421875, -1.025390625, -0.9600830078125, -0.894775390625, -0.8294677734375, -0.76416015625, -0.6988525390625, -0.633544921875, -0.5682373046875, -0.5029296875, -0.4376220703125, -0.372314453125, -0.3070068359375, -0.24169921875, -0.1763916015625, -0.111083984375, -0.0457763671875, 0.01953125, 0.0848388671875, 0.150146484375, 0.2154541015625, 0.28076171875, 0.3460693359375, 0.411376953125, 0.4766845703125, 0.5419921875, 0.6072998046875, 0.672607421875, 0.7379150390625, 0.80322265625, 0.8685302734375, 0.933837890625, 0.9991455078125, 1.064453125, 1.1297607421875, 1.195068359375, 1.2603759765625, 1.32568359375, 1.3909912109375, 1.456298828125, 1.5216064453125, 1.5869140625, 1.6522216796875, 1.717529296875, 1.7828369140625, 1.84814453125, 1.9134521484375, 1.978759765625, 2.0440673828125, 2.109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 7.0, 23.0, 14.0, 19.0, 19.0, 25.0, 28.0, 42.0, 45.0, 67.0, 62.0, 57.0, 51.0, 63.0, 66.0, 62.0, 56.0, 50.0, 41.0, 29.0, 35.0, 25.0, 19.0, 17.0, 19.0, 12.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.750335693359375, -0.72283935546875, -0.695343017578125, -0.6678466796875, -0.640350341796875, -0.61285400390625, -0.585357666015625, -0.557861328125, -0.530364990234375, -0.50286865234375, -0.475372314453125, -0.4478759765625, -0.420379638671875, -0.39288330078125, -0.365386962890625, -0.337890625, -0.310394287109375, -0.28289794921875, -0.255401611328125, -0.2279052734375, -0.200408935546875, -0.17291259765625, -0.145416259765625, -0.117919921875, -0.090423583984375, -0.06292724609375, -0.035430908203125, -0.0079345703125, 0.019561767578125, 0.04705810546875, 0.074554443359375, 0.10205078125, 0.129547119140625, 0.15704345703125, 0.184539794921875, 0.2120361328125, 0.239532470703125, 0.26702880859375, 0.294525146484375, 0.322021484375, 0.349517822265625, 0.37701416015625, 0.404510498046875, 0.4320068359375, 0.459503173828125, 0.48699951171875, 0.514495849609375, 0.5419921875, 0.569488525390625, 0.59698486328125, 0.624481201171875, 0.6519775390625, 0.679473876953125, 0.70697021484375, 0.734466552734375, 0.761962890625, 0.789459228515625, 0.81695556640625, 0.844451904296875, 0.8719482421875, 0.899444580078125, 0.92694091796875, 0.954437255859375, 0.98193359375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 8.0, 8.0, 12.0, 16.0, 12.0, 11.0, 9.0, 20.0, 20.0, 26.0, 29.0, 31.0, 44.0, 31.0, 44.0, 47.0, 43.0, 34.0, 38.0, 56.0, 45.0, 43.0, 42.0, 34.0, 39.0, 44.0, 30.0, 23.0, 20.0, 15.0, 23.0, 18.0, 13.0, 10.0, 12.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3753297328948975, -3.2676143646240234, -3.1598987579345703, -3.0521833896636963, -2.9444680213928223, -2.8367526531219482, -2.729037284851074, -2.621321678161621, -2.513606309890747, -2.405890941619873, -2.29817533493042, -2.190459966659546, -2.082744598388672, -1.9750292301177979, -1.8673137426376343, -1.7595982551574707, -1.6518828868865967, -1.5441675186157227, -1.436452031135559, -1.3287365436553955, -1.2210211753845215, -1.1133058071136475, -1.0055903196334839, -0.8978748917579651, -0.7901594638824463, -0.6824440360069275, -0.5747286081314087, -0.4670131802558899, -0.3592977523803711, -0.2515823245048523, -0.1438668966293335, -0.0361514687538147, 0.0715641975402832, 0.179279625415802, 0.2869950532913208, 0.3947104811668396, 0.5024259090423584, 0.6101413369178772, 0.717856764793396, 0.8255721926689148, 0.9332876205444336, 1.0410029888153076, 1.1487184762954712, 1.2564339637756348, 1.3641493320465088, 1.4718647003173828, 1.5795801877975464, 1.68729567527771, 1.795011043548584, 1.902726411819458, 2.010441780090332, 2.118157386779785, 2.225872755050659, 2.333588123321533, 2.4413037300109863, 2.5490190982818604, 2.6567344665527344, 2.7644498348236084, 2.8721652030944824, 2.9798808097839355, 3.0875961780548096, 3.1953115463256836, 3.3030271530151367, 3.4107425212860107, 3.5184578895568848]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 7.0, 13.0, 15.0, 25.0, 21.0, 14.0, 22.0, 27.0, 29.0, 25.0, 34.0, 38.0, 31.0, 39.0, 52.0, 41.0, 37.0, 47.0, 37.0, 49.0, 57.0, 22.0, 32.0, 34.0, 26.0, 19.0, 26.0, 23.0, 21.0, 12.0, 10.0, 19.0, 19.0, 12.0, 8.0, 9.0, 5.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.945760726928711, -2.8403706550598145, -2.734980583190918, -2.6295905113220215, -2.524200677871704, -2.4188106060028076, -2.313420534133911, -2.2080304622650146, -2.1026406288146973, -1.9972505569458008, -1.8918606042861938, -1.7864705324172974, -1.6810805797576904, -1.575690507888794, -1.4703004360198975, -1.364910364151001, -1.2595202922821045, -1.154130220413208, -1.048740267753601, -0.9433501958847046, -0.8379601836204529, -0.7325701713562012, -0.6271800994873047, -0.521790087223053, -0.41640007495880127, -0.31101006269454956, -0.20562002062797546, -0.10022997856140137, 0.005160033702850342, 0.11055004596710205, 0.21594011783599854, 0.32133013010025024, 0.42672038078308105, 0.5321103930473328, 0.6375004053115845, 0.742890477180481, 0.8482804894447327, 0.9536705017089844, 1.0590605735778809, 1.1644506454467773, 1.2698405981063843, 1.3752306699752808, 1.4806206226348877, 1.5860106945037842, 1.6914007663726807, 1.7967907190322876, 1.902180790901184, 2.007570743560791, 2.1129608154296875, 2.218350887298584, 2.3237409591674805, 2.429131031036377, 2.5345208644866943, 2.639910936355591, 2.7453010082244873, 2.850691080093384, 2.956080913543701, 3.0614709854125977, 3.166861057281494, 3.2722511291503906, 3.377640962600708, 3.4830310344696045, 3.588421106338501, 3.6938111782073975, 3.799201250076294]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 13.0, 42.0, 50.0, 90.0, 144.0, 253.0, 415.0, 766.0, 1288.0, 2212.0, 3723.0, 6901.0, 12516.0, 22660.0, 40935.0, 75409.0, 135952.0, 239532.0, 395004.0, 572624.0, 692871.0, 669715.0, 520854.0, 343113.0, 202895.0, 114621.0, 62913.0, 34303.0, 18776.0, 10421.0, 5706.0, 3186.0, 1796.0, 1026.0, 627.0, 345.0, 204.0, 152.0, 86.0, 39.0, 32.0, 23.0, 12.0, 7.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.263671875, -3.15789794921875, -3.0521240234375, -2.94635009765625, -2.840576171875, -2.73480224609375, -2.6290283203125, -2.52325439453125, -2.41748046875, -2.31170654296875, -2.2059326171875, -2.10015869140625, -1.994384765625, -1.88861083984375, -1.7828369140625, -1.67706298828125, -1.5712890625, -1.46551513671875, -1.3597412109375, -1.25396728515625, -1.148193359375, -1.04241943359375, -0.9366455078125, -0.83087158203125, -0.72509765625, -0.61932373046875, -0.5135498046875, -0.40777587890625, -0.302001953125, -0.19622802734375, -0.0904541015625, 0.01531982421875, 0.12109375, 0.22686767578125, 0.3326416015625, 0.43841552734375, 0.544189453125, 0.64996337890625, 0.7557373046875, 0.86151123046875, 0.96728515625, 1.07305908203125, 1.1788330078125, 1.28460693359375, 1.390380859375, 1.49615478515625, 1.6019287109375, 1.70770263671875, 1.8134765625, 1.91925048828125, 2.0250244140625, 2.13079833984375, 2.236572265625, 2.34234619140625, 2.4481201171875, 2.55389404296875, 2.65966796875, 2.76544189453125, 2.8712158203125, 2.97698974609375, 3.082763671875, 3.18853759765625, 3.2943115234375, 3.40008544921875, 3.505859375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 6.0, 18.0, 16.0, 17.0, 16.0, 21.0, 21.0, 17.0, 23.0, 33.0, 27.0, 42.0, 40.0, 32.0, 45.0, 51.0, 40.0, 53.0, 42.0, 36.0, 51.0, 48.0, 40.0, 26.0, 27.0, 27.0, 23.0, 15.0, 23.0, 16.0, 23.0, 13.0, 12.0, 7.0, 8.0, 4.0, 6.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.29656982421875, -2.2122802734375, -2.12799072265625, -2.043701171875, -1.95941162109375, -1.8751220703125, -1.79083251953125, -1.70654296875, -1.62225341796875, -1.5379638671875, -1.45367431640625, -1.369384765625, -1.28509521484375, -1.2008056640625, -1.11651611328125, -1.0322265625, -0.94793701171875, -0.8636474609375, -0.77935791015625, -0.695068359375, -0.61077880859375, -0.5264892578125, -0.44219970703125, -0.35791015625, -0.27362060546875, -0.1893310546875, -0.10504150390625, -0.020751953125, 0.06353759765625, 0.1478271484375, 0.23211669921875, 0.31640625, 0.40069580078125, 0.4849853515625, 0.56927490234375, 0.653564453125, 0.73785400390625, 0.8221435546875, 0.90643310546875, 0.99072265625, 1.07501220703125, 1.1593017578125, 1.24359130859375, 1.327880859375, 1.41217041015625, 1.4964599609375, 1.58074951171875, 1.6650390625, 1.74932861328125, 1.8336181640625, 1.91790771484375, 2.002197265625, 2.08648681640625, 2.1707763671875, 2.25506591796875, 2.33935546875, 2.42364501953125, 2.5079345703125, 2.59222412109375, 2.676513671875, 2.76080322265625, 2.8450927734375, 2.92938232421875, 3.013671875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 28.0, 29.0, 44.0, 66.0, 110.0, 171.0, 317.0, 460.0, 730.0, 1145.0, 1851.0, 3119.0, 4697.0, 7517.0, 11720.0, 18551.0, 28126.0, 44187.0, 65869.0, 98796.0, 142659.0, 201026.0, 270242.0, 344086.0, 409945.0, 450180.0, 448690.0, 407470.0, 342459.0, 268034.0, 197844.0, 140808.0, 96534.0, 65353.0, 43292.0, 28456.0, 17860.0, 11682.0, 7422.0, 4683.0, 2922.0, 1929.0, 1211.0, 743.0, 440.0, 297.0, 170.0, 104.0, 83.0, 37.0, 30.0, 24.0, 10.0, 10.0, 5.0, 5.0, 1.0], "bins": [-2.427734375, -2.3541259765625, -2.280517578125, -2.2069091796875, -2.13330078125, -2.0596923828125, -1.986083984375, -1.9124755859375, -1.8388671875, -1.7652587890625, -1.691650390625, -1.6180419921875, -1.54443359375, -1.4708251953125, -1.397216796875, -1.3236083984375, -1.25, -1.1763916015625, -1.102783203125, -1.0291748046875, -0.95556640625, -0.8819580078125, -0.808349609375, -0.7347412109375, -0.6611328125, -0.5875244140625, -0.513916015625, -0.4403076171875, -0.36669921875, -0.2930908203125, -0.219482421875, -0.1458740234375, -0.072265625, 0.0013427734375, 0.074951171875, 0.1485595703125, 0.22216796875, 0.2957763671875, 0.369384765625, 0.4429931640625, 0.5166015625, 0.5902099609375, 0.663818359375, 0.7374267578125, 0.81103515625, 0.8846435546875, 0.958251953125, 1.0318603515625, 1.10546875, 1.1790771484375, 1.252685546875, 1.3262939453125, 1.39990234375, 1.4735107421875, 1.547119140625, 1.6207275390625, 1.6943359375, 1.7679443359375, 1.841552734375, 1.9151611328125, 1.98876953125, 2.0623779296875, 2.135986328125, 2.2095947265625, 2.283203125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 1.0, 6.0, 8.0, 13.0, 20.0, 15.0, 15.0, 32.0, 43.0, 63.0, 44.0, 59.0, 69.0, 90.0, 91.0, 114.0, 138.0, 152.0, 169.0, 176.0, 178.0, 220.0, 212.0, 223.0, 223.0, 204.0, 178.0, 187.0, 160.0, 173.0, 117.0, 122.0, 101.0, 71.0, 77.0, 70.0, 59.0, 44.0, 23.0, 23.0, 20.0, 18.0, 14.0, 11.0, 6.0, 10.0, 4.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.195556640625, -1.15966796875, -1.123779296875, -1.087890625, -1.052001953125, -1.01611328125, -0.980224609375, -0.9443359375, -0.908447265625, -0.87255859375, -0.836669921875, -0.80078125, -0.764892578125, -0.72900390625, -0.693115234375, -0.6572265625, -0.621337890625, -0.58544921875, -0.549560546875, -0.513671875, -0.477783203125, -0.44189453125, -0.406005859375, -0.3701171875, -0.334228515625, -0.29833984375, -0.262451171875, -0.2265625, -0.190673828125, -0.15478515625, -0.118896484375, -0.0830078125, -0.047119140625, -0.01123046875, 0.024658203125, 0.060546875, 0.096435546875, 0.13232421875, 0.168212890625, 0.2041015625, 0.239990234375, 0.27587890625, 0.311767578125, 0.34765625, 0.383544921875, 0.41943359375, 0.455322265625, 0.4912109375, 0.527099609375, 0.56298828125, 0.598876953125, 0.634765625, 0.670654296875, 0.70654296875, 0.742431640625, 0.7783203125, 0.814208984375, 0.85009765625, 0.885986328125, 0.921875, 0.957763671875, 0.99365234375, 1.029541015625, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 1.0, 3.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 17.0, 19.0, 15.0, 28.0, 27.0, 31.0, 30.0, 35.0, 31.0, 37.0, 34.0, 41.0, 34.0, 47.0, 40.0, 45.0, 38.0, 33.0, 41.0, 40.0, 42.0, 24.0, 25.0, 27.0, 25.0, 19.0, 17.0, 12.0, 10.0, 12.0, 16.0, 8.0, 7.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.152416706085205, -3.0596210956573486, -2.966825485229492, -2.874030113220215, -2.7812345027923584, -2.688438892364502, -2.5956432819366455, -2.502847671508789, -2.4100522994995117, -2.3172566890716553, -2.224461078643799, -2.1316657066345215, -2.038870096206665, -1.9460744857788086, -1.8532788753509521, -1.7604832649230957, -1.6676876544952393, -1.5748920440673828, -1.482096552848816, -1.3893009424209595, -1.2965054512023926, -1.2037098407745361, -1.1109142303466797, -1.0181186199188232, -0.9253231287002563, -0.8325275778770447, -0.739732027053833, -0.6469364166259766, -0.5541408658027649, -0.4613453149795532, -0.3685497045516968, -0.2757541537284851, -0.18295836448669434, -0.09016279876232147, 0.0026327669620513916, 0.09542834758758545, 0.18822389841079712, 0.2810194492340088, 0.37381505966186523, 0.4666106104850769, 0.5594061613082886, 0.6522017121315002, 0.7449972629547119, 0.8377928733825684, 0.93058842420578, 1.0233839750289917, 1.1161795854568481, 1.208975076675415, 1.3017706871032715, 1.394566297531128, 1.4873617887496948, 1.5801573991775513, 1.6729528903961182, 1.7657485008239746, 1.858544111251831, 1.9513397216796875, 2.044135093688965, 2.1369307041168213, 2.2297263145446777, 2.322521686553955, 2.4153172969818115, 2.508112907409668, 2.6009085178375244, 2.693704128265381, 2.7864997386932373]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 22.0, 14.0, 19.0, 14.0, 15.0, 28.0, 24.0, 26.0, 32.0, 35.0, 34.0, 39.0, 39.0, 36.0, 40.0, 42.0, 51.0, 39.0, 33.0, 33.0, 41.0, 32.0, 40.0, 24.0, 20.0, 30.0, 16.0, 23.0, 21.0, 17.0, 13.0, 13.0, 15.0, 7.0, 9.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.8398711681365967, -2.7512996196746826, -2.6627280712127686, -2.5741565227508545, -2.4855849742889404, -2.3970134258270264, -2.3084418773651123, -2.2198703289031982, -2.131298780441284, -2.04272723197937, -1.954155683517456, -1.865584135055542, -1.777012586593628, -1.6884410381317139, -1.5998694896697998, -1.5112979412078857, -1.4227263927459717, -1.3341548442840576, -1.2455832958221436, -1.1570117473602295, -1.0684401988983154, -0.9798686504364014, -0.8912971019744873, -0.8027255535125732, -0.7141540050506592, -0.6255824565887451, -0.537010908126831, -0.448439359664917, -0.35986781120300293, -0.27129626274108887, -0.1827247142791748, -0.09415316581726074, -0.005581855773925781, 0.08298969268798828, 0.17156124114990234, 0.2601327896118164, 0.34870433807373047, 0.43727588653564453, 0.5258474349975586, 0.6144189834594727, 0.7029905319213867, 0.7915620803833008, 0.8801336288452148, 0.9687051773071289, 1.057276725769043, 1.145848274230957, 1.234419822692871, 1.3229913711547852, 1.4115629196166992, 1.5001344680786133, 1.5887060165405273, 1.6772775650024414, 1.7658491134643555, 1.8544206619262695, 1.9429922103881836, 2.0315637588500977, 2.1201353073120117, 2.208706855773926, 2.29727840423584, 2.385849952697754, 2.474421501159668, 2.562993049621582, 2.651564598083496, 2.74013614654541, 2.828707695007324]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 2.0, 2.0, 4.0, 13.0, 21.0, 22.0, 29.0, 49.0, 68.0, 92.0, 115.0, 192.0, 271.0, 337.0, 484.0, 699.0, 1083.0, 1524.0, 2506.0, 3839.0, 6468.0, 11483.0, 22072.0, 46646.0, 104451.0, 237465.0, 313001.0, 157298.0, 68453.0, 31705.0, 15762.0, 8478.0, 4894.0, 3008.0, 1921.0, 1273.0, 818.0, 602.0, 399.0, 289.0, 204.0, 131.0, 117.0, 73.0, 55.0, 37.0, 32.0, 12.0, 17.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.9017333984375, -3.768310546875, -3.6348876953125, -3.50146484375, -3.3680419921875, -3.234619140625, -3.1011962890625, -2.9677734375, -2.8343505859375, -2.700927734375, -2.5675048828125, -2.43408203125, -2.3006591796875, -2.167236328125, -2.0338134765625, -1.900390625, -1.7669677734375, -1.633544921875, -1.5001220703125, -1.36669921875, -1.2332763671875, -1.099853515625, -0.9664306640625, -0.8330078125, -0.6995849609375, -0.566162109375, -0.4327392578125, -0.29931640625, -0.1658935546875, -0.032470703125, 0.1009521484375, 0.234375, 0.3677978515625, 0.501220703125, 0.6346435546875, 0.76806640625, 0.9014892578125, 1.034912109375, 1.1683349609375, 1.3017578125, 1.4351806640625, 1.568603515625, 1.7020263671875, 1.83544921875, 1.9688720703125, 2.102294921875, 2.2357177734375, 2.369140625, 2.5025634765625, 2.635986328125, 2.7694091796875, 2.90283203125, 3.0362548828125, 3.169677734375, 3.3031005859375, 3.4365234375, 3.5699462890625, 3.703369140625, 3.8367919921875, 3.97021484375, 4.1036376953125, 4.237060546875, 4.3704833984375, 4.50390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 10.0, 6.0, 11.0, 16.0, 16.0, 16.0, 19.0, 23.0, 38.0, 32.0, 21.0, 33.0, 30.0, 28.0, 46.0, 38.0, 36.0, 42.0, 35.0, 39.0, 42.0, 39.0, 22.0, 46.0, 29.0, 31.0, 32.0, 27.0, 22.0, 20.0, 21.0, 13.0, 14.0, 14.0, 14.0, 8.0, 8.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.80859375, -2.71929931640625, -2.6300048828125, -2.54071044921875, -2.451416015625, -2.36212158203125, -2.2728271484375, -2.18353271484375, -2.09423828125, -2.00494384765625, -1.9156494140625, -1.82635498046875, -1.737060546875, -1.64776611328125, -1.5584716796875, -1.46917724609375, -1.3798828125, -1.29058837890625, -1.2012939453125, -1.11199951171875, -1.022705078125, -0.93341064453125, -0.8441162109375, -0.75482177734375, -0.66552734375, -0.57623291015625, -0.4869384765625, -0.39764404296875, -0.308349609375, -0.21905517578125, -0.1297607421875, -0.04046630859375, 0.048828125, 0.13812255859375, 0.2274169921875, 0.31671142578125, 0.406005859375, 0.49530029296875, 0.5845947265625, 0.67388916015625, 0.76318359375, 0.85247802734375, 0.9417724609375, 1.03106689453125, 1.120361328125, 1.20965576171875, 1.2989501953125, 1.38824462890625, 1.4775390625, 1.56683349609375, 1.6561279296875, 1.74542236328125, 1.834716796875, 1.92401123046875, 2.0133056640625, 2.10260009765625, 2.19189453125, 2.28118896484375, 2.3704833984375, 2.45977783203125, 2.549072265625, 2.63836669921875, 2.7276611328125, 2.81695556640625, 2.90625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 14.0, 27.0, 29.0, 42.0, 56.0, 89.0, 127.0, 200.0, 265.0, 501.0, 719.0, 1161.0, 1938.0, 3525.0, 6547.0, 13789.0, 31677.0, 84733.0, 254156.0, 391021.0, 159702.0, 54669.0, 21714.0, 9856.0, 5035.0, 2731.0, 1539.0, 979.0, 544.0, 339.0, 236.0, 173.0, 116.0, 85.0, 56.0, 34.0, 30.0, 20.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.539306640625, -3.41845703125, -3.297607421875, -3.1767578125, -3.055908203125, -2.93505859375, -2.814208984375, -2.693359375, -2.572509765625, -2.45166015625, -2.330810546875, -2.2099609375, -2.089111328125, -1.96826171875, -1.847412109375, -1.7265625, -1.605712890625, -1.48486328125, -1.364013671875, -1.2431640625, -1.122314453125, -1.00146484375, -0.880615234375, -0.759765625, -0.638916015625, -0.51806640625, -0.397216796875, -0.2763671875, -0.155517578125, -0.03466796875, 0.086181640625, 0.20703125, 0.327880859375, 0.44873046875, 0.569580078125, 0.6904296875, 0.811279296875, 0.93212890625, 1.052978515625, 1.173828125, 1.294677734375, 1.41552734375, 1.536376953125, 1.6572265625, 1.778076171875, 1.89892578125, 2.019775390625, 2.140625, 2.261474609375, 2.38232421875, 2.503173828125, 2.6240234375, 2.744873046875, 2.86572265625, 2.986572265625, 3.107421875, 3.228271484375, 3.34912109375, 3.469970703125, 3.5908203125, 3.711669921875, 3.83251953125, 3.953369140625, 4.07421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 8.0, 10.0, 10.0, 16.0, 23.0, 28.0, 23.0, 31.0, 35.0, 32.0, 40.0, 44.0, 29.0, 52.0, 55.0, 45.0, 45.0, 41.0, 42.0, 47.0, 33.0, 37.0, 47.0, 33.0, 28.0, 31.0, 21.0, 22.0, 18.0, 17.0, 15.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.701263427734375, -2.62518310546875, -2.549102783203125, -2.4730224609375, -2.396942138671875, -2.32086181640625, -2.244781494140625, -2.168701171875, -2.092620849609375, -2.01654052734375, -1.940460205078125, -1.8643798828125, -1.788299560546875, -1.71221923828125, -1.636138916015625, -1.56005859375, -1.483978271484375, -1.40789794921875, -1.331817626953125, -1.2557373046875, -1.179656982421875, -1.10357666015625, -1.027496337890625, -0.951416015625, -0.875335693359375, -0.79925537109375, -0.723175048828125, -0.6470947265625, -0.571014404296875, -0.49493408203125, -0.418853759765625, -0.3427734375, -0.266693115234375, -0.19061279296875, -0.114532470703125, -0.0384521484375, 0.037628173828125, 0.11370849609375, 0.189788818359375, 0.265869140625, 0.341949462890625, 0.41802978515625, 0.494110107421875, 0.5701904296875, 0.646270751953125, 0.72235107421875, 0.798431396484375, 0.87451171875, 0.950592041015625, 1.02667236328125, 1.102752685546875, 1.1788330078125, 1.254913330078125, 1.33099365234375, 1.407073974609375, 1.483154296875, 1.559234619140625, 1.63531494140625, 1.711395263671875, 1.7874755859375, 1.863555908203125, 1.93963623046875, 2.015716552734375, 2.091796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 19.0, 19.0, 15.0, 37.0, 43.0, 56.0, 83.0, 112.0, 133.0, 146.0, 205.0, 248.0, 409.0, 535.0, 765.0, 1223.0, 2007.0, 3742.0, 7620.0, 20970.0, 106441.0, 767546.0, 98922.0, 20142.0, 7623.0, 3575.0, 1962.0, 1206.0, 739.0, 500.0, 370.0, 270.0, 219.0, 165.0, 119.0, 88.0, 60.0, 49.0, 40.0, 22.0, 23.0, 16.0, 18.0, 5.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.41796875, -5.25616455078125, -5.0943603515625, -4.93255615234375, -4.770751953125, -4.60894775390625, -4.4471435546875, -4.28533935546875, -4.12353515625, -3.96173095703125, -3.7999267578125, -3.63812255859375, -3.476318359375, -3.31451416015625, -3.1527099609375, -2.99090576171875, -2.8291015625, -2.66729736328125, -2.5054931640625, -2.34368896484375, -2.181884765625, -2.02008056640625, -1.8582763671875, -1.69647216796875, -1.53466796875, -1.37286376953125, -1.2110595703125, -1.04925537109375, -0.887451171875, -0.72564697265625, -0.5638427734375, -0.40203857421875, -0.240234375, -0.07843017578125, 0.0833740234375, 0.24517822265625, 0.406982421875, 0.56878662109375, 0.7305908203125, 0.89239501953125, 1.05419921875, 1.21600341796875, 1.3778076171875, 1.53961181640625, 1.701416015625, 1.86322021484375, 2.0250244140625, 2.18682861328125, 2.3486328125, 2.51043701171875, 2.6722412109375, 2.83404541015625, 2.995849609375, 3.15765380859375, 3.3194580078125, 3.48126220703125, 3.64306640625, 3.80487060546875, 3.9666748046875, 4.12847900390625, 4.290283203125, 4.45208740234375, 4.6138916015625, 4.77569580078125, 4.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 3.0, 12.0, 19.0, 30.0, 55.0, 110.0, 185.0, 244.0, 125.0, 73.0, 43.0, 28.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004253387451171875, -0.00041211768984794617, -0.00039889663457870483, -0.0003856755793094635, -0.00037245452404022217, -0.00035923346877098083, -0.0003460124135017395, -0.00033279135823249817, -0.00031957030296325684, -0.0003063492476940155, -0.00029312819242477417, -0.00027990713715553284, -0.0002666860818862915, -0.00025346502661705017, -0.00024024397134780884, -0.0002270229160785675, -0.00021380186080932617, -0.00020058080554008484, -0.0001873597502708435, -0.00017413869500160217, -0.00016091763973236084, -0.0001476965844631195, -0.00013447552919387817, -0.00012125447392463684, -0.00010803341865539551, -9.481236338615417e-05, -8.159130811691284e-05, -6.837025284767151e-05, -5.5149197578430176e-05, -4.192814230918884e-05, -2.870708703994751e-05, -1.5486031770706177e-05, -2.2649765014648438e-06, 1.095607876777649e-05, 2.4177134037017822e-05, 3.7398189306259155e-05, 5.061924457550049e-05, 6.384029984474182e-05, 7.706135511398315e-05, 9.028241038322449e-05, 0.00010350346565246582, 0.00011672452092170715, 0.00012994557619094849, 0.00014316663146018982, 0.00015638768672943115, 0.00016960874199867249, 0.00018282979726791382, 0.00019605085253715515, 0.00020927190780639648, 0.00022249296307563782, 0.00023571401834487915, 0.0002489350736141205, 0.0002621561288833618, 0.00027537718415260315, 0.0002885982394218445, 0.0003018192946910858, 0.00031504034996032715, 0.0003282614052295685, 0.0003414824604988098, 0.00035470351576805115, 0.0003679245710372925, 0.0003811456263065338, 0.00039436668157577515, 0.0004075877368450165, 0.0004208087921142578]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 11.0, 19.0, 33.0, 56.0, 72.0, 88.0, 133.0, 163.0, 199.0, 288.0, 435.0, 678.0, 1041.0, 1640.0, 2424.0, 3801.0, 6716.0, 12820.0, 29486.0, 90729.0, 436349.0, 337131.0, 71840.0, 24842.0, 11313.0, 6151.0, 3524.0, 2198.0, 1399.0, 947.0, 586.0, 403.0, 274.0, 211.0, 149.0, 116.0, 83.0, 54.0, 44.0, 36.0, 22.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.721282958984375, -3.59686279296875, -3.472442626953125, -3.3480224609375, -3.223602294921875, -3.09918212890625, -2.974761962890625, -2.850341796875, -2.725921630859375, -2.60150146484375, -2.477081298828125, -2.3526611328125, -2.228240966796875, -2.10382080078125, -1.979400634765625, -1.85498046875, -1.730560302734375, -1.60614013671875, -1.481719970703125, -1.3572998046875, -1.232879638671875, -1.10845947265625, -0.984039306640625, -0.859619140625, -0.735198974609375, -0.61077880859375, -0.486358642578125, -0.3619384765625, -0.237518310546875, -0.11309814453125, 0.011322021484375, 0.1357421875, 0.260162353515625, 0.38458251953125, 0.509002685546875, 0.6334228515625, 0.757843017578125, 0.88226318359375, 1.006683349609375, 1.131103515625, 1.255523681640625, 1.37994384765625, 1.504364013671875, 1.6287841796875, 1.753204345703125, 1.87762451171875, 2.002044677734375, 2.12646484375, 2.250885009765625, 2.37530517578125, 2.499725341796875, 2.6241455078125, 2.748565673828125, 2.87298583984375, 2.997406005859375, 3.121826171875, 3.246246337890625, 3.37066650390625, 3.495086669921875, 3.6195068359375, 3.743927001953125, 3.86834716796875, 3.992767333984375, 4.1171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 9.0, 14.0, 13.0, 9.0, 29.0, 42.0, 55.0, 104.0, 188.0, 165.0, 107.0, 62.0, 55.0, 32.0, 20.0, 21.0, 14.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.9459228515625, -0.917236328125, -0.8885498046875, -0.85986328125, -0.8311767578125, -0.802490234375, -0.7738037109375, -0.7451171875, -0.7164306640625, -0.687744140625, -0.6590576171875, -0.63037109375, -0.6016845703125, -0.572998046875, -0.5443115234375, -0.515625, -0.4869384765625, -0.458251953125, -0.4295654296875, -0.40087890625, -0.3721923828125, -0.343505859375, -0.3148193359375, -0.2861328125, -0.2574462890625, -0.228759765625, -0.2000732421875, -0.17138671875, -0.1427001953125, -0.114013671875, -0.0853271484375, -0.056640625, -0.0279541015625, 0.000732421875, 0.0294189453125, 0.05810546875, 0.0867919921875, 0.115478515625, 0.1441650390625, 0.1728515625, 0.2015380859375, 0.230224609375, 0.2589111328125, 0.28759765625, 0.3162841796875, 0.344970703125, 0.3736572265625, 0.40234375, 0.4310302734375, 0.459716796875, 0.4884033203125, 0.51708984375, 0.5457763671875, 0.574462890625, 0.6031494140625, 0.6318359375, 0.6605224609375, 0.689208984375, 0.7178955078125, 0.74658203125, 0.7752685546875, 0.803955078125, 0.8326416015625, 0.861328125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 13.0, 12.0, 6.0, 15.0, 13.0, 26.0, 23.0, 26.0, 27.0, 27.0, 32.0, 28.0, 35.0, 32.0, 36.0, 34.0, 42.0, 32.0, 57.0, 52.0, 44.0, 34.0, 37.0, 32.0, 28.0, 24.0, 33.0, 25.0, 17.0, 17.0, 19.0, 21.0, 19.0, 10.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.174232006072998, -3.0808262825012207, -2.9874205589294434, -2.894014596939087, -2.8006088733673096, -2.7072031497955322, -2.613797426223755, -2.5203914642333984, -2.426985740661621, -2.3335800170898438, -2.2401742935180664, -2.14676833152771, -2.0533626079559326, -1.9599568843841553, -1.866551160812378, -1.773145318031311, -1.6797395944595337, -1.5863338708877563, -1.4929280281066895, -1.399522304534912, -1.3061164617538452, -1.2127107381820679, -1.119304895401001, -1.0258991718292236, -0.9324933886528015, -0.8390876054763794, -0.7456818222999573, -0.6522760391235352, -0.5588703155517578, -0.4654645025730133, -0.3720587491989136, -0.27865296602249146, -0.18524718284606934, -0.09184140712022781, 0.0015643686056137085, 0.09497013688087463, 0.18837592005729675, 0.28178170323371887, 0.3751874566078186, 0.4685932397842407, 0.5619990229606628, 0.655404806137085, 0.7488105893135071, 0.8422163724899292, 0.9356220960617065, 1.0290279388427734, 1.1224336624145508, 1.2158393859863281, 1.309245228767395, 1.4026509523391724, 1.4960567951202393, 1.5894625186920166, 1.6828683614730835, 1.7762740850448608, 1.8696799278259277, 1.963085651397705, 2.0564913749694824, 2.1498970985412598, 2.243302822113037, 2.3367087841033936, 2.430114507675171, 2.5235202312469482, 2.6169259548187256, 2.710331916809082, 2.8037376403808594]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 2.0, 20.0, 16.0, 15.0, 11.0, 15.0, 19.0, 20.0, 28.0, 32.0, 28.0, 29.0, 28.0, 48.0, 49.0, 27.0, 36.0, 45.0, 37.0, 44.0, 39.0, 37.0, 48.0, 34.0, 41.0, 25.0, 20.0, 18.0, 22.0, 29.0, 12.0, 21.0, 21.0, 12.0, 11.0, 13.0, 10.0, 3.0, 9.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.7933664321899414, -2.7040176391601562, -2.614668846130371, -2.525320053100586, -2.4359710216522217, -2.3466222286224365, -2.2572734355926514, -2.167924642562866, -2.078575611114502, -1.9892268180847168, -1.899877905845642, -1.810529112815857, -1.7211802005767822, -1.631831407546997, -1.542482614517212, -1.4531338214874268, -1.3637850284576416, -1.2744362354278564, -1.1850873231887817, -1.0957385301589966, -1.0063896179199219, -0.9170408248901367, -0.8276920318603516, -0.7383431792259216, -0.6489943265914917, -0.5596454739570618, -0.4702966511249542, -0.3809478282928467, -0.29159897565841675, -0.20225012302398682, -0.11290132999420166, -0.02355247735977173, 0.0657963752746582, 0.15514521300792694, 0.24449405074119568, 0.3338428735733032, 0.42319172620773315, 0.5125405788421631, 0.6018893718719482, 0.6912382245063782, 0.7805870771408081, 0.869935929775238, 0.959284782409668, 1.0486335754394531, 1.1379823684692383, 1.227331280708313, 1.3166800737380981, 1.4060289859771729, 1.495377779006958, 1.5847265720367432, 1.6740754842758179, 1.763424277305603, 1.8527731895446777, 1.942121982574463, 2.031470775604248, 2.120819568634033, 2.2101683616638184, 2.2995171546936035, 2.3888659477233887, 2.478214740753174, 2.567563772201538, 2.6569125652313232, 2.7462613582611084, 2.8356101512908936, 2.924959182739258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 14.0, 23.0, 45.0, 66.0, 93.0, 130.0, 221.0, 299.0, 523.0, 730.0, 1283.0, 1939.0, 3103.0, 4794.0, 7696.0, 11811.0, 18349.0, 28291.0, 41647.0, 58858.0, 79424.0, 100235.0, 115517.0, 119991.0, 112949.0, 96590.0, 76039.0, 55562.0, 38503.0, 26410.0, 17105.0, 10993.0, 7077.0, 4440.0, 2772.0, 1825.0, 1125.0, 730.0, 506.0, 347.0, 192.0, 104.0, 62.0, 41.0, 41.0, 22.0, 16.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.765625, -3.65618896484375, -3.5467529296875, -3.43731689453125, -3.327880859375, -3.21844482421875, -3.1090087890625, -2.99957275390625, -2.89013671875, -2.78070068359375, -2.6712646484375, -2.56182861328125, -2.452392578125, -2.34295654296875, -2.2335205078125, -2.12408447265625, -2.0146484375, -1.90521240234375, -1.7957763671875, -1.68634033203125, -1.576904296875, -1.46746826171875, -1.3580322265625, -1.24859619140625, -1.13916015625, -1.02972412109375, -0.9202880859375, -0.81085205078125, -0.701416015625, -0.59197998046875, -0.4825439453125, -0.37310791015625, -0.263671875, -0.15423583984375, -0.0447998046875, 0.06463623046875, 0.174072265625, 0.28350830078125, 0.3929443359375, 0.50238037109375, 0.61181640625, 0.72125244140625, 0.8306884765625, 0.94012451171875, 1.049560546875, 1.15899658203125, 1.2684326171875, 1.37786865234375, 1.4873046875, 1.59674072265625, 1.7061767578125, 1.81561279296875, 1.925048828125, 2.03448486328125, 2.1439208984375, 2.25335693359375, 2.36279296875, 2.47222900390625, 2.5816650390625, 2.69110107421875, 2.800537109375, 2.90997314453125, 3.0194091796875, 3.12884521484375, 3.23828125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 15.0, 16.0, 11.0, 26.0, 23.0, 25.0, 24.0, 24.0, 37.0, 29.0, 34.0, 31.0, 45.0, 39.0, 36.0, 44.0, 37.0, 43.0, 45.0, 31.0, 36.0, 39.0, 39.0, 27.0, 17.0, 29.0, 25.0, 20.0, 15.0, 15.0, 16.0, 11.0, 12.0, 13.0, 9.0, 12.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.330169677734375, -2.24432373046875, -2.158477783203125, -2.0726318359375, -1.986785888671875, -1.90093994140625, -1.815093994140625, -1.729248046875, -1.643402099609375, -1.55755615234375, -1.471710205078125, -1.3858642578125, -1.300018310546875, -1.21417236328125, -1.128326416015625, -1.04248046875, -0.956634521484375, -0.87078857421875, -0.784942626953125, -0.6990966796875, -0.613250732421875, -0.52740478515625, -0.441558837890625, -0.355712890625, -0.269866943359375, -0.18402099609375, -0.098175048828125, -0.0123291015625, 0.073516845703125, 0.15936279296875, 0.245208740234375, 0.3310546875, 0.416900634765625, 0.50274658203125, 0.588592529296875, 0.6744384765625, 0.760284423828125, 0.84613037109375, 0.931976318359375, 1.017822265625, 1.103668212890625, 1.18951416015625, 1.275360107421875, 1.3612060546875, 1.447052001953125, 1.53289794921875, 1.618743896484375, 1.70458984375, 1.790435791015625, 1.87628173828125, 1.962127685546875, 2.0479736328125, 2.133819580078125, 2.21966552734375, 2.305511474609375, 2.391357421875, 2.477203369140625, 2.56304931640625, 2.648895263671875, 2.7347412109375, 2.820587158203125, 2.90643310546875, 2.992279052734375, 3.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 16.0, 21.0, 31.0, 45.0, 95.0, 123.0, 188.0, 301.0, 490.0, 748.0, 1207.0, 1884.0, 3011.0, 4532.0, 7134.0, 11006.0, 16454.0, 25095.0, 36265.0, 50526.0, 67738.0, 85888.0, 101337.0, 110327.0, 110202.0, 101222.0, 85537.0, 67968.0, 50687.0, 35781.0, 24820.0, 16604.0, 11159.0, 7252.0, 4701.0, 2849.0, 1895.0, 1226.0, 820.0, 481.0, 309.0, 207.0, 136.0, 86.0, 51.0, 40.0, 20.0, 14.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.984375, -2.89111328125, -2.7978515625, -2.70458984375, -2.611328125, -2.51806640625, -2.4248046875, -2.33154296875, -2.23828125, -2.14501953125, -2.0517578125, -1.95849609375, -1.865234375, -1.77197265625, -1.6787109375, -1.58544921875, -1.4921875, -1.39892578125, -1.3056640625, -1.21240234375, -1.119140625, -1.02587890625, -0.9326171875, -0.83935546875, -0.74609375, -0.65283203125, -0.5595703125, -0.46630859375, -0.373046875, -0.27978515625, -0.1865234375, -0.09326171875, 0.0, 0.09326171875, 0.1865234375, 0.27978515625, 0.373046875, 0.46630859375, 0.5595703125, 0.65283203125, 0.74609375, 0.83935546875, 0.9326171875, 1.02587890625, 1.119140625, 1.21240234375, 1.3056640625, 1.39892578125, 1.4921875, 1.58544921875, 1.6787109375, 1.77197265625, 1.865234375, 1.95849609375, 2.0517578125, 2.14501953125, 2.23828125, 2.33154296875, 2.4248046875, 2.51806640625, 2.611328125, 2.70458984375, 2.7978515625, 2.89111328125, 2.984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 14.0, 13.0, 15.0, 23.0, 20.0, 23.0, 33.0, 36.0, 44.0, 28.0, 42.0, 27.0, 38.0, 33.0, 43.0, 37.0, 42.0, 43.0, 34.0, 41.0, 37.0, 38.0, 25.0, 26.0, 22.0, 24.0, 20.0, 27.0, 20.0, 17.0, 9.0, 13.0, 10.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7958984375, -1.739959716796875, -1.68402099609375, -1.628082275390625, -1.5721435546875, -1.516204833984375, -1.46026611328125, -1.404327392578125, -1.348388671875, -1.292449951171875, -1.23651123046875, -1.180572509765625, -1.1246337890625, -1.068695068359375, -1.01275634765625, -0.956817626953125, -0.90087890625, -0.844940185546875, -0.78900146484375, -0.733062744140625, -0.6771240234375, -0.621185302734375, -0.56524658203125, -0.509307861328125, -0.453369140625, -0.397430419921875, -0.34149169921875, -0.285552978515625, -0.2296142578125, -0.173675537109375, -0.11773681640625, -0.061798095703125, -0.005859375, 0.050079345703125, 0.10601806640625, 0.161956787109375, 0.2178955078125, 0.273834228515625, 0.32977294921875, 0.385711669921875, 0.441650390625, 0.497589111328125, 0.55352783203125, 0.609466552734375, 0.6654052734375, 0.721343994140625, 0.77728271484375, 0.833221435546875, 0.88916015625, 0.945098876953125, 1.00103759765625, 1.056976318359375, 1.1129150390625, 1.168853759765625, 1.22479248046875, 1.280731201171875, 1.336669921875, 1.392608642578125, 1.44854736328125, 1.504486083984375, 1.5604248046875, 1.616363525390625, 1.67230224609375, 1.728240966796875, 1.7841796875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 16.0, 21.0, 34.0, 35.0, 56.0, 69.0, 114.0, 148.0, 228.0, 311.0, 460.0, 663.0, 1018.0, 1496.0, 2350.0, 3549.0, 5894.0, 9731.0, 17415.0, 33431.0, 66910.0, 132532.0, 217598.0, 231647.0, 153825.0, 79651.0, 39736.0, 20362.0, 11113.0, 6506.0, 3977.0, 2474.0, 1688.0, 1082.0, 768.0, 524.0, 347.0, 229.0, 160.0, 111.0, 89.0, 76.0, 32.0, 19.0, 25.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.34783935546875, -3.2366943359375, -3.12554931640625, -3.014404296875, -2.90325927734375, -2.7921142578125, -2.68096923828125, -2.56982421875, -2.45867919921875, -2.3475341796875, -2.23638916015625, -2.125244140625, -2.01409912109375, -1.9029541015625, -1.79180908203125, -1.6806640625, -1.56951904296875, -1.4583740234375, -1.34722900390625, -1.236083984375, -1.12493896484375, -1.0137939453125, -0.90264892578125, -0.79150390625, -0.68035888671875, -0.5692138671875, -0.45806884765625, -0.346923828125, -0.23577880859375, -0.1246337890625, -0.01348876953125, 0.09765625, 0.20880126953125, 0.3199462890625, 0.43109130859375, 0.542236328125, 0.65338134765625, 0.7645263671875, 0.87567138671875, 0.98681640625, 1.09796142578125, 1.2091064453125, 1.32025146484375, 1.431396484375, 1.54254150390625, 1.6536865234375, 1.76483154296875, 1.8759765625, 1.98712158203125, 2.0982666015625, 2.20941162109375, 2.320556640625, 2.43170166015625, 2.5428466796875, 2.65399169921875, 2.76513671875, 2.87628173828125, 2.9874267578125, 3.09857177734375, 3.209716796875, 3.32086181640625, 3.4320068359375, 3.54315185546875, 3.654296875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 10.0, 15.0, 27.0, 32.0, 42.0, 79.0, 85.0, 96.0, 111.0, 94.0, 71.0, 81.0, 63.0, 47.0, 38.0, 19.0, 18.0, 13.0, 13.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047779083251953125, -0.00046325474977493286, -0.00044871866703033447, -0.0004341825842857361, -0.0004196465015411377, -0.0004051104187965393, -0.0003905743360519409, -0.00037603825330734253, -0.00036150217056274414, -0.00034696608781814575, -0.00033243000507354736, -0.000317893922328949, -0.0003033578395843506, -0.0002888217568397522, -0.0002742856740951538, -0.0002597495913505554, -0.00024521350860595703, -0.00023067742586135864, -0.00021614134311676025, -0.00020160526037216187, -0.00018706917762756348, -0.0001725330948829651, -0.0001579970121383667, -0.0001434609293937683, -0.00012892484664916992, -0.00011438876390457153, -9.985268115997314e-05, -8.531659841537476e-05, -7.078051567077637e-05, -5.624443292617798e-05, -4.170835018157959e-05, -2.71722674369812e-05, -1.2636184692382812e-05, 1.8998980522155762e-06, 1.6435980796813965e-05, 3.0972063541412354e-05, 4.550814628601074e-05, 6.004422903060913e-05, 7.458031177520752e-05, 8.911639451980591e-05, 0.0001036524772644043, 0.00011818856000900269, 0.00013272464275360107, 0.00014726072549819946, 0.00016179680824279785, 0.00017633289098739624, 0.00019086897373199463, 0.00020540505647659302, 0.0002199411392211914, 0.0002344772219657898, 0.0002490133047103882, 0.00026354938745498657, 0.00027808547019958496, 0.00029262155294418335, 0.00030715763568878174, 0.0003216937184333801, 0.0003362298011779785, 0.0003507658839225769, 0.0003653019666671753, 0.0003798380494117737, 0.00039437413215637207, 0.00040891021490097046, 0.00042344629764556885, 0.00043798238039016724, 0.0004525184631347656]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 14.0, 22.0, 27.0, 33.0, 35.0, 64.0, 112.0, 168.0, 228.0, 360.0, 512.0, 842.0, 1307.0, 2104.0, 3298.0, 5192.0, 8411.0, 14035.0, 23373.0, 38006.0, 61430.0, 93142.0, 128271.0, 152090.0, 150744.0, 124570.0, 88632.0, 58383.0, 36039.0, 22086.0, 13382.0, 8056.0, 4998.0, 3038.0, 1966.0, 1197.0, 777.0, 552.0, 328.0, 222.0, 150.0, 123.0, 67.0, 48.0, 35.0, 26.0, 14.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-2.1484375, -2.083221435546875, -2.01800537109375, -1.952789306640625, -1.8875732421875, -1.822357177734375, -1.75714111328125, -1.691925048828125, -1.626708984375, -1.561492919921875, -1.49627685546875, -1.431060791015625, -1.3658447265625, -1.300628662109375, -1.23541259765625, -1.170196533203125, -1.10498046875, -1.039764404296875, -0.97454833984375, -0.909332275390625, -0.8441162109375, -0.778900146484375, -0.71368408203125, -0.648468017578125, -0.583251953125, -0.518035888671875, -0.45281982421875, -0.387603759765625, -0.3223876953125, -0.257171630859375, -0.19195556640625, -0.126739501953125, -0.0615234375, 0.003692626953125, 0.06890869140625, 0.134124755859375, 0.1993408203125, 0.264556884765625, 0.32977294921875, 0.394989013671875, 0.460205078125, 0.525421142578125, 0.59063720703125, 0.655853271484375, 0.7210693359375, 0.786285400390625, 0.85150146484375, 0.916717529296875, 0.98193359375, 1.047149658203125, 1.11236572265625, 1.177581787109375, 1.2427978515625, 1.308013916015625, 1.37322998046875, 1.438446044921875, 1.503662109375, 1.568878173828125, 1.63409423828125, 1.699310302734375, 1.7645263671875, 1.829742431640625, 1.89495849609375, 1.960174560546875, 2.025390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 8.0, 5.0, 8.0, 7.0, 9.0, 7.0, 11.0, 13.0, 18.0, 13.0, 15.0, 23.0, 32.0, 20.0, 35.0, 44.0, 49.0, 44.0, 47.0, 40.0, 47.0, 53.0, 39.0, 45.0, 46.0, 43.0, 45.0, 30.0, 42.0, 22.0, 25.0, 17.0, 19.0, 18.0, 10.0, 12.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.88916015625, -0.86395263671875, -0.8387451171875, -0.81353759765625, -0.788330078125, -0.76312255859375, -0.7379150390625, -0.71270751953125, -0.6875, -0.66229248046875, -0.6370849609375, -0.61187744140625, -0.586669921875, -0.56146240234375, -0.5362548828125, -0.51104736328125, -0.48583984375, -0.46063232421875, -0.4354248046875, -0.41021728515625, -0.385009765625, -0.35980224609375, -0.3345947265625, -0.30938720703125, -0.2841796875, -0.25897216796875, -0.2337646484375, -0.20855712890625, -0.183349609375, -0.15814208984375, -0.1329345703125, -0.10772705078125, -0.08251953125, -0.05731201171875, -0.0321044921875, -0.00689697265625, 0.018310546875, 0.04351806640625, 0.0687255859375, 0.09393310546875, 0.119140625, 0.14434814453125, 0.1695556640625, 0.19476318359375, 0.219970703125, 0.24517822265625, 0.2703857421875, 0.29559326171875, 0.32080078125, 0.34600830078125, 0.3712158203125, 0.39642333984375, 0.421630859375, 0.44683837890625, 0.4720458984375, 0.49725341796875, 0.5224609375, 0.54766845703125, 0.5728759765625, 0.59808349609375, 0.623291015625, 0.64849853515625, 0.6737060546875, 0.69891357421875, 0.72412109375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 13.0, 23.0, 23.0, 18.0, 20.0, 31.0, 27.0, 28.0, 23.0, 28.0, 30.0, 45.0, 36.0, 44.0, 45.0, 43.0, 45.0, 44.0, 40.0, 45.0, 33.0, 49.0, 31.0, 27.0, 22.0, 29.0, 26.0, 16.0, 20.0, 17.0, 3.0, 11.0, 10.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.302363872528076, -3.2079219818115234, -3.1134800910949707, -3.019038200378418, -2.924596071243286, -2.8301541805267334, -2.7357122898101807, -2.641270399093628, -2.546828269958496, -2.4523863792419434, -2.3579444885253906, -2.263502597808838, -2.169060468673706, -2.0746185779571533, -1.9801766872406006, -1.8857347965240479, -1.7912929058074951, -1.6968510150909424, -1.6024090051651, -1.5079671144485474, -1.413525104522705, -1.3190832138061523, -1.2246413230895996, -1.1301994323730469, -1.0357574224472046, -0.9413154721260071, -0.8468735218048096, -0.7524316310882568, -0.6579896807670593, -0.5635477304458618, -0.4691058397293091, -0.3746638894081116, -0.28022170066833496, -0.18577976524829865, -0.09133782982826233, 0.003104090690612793, 0.0975460410118103, 0.1919879913330078, 0.28642988204956055, 0.38087183237075806, 0.47531378269195557, 0.5697557330131531, 0.6641976833343506, 0.7586395740509033, 0.8530815243721008, 0.9475234746932983, 1.041965365409851, 1.1364073753356934, 1.230849266052246, 1.3252911567687988, 1.4197331666946411, 1.5141750574111938, 1.6086170673370361, 1.7030589580535889, 1.7975008487701416, 1.8919427394866943, 1.9863847494125366, 2.080826759338379, 2.1752686500549316, 2.2697105407714844, 2.364152431488037, 2.45859432220459, 2.5530362129211426, 2.6474783420562744, 2.741920232772827]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 11.0, 11.0, 10.0, 13.0, 14.0, 18.0, 23.0, 24.0, 28.0, 28.0, 32.0, 32.0, 26.0, 51.0, 42.0, 41.0, 41.0, 37.0, 44.0, 47.0, 34.0, 29.0, 43.0, 32.0, 30.0, 39.0, 30.0, 30.0, 21.0, 14.0, 16.0, 17.0, 15.0, 18.0, 9.0, 2.0, 10.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.664181709289551, -2.571289300918579, -2.4783968925476074, -2.3855044841766357, -2.292612075805664, -2.1997196674346924, -2.1068272590637207, -2.01393461227417, -1.9210423231124878, -1.8281499147415161, -1.7352575063705444, -1.6423649787902832, -1.5494725704193115, -1.4565801620483398, -1.3636877536773682, -1.2707953453063965, -1.1779029369354248, -1.0850105285644531, -0.9921181201934814, -0.899225652217865, -0.8063332438468933, -0.7134408354759216, -0.6205483675003052, -0.5276559591293335, -0.4347635507583618, -0.34187114238739014, -0.24897870421409607, -0.156086266040802, -0.06319385766983032, 0.029698550701141357, 0.12259101867675781, 0.2154834270477295, 0.30837583541870117, 0.40126824378967285, 0.4941606819629669, 0.587053120136261, 0.6799455285072327, 0.7728379368782043, 0.8657304048538208, 0.9586228132247925, 1.0515152215957642, 1.1444076299667358, 1.2373000383377075, 1.3301925659179688, 1.4230849742889404, 1.515977382659912, 1.6088697910308838, 1.7017621994018555, 1.7946546077728271, 1.8875470161437988, 1.9804394245147705, 2.073331832885742, 2.166224241256714, 2.2591166496276855, 2.3520092964172363, 2.444901466369629, 2.5377941131591797, 2.6306865215301514, 2.723578929901123, 2.8164713382720947, 2.9093637466430664, 3.002256155014038, 3.0951485633850098, 3.1880412101745605, 3.280933380126953]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 13.0, 25.0, 31.0, 42.0, 62.0, 136.0, 215.0, 377.0, 618.0, 1086.0, 1722.0, 3036.0, 5018.0, 8500.0, 14598.0, 24543.0, 41199.0, 69894.0, 114159.0, 185315.0, 285838.0, 412390.0, 531399.0, 593869.0, 560884.0, 454996.0, 326476.0, 217120.0, 135424.0, 83259.0, 49723.0, 29332.0, 17410.0, 10443.0, 6141.0, 3608.0, 2082.0, 1373.0, 757.0, 475.0, 251.0, 164.0, 106.0, 69.0, 40.0, 22.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.6796875, -2.600067138671875, -2.52044677734375, -2.440826416015625, -2.3612060546875, -2.281585693359375, -2.20196533203125, -2.122344970703125, -2.042724609375, -1.963104248046875, -1.88348388671875, -1.803863525390625, -1.7242431640625, -1.644622802734375, -1.56500244140625, -1.485382080078125, -1.40576171875, -1.326141357421875, -1.24652099609375, -1.166900634765625, -1.0872802734375, -1.007659912109375, -0.92803955078125, -0.848419189453125, -0.768798828125, -0.689178466796875, -0.60955810546875, -0.529937744140625, -0.4503173828125, -0.370697021484375, -0.29107666015625, -0.211456298828125, -0.1318359375, -0.052215576171875, 0.02740478515625, 0.107025146484375, 0.1866455078125, 0.266265869140625, 0.34588623046875, 0.425506591796875, 0.505126953125, 0.584747314453125, 0.66436767578125, 0.743988037109375, 0.8236083984375, 0.903228759765625, 0.98284912109375, 1.062469482421875, 1.14208984375, 1.221710205078125, 1.30133056640625, 1.380950927734375, 1.4605712890625, 1.540191650390625, 1.61981201171875, 1.699432373046875, 1.779052734375, 1.858673095703125, 1.93829345703125, 2.017913818359375, 2.0975341796875, 2.177154541015625, 2.25677490234375, 2.336395263671875, 2.416015625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 12.0, 9.0, 17.0, 16.0, 13.0, 21.0, 25.0, 27.0, 27.0, 34.0, 38.0, 32.0, 41.0, 46.0, 37.0, 39.0, 48.0, 33.0, 46.0, 44.0, 40.0, 36.0, 38.0, 38.0, 35.0, 33.0, 23.0, 23.0, 17.0, 14.0, 12.0, 14.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.029296875, -1.95849609375, -1.8876953125, -1.81689453125, -1.74609375, -1.67529296875, -1.6044921875, -1.53369140625, -1.462890625, -1.39208984375, -1.3212890625, -1.25048828125, -1.1796875, -1.10888671875, -1.0380859375, -0.96728515625, -0.896484375, -0.82568359375, -0.7548828125, -0.68408203125, -0.61328125, -0.54248046875, -0.4716796875, -0.40087890625, -0.330078125, -0.25927734375, -0.1884765625, -0.11767578125, -0.046875, 0.02392578125, 0.0947265625, 0.16552734375, 0.236328125, 0.30712890625, 0.3779296875, 0.44873046875, 0.51953125, 0.59033203125, 0.6611328125, 0.73193359375, 0.802734375, 0.87353515625, 0.9443359375, 1.01513671875, 1.0859375, 1.15673828125, 1.2275390625, 1.29833984375, 1.369140625, 1.43994140625, 1.5107421875, 1.58154296875, 1.65234375, 1.72314453125, 1.7939453125, 1.86474609375, 1.935546875, 2.00634765625, 2.0771484375, 2.14794921875, 2.21875, 2.28955078125, 2.3603515625, 2.43115234375, 2.501953125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 33.0, 41.0, 71.0, 126.0, 200.0, 358.0, 611.0, 1054.0, 1768.0, 3103.0, 5271.0, 9154.0, 16049.0, 27037.0, 45753.0, 75324.0, 122266.0, 189562.0, 278947.0, 383194.0, 481017.0, 535683.0, 526642.0, 454338.0, 353029.0, 250271.0, 167287.0, 106250.0, 65386.0, 38969.0, 23369.0, 13525.0, 7743.0, 4542.0, 2602.0, 1592.0, 848.0, 530.0, 286.0, 184.0, 106.0, 70.0, 39.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.511444091796875, -2.43499755859375, -2.358551025390625, -2.2821044921875, -2.205657958984375, -2.12921142578125, -2.052764892578125, -1.976318359375, -1.899871826171875, -1.82342529296875, -1.746978759765625, -1.6705322265625, -1.594085693359375, -1.51763916015625, -1.441192626953125, -1.36474609375, -1.288299560546875, -1.21185302734375, -1.135406494140625, -1.0589599609375, -0.982513427734375, -0.90606689453125, -0.829620361328125, -0.753173828125, -0.676727294921875, -0.60028076171875, -0.523834228515625, -0.4473876953125, -0.370941162109375, -0.29449462890625, -0.218048095703125, -0.1416015625, -0.065155029296875, 0.01129150390625, 0.087738037109375, 0.1641845703125, 0.240631103515625, 0.31707763671875, 0.393524169921875, 0.469970703125, 0.546417236328125, 0.62286376953125, 0.699310302734375, 0.7757568359375, 0.852203369140625, 0.92864990234375, 1.005096435546875, 1.08154296875, 1.157989501953125, 1.23443603515625, 1.310882568359375, 1.3873291015625, 1.463775634765625, 1.54022216796875, 1.616668701171875, 1.693115234375, 1.769561767578125, 1.84600830078125, 1.922454833984375, 1.9989013671875, 2.075347900390625, 2.15179443359375, 2.228240966796875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 12.0, 7.0, 14.0, 20.0, 31.0, 41.0, 40.0, 61.0, 53.0, 82.0, 100.0, 112.0, 117.0, 142.0, 137.0, 182.0, 187.0, 213.0, 232.0, 185.0, 211.0, 206.0, 201.0, 193.0, 172.0, 167.0, 151.0, 115.0, 114.0, 108.0, 93.0, 78.0, 58.0, 52.0, 44.0, 28.0, 33.0, 21.0, 15.0, 16.0, 3.0, 6.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0595703125, -1.0271148681640625, -0.994659423828125, -0.9622039794921875, -0.92974853515625, -0.8972930908203125, -0.864837646484375, -0.8323822021484375, -0.7999267578125, -0.7674713134765625, -0.735015869140625, -0.7025604248046875, -0.67010498046875, -0.6376495361328125, -0.605194091796875, -0.5727386474609375, -0.540283203125, -0.5078277587890625, -0.475372314453125, -0.4429168701171875, -0.41046142578125, -0.3780059814453125, -0.345550537109375, -0.3130950927734375, -0.2806396484375, -0.2481842041015625, -0.215728759765625, -0.1832733154296875, -0.15081787109375, -0.1183624267578125, -0.085906982421875, -0.0534515380859375, -0.02099609375, 0.0114593505859375, 0.043914794921875, 0.0763702392578125, 0.10882568359375, 0.1412811279296875, 0.173736572265625, 0.2061920166015625, 0.2386474609375, 0.2711029052734375, 0.303558349609375, 0.3360137939453125, 0.36846923828125, 0.4009246826171875, 0.433380126953125, 0.4658355712890625, 0.498291015625, 0.5307464599609375, 0.563201904296875, 0.5956573486328125, 0.62811279296875, 0.6605682373046875, 0.693023681640625, 0.7254791259765625, 0.7579345703125, 0.7903900146484375, 0.822845458984375, 0.8553009033203125, 0.88775634765625, 0.9202117919921875, 0.952667236328125, 0.9851226806640625, 1.017578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 6.0, 10.0, 7.0, 16.0, 17.0, 23.0, 23.0, 32.0, 34.0, 28.0, 41.0, 36.0, 40.0, 53.0, 62.0, 46.0, 46.0, 54.0, 47.0, 53.0, 45.0, 38.0, 36.0, 33.0, 31.0, 23.0, 21.0, 12.0, 14.0, 17.0, 14.0, 5.0, 8.0, 9.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3508079051971436, -3.2532224655151367, -3.155637264251709, -3.0580520629882812, -2.9604666233062744, -2.8628811836242676, -2.76529598236084, -2.667710781097412, -2.5701253414154053, -2.4725399017333984, -2.3749547004699707, -2.277369499206543, -2.179784059524536, -2.0821986198425293, -1.9846134185791016, -1.8870280981063843, -1.789442777633667, -1.6918574571609497, -1.5942721366882324, -1.4966868162155151, -1.3991014957427979, -1.3015161752700806, -1.2039308547973633, -1.106345534324646, -1.0087602138519287, -0.9111748933792114, -0.8135895729064941, -0.7160042524337769, -0.6184189319610596, -0.5208336114883423, -0.423248291015625, -0.3256629705429077, -0.22807741165161133, -0.13049209117889404, -0.03290677070617676, 0.06467854976654053, 0.1622638702392578, 0.2598491907119751, 0.3574345111846924, 0.45501983165740967, 0.552605152130127, 0.6501904726028442, 0.7477757930755615, 0.8453611135482788, 0.9429464340209961, 1.0405317544937134, 1.1381170749664307, 1.235702395439148, 1.3332877159118652, 1.4308730363845825, 1.5284583568572998, 1.626043677330017, 1.7236289978027344, 1.8212143182754517, 1.918799638748169, 2.016385078430176, 2.1139702796936035, 2.2115554809570312, 2.309140920639038, 2.406726360321045, 2.5043115615844727, 2.6018967628479004, 2.6994822025299072, 2.797067642211914, 2.894652843475342]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 2.0, 3.0, 6.0, 16.0, 14.0, 8.0, 16.0, 30.0, 23.0, 27.0, 27.0, 28.0, 34.0, 26.0, 32.0, 49.0, 49.0, 48.0, 42.0, 41.0, 34.0, 30.0, 39.0, 29.0, 39.0, 40.0, 33.0, 30.0, 30.0, 26.0, 18.0, 25.0, 19.0, 17.0, 12.0, 8.0, 6.0, 12.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.750286102294922, -2.670217990875244, -2.5901501178741455, -2.5100820064544678, -2.430014133453369, -2.3499460220336914, -2.2698781490325928, -2.189810037612915, -2.1097421646118164, -2.0296740531921387, -1.94960618019104, -1.8695381879806519, -1.7894701957702637, -1.7094022035598755, -1.6293342113494873, -1.5492660999298096, -1.4691981077194214, -1.3891301155090332, -1.309062123298645, -1.2289941310882568, -1.1489261388778687, -1.0688581466674805, -0.9887900948524475, -0.9087221026420593, -0.8286541104316711, -0.748586118221283, -0.6685181260108948, -0.5884500741958618, -0.5083820819854736, -0.42831411957740784, -0.34824609756469727, -0.2681781053543091, -0.1881101131439209, -0.10804211348295212, -0.027974113821983337, 0.05209389328956604, 0.13216188549995422, 0.2122298777103424, 0.292297899723053, 0.37236589193344116, 0.45243388414382935, 0.5325018763542175, 0.6125698685646057, 0.6926379203796387, 0.7727059125900269, 0.852773904800415, 0.9328418970108032, 1.0129098892211914, 1.0929778814315796, 1.1730458736419678, 1.253113865852356, 1.3331818580627441, 1.4132498502731323, 1.4933178424835205, 1.5733859539031982, 1.6534538269042969, 1.7335219383239746, 1.8135899305343628, 1.893657922744751, 1.9737259149551392, 2.0537939071655273, 2.133862018585205, 2.2139298915863037, 2.2939980030059814, 2.37406587600708]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 17.0, 27.0, 25.0, 36.0, 45.0, 76.0, 119.0, 178.0, 251.0, 441.0, 734.0, 1246.0, 2374.0, 4394.0, 8666.0, 18709.0, 39206.0, 83009.0, 169491.0, 265414.0, 223873.0, 120114.0, 57149.0, 26871.0, 12506.0, 6161.0, 3138.0, 1664.0, 974.0, 584.0, 362.0, 238.0, 150.0, 97.0, 69.0, 48.0, 28.0, 13.0, 7.0, 12.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.46484375, -2.38720703125, -2.3095703125, -2.23193359375, -2.154296875, -2.07666015625, -1.9990234375, -1.92138671875, -1.84375, -1.76611328125, -1.6884765625, -1.61083984375, -1.533203125, -1.45556640625, -1.3779296875, -1.30029296875, -1.22265625, -1.14501953125, -1.0673828125, -0.98974609375, -0.912109375, -0.83447265625, -0.7568359375, -0.67919921875, -0.6015625, -0.52392578125, -0.4462890625, -0.36865234375, -0.291015625, -0.21337890625, -0.1357421875, -0.05810546875, 0.01953125, 0.09716796875, 0.1748046875, 0.25244140625, 0.330078125, 0.40771484375, 0.4853515625, 0.56298828125, 0.640625, 0.71826171875, 0.7958984375, 0.87353515625, 0.951171875, 1.02880859375, 1.1064453125, 1.18408203125, 1.26171875, 1.33935546875, 1.4169921875, 1.49462890625, 1.572265625, 1.64990234375, 1.7275390625, 1.80517578125, 1.8828125, 1.96044921875, 2.0380859375, 2.11572265625, 2.193359375, 2.27099609375, 2.3486328125, 2.42626953125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 5.0, 11.0, 6.0, 12.0, 16.0, 10.0, 20.0, 22.0, 24.0, 18.0, 18.0, 39.0, 33.0, 39.0, 35.0, 38.0, 45.0, 44.0, 39.0, 40.0, 39.0, 38.0, 31.0, 32.0, 40.0, 35.0, 28.0, 23.0, 30.0, 33.0, 31.0, 19.0, 12.0, 15.0, 13.0, 10.0, 12.0, 11.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71484375, -2.633209228515625, -2.55157470703125, -2.469940185546875, -2.3883056640625, -2.306671142578125, -2.22503662109375, -2.143402099609375, -2.061767578125, -1.980133056640625, -1.89849853515625, -1.816864013671875, -1.7352294921875, -1.653594970703125, -1.57196044921875, -1.490325927734375, -1.40869140625, -1.327056884765625, -1.24542236328125, -1.163787841796875, -1.0821533203125, -1.000518798828125, -0.91888427734375, -0.837249755859375, -0.755615234375, -0.673980712890625, -0.59234619140625, -0.510711669921875, -0.4290771484375, -0.347442626953125, -0.26580810546875, -0.184173583984375, -0.1025390625, -0.020904541015625, 0.06072998046875, 0.142364501953125, 0.2239990234375, 0.305633544921875, 0.38726806640625, 0.468902587890625, 0.550537109375, 0.632171630859375, 0.71380615234375, 0.795440673828125, 0.8770751953125, 0.958709716796875, 1.04034423828125, 1.121978759765625, 1.20361328125, 1.285247802734375, 1.36688232421875, 1.448516845703125, 1.5301513671875, 1.611785888671875, 1.69342041015625, 1.775054931640625, 1.856689453125, 1.938323974609375, 2.01995849609375, 2.101593017578125, 2.1832275390625, 2.264862060546875, 2.34649658203125, 2.428131103515625, 2.509765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 22.0, 25.0, 37.0, 51.0, 73.0, 114.0, 174.0, 279.0, 396.0, 624.0, 976.0, 1635.0, 2886.0, 5246.0, 9743.0, 19743.0, 41563.0, 89975.0, 191591.0, 294144.0, 203112.0, 96953.0, 44387.0, 21044.0, 10648.0, 5398.0, 2984.0, 1767.0, 1083.0, 633.0, 440.0, 234.0, 206.0, 118.0, 64.0, 58.0, 33.0, 26.0, 17.0, 11.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.669525146484375, -1.60662841796875, -1.543731689453125, -1.4808349609375, -1.417938232421875, -1.35504150390625, -1.292144775390625, -1.229248046875, -1.166351318359375, -1.10345458984375, -1.040557861328125, -0.9776611328125, -0.914764404296875, -0.85186767578125, -0.788970947265625, -0.72607421875, -0.663177490234375, -0.60028076171875, -0.537384033203125, -0.4744873046875, -0.411590576171875, -0.34869384765625, -0.285797119140625, -0.222900390625, -0.160003662109375, -0.09710693359375, -0.034210205078125, 0.0286865234375, 0.091583251953125, 0.15447998046875, 0.217376708984375, 0.2802734375, 0.343170166015625, 0.40606689453125, 0.468963623046875, 0.5318603515625, 0.594757080078125, 0.65765380859375, 0.720550537109375, 0.783447265625, 0.846343994140625, 0.90924072265625, 0.972137451171875, 1.0350341796875, 1.097930908203125, 1.16082763671875, 1.223724365234375, 1.28662109375, 1.349517822265625, 1.41241455078125, 1.475311279296875, 1.5382080078125, 1.601104736328125, 1.66400146484375, 1.726898193359375, 1.789794921875, 1.852691650390625, 1.91558837890625, 1.978485107421875, 2.0413818359375, 2.104278564453125, 2.16717529296875, 2.230072021484375, 2.29296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 3.0, 6.0, 11.0, 9.0, 17.0, 15.0, 16.0, 20.0, 30.0, 27.0, 36.0, 38.0, 31.0, 44.0, 39.0, 42.0, 46.0, 48.0, 46.0, 35.0, 44.0, 41.0, 36.0, 32.0, 30.0, 41.0, 27.0, 29.0, 22.0, 22.0, 16.0, 19.0, 11.0, 14.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.61602783203125, -1.5562744140625, -1.49652099609375, -1.436767578125, -1.37701416015625, -1.3172607421875, -1.25750732421875, -1.19775390625, -1.13800048828125, -1.0782470703125, -1.01849365234375, -0.958740234375, -0.89898681640625, -0.8392333984375, -0.77947998046875, -0.7197265625, -0.65997314453125, -0.6002197265625, -0.54046630859375, -0.480712890625, -0.42095947265625, -0.3612060546875, -0.30145263671875, -0.24169921875, -0.18194580078125, -0.1221923828125, -0.06243896484375, -0.002685546875, 0.05706787109375, 0.1168212890625, 0.17657470703125, 0.236328125, 0.29608154296875, 0.3558349609375, 0.41558837890625, 0.475341796875, 0.53509521484375, 0.5948486328125, 0.65460205078125, 0.71435546875, 0.77410888671875, 0.8338623046875, 0.89361572265625, 0.953369140625, 1.01312255859375, 1.0728759765625, 1.13262939453125, 1.1923828125, 1.25213623046875, 1.3118896484375, 1.37164306640625, 1.431396484375, 1.49114990234375, 1.5509033203125, 1.61065673828125, 1.67041015625, 1.73016357421875, 1.7899169921875, 1.84967041015625, 1.909423828125, 1.96917724609375, 2.0289306640625, 2.08868408203125, 2.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 14.0, 16.0, 23.0, 17.0, 20.0, 37.0, 44.0, 53.0, 71.0, 87.0, 132.0, 177.0, 209.0, 313.0, 436.0, 599.0, 1003.0, 1487.0, 2583.0, 4692.0, 10438.0, 31674.0, 187744.0, 665094.0, 101128.0, 22067.0, 8155.0, 3914.0, 2080.0, 1276.0, 855.0, 547.0, 417.0, 290.0, 186.0, 156.0, 113.0, 98.0, 61.0, 51.0, 48.0, 38.0, 19.0, 16.0, 16.0, 10.0, 11.0, 10.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.28515625, -2.2122802734375, -2.139404296875, -2.0665283203125, -1.99365234375, -1.9207763671875, -1.847900390625, -1.7750244140625, -1.7021484375, -1.6292724609375, -1.556396484375, -1.4835205078125, -1.41064453125, -1.3377685546875, -1.264892578125, -1.1920166015625, -1.119140625, -1.0462646484375, -0.973388671875, -0.9005126953125, -0.82763671875, -0.7547607421875, -0.681884765625, -0.6090087890625, -0.5361328125, -0.4632568359375, -0.390380859375, -0.3175048828125, -0.24462890625, -0.1717529296875, -0.098876953125, -0.0260009765625, 0.046875, 0.1197509765625, 0.192626953125, 0.2655029296875, 0.33837890625, 0.4112548828125, 0.484130859375, 0.5570068359375, 0.6298828125, 0.7027587890625, 0.775634765625, 0.8485107421875, 0.92138671875, 0.9942626953125, 1.067138671875, 1.1400146484375, 1.212890625, 1.2857666015625, 1.358642578125, 1.4315185546875, 1.50439453125, 1.5772705078125, 1.650146484375, 1.7230224609375, 1.7958984375, 1.8687744140625, 1.941650390625, 2.0145263671875, 2.08740234375, 2.1602783203125, 2.233154296875, 2.3060302734375, 2.37890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 14.0, 16.0, 26.0, 52.0, 55.0, 113.0, 118.0, 114.0, 126.0, 92.0, 86.0, 44.0, 35.0, 16.0, 10.0, 12.0, 11.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00014328956604003906, -0.00013889558613300323, -0.0001345016062259674, -0.00013010762631893158, -0.00012571364641189575, -0.00012131966650485992, -0.0001169256865978241, -0.00011253170669078827, -0.00010813772678375244, -0.00010374374687671661, -9.934976696968079e-05, -9.495578706264496e-05, -9.056180715560913e-05, -8.61678272485733e-05, -8.177384734153748e-05, -7.737986743450165e-05, -7.298588752746582e-05, -6.859190762042999e-05, -6.419792771339417e-05, -5.980394780635834e-05, -5.540996789932251e-05, -5.101598799228668e-05, -4.6622008085250854e-05, -4.222802817821503e-05, -3.78340482711792e-05, -3.344006836414337e-05, -2.9046088457107544e-05, -2.4652108550071716e-05, -2.025812864303589e-05, -1.586414873600006e-05, -1.1470168828964233e-05, -7.076188921928406e-06, -2.682209014892578e-06, 1.7117708921432495e-06, 6.105750799179077e-06, 1.0499730706214905e-05, 1.4893710613250732e-05, 1.928769052028656e-05, 2.3681670427322388e-05, 2.8075650334358215e-05, 3.246963024139404e-05, 3.686361014842987e-05, 4.12575900554657e-05, 4.5651569962501526e-05, 5.0045549869537354e-05, 5.443952977657318e-05, 5.883350968360901e-05, 6.322748959064484e-05, 6.762146949768066e-05, 7.201544940471649e-05, 7.640942931175232e-05, 8.080340921878815e-05, 8.519738912582397e-05, 8.95913690328598e-05, 9.398534893989563e-05, 9.837932884693146e-05, 0.00010277330875396729, 0.00010716728866100311, 0.00011156126856803894, 0.00011595524847507477, 0.0001203492283821106, 0.00012474320828914642, 0.00012913718819618225, 0.00013353116810321808, 0.0001379251480102539]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 13.0, 16.0, 17.0, 37.0, 36.0, 42.0, 64.0, 103.0, 157.0, 179.0, 245.0, 329.0, 498.0, 680.0, 924.0, 1231.0, 1853.0, 2985.0, 4684.0, 8207.0, 17532.0, 44549.0, 130059.0, 336648.0, 308034.0, 113843.0, 39050.0, 15756.0, 7590.0, 4355.0, 2657.0, 1758.0, 1201.0, 914.0, 620.0, 461.0, 338.0, 223.0, 175.0, 137.0, 94.0, 72.0, 66.0, 31.0, 20.0, 17.0, 18.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.455291748046875, -1.40667724609375, -1.358062744140625, -1.3094482421875, -1.260833740234375, -1.21221923828125, -1.163604736328125, -1.114990234375, -1.066375732421875, -1.01776123046875, -0.969146728515625, -0.9205322265625, -0.871917724609375, -0.82330322265625, -0.774688720703125, -0.72607421875, -0.677459716796875, -0.62884521484375, -0.580230712890625, -0.5316162109375, -0.483001708984375, -0.43438720703125, -0.385772705078125, -0.337158203125, -0.288543701171875, -0.23992919921875, -0.191314697265625, -0.1427001953125, -0.094085693359375, -0.04547119140625, 0.003143310546875, 0.0517578125, 0.100372314453125, 0.14898681640625, 0.197601318359375, 0.2462158203125, 0.294830322265625, 0.34344482421875, 0.392059326171875, 0.440673828125, 0.489288330078125, 0.53790283203125, 0.586517333984375, 0.6351318359375, 0.683746337890625, 0.73236083984375, 0.780975341796875, 0.82958984375, 0.878204345703125, 0.92681884765625, 0.975433349609375, 1.0240478515625, 1.072662353515625, 1.12127685546875, 1.169891357421875, 1.218505859375, 1.267120361328125, 1.31573486328125, 1.364349365234375, 1.4129638671875, 1.461578369140625, 1.51019287109375, 1.558807373046875, 1.607421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 5.0, 13.0, 12.0, 10.0, 28.0, 20.0, 31.0, 44.0, 63.0, 68.0, 76.0, 105.0, 103.0, 76.0, 69.0, 56.0, 45.0, 39.0, 21.0, 18.0, 13.0, 12.0, 11.0, 7.0, 2.0, 2.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.365966796875, -0.3542289733886719, -0.34249114990234375, -0.3307533264160156, -0.3190155029296875, -0.3072776794433594, -0.29553985595703125, -0.2838020324707031, -0.272064208984375, -0.2603263854980469, -0.24858856201171875, -0.23685073852539062, -0.2251129150390625, -0.21337509155273438, -0.20163726806640625, -0.18989944458007812, -0.17816162109375, -0.16642379760742188, -0.15468597412109375, -0.14294815063476562, -0.1312103271484375, -0.11947250366210938, -0.10773468017578125, -0.09599685668945312, -0.084259033203125, -0.07252120971679688, -0.06078338623046875, -0.049045562744140625, -0.0373077392578125, -0.025569915771484375, -0.01383209228515625, -0.002094268798828125, 0.0096435546875, 0.021381378173828125, 0.03311920166015625, 0.044857025146484375, 0.0565948486328125, 0.06833267211914062, 0.08007049560546875, 0.09180831909179688, 0.103546142578125, 0.11528396606445312, 0.12702178955078125, 0.13875961303710938, 0.1504974365234375, 0.16223526000976562, 0.17397308349609375, 0.18571090698242188, 0.19744873046875, 0.20918655395507812, 0.22092437744140625, 0.23266220092773438, 0.2444000244140625, 0.2561378479003906, 0.26787567138671875, 0.2796134948730469, 0.291351318359375, 0.3030891418457031, 0.31482696533203125, 0.3265647888183594, 0.3383026123046875, 0.3500404357910156, 0.36177825927734375, 0.3735160827636719, 0.38525390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 10.0, 18.0, 20.0, 12.0, 20.0, 32.0, 27.0, 27.0, 31.0, 30.0, 33.0, 56.0, 55.0, 62.0, 51.0, 46.0, 54.0, 43.0, 46.0, 46.0, 42.0, 39.0, 26.0, 31.0, 34.0, 20.0, 9.0, 12.0, 13.0, 16.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265214204788208, -3.1674351692199707, -3.0696561336517334, -2.971877098083496, -2.874098062515259, -2.7763190269470215, -2.678539991378784, -2.580760955810547, -2.4829819202423096, -2.3852028846740723, -2.287423849105835, -2.1896448135375977, -2.0918657779693604, -1.994086742401123, -1.8963077068328857, -1.7985286712646484, -1.7007497549057007, -1.6029707193374634, -1.505191683769226, -1.4074126482009888, -1.3096336126327515, -1.2118545770645142, -1.1140756607055664, -1.016296625137329, -0.918517529964447, -0.8207384943962097, -0.7229594588279724, -0.6251804828643799, -0.5274014472961426, -0.4296223819255829, -0.33184337615966797, -0.23406434059143066, -0.13628530502319336, -0.03850627690553665, 0.059272751212120056, 0.15705177187919617, 0.25483080744743347, 0.3526098430156708, 0.4503888487815857, 0.548167884349823, 0.6459469199180603, 0.7437259554862976, 0.8415049910545349, 0.9392839670181274, 1.0370630025863647, 1.134842038154602, 1.2326210737228394, 1.3304001092910767, 1.428179144859314, 1.5259581804275513, 1.6237372159957886, 1.7215162515640259, 1.8192952871322632, 1.9170743227005005, 2.0148532390594482, 2.1126322746276855, 2.210411310195923, 2.30819034576416, 2.4059693813323975, 2.5037484169006348, 2.601527452468872, 2.6993064880371094, 2.7970855236053467, 2.894864559173584, 2.9926435947418213]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 7.0, 13.0, 12.0, 11.0, 18.0, 20.0, 30.0, 31.0, 23.0, 27.0, 25.0, 28.0, 39.0, 48.0, 48.0, 38.0, 34.0, 45.0, 48.0, 28.0, 33.0, 31.0, 35.0, 38.0, 35.0, 30.0, 23.0, 36.0, 20.0, 23.0, 19.0, 19.0, 16.0, 10.0, 4.0, 12.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.642449140548706, -2.5643460750579834, -2.4862427711486816, -2.408139705657959, -2.3300366401672363, -2.2519335746765137, -2.173830270767212, -2.0957272052764893, -2.0176239013671875, -1.9395207166671753, -1.8614176511764526, -1.7833144664764404, -1.7052114009857178, -1.6271082162857056, -1.5490050315856934, -1.4709019660949707, -1.392798900604248, -1.3146957159042358, -1.2365926504135132, -1.158489465713501, -1.0803864002227783, -1.0022832155227661, -0.9241800308227539, -0.8460769057273865, -0.767973780632019, -0.6898706555366516, -0.6117675304412842, -0.533664345741272, -0.45556122064590454, -0.3774580955505371, -0.2993549406528473, -0.22125178575515747, -0.14314889907836914, -0.06504575908184052, 0.01305738091468811, 0.09116052091121674, 0.16926366090774536, 0.2473667860031128, 0.3254699409008026, 0.40357309579849243, 0.48167622089385986, 0.5597793459892273, 0.6378824710845947, 0.7159856557846069, 0.7940887808799744, 0.8721919059753418, 0.950295090675354, 1.0283982753753662, 1.1065013408660889, 1.184604525566101, 1.2627075910568237, 1.340810775756836, 1.4189138412475586, 1.4970170259475708, 1.575120210647583, 1.6532232761383057, 1.7313264608383179, 1.80942964553833, 1.8875327110290527, 1.965635895729065, 2.043739080429077, 2.1218421459198, 2.1999452114105225, 2.278048515319824, 2.356151580810547]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 13.0, 17.0, 37.0, 36.0, 61.0, 97.0, 158.0, 210.0, 363.0, 574.0, 894.0, 1542.0, 2436.0, 3994.0, 6380.0, 9952.0, 15611.0, 23825.0, 35609.0, 51795.0, 70984.0, 91955.0, 110038.0, 119786.0, 117408.0, 104729.0, 84257.0, 63918.0, 45160.0, 30615.0, 20240.0, 13445.0, 8208.0, 5314.0, 3329.0, 2143.0, 1316.0, 769.0, 509.0, 328.0, 169.0, 115.0, 80.0, 53.0, 33.0, 24.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.826171875, -2.74005126953125, -2.6539306640625, -2.56781005859375, -2.481689453125, -2.39556884765625, -2.3094482421875, -2.22332763671875, -2.13720703125, -2.05108642578125, -1.9649658203125, -1.87884521484375, -1.792724609375, -1.70660400390625, -1.6204833984375, -1.53436279296875, -1.4482421875, -1.36212158203125, -1.2760009765625, -1.18988037109375, -1.103759765625, -1.01763916015625, -0.9315185546875, -0.84539794921875, -0.75927734375, -0.67315673828125, -0.5870361328125, -0.50091552734375, -0.414794921875, -0.32867431640625, -0.2425537109375, -0.15643310546875, -0.0703125, 0.01580810546875, 0.1019287109375, 0.18804931640625, 0.274169921875, 0.36029052734375, 0.4464111328125, 0.53253173828125, 0.61865234375, 0.70477294921875, 0.7908935546875, 0.87701416015625, 0.963134765625, 1.04925537109375, 1.1353759765625, 1.22149658203125, 1.3076171875, 1.39373779296875, 1.4798583984375, 1.56597900390625, 1.652099609375, 1.73822021484375, 1.8243408203125, 1.91046142578125, 1.99658203125, 2.08270263671875, 2.1688232421875, 2.25494384765625, 2.341064453125, 2.42718505859375, 2.5133056640625, 2.59942626953125, 2.685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 10.0, 4.0, 16.0, 14.0, 17.0, 22.0, 17.0, 27.0, 27.0, 36.0, 32.0, 32.0, 35.0, 45.0, 32.0, 44.0, 47.0, 34.0, 37.0, 38.0, 48.0, 36.0, 38.0, 23.0, 34.0, 35.0, 21.0, 23.0, 29.0, 19.0, 24.0, 22.0, 14.0, 10.0, 10.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.6484375, -2.57012939453125, -2.4918212890625, -2.41351318359375, -2.335205078125, -2.25689697265625, -2.1785888671875, -2.10028076171875, -2.02197265625, -1.94366455078125, -1.8653564453125, -1.78704833984375, -1.708740234375, -1.63043212890625, -1.5521240234375, -1.47381591796875, -1.3955078125, -1.31719970703125, -1.2388916015625, -1.16058349609375, -1.082275390625, -1.00396728515625, -0.9256591796875, -0.84735107421875, -0.76904296875, -0.69073486328125, -0.6124267578125, -0.53411865234375, -0.455810546875, -0.37750244140625, -0.2991943359375, -0.22088623046875, -0.142578125, -0.06427001953125, 0.0140380859375, 0.09234619140625, 0.170654296875, 0.24896240234375, 0.3272705078125, 0.40557861328125, 0.48388671875, 0.56219482421875, 0.6405029296875, 0.71881103515625, 0.797119140625, 0.87542724609375, 0.9537353515625, 1.03204345703125, 1.1103515625, 1.18865966796875, 1.2669677734375, 1.34527587890625, 1.423583984375, 1.50189208984375, 1.5802001953125, 1.65850830078125, 1.73681640625, 1.81512451171875, 1.8934326171875, 1.97174072265625, 2.050048828125, 2.12835693359375, 2.2066650390625, 2.28497314453125, 2.36328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 13.0, 13.0, 10.0, 16.0, 33.0, 48.0, 86.0, 86.0, 128.0, 190.0, 325.0, 462.0, 739.0, 1079.0, 1589.0, 2474.0, 3640.0, 5332.0, 8377.0, 12243.0, 18133.0, 26326.0, 37081.0, 51792.0, 67703.0, 84323.0, 98260.0, 107617.0, 107504.0, 98450.0, 83229.0, 66027.0, 49940.0, 36218.0, 25937.0, 17412.0, 11973.0, 8121.0, 5262.0, 3438.0, 2274.0, 1558.0, 1041.0, 623.0, 485.0, 303.0, 195.0, 132.0, 107.0, 71.0, 59.0, 28.0, 10.0, 20.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0], "bins": [-2.330078125, -2.257171630859375, -2.18426513671875, -2.111358642578125, -2.0384521484375, -1.965545654296875, -1.89263916015625, -1.819732666015625, -1.746826171875, -1.673919677734375, -1.60101318359375, -1.528106689453125, -1.4552001953125, -1.382293701171875, -1.30938720703125, -1.236480712890625, -1.16357421875, -1.090667724609375, -1.01776123046875, -0.944854736328125, -0.8719482421875, -0.799041748046875, -0.72613525390625, -0.653228759765625, -0.580322265625, -0.507415771484375, -0.43450927734375, -0.361602783203125, -0.2886962890625, -0.215789794921875, -0.14288330078125, -0.069976806640625, 0.0029296875, 0.075836181640625, 0.14874267578125, 0.221649169921875, 0.2945556640625, 0.367462158203125, 0.44036865234375, 0.513275146484375, 0.586181640625, 0.659088134765625, 0.73199462890625, 0.804901123046875, 0.8778076171875, 0.950714111328125, 1.02362060546875, 1.096527099609375, 1.16943359375, 1.242340087890625, 1.31524658203125, 1.388153076171875, 1.4610595703125, 1.533966064453125, 1.60687255859375, 1.679779052734375, 1.752685546875, 1.825592041015625, 1.89849853515625, 1.971405029296875, 2.0443115234375, 2.117218017578125, 2.19012451171875, 2.263031005859375, 2.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 5.0, 5.0, 9.0, 9.0, 7.0, 16.0, 14.0, 11.0, 17.0, 21.0, 25.0, 20.0, 33.0, 26.0, 38.0, 35.0, 40.0, 32.0, 32.0, 40.0, 45.0, 37.0, 50.0, 38.0, 28.0, 30.0, 33.0, 30.0, 29.0, 17.0, 20.0, 22.0, 18.0, 20.0, 20.0, 26.0, 12.0, 13.0, 14.0, 13.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.43359375, -1.387115478515625, -1.34063720703125, -1.294158935546875, -1.2476806640625, -1.201202392578125, -1.15472412109375, -1.108245849609375, -1.061767578125, -1.015289306640625, -0.96881103515625, -0.922332763671875, -0.8758544921875, -0.829376220703125, -0.78289794921875, -0.736419677734375, -0.68994140625, -0.643463134765625, -0.59698486328125, -0.550506591796875, -0.5040283203125, -0.457550048828125, -0.41107177734375, -0.364593505859375, -0.318115234375, -0.271636962890625, -0.22515869140625, -0.178680419921875, -0.1322021484375, -0.085723876953125, -0.03924560546875, 0.007232666015625, 0.0537109375, 0.100189208984375, 0.14666748046875, 0.193145751953125, 0.2396240234375, 0.286102294921875, 0.33258056640625, 0.379058837890625, 0.425537109375, 0.472015380859375, 0.51849365234375, 0.564971923828125, 0.6114501953125, 0.657928466796875, 0.70440673828125, 0.750885009765625, 0.79736328125, 0.843841552734375, 0.89031982421875, 0.936798095703125, 0.9832763671875, 1.029754638671875, 1.07623291015625, 1.122711181640625, 1.169189453125, 1.215667724609375, 1.26214599609375, 1.308624267578125, 1.3551025390625, 1.401580810546875, 1.44805908203125, 1.494537353515625, 1.541015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 20.0, 28.0, 47.0, 56.0, 70.0, 116.0, 175.0, 244.0, 368.0, 528.0, 736.0, 1116.0, 1884.0, 3040.0, 5412.0, 9753.0, 19544.0, 43548.0, 100710.0, 209204.0, 280337.0, 198141.0, 92559.0, 40248.0, 18322.0, 9207.0, 5009.0, 2899.0, 1810.0, 1038.0, 726.0, 498.0, 348.0, 254.0, 167.0, 114.0, 81.0, 52.0, 31.0, 21.0, 22.0, 13.0, 16.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.954742431640625, -2.85089111328125, -2.747039794921875, -2.6431884765625, -2.539337158203125, -2.43548583984375, -2.331634521484375, -2.227783203125, -2.123931884765625, -2.02008056640625, -1.916229248046875, -1.8123779296875, -1.708526611328125, -1.60467529296875, -1.500823974609375, -1.39697265625, -1.293121337890625, -1.18927001953125, -1.085418701171875, -0.9815673828125, -0.877716064453125, -0.77386474609375, -0.670013427734375, -0.566162109375, -0.462310791015625, -0.35845947265625, -0.254608154296875, -0.1507568359375, -0.046905517578125, 0.05694580078125, 0.160797119140625, 0.2646484375, 0.368499755859375, 0.47235107421875, 0.576202392578125, 0.6800537109375, 0.783905029296875, 0.88775634765625, 0.991607666015625, 1.095458984375, 1.199310302734375, 1.30316162109375, 1.407012939453125, 1.5108642578125, 1.614715576171875, 1.71856689453125, 1.822418212890625, 1.92626953125, 2.030120849609375, 2.13397216796875, 2.237823486328125, 2.3416748046875, 2.445526123046875, 2.54937744140625, 2.653228759765625, 2.757080078125, 2.860931396484375, 2.96478271484375, 3.068634033203125, 3.1724853515625, 3.276336669921875, 3.38018798828125, 3.484039306640625, 3.587890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 6.0, 14.0, 8.0, 20.0, 38.0, 64.0, 75.0, 109.0, 111.0, 107.0, 124.0, 91.0, 65.0, 52.0, 33.0, 23.0, 20.0, 4.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004410743713378906, -0.0004278421401977539, -0.0004146099090576172, -0.00040137767791748047, -0.00038814544677734375, -0.00037491321563720703, -0.0003616809844970703, -0.0003484487533569336, -0.0003352165222167969, -0.00032198429107666016, -0.00030875205993652344, -0.0002955198287963867, -0.00028228759765625, -0.0002690553665161133, -0.00025582313537597656, -0.00024259090423583984, -0.00022935867309570312, -0.0002161264419555664, -0.0002028942108154297, -0.00018966197967529297, -0.00017642974853515625, -0.00016319751739501953, -0.0001499652862548828, -0.0001367330551147461, -0.00012350082397460938, -0.00011026859283447266, -9.703636169433594e-05, -8.380413055419922e-05, -7.05718994140625e-05, -5.733966827392578e-05, -4.410743713378906e-05, -3.0875205993652344e-05, -1.7642974853515625e-05, -4.410743713378906e-06, 8.821487426757812e-06, 2.205371856689453e-05, 3.528594970703125e-05, 4.851818084716797e-05, 6.175041198730469e-05, 7.49826431274414e-05, 8.821487426757812e-05, 0.00010144710540771484, 0.00011467933654785156, 0.00012791156768798828, 0.000141143798828125, 0.00015437602996826172, 0.00016760826110839844, 0.00018084049224853516, 0.00019407272338867188, 0.0002073049545288086, 0.0002205371856689453, 0.00023376941680908203, 0.00024700164794921875, 0.00026023387908935547, 0.0002734661102294922, 0.0002866983413696289, 0.0002999305725097656, 0.00031316280364990234, 0.00032639503479003906, 0.0003396272659301758, 0.0003528594970703125, 0.0003660917282104492, 0.00037932395935058594, 0.00039255619049072266, 0.0004057884216308594]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 7.0, 16.0, 21.0, 36.0, 39.0, 55.0, 59.0, 115.0, 178.0, 278.0, 408.0, 621.0, 940.0, 1536.0, 2281.0, 3789.0, 6237.0, 10406.0, 18017.0, 30099.0, 50877.0, 83858.0, 126549.0, 163657.0, 169286.0, 138581.0, 94878.0, 58745.0, 35242.0, 20592.0, 11919.0, 7235.0, 4366.0, 2700.0, 1789.0, 1070.0, 684.0, 459.0, 290.0, 195.0, 135.0, 99.0, 58.0, 51.0, 29.0, 20.0, 16.0, 6.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.78515625, -1.7278289794921875, -1.670501708984375, -1.6131744384765625, -1.55584716796875, -1.4985198974609375, -1.441192626953125, -1.3838653564453125, -1.3265380859375, -1.2692108154296875, -1.211883544921875, -1.1545562744140625, -1.09722900390625, -1.0399017333984375, -0.982574462890625, -0.9252471923828125, -0.867919921875, -0.8105926513671875, -0.753265380859375, -0.6959381103515625, -0.63861083984375, -0.5812835693359375, -0.523956298828125, -0.4666290283203125, -0.4093017578125, -0.3519744873046875, -0.294647216796875, -0.2373199462890625, -0.17999267578125, -0.1226654052734375, -0.065338134765625, -0.0080108642578125, 0.04931640625, 0.1066436767578125, 0.163970947265625, 0.2212982177734375, 0.27862548828125, 0.3359527587890625, 0.393280029296875, 0.4506072998046875, 0.5079345703125, 0.5652618408203125, 0.622589111328125, 0.6799163818359375, 0.73724365234375, 0.7945709228515625, 0.851898193359375, 0.9092254638671875, 0.966552734375, 1.0238800048828125, 1.081207275390625, 1.1385345458984375, 1.19586181640625, 1.2531890869140625, 1.310516357421875, 1.3678436279296875, 1.4251708984375, 1.4824981689453125, 1.539825439453125, 1.5971527099609375, 1.65447998046875, 1.7118072509765625, 1.769134521484375, 1.8264617919921875, 1.8837890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 6.0, 8.0, 15.0, 14.0, 15.0, 23.0, 22.0, 32.0, 37.0, 31.0, 38.0, 51.0, 49.0, 39.0, 45.0, 45.0, 50.0, 60.0, 58.0, 34.0, 33.0, 31.0, 39.0, 31.0, 23.0, 21.0, 24.0, 8.0, 19.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.51513671875, -0.49948883056640625, -0.4838409423828125, -0.46819305419921875, -0.452545166015625, -0.43689727783203125, -0.4212493896484375, -0.40560150146484375, -0.38995361328125, -0.37430572509765625, -0.3586578369140625, -0.34300994873046875, -0.327362060546875, -0.31171417236328125, -0.2960662841796875, -0.28041839599609375, -0.2647705078125, -0.24912261962890625, -0.2334747314453125, -0.21782684326171875, -0.202178955078125, -0.18653106689453125, -0.1708831787109375, -0.15523529052734375, -0.13958740234375, -0.12393951416015625, -0.1082916259765625, -0.09264373779296875, -0.076995849609375, -0.06134796142578125, -0.0457000732421875, -0.03005218505859375, -0.014404296875, 0.00124359130859375, 0.0168914794921875, 0.03253936767578125, 0.048187255859375, 0.06383514404296875, 0.0794830322265625, 0.09513092041015625, 0.11077880859375, 0.12642669677734375, 0.1420745849609375, 0.15772247314453125, 0.173370361328125, 0.18901824951171875, 0.2046661376953125, 0.22031402587890625, 0.2359619140625, 0.25160980224609375, 0.2672576904296875, 0.28290557861328125, 0.298553466796875, 0.31420135498046875, 0.3298492431640625, 0.34549713134765625, 0.36114501953125, 0.37679290771484375, 0.3924407958984375, 0.40808868408203125, 0.423736572265625, 0.43938446044921875, 0.4550323486328125, 0.47068023681640625, 0.486328125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 9.0, 12.0, 18.0, 20.0, 20.0, 18.0, 23.0, 25.0, 30.0, 27.0, 40.0, 38.0, 53.0, 49.0, 32.0, 47.0, 50.0, 56.0, 43.0, 36.0, 44.0, 40.0, 33.0, 25.0, 26.0, 30.0, 24.0, 17.0, 18.0, 13.0, 17.0, 11.0, 2.0, 9.0, 8.0, 5.0, 2.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.74275541305542, -2.6544618606567383, -2.5661680698394775, -2.477874279022217, -2.389580726623535, -2.3012871742248535, -2.2129933834075928, -2.124699592590332, -2.0364060401916504, -1.9481123685836792, -1.859818696975708, -1.7715250253677368, -1.6832313537597656, -1.5949376821517944, -1.5066440105438232, -1.418350338935852, -1.3300566673278809, -1.2417629957199097, -1.1534693241119385, -1.0651756525039673, -0.9768819808959961, -0.8885883092880249, -0.8002946376800537, -0.7120009660720825, -0.6237072944641113, -0.5354136228561401, -0.44711995124816895, -0.35882627964019775, -0.27053260803222656, -0.18223893642425537, -0.09394526481628418, -0.005651593208312988, 0.0826418399810791, 0.1709355115890503, 0.2592291831970215, 0.3475228548049927, 0.43581652641296387, 0.5241101980209351, 0.6124038696289062, 0.7006975412368774, 0.7889912128448486, 0.8772848844528198, 0.965578556060791, 1.0538722276687622, 1.1421658992767334, 1.2304595708847046, 1.3187532424926758, 1.407046914100647, 1.4953405857086182, 1.5836342573165894, 1.6719279289245605, 1.7602216005325317, 1.848515272140503, 1.9368089437484741, 2.0251026153564453, 2.113396167755127, 2.2016899585723877, 2.2899837493896484, 2.37827730178833, 2.4665708541870117, 2.5548646450042725, 2.643158435821533, 2.731451988220215, 2.8197455406188965, 2.9080393314361572]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 12.0, 17.0, 13.0, 12.0, 18.0, 18.0, 11.0, 21.0, 21.0, 22.0, 29.0, 25.0, 35.0, 44.0, 31.0, 45.0, 38.0, 35.0, 41.0, 38.0, 50.0, 36.0, 35.0, 30.0, 35.0, 29.0, 31.0, 25.0, 26.0, 20.0, 23.0, 24.0, 17.0, 17.0, 13.0, 9.0, 7.0, 8.0, 1.0, 7.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5127570629119873, -2.4362292289733887, -2.35970139503479, -2.2831737995147705, -2.206645965576172, -2.1301181316375732, -2.0535902976989746, -1.977062463760376, -1.900534749031067, -1.8240069150924683, -1.7474792003631592, -1.6709513664245605, -1.594423532485962, -1.5178958177566528, -1.4413679838180542, -1.3648402690887451, -1.2883124351501465, -1.2117846012115479, -1.1352568864822388, -1.0587290525436401, -0.9822012782096863, -0.9056735038757324, -0.8291456699371338, -0.7526178956031799, -0.6760901212692261, -0.5995623469352722, -0.5230345726013184, -0.4465067386627197, -0.36997896432876587, -0.293451189994812, -0.21692338585853577, -0.14039558172225952, -0.06386804580688477, 0.012659743428230286, 0.08918753266334534, 0.1657153218984604, 0.24224311113357544, 0.3187708854675293, 0.39529868960380554, 0.4718264937400818, 0.5483542680740356, 0.6248820424079895, 0.7014098167419434, 0.777937650680542, 0.8544654250144958, 0.9309931993484497, 1.0075210332870483, 1.0840487480163574, 1.160576581954956, 1.2371044158935547, 1.3136321306228638, 1.3901599645614624, 1.4666876792907715, 1.5432155132293701, 1.6197433471679688, 1.6962711811065674, 1.7727988958358765, 1.849326729774475, 1.9258544445037842, 2.002382278442383, 2.0789101123809814, 2.15543794631958, 2.2319655418395996, 2.3084933757781982, 2.385021209716797]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 6.0, 10.0, 21.0, 21.0, 41.0, 82.0, 159.0, 239.0, 390.0, 668.0, 1130.0, 1920.0, 3135.0, 5245.0, 8943.0, 15356.0, 26283.0, 43784.0, 73951.0, 121924.0, 195773.0, 300346.0, 427972.0, 543121.0, 593948.0, 550498.0, 439748.0, 312250.0, 205893.0, 128274.0, 78963.0, 46810.0, 27504.0, 16233.0, 9442.0, 5712.0, 3344.0, 2006.0, 1213.0, 724.0, 465.0, 299.0, 164.0, 114.0, 60.0, 31.0, 42.0, 11.0, 8.0, 1.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8932037353515625, -1.824493408203125, -1.7557830810546875, -1.68707275390625, -1.6183624267578125, -1.549652099609375, -1.4809417724609375, -1.4122314453125, -1.3435211181640625, -1.274810791015625, -1.2061004638671875, -1.13739013671875, -1.0686798095703125, -0.999969482421875, -0.9312591552734375, -0.862548828125, -0.7938385009765625, -0.725128173828125, -0.6564178466796875, -0.58770751953125, -0.5189971923828125, -0.450286865234375, -0.3815765380859375, -0.3128662109375, -0.2441558837890625, -0.175445556640625, -0.1067352294921875, -0.03802490234375, 0.0306854248046875, 0.099395751953125, 0.1681060791015625, 0.23681640625, 0.3055267333984375, 0.374237060546875, 0.4429473876953125, 0.51165771484375, 0.5803680419921875, 0.649078369140625, 0.7177886962890625, 0.7864990234375, 0.8552093505859375, 0.923919677734375, 0.9926300048828125, 1.06134033203125, 1.1300506591796875, 1.198760986328125, 1.2674713134765625, 1.336181640625, 1.4048919677734375, 1.473602294921875, 1.5423126220703125, 1.61102294921875, 1.6797332763671875, 1.748443603515625, 1.8171539306640625, 1.8858642578125, 1.9545745849609375, 2.023284912109375, 2.0919952392578125, 2.16070556640625, 2.2294158935546875, 2.298126220703125, 2.3668365478515625, 2.435546875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 12.0, 13.0, 19.0, 8.0, 17.0, 29.0, 30.0, 17.0, 36.0, 35.0, 32.0, 40.0, 40.0, 38.0, 45.0, 37.0, 45.0, 44.0, 46.0, 44.0, 38.0, 34.0, 35.0, 26.0, 31.0, 24.0, 26.0, 26.0, 15.0, 20.0, 12.0, 16.0, 16.0, 11.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9421234130859375, -1.882293701171875, -1.8224639892578125, -1.76263427734375, -1.7028045654296875, -1.642974853515625, -1.5831451416015625, -1.5233154296875, -1.4634857177734375, -1.403656005859375, -1.3438262939453125, -1.28399658203125, -1.2241668701171875, -1.164337158203125, -1.1045074462890625, -1.044677734375, -0.9848480224609375, -0.925018310546875, -0.8651885986328125, -0.80535888671875, -0.7455291748046875, -0.685699462890625, -0.6258697509765625, -0.5660400390625, -0.5062103271484375, -0.446380615234375, -0.3865509033203125, -0.32672119140625, -0.2668914794921875, -0.207061767578125, -0.1472320556640625, -0.08740234375, -0.0275726318359375, 0.032257080078125, 0.0920867919921875, 0.15191650390625, 0.2117462158203125, 0.271575927734375, 0.3314056396484375, 0.3912353515625, 0.4510650634765625, 0.510894775390625, 0.5707244873046875, 0.63055419921875, 0.6903839111328125, 0.750213623046875, 0.8100433349609375, 0.869873046875, 0.9297027587890625, 0.989532470703125, 1.0493621826171875, 1.10919189453125, 1.1690216064453125, 1.228851318359375, 1.2886810302734375, 1.3485107421875, 1.4083404541015625, 1.468170166015625, 1.5279998779296875, 1.58782958984375, 1.6476593017578125, 1.707489013671875, 1.7673187255859375, 1.8271484375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 9.0, 8.0, 19.0, 37.0, 48.0, 70.0, 121.0, 167.0, 305.0, 522.0, 747.0, 1175.0, 1888.0, 3016.0, 4639.0, 7535.0, 11887.0, 18713.0, 29477.0, 45899.0, 70096.0, 105526.0, 151809.0, 214589.0, 287922.0, 365575.0, 428604.0, 462047.0, 449901.0, 399661.0, 328065.0, 250259.0, 182285.0, 127444.0, 85086.0, 57148.0, 37173.0, 23739.0, 15027.0, 9676.0, 5978.0, 3814.0, 2405.0, 1584.0, 941.0, 611.0, 388.0, 230.0, 144.0, 83.0, 92.0, 36.0, 26.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0], "bins": [-1.8271484375, -1.7713623046875, -1.715576171875, -1.6597900390625, -1.60400390625, -1.5482177734375, -1.492431640625, -1.4366455078125, -1.380859375, -1.3250732421875, -1.269287109375, -1.2135009765625, -1.15771484375, -1.1019287109375, -1.046142578125, -0.9903564453125, -0.9345703125, -0.8787841796875, -0.822998046875, -0.7672119140625, -0.71142578125, -0.6556396484375, -0.599853515625, -0.5440673828125, -0.48828125, -0.4324951171875, -0.376708984375, -0.3209228515625, -0.26513671875, -0.2093505859375, -0.153564453125, -0.0977783203125, -0.0419921875, 0.0137939453125, 0.069580078125, 0.1253662109375, 0.18115234375, 0.2369384765625, 0.292724609375, 0.3485107421875, 0.404296875, 0.4600830078125, 0.515869140625, 0.5716552734375, 0.62744140625, 0.6832275390625, 0.739013671875, 0.7947998046875, 0.8505859375, 0.9063720703125, 0.962158203125, 1.0179443359375, 1.07373046875, 1.1295166015625, 1.185302734375, 1.2410888671875, 1.296875, 1.3526611328125, 1.408447265625, 1.4642333984375, 1.52001953125, 1.5758056640625, 1.631591796875, 1.6873779296875, 1.7431640625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 17.0, 15.0, 19.0, 14.0, 21.0, 18.0, 38.0, 35.0, 45.0, 55.0, 65.0, 106.0, 108.0, 117.0, 120.0, 146.0, 155.0, 174.0, 173.0, 199.0, 202.0, 188.0, 197.0, 193.0, 198.0, 167.0, 179.0, 164.0, 144.0, 129.0, 104.0, 106.0, 79.0, 56.0, 84.0, 58.0, 39.0, 27.0, 20.0, 23.0, 21.0, 9.0, 8.0, 12.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.88037109375, -0.8539810180664062, -0.8275909423828125, -0.8012008666992188, -0.774810791015625, -0.7484207153320312, -0.7220306396484375, -0.6956405639648438, -0.66925048828125, -0.6428604125976562, -0.6164703369140625, -0.5900802612304688, -0.563690185546875, -0.5373001098632812, -0.5109100341796875, -0.48451995849609375, -0.4581298828125, -0.43173980712890625, -0.4053497314453125, -0.37895965576171875, -0.352569580078125, -0.32617950439453125, -0.2997894287109375, -0.27339935302734375, -0.24700927734375, -0.22061920166015625, -0.1942291259765625, -0.16783905029296875, -0.141448974609375, -0.11505889892578125, -0.0886688232421875, -0.06227874755859375, -0.035888671875, -0.00949859619140625, 0.0168914794921875, 0.04328155517578125, 0.069671630859375, 0.09606170654296875, 0.1224517822265625, 0.14884185791015625, 0.17523193359375, 0.20162200927734375, 0.2280120849609375, 0.25440216064453125, 0.280792236328125, 0.30718231201171875, 0.3335723876953125, 0.35996246337890625, 0.3863525390625, 0.41274261474609375, 0.4391326904296875, 0.46552276611328125, 0.491912841796875, 0.5183029174804688, 0.5446929931640625, 0.5710830688476562, 0.59747314453125, 0.6238632202148438, 0.6502532958984375, 0.6766433715820312, 0.703033447265625, 0.7294235229492188, 0.7558135986328125, 0.7822036743164062, 0.80859375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 11.0, 18.0, 21.0, 28.0, 26.0, 25.0, 44.0, 35.0, 38.0, 41.0, 48.0, 41.0, 53.0, 54.0, 62.0, 55.0, 44.0, 40.0, 44.0, 34.0, 41.0, 40.0, 27.0, 22.0, 13.0, 16.0, 12.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.011713743209839, -2.9235851764678955, -2.835456609725952, -2.747328042984009, -2.6591994762420654, -2.571070909500122, -2.482942581176758, -2.3948140144348145, -2.306685447692871, -2.2185568809509277, -2.1304283142089844, -2.042299747467041, -1.9541711807250977, -1.8660426139831543, -1.7779141664505005, -1.6897855997085571, -1.6016569137573242, -1.5135283470153809, -1.4253997802734375, -1.3372712135314941, -1.2491426467895508, -1.1610140800476074, -1.0728856325149536, -0.9847570657730103, -0.8966284990310669, -0.8084999322891235, -0.7203713655471802, -0.6322428584098816, -0.5441142916679382, -0.4559857249259949, -0.3678572177886963, -0.27972865104675293, -0.19160032272338867, -0.1034717708826065, -0.01534321904182434, 0.07278531789779663, 0.16091388463974, 0.24904245138168335, 0.33717095851898193, 0.4252995252609253, 0.5134280920028687, 0.601556658744812, 0.6896852254867554, 0.777813732624054, 0.8659422993659973, 0.9540708661079407, 1.0421993732452393, 1.1303279399871826, 1.218456506729126, 1.3065850734710693, 1.3947136402130127, 1.482842206954956, 1.5709707736968994, 1.6590993404388428, 1.7472277879714966, 1.83535635471344, 1.9234849214553833, 2.011613368988037, 2.0997419357299805, 2.187870502471924, 2.275999069213867, 2.3641276359558105, 2.452256202697754, 2.5403847694396973, 2.6285133361816406]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 6.0, 12.0, 12.0, 14.0, 12.0, 15.0, 16.0, 16.0, 22.0, 19.0, 35.0, 35.0, 24.0, 23.0, 22.0, 24.0, 34.0, 42.0, 40.0, 31.0, 47.0, 35.0, 44.0, 37.0, 34.0, 27.0, 35.0, 27.0, 32.0, 26.0, 15.0, 26.0, 20.0, 15.0, 13.0, 16.0, 16.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.096761703491211, -2.035475492477417, -1.9741891622543335, -1.91290283203125, -1.851616621017456, -1.790330410003662, -1.7290440797805786, -1.6677577495574951, -1.6064715385437012, -1.5451853275299072, -1.4838989973068237, -1.4226126670837402, -1.3613264560699463, -1.3000402450561523, -1.2387539148330688, -1.1774675846099854, -1.1161813735961914, -1.0548951625823975, -0.993608832359314, -0.9323225617408752, -0.8710362911224365, -0.8097500205039978, -0.7484637498855591, -0.6871774792671204, -0.6258912086486816, -0.5646049380302429, -0.5033186674118042, -0.4420323967933655, -0.38074612617492676, -0.31945985555648804, -0.2581735849380493, -0.1968873143196106, -0.13560104370117188, -0.07431477308273315, -0.013028502464294434, 0.04825776815414429, 0.10954403877258301, 0.17083030939102173, 0.23211658000946045, 0.29340285062789917, 0.3546891212463379, 0.4159753918647766, 0.47726166248321533, 0.538547933101654, 0.5998342037200928, 0.6611204743385315, 0.7224067449569702, 0.7836930155754089, 0.8449792861938477, 0.9062655568122864, 0.9675518274307251, 1.0288381576538086, 1.0901243686676025, 1.1514105796813965, 1.21269690990448, 1.2739832401275635, 1.3352694511413574, 1.3965556621551514, 1.4578419923782349, 1.5191283226013184, 1.5804145336151123, 1.6417007446289062, 1.7029870748519897, 1.7642734050750732, 1.8255596160888672]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 10.0, 9.0, 20.0, 18.0, 25.0, 37.0, 46.0, 61.0, 91.0, 128.0, 177.0, 265.0, 417.0, 556.0, 812.0, 1361.0, 2705.0, 5607.0, 14257.0, 43241.0, 140649.0, 375635.0, 308765.0, 101030.0, 31303.0, 10988.0, 4435.0, 2184.0, 1269.0, 779.0, 503.0, 344.0, 251.0, 156.0, 122.0, 82.0, 51.0, 43.0, 29.0, 28.0, 20.0, 16.0, 6.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.629638671875, -2.54443359375, -2.459228515625, -2.3740234375, -2.288818359375, -2.20361328125, -2.118408203125, -2.033203125, -1.947998046875, -1.86279296875, -1.777587890625, -1.6923828125, -1.607177734375, -1.52197265625, -1.436767578125, -1.3515625, -1.266357421875, -1.18115234375, -1.095947265625, -1.0107421875, -0.925537109375, -0.84033203125, -0.755126953125, -0.669921875, -0.584716796875, -0.49951171875, -0.414306640625, -0.3291015625, -0.243896484375, -0.15869140625, -0.073486328125, 0.01171875, 0.096923828125, 0.18212890625, 0.267333984375, 0.3525390625, 0.437744140625, 0.52294921875, 0.608154296875, 0.693359375, 0.778564453125, 0.86376953125, 0.948974609375, 1.0341796875, 1.119384765625, 1.20458984375, 1.289794921875, 1.375, 1.460205078125, 1.54541015625, 1.630615234375, 1.7158203125, 1.801025390625, 1.88623046875, 1.971435546875, 2.056640625, 2.141845703125, 2.22705078125, 2.312255859375, 2.3974609375, 2.482666015625, 2.56787109375, 2.653076171875, 2.73828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 14.0, 9.0, 7.0, 10.0, 13.0, 21.0, 20.0, 21.0, 26.0, 28.0, 34.0, 31.0, 28.0, 30.0, 35.0, 32.0, 34.0, 35.0, 46.0, 47.0, 38.0, 38.0, 33.0, 33.0, 21.0, 30.0, 28.0, 24.0, 22.0, 14.0, 29.0, 15.0, 15.0, 22.0, 18.0, 10.0, 8.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-2.134765625, -2.0708160400390625, -2.006866455078125, -1.9429168701171875, -1.87896728515625, -1.8150177001953125, -1.751068115234375, -1.6871185302734375, -1.6231689453125, -1.5592193603515625, -1.495269775390625, -1.4313201904296875, -1.36737060546875, -1.3034210205078125, -1.239471435546875, -1.1755218505859375, -1.111572265625, -1.0476226806640625, -0.983673095703125, -0.9197235107421875, -0.85577392578125, -0.7918243408203125, -0.727874755859375, -0.6639251708984375, -0.5999755859375, -0.5360260009765625, -0.472076416015625, -0.4081268310546875, -0.34417724609375, -0.2802276611328125, -0.216278076171875, -0.1523284912109375, -0.08837890625, -0.0244293212890625, 0.039520263671875, 0.1034698486328125, 0.16741943359375, 0.2313690185546875, 0.295318603515625, 0.3592681884765625, 0.4232177734375, 0.4871673583984375, 0.551116943359375, 0.6150665283203125, 0.67901611328125, 0.7429656982421875, 0.806915283203125, 0.8708648681640625, 0.934814453125, 0.9987640380859375, 1.062713623046875, 1.1266632080078125, 1.19061279296875, 1.2545623779296875, 1.318511962890625, 1.3824615478515625, 1.4464111328125, 1.5103607177734375, 1.574310302734375, 1.6382598876953125, 1.70220947265625, 1.7661590576171875, 1.830108642578125, 1.8940582275390625, 1.9580078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 9.0, 5.0, 12.0, 15.0, 19.0, 20.0, 35.0, 42.0, 65.0, 84.0, 101.0, 149.0, 214.0, 318.0, 477.0, 797.0, 1312.0, 2466.0, 5516.0, 13967.0, 39360.0, 128808.0, 370817.0, 324835.0, 104280.0, 32704.0, 11659.0, 4724.0, 2312.0, 1175.0, 725.0, 433.0, 311.0, 216.0, 177.0, 96.0, 76.0, 49.0, 41.0, 24.0, 24.0, 21.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 3.0], "bins": [-2.76171875, -2.6826171875, -2.603515625, -2.5244140625, -2.4453125, -2.3662109375, -2.287109375, -2.2080078125, -2.12890625, -2.0498046875, -1.970703125, -1.8916015625, -1.8125, -1.7333984375, -1.654296875, -1.5751953125, -1.49609375, -1.4169921875, -1.337890625, -1.2587890625, -1.1796875, -1.1005859375, -1.021484375, -0.9423828125, -0.86328125, -0.7841796875, -0.705078125, -0.6259765625, -0.546875, -0.4677734375, -0.388671875, -0.3095703125, -0.23046875, -0.1513671875, -0.072265625, 0.0068359375, 0.0859375, 0.1650390625, 0.244140625, 0.3232421875, 0.40234375, 0.4814453125, 0.560546875, 0.6396484375, 0.71875, 0.7978515625, 0.876953125, 0.9560546875, 1.03515625, 1.1142578125, 1.193359375, 1.2724609375, 1.3515625, 1.4306640625, 1.509765625, 1.5888671875, 1.66796875, 1.7470703125, 1.826171875, 1.9052734375, 1.984375, 2.0634765625, 2.142578125, 2.2216796875, 2.30078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 8.0, 14.0, 11.0, 11.0, 14.0, 24.0, 22.0, 28.0, 26.0, 27.0, 22.0, 38.0, 39.0, 23.0, 30.0, 40.0, 43.0, 51.0, 49.0, 53.0, 40.0, 38.0, 34.0, 46.0, 36.0, 40.0, 23.0, 24.0, 19.0, 28.0, 18.0, 16.0, 7.0, 10.0, 10.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.734375, -1.6830291748046875, -1.631683349609375, -1.5803375244140625, -1.52899169921875, -1.4776458740234375, -1.426300048828125, -1.3749542236328125, -1.3236083984375, -1.2722625732421875, -1.220916748046875, -1.1695709228515625, -1.11822509765625, -1.0668792724609375, -1.015533447265625, -0.9641876220703125, -0.912841796875, -0.8614959716796875, -0.810150146484375, -0.7588043212890625, -0.70745849609375, -0.6561126708984375, -0.604766845703125, -0.5534210205078125, -0.5020751953125, -0.4507293701171875, -0.399383544921875, -0.3480377197265625, -0.29669189453125, -0.2453460693359375, -0.194000244140625, -0.1426544189453125, -0.09130859375, -0.0399627685546875, 0.011383056640625, 0.0627288818359375, 0.11407470703125, 0.1654205322265625, 0.216766357421875, 0.2681121826171875, 0.3194580078125, 0.3708038330078125, 0.422149658203125, 0.4734954833984375, 0.52484130859375, 0.5761871337890625, 0.627532958984375, 0.6788787841796875, 0.730224609375, 0.7815704345703125, 0.832916259765625, 0.8842620849609375, 0.93560791015625, 0.9869537353515625, 1.038299560546875, 1.0896453857421875, 1.1409912109375, 1.1923370361328125, 1.243682861328125, 1.2950286865234375, 1.34637451171875, 1.3977203369140625, 1.449066162109375, 1.5004119873046875, 1.5517578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 10.0, 9.0, 8.0, 19.0, 28.0, 21.0, 31.0, 52.0, 91.0, 116.0, 173.0, 269.0, 380.0, 556.0, 871.0, 1501.0, 2573.0, 4553.0, 10212.0, 30174.0, 135434.0, 560332.0, 229287.0, 44475.0, 13761.0, 5808.0, 3035.0, 1658.0, 1054.0, 670.0, 436.0, 302.0, 189.0, 126.0, 79.0, 66.0, 49.0, 40.0, 34.0, 16.0, 19.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.205078125, -1.1681671142578125, -1.131256103515625, -1.0943450927734375, -1.05743408203125, -1.0205230712890625, -0.983612060546875, -0.9467010498046875, -0.9097900390625, -0.8728790283203125, -0.835968017578125, -0.7990570068359375, -0.76214599609375, -0.7252349853515625, -0.688323974609375, -0.6514129638671875, -0.614501953125, -0.5775909423828125, -0.540679931640625, -0.5037689208984375, -0.46685791015625, -0.4299468994140625, -0.393035888671875, -0.3561248779296875, -0.3192138671875, -0.2823028564453125, -0.245391845703125, -0.2084808349609375, -0.17156982421875, -0.1346588134765625, -0.097747802734375, -0.0608367919921875, -0.02392578125, 0.0129852294921875, 0.049896240234375, 0.0868072509765625, 0.12371826171875, 0.1606292724609375, 0.197540283203125, 0.2344512939453125, 0.2713623046875, 0.3082733154296875, 0.345184326171875, 0.3820953369140625, 0.41900634765625, 0.4559173583984375, 0.492828369140625, 0.5297393798828125, 0.566650390625, 0.6035614013671875, 0.640472412109375, 0.6773834228515625, 0.71429443359375, 0.7512054443359375, 0.788116455078125, 0.8250274658203125, 0.8619384765625, 0.8988494873046875, 0.935760498046875, 0.9726715087890625, 1.00958251953125, 1.0464935302734375, 1.083404541015625, 1.1203155517578125, 1.1572265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 10.0, 20.0, 31.0, 34.0, 38.0, 54.0, 67.0, 70.0, 62.0, 74.0, 94.0, 76.0, 68.0, 47.0, 35.0, 41.0, 26.0, 30.0, 21.0, 18.0, 8.0, 9.0, 4.0, 4.0, 1.0, 7.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.99758529663086e-05, -6.81411474943161e-05, -6.630644202232361e-05, -6.447173655033112e-05, -6.263703107833862e-05, -6.080232560634613e-05, -5.896762013435364e-05, -5.7132914662361145e-05, -5.529820919036865e-05, -5.346350371837616e-05, -5.162879824638367e-05, -4.9794092774391174e-05, -4.795938730239868e-05, -4.612468183040619e-05, -4.4289976358413696e-05, -4.2455270886421204e-05, -4.062056541442871e-05, -3.878585994243622e-05, -3.6951154470443726e-05, -3.511644899845123e-05, -3.328174352645874e-05, -3.144703805446625e-05, -2.9612332582473755e-05, -2.7777627110481262e-05, -2.594292163848877e-05, -2.4108216166496277e-05, -2.2273510694503784e-05, -2.043880522251129e-05, -1.86040997505188e-05, -1.6769394278526306e-05, -1.4934688806533813e-05, -1.309998333454132e-05, -1.1265277862548828e-05, -9.430572390556335e-06, -7.595866918563843e-06, -5.76116144657135e-06, -3.926455974578857e-06, -2.0917505025863647e-06, -2.5704503059387207e-07, 1.5776604413986206e-06, 3.4123659133911133e-06, 5.247071385383606e-06, 7.081776857376099e-06, 8.916482329368591e-06, 1.0751187801361084e-05, 1.2585893273353577e-05, 1.442059874534607e-05, 1.6255304217338562e-05, 1.8090009689331055e-05, 1.9924715161323547e-05, 2.175942063331604e-05, 2.3594126105308533e-05, 2.5428831577301025e-05, 2.7263537049293518e-05, 2.909824252128601e-05, 3.0932947993278503e-05, 3.2767653465270996e-05, 3.460235893726349e-05, 3.643706440925598e-05, 3.8271769881248474e-05, 4.010647535324097e-05, 4.194118082523346e-05, 4.377588629722595e-05, 4.5610591769218445e-05, 4.744529724121094e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 14.0, 15.0, 30.0, 39.0, 55.0, 83.0, 105.0, 178.0, 249.0, 384.0, 560.0, 839.0, 1297.0, 1942.0, 3400.0, 5662.0, 10182.0, 19208.0, 38796.0, 81446.0, 169774.0, 276304.0, 218826.0, 110166.0, 52086.0, 25528.0, 13194.0, 7150.0, 4109.0, 2352.0, 1586.0, 958.0, 682.0, 441.0, 288.0, 199.0, 135.0, 95.0, 63.0, 40.0, 21.0, 16.0, 17.0, 6.0, 10.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7031707763671875, -0.680267333984375, -0.6573638916015625, -0.63446044921875, -0.6115570068359375, -0.588653564453125, -0.5657501220703125, -0.5428466796875, -0.5199432373046875, -0.497039794921875, -0.4741363525390625, -0.45123291015625, -0.4283294677734375, -0.405426025390625, -0.3825225830078125, -0.359619140625, -0.3367156982421875, -0.313812255859375, -0.2909088134765625, -0.26800537109375, -0.2451019287109375, -0.222198486328125, -0.1992950439453125, -0.1763916015625, -0.1534881591796875, -0.130584716796875, -0.1076812744140625, -0.08477783203125, -0.0618743896484375, -0.038970947265625, -0.0160675048828125, 0.0068359375, 0.0297393798828125, 0.052642822265625, 0.0755462646484375, 0.09844970703125, 0.1213531494140625, 0.144256591796875, 0.1671600341796875, 0.1900634765625, 0.2129669189453125, 0.235870361328125, 0.2587738037109375, 0.28167724609375, 0.3045806884765625, 0.327484130859375, 0.3503875732421875, 0.373291015625, 0.3961944580078125, 0.419097900390625, 0.4420013427734375, 0.46490478515625, 0.4878082275390625, 0.510711669921875, 0.5336151123046875, 0.5565185546875, 0.5794219970703125, 0.602325439453125, 0.6252288818359375, 0.64813232421875, 0.6710357666015625, 0.693939208984375, 0.7168426513671875, 0.73974609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 6.0, 12.0, 22.0, 28.0, 25.0, 55.0, 65.0, 77.0, 97.0, 116.0, 105.0, 97.0, 74.0, 64.0, 43.0, 22.0, 28.0, 9.0, 13.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2656707763671875, -0.254974365234375, -0.2442779541015625, -0.23358154296875, -0.2228851318359375, -0.212188720703125, -0.2014923095703125, -0.1907958984375, -0.1800994873046875, -0.169403076171875, -0.1587066650390625, -0.14801025390625, -0.1373138427734375, -0.126617431640625, -0.1159210205078125, -0.105224609375, -0.0945281982421875, -0.083831787109375, -0.0731353759765625, -0.06243896484375, -0.0517425537109375, -0.041046142578125, -0.0303497314453125, -0.0196533203125, -0.0089569091796875, 0.001739501953125, 0.0124359130859375, 0.02313232421875, 0.0338287353515625, 0.044525146484375, 0.0552215576171875, 0.06591796875, 0.0766143798828125, 0.087310791015625, 0.0980072021484375, 0.10870361328125, 0.1194000244140625, 0.130096435546875, 0.1407928466796875, 0.1514892578125, 0.1621856689453125, 0.172882080078125, 0.1835784912109375, 0.19427490234375, 0.2049713134765625, 0.215667724609375, 0.2263641357421875, 0.237060546875, 0.2477569580078125, 0.258453369140625, 0.2691497802734375, 0.27984619140625, 0.2905426025390625, 0.301239013671875, 0.3119354248046875, 0.3226318359375, 0.3333282470703125, 0.344024658203125, 0.3547210693359375, 0.36541748046875, 0.3761138916015625, 0.386810302734375, 0.3975067138671875, 0.408203125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 4.0, 7.0, 11.0, 6.0, 8.0, 18.0, 28.0, 29.0, 18.0, 41.0, 36.0, 43.0, 33.0, 42.0, 48.0, 54.0, 45.0, 73.0, 54.0, 51.0, 46.0, 39.0, 39.0, 42.0, 39.0, 28.0, 26.0, 16.0, 12.0, 16.0, 13.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.925477981567383, -2.8365590572357178, -2.7476401329040527, -2.6587212085723877, -2.5698022842407227, -2.4808833599090576, -2.3919644355773926, -2.3030452728271484, -2.2141265869140625, -2.1252076625823975, -2.0362887382507324, -1.9473698139190674, -1.8584508895874023, -1.7695319652557373, -1.6806129217147827, -1.5916939973831177, -1.502774953842163, -1.413856029510498, -1.324937105178833, -1.236018180847168, -1.147099256515503, -1.058180332183838, -0.9692612886428833, -0.8803423643112183, -0.7914234399795532, -0.7025045156478882, -0.6135855913162231, -0.5246666073799133, -0.4357476830482483, -0.34682875871658325, -0.25790977478027344, -0.1689908504486084, -0.08007168769836426, 0.008847251534461975, 0.09776619076728821, 0.18668514490127563, 0.2756040692329407, 0.3645229935646057, 0.4534419775009155, 0.5423609018325806, 0.6312798261642456, 0.7201987504959106, 0.8091176748275757, 0.8980366587638855, 0.9869555830955505, 1.0758745670318604, 1.1647934913635254, 1.2537124156951904, 1.3426313400268555, 1.4315502643585205, 1.5204691886901855, 1.6093881130218506, 1.6983070373535156, 1.7872259616851807, 1.8761450052261353, 1.9650639295578003, 2.053982734680176, 2.142901659011841, 2.231820583343506, 2.320739507675171, 2.409658432006836, 2.498577356338501, 2.587496280670166, 2.67641544342041, 2.765334367752075]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 6.0, 4.0, 12.0, 8.0, 10.0, 16.0, 10.0, 16.0, 11.0, 18.0, 32.0, 28.0, 22.0, 30.0, 34.0, 24.0, 16.0, 29.0, 36.0, 40.0, 47.0, 46.0, 40.0, 32.0, 41.0, 35.0, 39.0, 40.0, 33.0, 22.0, 21.0, 24.0, 22.0, 17.0, 22.0, 10.0, 15.0, 15.0, 16.0, 13.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.1321260929107666, -2.0693349838256836, -2.0065436363220215, -1.9437525272369385, -1.880961298942566, -1.8181700706481934, -1.7553788423538208, -1.6925876140594482, -1.6297965049743652, -1.5670052766799927, -1.5042140483856201, -1.441422939300537, -1.3786317110061646, -1.315840482711792, -1.2530492544174194, -1.1902580261230469, -1.1274667978286743, -1.0646755695343018, -1.0018843412399292, -0.9390931725502014, -0.8763020038604736, -0.8135107755661011, -0.7507195472717285, -0.687928318977356, -0.6251371502876282, -0.5623459219932556, -0.49955475330352783, -0.4367635250091553, -0.3739723265171051, -0.31118112802505493, -0.24838989973068237, -0.1855987012386322, -0.12280738353729248, -0.06001617759466171, 0.002775028347969055, 0.06556624174118042, 0.1283574402332306, 0.19114863872528076, 0.2539398670196533, 0.3167310655117035, 0.37952226400375366, 0.44231346249580383, 0.505104660987854, 0.5678958892822266, 0.6306871175765991, 0.6934782862663269, 0.7562695145606995, 0.8190606832504272, 0.8818519115447998, 0.9446431398391724, 1.007434368133545, 1.070225477218628, 1.1330167055130005, 1.195807933807373, 1.2585991621017456, 1.3213903903961182, 1.3841814994812012, 1.4469727277755737, 1.5097639560699463, 1.5725550651550293, 1.6353462934494019, 1.6981375217437744, 1.760928750038147, 1.8237199783325195, 1.886511206626892]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 13.0, 13.0, 15.0, 38.0, 58.0, 85.0, 113.0, 178.0, 277.0, 402.0, 590.0, 847.0, 1352.0, 1984.0, 2889.0, 4574.0, 6788.0, 9948.0, 15071.0, 21892.0, 31813.0, 44284.0, 60720.0, 79197.0, 95565.0, 108340.0, 111284.0, 104707.0, 90615.0, 73121.0, 55075.0, 39756.0, 27912.0, 19219.0, 13079.0, 8825.0, 5909.0, 4038.0, 2730.0, 1805.0, 1146.0, 801.0, 496.0, 345.0, 214.0, 139.0, 87.0, 65.0, 34.0, 39.0, 21.0, 8.0, 9.0, 10.0, 6.0, 5.0, 5.0], "bins": [-2.111328125, -2.0479888916015625, -1.984649658203125, -1.9213104248046875, -1.85797119140625, -1.7946319580078125, -1.731292724609375, -1.6679534912109375, -1.6046142578125, -1.5412750244140625, -1.477935791015625, -1.4145965576171875, -1.35125732421875, -1.2879180908203125, -1.224578857421875, -1.1612396240234375, -1.097900390625, -1.0345611572265625, -0.971221923828125, -0.9078826904296875, -0.84454345703125, -0.7812042236328125, -0.717864990234375, -0.6545257568359375, -0.5911865234375, -0.5278472900390625, -0.464508056640625, -0.4011688232421875, -0.33782958984375, -0.2744903564453125, -0.211151123046875, -0.1478118896484375, -0.08447265625, -0.0211334228515625, 0.042205810546875, 0.1055450439453125, 0.16888427734375, 0.2322235107421875, 0.295562744140625, 0.3589019775390625, 0.4222412109375, 0.4855804443359375, 0.548919677734375, 0.6122589111328125, 0.67559814453125, 0.7389373779296875, 0.802276611328125, 0.8656158447265625, 0.928955078125, 0.9922943115234375, 1.055633544921875, 1.1189727783203125, 1.18231201171875, 1.2456512451171875, 1.308990478515625, 1.3723297119140625, 1.4356689453125, 1.4990081787109375, 1.562347412109375, 1.6256866455078125, 1.68902587890625, 1.7523651123046875, 1.815704345703125, 1.8790435791015625, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 10.0, 19.0, 16.0, 19.0, 19.0, 17.0, 19.0, 34.0, 21.0, 30.0, 27.0, 35.0, 36.0, 40.0, 38.0, 51.0, 36.0, 40.0, 45.0, 52.0, 36.0, 39.0, 28.0, 34.0, 29.0, 18.0, 16.0, 29.0, 21.0, 21.0, 17.0, 16.0, 11.0, 7.0, 7.0, 13.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.974609375, -1.91070556640625, -1.8468017578125, -1.78289794921875, -1.718994140625, -1.65509033203125, -1.5911865234375, -1.52728271484375, -1.46337890625, -1.39947509765625, -1.3355712890625, -1.27166748046875, -1.207763671875, -1.14385986328125, -1.0799560546875, -1.01605224609375, -0.9521484375, -0.88824462890625, -0.8243408203125, -0.76043701171875, -0.696533203125, -0.63262939453125, -0.5687255859375, -0.50482177734375, -0.44091796875, -0.37701416015625, -0.3131103515625, -0.24920654296875, -0.185302734375, -0.12139892578125, -0.0574951171875, 0.00640869140625, 0.0703125, 0.13421630859375, 0.1981201171875, 0.26202392578125, 0.325927734375, 0.38983154296875, 0.4537353515625, 0.51763916015625, 0.58154296875, 0.64544677734375, 0.7093505859375, 0.77325439453125, 0.837158203125, 0.90106201171875, 0.9649658203125, 1.02886962890625, 1.0927734375, 1.15667724609375, 1.2205810546875, 1.28448486328125, 1.348388671875, 1.41229248046875, 1.4761962890625, 1.54010009765625, 1.60400390625, 1.66790771484375, 1.7318115234375, 1.79571533203125, 1.859619140625, 1.92352294921875, 1.9874267578125, 2.05133056640625, 2.115234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 7.0, 22.0, 20.0, 33.0, 57.0, 106.0, 160.0, 276.0, 439.0, 734.0, 1193.0, 2015.0, 3604.0, 5963.0, 9842.0, 16141.0, 26400.0, 40745.0, 60684.0, 85314.0, 110673.0, 128409.0, 131738.0, 120376.0, 97600.0, 72003.0, 49639.0, 32462.0, 20363.0, 12548.0, 7641.0, 4443.0, 2739.0, 1672.0, 993.0, 591.0, 340.0, 237.0, 144.0, 84.0, 45.0, 30.0, 9.0, 12.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.7716064453125, -1.701416015625, -1.6312255859375, -1.56103515625, -1.4908447265625, -1.420654296875, -1.3504638671875, -1.2802734375, -1.2100830078125, -1.139892578125, -1.0697021484375, -0.99951171875, -0.9293212890625, -0.859130859375, -0.7889404296875, -0.71875, -0.6485595703125, -0.578369140625, -0.5081787109375, -0.43798828125, -0.3677978515625, -0.297607421875, -0.2274169921875, -0.1572265625, -0.0870361328125, -0.016845703125, 0.0533447265625, 0.12353515625, 0.1937255859375, 0.263916015625, 0.3341064453125, 0.404296875, 0.4744873046875, 0.544677734375, 0.6148681640625, 0.68505859375, 0.7552490234375, 0.825439453125, 0.8956298828125, 0.9658203125, 1.0360107421875, 1.106201171875, 1.1763916015625, 1.24658203125, 1.3167724609375, 1.386962890625, 1.4571533203125, 1.52734375, 1.5975341796875, 1.667724609375, 1.7379150390625, 1.80810546875, 1.8782958984375, 1.948486328125, 2.0186767578125, 2.0888671875, 2.1590576171875, 2.229248046875, 2.2994384765625, 2.36962890625, 2.4398193359375, 2.510009765625, 2.5802001953125, 2.650390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 21.0, 17.0, 12.0, 23.0, 26.0, 25.0, 21.0, 39.0, 28.0, 45.0, 31.0, 39.0, 41.0, 39.0, 51.0, 43.0, 47.0, 46.0, 45.0, 34.0, 41.0, 46.0, 33.0, 29.0, 23.0, 13.0, 22.0, 10.0, 18.0, 14.0, 6.0, 13.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.344024658203125, -1.29742431640625, -1.250823974609375, -1.2042236328125, -1.157623291015625, -1.11102294921875, -1.064422607421875, -1.017822265625, -0.971221923828125, -0.92462158203125, -0.878021240234375, -0.8314208984375, -0.784820556640625, -0.73822021484375, -0.691619873046875, -0.64501953125, -0.598419189453125, -0.55181884765625, -0.505218505859375, -0.4586181640625, -0.412017822265625, -0.36541748046875, -0.318817138671875, -0.272216796875, -0.225616455078125, -0.17901611328125, -0.132415771484375, -0.0858154296875, -0.039215087890625, 0.00738525390625, 0.053985595703125, 0.1005859375, 0.147186279296875, 0.19378662109375, 0.240386962890625, 0.2869873046875, 0.333587646484375, 0.38018798828125, 0.426788330078125, 0.473388671875, 0.519989013671875, 0.56658935546875, 0.613189697265625, 0.6597900390625, 0.706390380859375, 0.75299072265625, 0.799591064453125, 0.84619140625, 0.892791748046875, 0.93939208984375, 0.985992431640625, 1.0325927734375, 1.079193115234375, 1.12579345703125, 1.172393798828125, 1.218994140625, 1.265594482421875, 1.31219482421875, 1.358795166015625, 1.4053955078125, 1.451995849609375, 1.49859619140625, 1.545196533203125, 1.591796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 24.0, 30.0, 38.0, 48.0, 91.0, 99.0, 190.0, 250.0, 426.0, 647.0, 917.0, 1489.0, 2503.0, 4192.0, 7742.0, 15272.0, 31301.0, 69323.0, 162597.0, 299850.0, 243930.0, 110974.0, 48205.0, 22566.0, 11142.0, 5880.0, 3379.0, 1930.0, 1237.0, 799.0, 476.0, 318.0, 227.0, 137.0, 91.0, 71.0, 48.0, 35.0, 23.0, 19.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.289764404296875, -3.17132568359375, -3.052886962890625, -2.9344482421875, -2.816009521484375, -2.69757080078125, -2.579132080078125, -2.460693359375, -2.342254638671875, -2.22381591796875, -2.105377197265625, -1.9869384765625, -1.868499755859375, -1.75006103515625, -1.631622314453125, -1.51318359375, -1.394744873046875, -1.27630615234375, -1.157867431640625, -1.0394287109375, -0.920989990234375, -0.80255126953125, -0.684112548828125, -0.565673828125, -0.447235107421875, -0.32879638671875, -0.210357666015625, -0.0919189453125, 0.026519775390625, 0.14495849609375, 0.263397216796875, 0.3818359375, 0.500274658203125, 0.61871337890625, 0.737152099609375, 0.8555908203125, 0.974029541015625, 1.09246826171875, 1.210906982421875, 1.329345703125, 1.447784423828125, 1.56622314453125, 1.684661865234375, 1.8031005859375, 1.921539306640625, 2.03997802734375, 2.158416748046875, 2.27685546875, 2.395294189453125, 2.51373291015625, 2.632171630859375, 2.7506103515625, 2.869049072265625, 2.98748779296875, 3.105926513671875, 3.224365234375, 3.342803955078125, 3.46124267578125, 3.579681396484375, 3.6981201171875, 3.816558837890625, 3.93499755859375, 4.053436279296875, 4.171875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 8.0, 15.0, 19.0, 17.0, 23.0, 31.0, 51.0, 59.0, 55.0, 66.0, 90.0, 70.0, 56.0, 76.0, 49.0, 52.0, 46.0, 42.0, 19.0, 27.0, 15.0, 18.0, 5.0, 12.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020325183868408203, -0.00019521452486515045, -0.00018717721104621887, -0.0001791398972272873, -0.0001711025834083557, -0.00016306526958942413, -0.00015502795577049255, -0.00014699064195156097, -0.0001389533281326294, -0.00013091601431369781, -0.00012287870049476624, -0.00011484138667583466, -0.00010680407285690308, -9.87667590379715e-05, -9.072944521903992e-05, -8.269213140010834e-05, -7.465481758117676e-05, -6.661750376224518e-05, -5.85801899433136e-05, -5.054287612438202e-05, -4.250556230545044e-05, -3.446824848651886e-05, -2.643093466758728e-05, -1.83936208486557e-05, -1.0356307029724121e-05, -2.3189932107925415e-06, 5.718320608139038e-06, 1.3755634427070618e-05, 2.1792948246002197e-05, 2.9830262064933777e-05, 3.7867575883865356e-05, 4.5904889702796936e-05, 5.3942203521728516e-05, 6.19795173406601e-05, 7.001683115959167e-05, 7.805414497852325e-05, 8.609145879745483e-05, 9.412877261638641e-05, 0.00010216608643531799, 0.00011020340025424957, 0.00011824071407318115, 0.00012627802789211273, 0.0001343153417110443, 0.0001423526555299759, 0.00015038996934890747, 0.00015842728316783905, 0.00016646459698677063, 0.0001745019108057022, 0.0001825392246246338, 0.00019057653844356537, 0.00019861385226249695, 0.00020665116608142853, 0.0002146884799003601, 0.0002227257937192917, 0.00023076310753822327, 0.00023880042135715485, 0.0002468377351760864, 0.000254875048995018, 0.0002629123628139496, 0.00027094967663288116, 0.00027898699045181274, 0.0002870243042707443, 0.0002950616180896759, 0.0003030989319086075, 0.00031113624572753906]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 12.0, 17.0, 24.0, 37.0, 43.0, 83.0, 109.0, 158.0, 232.0, 340.0, 500.0, 727.0, 1038.0, 1526.0, 2483.0, 3754.0, 6155.0, 10440.0, 17877.0, 32690.0, 60087.0, 108852.0, 175784.0, 213301.0, 172608.0, 105094.0, 58427.0, 31708.0, 17327.0, 10101.0, 6087.0, 3734.0, 2395.0, 1488.0, 1046.0, 702.0, 469.0, 319.0, 233.0, 151.0, 118.0, 76.0, 64.0, 42.0, 34.0, 16.0, 15.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.132720947265625, -2.06036376953125, -1.988006591796875, -1.9156494140625, -1.843292236328125, -1.77093505859375, -1.698577880859375, -1.626220703125, -1.553863525390625, -1.48150634765625, -1.409149169921875, -1.3367919921875, -1.264434814453125, -1.19207763671875, -1.119720458984375, -1.04736328125, -0.975006103515625, -0.90264892578125, -0.830291748046875, -0.7579345703125, -0.685577392578125, -0.61322021484375, -0.540863037109375, -0.468505859375, -0.396148681640625, -0.32379150390625, -0.251434326171875, -0.1790771484375, -0.106719970703125, -0.03436279296875, 0.037994384765625, 0.1103515625, 0.182708740234375, 0.25506591796875, 0.327423095703125, 0.3997802734375, 0.472137451171875, 0.54449462890625, 0.616851806640625, 0.689208984375, 0.761566162109375, 0.83392333984375, 0.906280517578125, 0.9786376953125, 1.050994873046875, 1.12335205078125, 1.195709228515625, 1.26806640625, 1.340423583984375, 1.41278076171875, 1.485137939453125, 1.5574951171875, 1.629852294921875, 1.70220947265625, 1.774566650390625, 1.846923828125, 1.919281005859375, 1.99163818359375, 2.063995361328125, 2.1363525390625, 2.208709716796875, 2.28106689453125, 2.353424072265625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 6.0, 10.0, 15.0, 14.0, 14.0, 28.0, 30.0, 28.0, 41.0, 47.0, 55.0, 89.0, 61.0, 77.0, 67.0, 65.0, 54.0, 47.0, 44.0, 44.0, 23.0, 30.0, 17.0, 14.0, 17.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8664016723632812, -0.8397369384765625, -0.8130722045898438, -0.786407470703125, -0.7597427368164062, -0.7330780029296875, -0.7064132690429688, -0.67974853515625, -0.6530838012695312, -0.6264190673828125, -0.5997543334960938, -0.573089599609375, -0.5464248657226562, -0.5197601318359375, -0.49309539794921875, -0.4664306640625, -0.43976593017578125, -0.4131011962890625, -0.38643646240234375, -0.359771728515625, -0.33310699462890625, -0.3064422607421875, -0.27977752685546875, -0.25311279296875, -0.22644805908203125, -0.1997833251953125, -0.17311859130859375, -0.146453857421875, -0.11978912353515625, -0.0931243896484375, -0.06645965576171875, -0.039794921875, -0.01313018798828125, 0.0135345458984375, 0.04019927978515625, 0.066864013671875, 0.09352874755859375, 0.1201934814453125, 0.14685821533203125, 0.17352294921875, 0.20018768310546875, 0.2268524169921875, 0.25351715087890625, 0.280181884765625, 0.30684661865234375, 0.3335113525390625, 0.36017608642578125, 0.3868408203125, 0.41350555419921875, 0.4401702880859375, 0.46683502197265625, 0.493499755859375, 0.5201644897460938, 0.5468292236328125, 0.5734939575195312, 0.60015869140625, 0.6268234252929688, 0.6534881591796875, 0.6801528930664062, 0.706817626953125, 0.7334823608398438, 0.7601470947265625, 0.7868118286132812, 0.8134765625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 16.0, 11.0, 13.0, 17.0, 31.0, 29.0, 35.0, 34.0, 33.0, 43.0, 31.0, 42.0, 48.0, 46.0, 47.0, 55.0, 52.0, 45.0, 47.0, 34.0, 47.0, 24.0, 25.0, 33.0, 31.0, 22.0, 11.0, 22.0, 16.0, 5.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6193525791168213, -2.537788152694702, -2.456223487854004, -2.3746590614318848, -2.2930946350097656, -2.2115302085876465, -2.1299655437469482, -2.048401117324829, -1.96683669090271, -1.8852721452713013, -1.8037077188491821, -1.7221431732177734, -1.6405787467956543, -1.5590142011642456, -1.477449655532837, -1.3958852291107178, -1.314320683479309, -1.2327561378479004, -1.1511917114257812, -1.0696271657943726, -0.9880627393722534, -0.9064981937408447, -0.8249337077140808, -0.7433692216873169, -0.661804735660553, -0.5802402496337891, -0.49867576360702515, -0.41711124777793884, -0.3355467617511749, -0.253982275724411, -0.1724177598953247, -0.09085327386856079, -0.009288787841796875, 0.07227570563554764, 0.15384019911289215, 0.23540470004081726, 0.3169691860675812, 0.3985336720943451, 0.4800981879234314, 0.5616626739501953, 0.6432271599769592, 0.7247916460037231, 0.8063561320304871, 0.887920618057251, 0.9694851636886597, 1.0510495901107788, 1.1326141357421875, 1.2141785621643066, 1.2957431077957153, 1.377307653427124, 1.4588720798492432, 1.5404366254806519, 1.622001051902771, 1.7035655975341797, 1.7851300239562988, 1.8666945695877075, 1.9482591152191162, 2.0298235416412354, 2.1113882064819336, 2.1929526329040527, 2.274517059326172, 2.356081485748291, 2.4376461505889893, 2.5192105770111084, 2.6007750034332275]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 4.0, 11.0, 11.0, 12.0, 13.0, 11.0, 21.0, 13.0, 20.0, 25.0, 30.0, 24.0, 30.0, 28.0, 33.0, 33.0, 34.0, 31.0, 42.0, 34.0, 41.0, 35.0, 43.0, 52.0, 32.0, 39.0, 29.0, 32.0, 29.0, 32.0, 20.0, 31.0, 18.0, 11.0, 12.0, 12.0, 9.0, 8.0, 8.0, 9.0, 5.0, 7.0, 1.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.2677392959594727, -2.201488494873047, -2.135237693786621, -2.0689868927001953, -2.0027360916137695, -1.9364852905273438, -1.870234489440918, -1.8039836883544922, -1.7377328872680664, -1.6714820861816406, -1.6052312850952148, -1.538980484008789, -1.4727296829223633, -1.4064788818359375, -1.3402280807495117, -1.273977279663086, -1.2077263593673706, -1.1414755582809448, -1.075224757194519, -1.0089739561080933, -0.9427231550216675, -0.8764723539352417, -0.8102214932441711, -0.7439706921577454, -0.6777198910713196, -0.6114690899848938, -0.545218288898468, -0.47896745800971985, -0.41271665692329407, -0.3464658558368683, -0.2802150249481201, -0.21396422386169434, -0.147713303565979, -0.08146249502897263, -0.015211686491966248, 0.05103912949562073, 0.11728993058204651, 0.1835407316684723, 0.24979156255722046, 0.31604236364364624, 0.382293164730072, 0.4485439658164978, 0.5147947669029236, 0.5810456275939941, 0.6472964286804199, 0.7135472297668457, 0.7797980308532715, 0.8460488319396973, 0.912299633026123, 0.9785504341125488, 1.0448012351989746, 1.1110520362854004, 1.1773028373718262, 1.243553638458252, 1.3098044395446777, 1.3760552406311035, 1.4423060417175293, 1.508556842803955, 1.5748076438903809, 1.6410584449768066, 1.7073092460632324, 1.7735600471496582, 1.839810848236084, 1.9060616493225098, 1.972312569618225]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 17.0, 27.0, 29.0, 62.0, 97.0, 121.0, 240.0, 347.0, 570.0, 910.0, 1470.0, 2229.0, 3561.0, 5886.0, 9420.0, 15350.0, 24762.0, 39929.0, 63640.0, 100979.0, 155739.0, 235136.0, 336935.0, 446928.0, 529459.0, 548992.0, 491119.0, 387947.0, 277860.0, 187169.0, 121414.0, 77488.0, 48558.0, 30053.0, 18491.0, 11992.0, 7183.0, 4417.0, 2896.0, 1747.0, 1111.0, 720.0, 448.0, 292.0, 170.0, 143.0, 85.0, 47.0, 30.0, 20.0, 14.0, 10.0, 5.0, 13.0, 1.0, 1.0, 2.0], "bins": [-1.78125, -1.7259368896484375, -1.670623779296875, -1.6153106689453125, -1.55999755859375, -1.5046844482421875, -1.449371337890625, -1.3940582275390625, -1.3387451171875, -1.2834320068359375, -1.228118896484375, -1.1728057861328125, -1.11749267578125, -1.0621795654296875, -1.006866455078125, -0.9515533447265625, -0.896240234375, -0.8409271240234375, -0.785614013671875, -0.7303009033203125, -0.67498779296875, -0.6196746826171875, -0.564361572265625, -0.5090484619140625, -0.4537353515625, -0.3984222412109375, -0.343109130859375, -0.2877960205078125, -0.23248291015625, -0.1771697998046875, -0.121856689453125, -0.0665435791015625, -0.01123046875, 0.0440826416015625, 0.099395751953125, 0.1547088623046875, 0.21002197265625, 0.2653350830078125, 0.320648193359375, 0.3759613037109375, 0.4312744140625, 0.4865875244140625, 0.541900634765625, 0.5972137451171875, 0.65252685546875, 0.7078399658203125, 0.763153076171875, 0.8184661865234375, 0.873779296875, 0.9290924072265625, 0.984405517578125, 1.0397186279296875, 1.09503173828125, 1.1503448486328125, 1.205657958984375, 1.2609710693359375, 1.3162841796875, 1.3715972900390625, 1.426910400390625, 1.4822235107421875, 1.53753662109375, 1.5928497314453125, 1.648162841796875, 1.7034759521484375, 1.7587890625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 13.0, 11.0, 13.0, 9.0, 19.0, 13.0, 25.0, 22.0, 32.0, 30.0, 30.0, 37.0, 30.0, 33.0, 45.0, 54.0, 43.0, 51.0, 43.0, 44.0, 41.0, 41.0, 51.0, 33.0, 28.0, 29.0, 30.0, 22.0, 25.0, 18.0, 13.0, 8.0, 14.0, 6.0, 10.0, 3.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9931640625, -1.9395599365234375, -1.885955810546875, -1.8323516845703125, -1.77874755859375, -1.7251434326171875, -1.671539306640625, -1.6179351806640625, -1.5643310546875, -1.5107269287109375, -1.457122802734375, -1.4035186767578125, -1.34991455078125, -1.2963104248046875, -1.242706298828125, -1.1891021728515625, -1.135498046875, -1.0818939208984375, -1.028289794921875, -0.9746856689453125, -0.92108154296875, -0.8674774169921875, -0.813873291015625, -0.7602691650390625, -0.7066650390625, -0.6530609130859375, -0.599456787109375, -0.5458526611328125, -0.49224853515625, -0.4386444091796875, -0.385040283203125, -0.3314361572265625, -0.27783203125, -0.2242279052734375, -0.170623779296875, -0.1170196533203125, -0.06341552734375, -0.0098114013671875, 0.043792724609375, 0.0973968505859375, 0.1510009765625, 0.2046051025390625, 0.258209228515625, 0.3118133544921875, 0.36541748046875, 0.4190216064453125, 0.472625732421875, 0.5262298583984375, 0.579833984375, 0.6334381103515625, 0.687042236328125, 0.7406463623046875, 0.79425048828125, 0.8478546142578125, 0.901458740234375, 0.9550628662109375, 1.0086669921875, 1.0622711181640625, 1.115875244140625, 1.1694793701171875, 1.22308349609375, 1.2766876220703125, 1.330291748046875, 1.3838958740234375, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 14.0, 18.0, 31.0, 43.0, 97.0, 110.0, 204.0, 326.0, 611.0, 993.0, 1628.0, 2723.0, 4560.0, 8034.0, 13451.0, 22727.0, 37434.0, 61894.0, 99186.0, 154213.0, 229733.0, 323447.0, 422384.0, 499957.0, 524608.0, 487044.0, 404648.0, 305777.0, 213974.0, 142143.0, 90702.0, 56274.0, 34481.0, 20740.0, 12222.0, 7384.0, 4226.0, 2523.0, 1455.0, 885.0, 548.0, 318.0, 183.0, 132.0, 69.0, 42.0, 35.0, 20.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6689453125, -1.6140594482421875, -1.559173583984375, -1.5042877197265625, -1.44940185546875, -1.3945159912109375, -1.339630126953125, -1.2847442626953125, -1.2298583984375, -1.1749725341796875, -1.120086669921875, -1.0652008056640625, -1.01031494140625, -0.9554290771484375, -0.900543212890625, -0.8456573486328125, -0.790771484375, -0.7358856201171875, -0.680999755859375, -0.6261138916015625, -0.57122802734375, -0.5163421630859375, -0.461456298828125, -0.4065704345703125, -0.3516845703125, -0.2967987060546875, -0.241912841796875, -0.1870269775390625, -0.13214111328125, -0.0772552490234375, -0.022369384765625, 0.0325164794921875, 0.08740234375, 0.1422882080078125, 0.197174072265625, 0.2520599365234375, 0.30694580078125, 0.3618316650390625, 0.416717529296875, 0.4716033935546875, 0.5264892578125, 0.5813751220703125, 0.636260986328125, 0.6911468505859375, 0.74603271484375, 0.8009185791015625, 0.855804443359375, 0.9106903076171875, 0.965576171875, 1.0204620361328125, 1.075347900390625, 1.1302337646484375, 1.18511962890625, 1.2400054931640625, 1.294891357421875, 1.3497772216796875, 1.4046630859375, 1.4595489501953125, 1.514434814453125, 1.5693206787109375, 1.62420654296875, 1.6790924072265625, 1.733978271484375, 1.7888641357421875, 1.84375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 11.0, 22.0, 21.0, 27.0, 27.0, 31.0, 52.0, 51.0, 75.0, 91.0, 83.0, 112.0, 130.0, 118.0, 152.0, 163.0, 176.0, 203.0, 191.0, 216.0, 231.0, 201.0, 204.0, 192.0, 181.0, 172.0, 140.0, 123.0, 115.0, 103.0, 74.0, 80.0, 57.0, 43.0, 47.0, 35.0, 27.0, 23.0, 13.0, 10.0, 5.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7119140625, -0.6884918212890625, -0.665069580078125, -0.6416473388671875, -0.61822509765625, -0.5948028564453125, -0.571380615234375, -0.5479583740234375, -0.5245361328125, -0.5011138916015625, -0.477691650390625, -0.4542694091796875, -0.43084716796875, -0.4074249267578125, -0.384002685546875, -0.3605804443359375, -0.337158203125, -0.3137359619140625, -0.290313720703125, -0.2668914794921875, -0.24346923828125, -0.2200469970703125, -0.196624755859375, -0.1732025146484375, -0.1497802734375, -0.1263580322265625, -0.102935791015625, -0.0795135498046875, -0.05609130859375, -0.0326690673828125, -0.009246826171875, 0.0141754150390625, 0.03759765625, 0.0610198974609375, 0.084442138671875, 0.1078643798828125, 0.13128662109375, 0.1547088623046875, 0.178131103515625, 0.2015533447265625, 0.2249755859375, 0.2483978271484375, 0.271820068359375, 0.2952423095703125, 0.31866455078125, 0.3420867919921875, 0.365509033203125, 0.3889312744140625, 0.412353515625, 0.4357757568359375, 0.459197998046875, 0.4826202392578125, 0.50604248046875, 0.5294647216796875, 0.552886962890625, 0.5763092041015625, 0.5997314453125, 0.6231536865234375, 0.646575927734375, 0.6699981689453125, 0.69342041015625, 0.7168426513671875, 0.740264892578125, 0.7636871337890625, 0.787109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 8.0, 6.0, 10.0, 9.0, 17.0, 16.0, 27.0, 31.0, 34.0, 30.0, 59.0, 60.0, 63.0, 60.0, 69.0, 70.0, 62.0, 38.0, 42.0, 43.0, 56.0, 33.0, 33.0, 22.0, 31.0, 24.0, 20.0, 7.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.988922595977783, -2.9013919830322266, -2.813861131668091, -2.726330518722534, -2.6387999057769775, -2.551269054412842, -2.463738441467285, -2.3762078285217285, -2.288677215576172, -2.2011466026306152, -2.1136157512664795, -2.026085138320923, -1.9385545253753662, -1.85102379322052, -1.7634930610656738, -1.6759624481201172, -1.5884315967559814, -1.5009008646011353, -1.4133702516555786, -1.3258395195007324, -1.2383089065551758, -1.1507781744003296, -1.0632474422454834, -0.975716769695282, -0.8881860971450806, -0.8006554245948792, -0.7131247520446777, -0.6255940198898315, -0.5380633473396301, -0.4505326747894287, -0.3630019426345825, -0.2754712700843811, -0.1879405975341797, -0.10040991008281708, -0.012879222631454468, 0.07465147972106934, 0.16218215227127075, 0.24971282482147217, 0.33724355697631836, 0.4247742295265198, 0.5123049020767212, 0.5998355746269226, 0.687366247177124, 0.7748969793319702, 0.8624276518821716, 0.949958324432373, 1.0374890565872192, 1.1250197887420654, 1.212550401687622, 1.3000811338424683, 1.387611746788025, 1.475142478942871, 1.5626730918884277, 1.650203824043274, 1.7377345561981201, 1.8252651691436768, 1.912795901298523, 2.000326633453369, 2.087857246398926, 2.1753878593444824, 2.262918710708618, 2.350449323654175, 2.4379801750183105, 2.525510787963867, 2.613041400909424]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 8.0, 6.0, 10.0, 11.0, 14.0, 15.0, 16.0, 15.0, 18.0, 28.0, 24.0, 21.0, 29.0, 31.0, 33.0, 34.0, 39.0, 34.0, 40.0, 30.0, 46.0, 30.0, 38.0, 35.0, 37.0, 26.0, 30.0, 30.0, 21.0, 24.0, 31.0, 21.0, 16.0, 21.0, 18.0, 14.0, 15.0, 13.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.6044965982437134, -1.5532957315444946, -1.5020948648452759, -1.4508939981460571, -1.3996931314468384, -1.3484922647476196, -1.2972913980484009, -1.2460905313491821, -1.1948896646499634, -1.1436887979507446, -1.0924879312515259, -1.0412870645523071, -0.9900861978530884, -0.9388853311538696, -0.8876844644546509, -0.8364835977554321, -0.7852827310562134, -0.7340818643569946, -0.6828809976577759, -0.6316801309585571, -0.5804792642593384, -0.5292783975601196, -0.4780775308609009, -0.42687666416168213, -0.3756757974624634, -0.32447493076324463, -0.2732740640640259, -0.22207319736480713, -0.17087233066558838, -0.11967146396636963, -0.06847059726715088, -0.01726973056793213, 0.03393101692199707, 0.08513188362121582, 0.13633275032043457, 0.18753361701965332, 0.23873448371887207, 0.2899353504180908, 0.34113621711730957, 0.3923370838165283, 0.44353795051574707, 0.4947388172149658, 0.5459396839141846, 0.5971405506134033, 0.6483414173126221, 0.6995422840118408, 0.7507431507110596, 0.8019440174102783, 0.8531448841094971, 0.9043457508087158, 0.9555466175079346, 1.0067474842071533, 1.057948350906372, 1.1091492176055908, 1.1603500843048096, 1.2115509510040283, 1.262751817703247, 1.3139526844024658, 1.3651535511016846, 1.4163544178009033, 1.467555284500122, 1.5187561511993408, 1.5699570178985596, 1.6211578845977783, 1.672358751296997]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 28.0, 18.0, 40.0, 55.0, 76.0, 81.0, 137.0, 178.0, 266.0, 399.0, 557.0, 779.0, 1109.0, 1719.0, 2903.0, 5997.0, 17535.0, 72549.0, 313259.0, 452580.0, 130021.0, 29278.0, 8687.0, 3818.0, 2127.0, 1303.0, 860.0, 690.0, 394.0, 329.0, 229.0, 160.0, 97.0, 80.0, 55.0, 37.0, 33.0, 20.0, 16.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84814453125, -2.7568359375, -2.66552734375, -2.57421875, -2.48291015625, -2.3916015625, -2.30029296875, -2.208984375, -2.11767578125, -2.0263671875, -1.93505859375, -1.84375, -1.75244140625, -1.6611328125, -1.56982421875, -1.478515625, -1.38720703125, -1.2958984375, -1.20458984375, -1.11328125, -1.02197265625, -0.9306640625, -0.83935546875, -0.748046875, -0.65673828125, -0.5654296875, -0.47412109375, -0.3828125, -0.29150390625, -0.2001953125, -0.10888671875, -0.017578125, 0.07373046875, 0.1650390625, 0.25634765625, 0.34765625, 0.43896484375, 0.5302734375, 0.62158203125, 0.712890625, 0.80419921875, 0.8955078125, 0.98681640625, 1.078125, 1.16943359375, 1.2607421875, 1.35205078125, 1.443359375, 1.53466796875, 1.6259765625, 1.71728515625, 1.80859375, 1.89990234375, 1.9912109375, 2.08251953125, 2.173828125, 2.26513671875, 2.3564453125, 2.44775390625, 2.5390625, 2.63037109375, 2.7216796875, 2.81298828125, 2.904296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 8.0, 12.0, 7.0, 12.0, 17.0, 17.0, 17.0, 23.0, 26.0, 22.0, 39.0, 28.0, 34.0, 35.0, 39.0, 33.0, 31.0, 29.0, 38.0, 47.0, 34.0, 46.0, 44.0, 31.0, 28.0, 32.0, 30.0, 31.0, 25.0, 18.0, 19.0, 24.0, 28.0, 19.0, 8.0, 7.0, 11.0, 3.0, 7.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7255859375, -1.6685028076171875, -1.611419677734375, -1.5543365478515625, -1.49725341796875, -1.4401702880859375, -1.383087158203125, -1.3260040283203125, -1.2689208984375, -1.2118377685546875, -1.154754638671875, -1.0976715087890625, -1.04058837890625, -0.9835052490234375, -0.926422119140625, -0.8693389892578125, -0.812255859375, -0.7551727294921875, -0.698089599609375, -0.6410064697265625, -0.58392333984375, -0.5268402099609375, -0.469757080078125, -0.4126739501953125, -0.3555908203125, -0.2985076904296875, -0.241424560546875, -0.1843414306640625, -0.12725830078125, -0.0701751708984375, -0.013092041015625, 0.0439910888671875, 0.10107421875, 0.1581573486328125, 0.215240478515625, 0.2723236083984375, 0.32940673828125, 0.3864898681640625, 0.443572998046875, 0.5006561279296875, 0.5577392578125, 0.6148223876953125, 0.671905517578125, 0.7289886474609375, 0.78607177734375, 0.8431549072265625, 0.900238037109375, 0.9573211669921875, 1.014404296875, 1.0714874267578125, 1.128570556640625, 1.1856536865234375, 1.24273681640625, 1.2998199462890625, 1.356903076171875, 1.4139862060546875, 1.4710693359375, 1.5281524658203125, 1.585235595703125, 1.6423187255859375, 1.69940185546875, 1.7564849853515625, 1.813568115234375, 1.8706512451171875, 1.927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 16.0, 17.0, 22.0, 29.0, 42.0, 51.0, 71.0, 94.0, 128.0, 167.0, 199.0, 293.0, 417.0, 628.0, 1095.0, 1970.0, 4683.0, 12812.0, 41546.0, 155245.0, 454129.0, 270118.0, 70632.0, 20574.0, 6905.0, 2748.0, 1354.0, 739.0, 480.0, 340.0, 235.0, 168.0, 150.0, 129.0, 75.0, 53.0, 50.0, 34.0, 18.0, 20.0, 20.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.1875, -2.113861083984375, -2.04022216796875, -1.966583251953125, -1.8929443359375, -1.819305419921875, -1.74566650390625, -1.672027587890625, -1.598388671875, -1.524749755859375, -1.45111083984375, -1.377471923828125, -1.3038330078125, -1.230194091796875, -1.15655517578125, -1.082916259765625, -1.00927734375, -0.935638427734375, -0.86199951171875, -0.788360595703125, -0.7147216796875, -0.641082763671875, -0.56744384765625, -0.493804931640625, -0.420166015625, -0.346527099609375, -0.27288818359375, -0.199249267578125, -0.1256103515625, -0.051971435546875, 0.02166748046875, 0.095306396484375, 0.1689453125, 0.242584228515625, 0.31622314453125, 0.389862060546875, 0.4635009765625, 0.537139892578125, 0.61077880859375, 0.684417724609375, 0.758056640625, 0.831695556640625, 0.90533447265625, 0.978973388671875, 1.0526123046875, 1.126251220703125, 1.19989013671875, 1.273529052734375, 1.34716796875, 1.420806884765625, 1.49444580078125, 1.568084716796875, 1.6417236328125, 1.715362548828125, 1.78900146484375, 1.862640380859375, 1.936279296875, 2.009918212890625, 2.08355712890625, 2.157196044921875, 2.2308349609375, 2.304473876953125, 2.37811279296875, 2.451751708984375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 7.0, 13.0, 16.0, 8.0, 8.0, 23.0, 11.0, 20.0, 19.0, 30.0, 28.0, 32.0, 26.0, 26.0, 38.0, 27.0, 41.0, 45.0, 42.0, 46.0, 41.0, 42.0, 45.0, 29.0, 36.0, 30.0, 32.0, 23.0, 24.0, 37.0, 21.0, 20.0, 15.0, 15.0, 18.0, 6.0, 14.0, 6.0, 12.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.072052001953125, -1.03472900390625, -0.997406005859375, -0.9600830078125, -0.922760009765625, -0.88543701171875, -0.848114013671875, -0.810791015625, -0.773468017578125, -0.73614501953125, -0.698822021484375, -0.6614990234375, -0.624176025390625, -0.58685302734375, -0.549530029296875, -0.51220703125, -0.474884033203125, -0.43756103515625, -0.400238037109375, -0.3629150390625, -0.325592041015625, -0.28826904296875, -0.250946044921875, -0.213623046875, -0.176300048828125, -0.13897705078125, -0.101654052734375, -0.0643310546875, -0.027008056640625, 0.01031494140625, 0.047637939453125, 0.0849609375, 0.122283935546875, 0.15960693359375, 0.196929931640625, 0.2342529296875, 0.271575927734375, 0.30889892578125, 0.346221923828125, 0.383544921875, 0.420867919921875, 0.45819091796875, 0.495513916015625, 0.5328369140625, 0.570159912109375, 0.60748291015625, 0.644805908203125, 0.68212890625, 0.719451904296875, 0.75677490234375, 0.794097900390625, 0.8314208984375, 0.868743896484375, 0.90606689453125, 0.943389892578125, 0.980712890625, 1.018035888671875, 1.05535888671875, 1.092681884765625, 1.1300048828125, 1.167327880859375, 1.20465087890625, 1.241973876953125, 1.279296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 9.0, 10.0, 12.0, 17.0, 25.0, 30.0, 53.0, 68.0, 118.0, 139.0, 197.0, 278.0, 422.0, 618.0, 959.0, 1456.0, 2382.0, 4098.0, 8088.0, 18773.0, 58960.0, 243558.0, 485528.0, 153105.0, 39866.0, 14057.0, 6401.0, 3440.0, 2025.0, 1266.0, 841.0, 496.0, 375.0, 259.0, 150.0, 113.0, 109.0, 61.0, 42.0, 29.0, 28.0, 26.0, 13.0, 12.0, 12.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.70556640625, -0.68231201171875, -0.6590576171875, -0.63580322265625, -0.612548828125, -0.58929443359375, -0.5660400390625, -0.54278564453125, -0.51953125, -0.49627685546875, -0.4730224609375, -0.44976806640625, -0.426513671875, -0.40325927734375, -0.3800048828125, -0.35675048828125, -0.33349609375, -0.31024169921875, -0.2869873046875, -0.26373291015625, -0.240478515625, -0.21722412109375, -0.1939697265625, -0.17071533203125, -0.1474609375, -0.12420654296875, -0.1009521484375, -0.07769775390625, -0.054443359375, -0.03118896484375, -0.0079345703125, 0.01531982421875, 0.03857421875, 0.06182861328125, 0.0850830078125, 0.10833740234375, 0.131591796875, 0.15484619140625, 0.1781005859375, 0.20135498046875, 0.224609375, 0.24786376953125, 0.2711181640625, 0.29437255859375, 0.317626953125, 0.34088134765625, 0.3641357421875, 0.38739013671875, 0.41064453125, 0.43389892578125, 0.4571533203125, 0.48040771484375, 0.503662109375, 0.52691650390625, 0.5501708984375, 0.57342529296875, 0.5966796875, 0.61993408203125, 0.6431884765625, 0.66644287109375, 0.689697265625, 0.71295166015625, 0.7362060546875, 0.75946044921875, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 34.0, 36.0, 59.0, 111.0, 151.0, 139.0, 136.0, 99.0, 74.0, 33.0, 25.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.861852645874023e-05, -7.612258195877075e-05, -7.362663745880127e-05, -7.113069295883179e-05, -6.86347484588623e-05, -6.613880395889282e-05, -6.364285945892334e-05, -6.114691495895386e-05, -5.8650970458984375e-05, -5.615502595901489e-05, -5.365908145904541e-05, -5.116313695907593e-05, -4.8667192459106445e-05, -4.617124795913696e-05, -4.367530345916748e-05, -4.1179358959198e-05, -3.8683414459228516e-05, -3.618746995925903e-05, -3.369152545928955e-05, -3.119558095932007e-05, -2.8699636459350586e-05, -2.6203691959381104e-05, -2.370774745941162e-05, -2.121180295944214e-05, -1.8715858459472656e-05, -1.6219913959503174e-05, -1.3723969459533691e-05, -1.1228024959564209e-05, -8.732080459594727e-06, -6.236135959625244e-06, -3.7401914596557617e-06, -1.2442469596862793e-06, 1.2516975402832031e-06, 3.7476420402526855e-06, 6.243586540222168e-06, 8.73953104019165e-06, 1.1235475540161133e-05, 1.3731420040130615e-05, 1.6227364540100098e-05, 1.872330904006958e-05, 2.1219253540039062e-05, 2.3715198040008545e-05, 2.6211142539978027e-05, 2.870708703994751e-05, 3.120303153991699e-05, 3.3698976039886475e-05, 3.619492053985596e-05, 3.869086503982544e-05, 4.118680953979492e-05, 4.3682754039764404e-05, 4.617869853973389e-05, 4.867464303970337e-05, 5.117058753967285e-05, 5.3666532039642334e-05, 5.6162476539611816e-05, 5.86584210395813e-05, 6.115436553955078e-05, 6.365031003952026e-05, 6.614625453948975e-05, 6.864219903945923e-05, 7.113814353942871e-05, 7.36340880393982e-05, 7.613003253936768e-05, 7.862597703933716e-05, 8.112192153930664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 3.0, 10.0, 25.0, 30.0, 54.0, 57.0, 88.0, 128.0, 172.0, 250.0, 389.0, 580.0, 783.0, 1313.0, 1985.0, 3159.0, 5028.0, 8559.0, 15204.0, 28684.0, 57454.0, 115493.0, 211057.0, 252402.0, 166083.0, 85360.0, 42431.0, 21734.0, 11677.0, 6845.0, 4109.0, 2504.0, 1643.0, 1078.0, 689.0, 489.0, 309.0, 196.0, 145.0, 126.0, 71.0, 51.0, 30.0, 16.0, 15.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5659637451171875, -0.548431396484375, -0.5308990478515625, -0.51336669921875, -0.4958343505859375, -0.478302001953125, -0.4607696533203125, -0.4432373046875, -0.4257049560546875, -0.408172607421875, -0.3906402587890625, -0.37310791015625, -0.3555755615234375, -0.338043212890625, -0.3205108642578125, -0.302978515625, -0.2854461669921875, -0.267913818359375, -0.2503814697265625, -0.23284912109375, -0.2153167724609375, -0.197784423828125, -0.1802520751953125, -0.1627197265625, -0.1451873779296875, -0.127655029296875, -0.1101226806640625, -0.09259033203125, -0.0750579833984375, -0.057525634765625, -0.0399932861328125, -0.0224609375, -0.0049285888671875, 0.012603759765625, 0.0301361083984375, 0.04766845703125, 0.0652008056640625, 0.082733154296875, 0.1002655029296875, 0.1177978515625, 0.1353302001953125, 0.152862548828125, 0.1703948974609375, 0.18792724609375, 0.2054595947265625, 0.222991943359375, 0.2405242919921875, 0.258056640625, 0.2755889892578125, 0.293121337890625, 0.3106536865234375, 0.32818603515625, 0.3457183837890625, 0.363250732421875, 0.3807830810546875, 0.3983154296875, 0.4158477783203125, 0.433380126953125, 0.4509124755859375, 0.46844482421875, 0.4859771728515625, 0.503509521484375, 0.5210418701171875, 0.53857421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 18.0, 17.0, 33.0, 52.0, 47.0, 93.0, 141.0, 148.0, 135.0, 88.0, 67.0, 48.0, 24.0, 25.0, 13.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.285369873046875, -0.27630615234375, -0.267242431640625, -0.2581787109375, -0.249114990234375, -0.24005126953125, -0.230987548828125, -0.221923828125, -0.212860107421875, -0.20379638671875, -0.194732666015625, -0.1856689453125, -0.176605224609375, -0.16754150390625, -0.158477783203125, -0.1494140625, -0.140350341796875, -0.13128662109375, -0.122222900390625, -0.1131591796875, -0.104095458984375, -0.09503173828125, -0.085968017578125, -0.076904296875, -0.067840576171875, -0.05877685546875, -0.049713134765625, -0.0406494140625, -0.031585693359375, -0.02252197265625, -0.013458251953125, -0.00439453125, 0.004669189453125, 0.01373291015625, 0.022796630859375, 0.0318603515625, 0.040924072265625, 0.04998779296875, 0.059051513671875, 0.068115234375, 0.077178955078125, 0.08624267578125, 0.095306396484375, 0.1043701171875, 0.113433837890625, 0.12249755859375, 0.131561279296875, 0.140625, 0.149688720703125, 0.15875244140625, 0.167816162109375, 0.1768798828125, 0.185943603515625, 0.19500732421875, 0.204071044921875, 0.213134765625, 0.222198486328125, 0.23126220703125, 0.240325927734375, 0.2493896484375, 0.258453369140625, 0.26751708984375, 0.276580810546875, 0.28564453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 14.0, 25.0, 18.0, 26.0, 32.0, 33.0, 50.0, 49.0, 60.0, 69.0, 62.0, 68.0, 49.0, 51.0, 47.0, 47.0, 52.0, 45.0, 43.0, 28.0, 19.0, 29.0, 16.0, 16.0, 9.0, 5.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.003823757171631, -2.9175076484680176, -2.8311917781829834, -2.74487566947937, -2.658559560775757, -2.5722436904907227, -2.4859275817871094, -2.399611473083496, -2.313295364379883, -2.2269792556762695, -2.1406633853912354, -2.054347276687622, -1.9680311679840088, -1.881715178489685, -1.7953991889953613, -1.709083080291748, -1.6227672100067139, -1.5364512205123901, -1.4501351118087769, -1.3638191223144531, -1.2775030136108398, -1.1911870241165161, -1.1048710346221924, -1.018554925918579, -0.9322389364242554, -0.8459228873252869, -0.7596068382263184, -0.6732908487319946, -0.5869747996330261, -0.5006587505340576, -0.4143427610397339, -0.3280267119407654, -0.24171066284179688, -0.15539462864398956, -0.06907859444618225, 0.017237424850463867, 0.10355347394943237, 0.18986952304840088, 0.2761855125427246, 0.3625015616416931, 0.4488176107406616, 0.5351336598396301, 0.6214497089385986, 0.7077656984329224, 0.7940817475318909, 0.8803977966308594, 0.9667137861251831, 1.0530297756195068, 1.1393458843231201, 1.2256618738174438, 1.3119779825210571, 1.3982939720153809, 1.4846100807189941, 1.5709260702133179, 1.6572420597076416, 1.7435581684112549, 1.8298741579055786, 1.9161901473999023, 2.0025062561035156, 2.088822364807129, 2.175138235092163, 2.2614543437957764, 2.3477702140808105, 2.434086322784424, 2.520402431488037]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 8.0, 8.0, 8.0, 15.0, 16.0, 12.0, 13.0, 16.0, 18.0, 19.0, 29.0, 24.0, 26.0, 27.0, 28.0, 37.0, 37.0, 46.0, 30.0, 41.0, 30.0, 37.0, 38.0, 38.0, 41.0, 17.0, 38.0, 24.0, 30.0, 22.0, 23.0, 21.0, 26.0, 16.0, 22.0, 12.0, 15.0, 12.0, 17.0, 4.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5719082355499268, -1.5209792852401733, -1.4700504541397095, -1.419121503829956, -1.3681925535202026, -1.3172636032104492, -1.2663347721099854, -1.215405821800232, -1.1644768714904785, -1.113547921180725, -1.0626190900802612, -1.0116901397705078, -0.9607611894607544, -0.9098322987556458, -0.8589034080505371, -0.8079744577407837, -0.7570456266403198, -0.7061167359352112, -0.6551877856254578, -0.6042588949203491, -0.5533299446105957, -0.5024010539054871, -0.4514721632003784, -0.4005432426929474, -0.34961432218551636, -0.2986854016780853, -0.2477564960718155, -0.19682759046554565, -0.14589866995811462, -0.0949697494506836, -0.04404085874557495, 0.006888061761856079, 0.05781710147857666, 0.1087460145354271, 0.15967492759227753, 0.21060383319854736, 0.2615327537059784, 0.3124616742134094, 0.36339056491851807, 0.4143194854259491, 0.4652484059333801, 0.5161772966384888, 0.5671062469482422, 0.6180351376533508, 0.6689640283584595, 0.7198929786682129, 0.7708218693733215, 0.8217507600784302, 0.8726797103881836, 0.9236086010932922, 0.9745375514030457, 1.0254664421081543, 1.0763953924179077, 1.1273243427276611, 1.178253173828125, 1.2291821241378784, 1.2801110744476318, 1.3310400247573853, 1.3819688558578491, 1.4328978061676025, 1.483826756477356, 1.5347557067871094, 1.5856845378875732, 1.6366134881973267, 1.6875423192977905]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 12.0, 23.0, 21.0, 36.0, 46.0, 68.0, 86.0, 141.0, 189.0, 324.0, 470.0, 663.0, 1151.0, 1766.0, 2768.0, 4536.0, 7436.0, 12099.0, 19240.0, 31222.0, 48183.0, 70618.0, 96769.0, 120000.0, 133898.0, 129632.0, 111419.0, 86059.0, 61073.0, 40393.0, 25955.0, 16270.0, 9791.0, 5963.0, 3684.0, 2295.0, 1468.0, 935.0, 576.0, 415.0, 255.0, 177.0, 120.0, 100.0, 71.0, 41.0, 34.0, 27.0, 12.0, 5.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.0078125, -1.944671630859375, -1.88153076171875, -1.818389892578125, -1.7552490234375, -1.692108154296875, -1.62896728515625, -1.565826416015625, -1.502685546875, -1.439544677734375, -1.37640380859375, -1.313262939453125, -1.2501220703125, -1.186981201171875, -1.12384033203125, -1.060699462890625, -0.99755859375, -0.934417724609375, -0.87127685546875, -0.808135986328125, -0.7449951171875, -0.681854248046875, -0.61871337890625, -0.555572509765625, -0.492431640625, -0.429290771484375, -0.36614990234375, -0.303009033203125, -0.2398681640625, -0.176727294921875, -0.11358642578125, -0.050445556640625, 0.0126953125, 0.075836181640625, 0.13897705078125, 0.202117919921875, 0.2652587890625, 0.328399658203125, 0.39154052734375, 0.454681396484375, 0.517822265625, 0.580963134765625, 0.64410400390625, 0.707244873046875, 0.7703857421875, 0.833526611328125, 0.89666748046875, 0.959808349609375, 1.02294921875, 1.086090087890625, 1.14923095703125, 1.212371826171875, 1.2755126953125, 1.338653564453125, 1.40179443359375, 1.464935302734375, 1.528076171875, 1.591217041015625, 1.65435791015625, 1.717498779296875, 1.7806396484375, 1.843780517578125, 1.90692138671875, 1.970062255859375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 8.0, 8.0, 13.0, 11.0, 8.0, 12.0, 19.0, 15.0, 19.0, 14.0, 23.0, 32.0, 27.0, 36.0, 29.0, 40.0, 37.0, 30.0, 37.0, 41.0, 35.0, 33.0, 43.0, 32.0, 29.0, 25.0, 39.0, 27.0, 21.0, 25.0, 28.0, 26.0, 23.0, 20.0, 20.0, 14.0, 16.0, 15.0, 12.0, 9.0, 9.0, 7.0, 1.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.716796875, -1.66448974609375, -1.6121826171875, -1.55987548828125, -1.507568359375, -1.45526123046875, -1.4029541015625, -1.35064697265625, -1.29833984375, -1.24603271484375, -1.1937255859375, -1.14141845703125, -1.089111328125, -1.03680419921875, -0.9844970703125, -0.93218994140625, -0.8798828125, -0.82757568359375, -0.7752685546875, -0.72296142578125, -0.670654296875, -0.61834716796875, -0.5660400390625, -0.51373291015625, -0.46142578125, -0.40911865234375, -0.3568115234375, -0.30450439453125, -0.252197265625, -0.19989013671875, -0.1475830078125, -0.09527587890625, -0.04296875, 0.00933837890625, 0.0616455078125, 0.11395263671875, 0.166259765625, 0.21856689453125, 0.2708740234375, 0.32318115234375, 0.37548828125, 0.42779541015625, 0.4801025390625, 0.53240966796875, 0.584716796875, 0.63702392578125, 0.6893310546875, 0.74163818359375, 0.7939453125, 0.84625244140625, 0.8985595703125, 0.95086669921875, 1.003173828125, 1.05548095703125, 1.1077880859375, 1.16009521484375, 1.21240234375, 1.26470947265625, 1.3170166015625, 1.36932373046875, 1.421630859375, 1.47393798828125, 1.5262451171875, 1.57855224609375, 1.630859375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 11.0, 14.0, 17.0, 40.0, 86.0, 105.0, 167.0, 279.0, 422.0, 730.0, 1154.0, 2061.0, 3396.0, 5667.0, 9379.0, 15524.0, 25357.0, 40040.0, 60773.0, 86530.0, 113300.0, 132039.0, 134892.0, 121972.0, 98041.0, 70846.0, 47234.0, 30604.0, 19060.0, 11476.0, 6904.0, 4156.0, 2483.0, 1509.0, 840.0, 532.0, 378.0, 210.0, 125.0, 64.0, 49.0, 37.0, 27.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.818359375, -1.758148193359375, -1.69793701171875, -1.637725830078125, -1.5775146484375, -1.517303466796875, -1.45709228515625, -1.396881103515625, -1.336669921875, -1.276458740234375, -1.21624755859375, -1.156036376953125, -1.0958251953125, -1.035614013671875, -0.97540283203125, -0.915191650390625, -0.85498046875, -0.794769287109375, -0.73455810546875, -0.674346923828125, -0.6141357421875, -0.553924560546875, -0.49371337890625, -0.433502197265625, -0.373291015625, -0.313079833984375, -0.25286865234375, -0.192657470703125, -0.1324462890625, -0.072235107421875, -0.01202392578125, 0.048187255859375, 0.1083984375, 0.168609619140625, 0.22882080078125, 0.289031982421875, 0.3492431640625, 0.409454345703125, 0.46966552734375, 0.529876708984375, 0.590087890625, 0.650299072265625, 0.71051025390625, 0.770721435546875, 0.8309326171875, 0.891143798828125, 0.95135498046875, 1.011566162109375, 1.07177734375, 1.131988525390625, 1.19219970703125, 1.252410888671875, 1.3126220703125, 1.372833251953125, 1.43304443359375, 1.493255615234375, 1.553466796875, 1.613677978515625, 1.67388916015625, 1.734100341796875, 1.7943115234375, 1.854522705078125, 1.91473388671875, 1.974945068359375, 2.03515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 4.0, 12.0, 13.0, 11.0, 26.0, 24.0, 23.0, 23.0, 28.0, 30.0, 42.0, 37.0, 32.0, 40.0, 35.0, 30.0, 46.0, 40.0, 45.0, 40.0, 40.0, 35.0, 41.0, 36.0, 28.0, 43.0, 41.0, 24.0, 26.0, 26.0, 7.0, 16.0, 11.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1051483154296875, -1.064788818359375, -1.0244293212890625, -0.98406982421875, -0.9437103271484375, -0.903350830078125, -0.8629913330078125, -0.8226318359375, -0.7822723388671875, -0.741912841796875, -0.7015533447265625, -0.66119384765625, -0.6208343505859375, -0.580474853515625, -0.5401153564453125, -0.499755859375, -0.4593963623046875, -0.419036865234375, -0.3786773681640625, -0.33831787109375, -0.2979583740234375, -0.257598876953125, -0.2172393798828125, -0.1768798828125, -0.1365203857421875, -0.096160888671875, -0.0558013916015625, -0.01544189453125, 0.0249176025390625, 0.065277099609375, 0.1056365966796875, 0.14599609375, 0.1863555908203125, 0.226715087890625, 0.2670745849609375, 0.30743408203125, 0.3477935791015625, 0.388153076171875, 0.4285125732421875, 0.4688720703125, 0.5092315673828125, 0.549591064453125, 0.5899505615234375, 0.63031005859375, 0.6706695556640625, 0.711029052734375, 0.7513885498046875, 0.791748046875, 0.8321075439453125, 0.872467041015625, 0.9128265380859375, 0.95318603515625, 0.9935455322265625, 1.033905029296875, 1.0742645263671875, 1.1146240234375, 1.1549835205078125, 1.195343017578125, 1.2357025146484375, 1.27606201171875, 1.3164215087890625, 1.356781005859375, 1.3971405029296875, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 6.0, 9.0, 7.0, 15.0, 18.0, 27.0, 42.0, 54.0, 91.0, 132.0, 244.0, 378.0, 561.0, 890.0, 1353.0, 2354.0, 4015.0, 7058.0, 13559.0, 27707.0, 62300.0, 142593.0, 264452.0, 261435.0, 140674.0, 60859.0, 27342.0, 13171.0, 7080.0, 3984.0, 2315.0, 1462.0, 827.0, 512.0, 349.0, 231.0, 150.0, 99.0, 49.0, 41.0, 33.0, 24.0, 20.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.766204833984375, -2.67694091796875, -2.587677001953125, -2.4984130859375, -2.409149169921875, -2.31988525390625, -2.230621337890625, -2.141357421875, -2.052093505859375, -1.96282958984375, -1.873565673828125, -1.7843017578125, -1.695037841796875, -1.60577392578125, -1.516510009765625, -1.42724609375, -1.337982177734375, -1.24871826171875, -1.159454345703125, -1.0701904296875, -0.980926513671875, -0.89166259765625, -0.802398681640625, -0.713134765625, -0.623870849609375, -0.53460693359375, -0.445343017578125, -0.3560791015625, -0.266815185546875, -0.17755126953125, -0.088287353515625, 0.0009765625, 0.090240478515625, 0.17950439453125, 0.268768310546875, 0.3580322265625, 0.447296142578125, 0.53656005859375, 0.625823974609375, 0.715087890625, 0.804351806640625, 0.89361572265625, 0.982879638671875, 1.0721435546875, 1.161407470703125, 1.25067138671875, 1.339935302734375, 1.42919921875, 1.518463134765625, 1.60772705078125, 1.696990966796875, 1.7862548828125, 1.875518798828125, 1.96478271484375, 2.054046630859375, 2.143310546875, 2.232574462890625, 2.32183837890625, 2.411102294921875, 2.5003662109375, 2.589630126953125, 2.67889404296875, 2.768157958984375, 2.857421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 1.0, 11.0, 12.0, 14.0, 19.0, 25.0, 27.0, 17.0, 26.0, 35.0, 50.0, 51.0, 47.0, 58.0, 64.0, 65.0, 59.0, 50.0, 43.0, 48.0, 37.0, 33.0, 40.0, 16.0, 22.0, 21.0, 11.0, 17.0, 11.0, 5.0, 4.0, 9.0, 4.0, 4.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.00013802573084831238, -0.00013347715139389038, -0.00012892857193946838, -0.0001243799924850464, -0.00011983141303062439, -0.00011528283357620239, -0.0001107342541217804, -0.0001061856746673584, -0.0001016370952129364, -9.70885157585144e-05, -9.253993630409241e-05, -8.799135684967041e-05, -8.344277739524841e-05, -7.889419794082642e-05, -7.434561848640442e-05, -6.979703903198242e-05, -6.524845957756042e-05, -6.069988012313843e-05, -5.615130066871643e-05, -5.1602721214294434e-05, -4.7054141759872437e-05, -4.250556230545044e-05, -3.795698285102844e-05, -3.3408403396606445e-05, -2.8859823942184448e-05, -2.431124448776245e-05, -1.9762665033340454e-05, -1.5214085578918457e-05, -1.066550612449646e-05, -6.116926670074463e-06, -1.5683472156524658e-06, 2.9802322387695312e-06, 7.528811693191528e-06, 1.2077391147613525e-05, 1.6625970602035522e-05, 2.117455005645752e-05, 2.5723129510879517e-05, 3.0271708965301514e-05, 3.482028841972351e-05, 3.936886787414551e-05, 4.3917447328567505e-05, 4.84660267829895e-05, 5.30146062374115e-05, 5.7563185691833496e-05, 6.211176514625549e-05, 6.666034460067749e-05, 7.120892405509949e-05, 7.575750350952148e-05, 8.030608296394348e-05, 8.485466241836548e-05, 8.940324187278748e-05, 9.395182132720947e-05, 9.850040078163147e-05, 0.00010304898023605347, 0.00010759755969047546, 0.00011214613914489746, 0.00011669471859931946, 0.00012124329805374146, 0.00012579187750816345, 0.00013034045696258545, 0.00013488903641700745, 0.00013943761587142944, 0.00014398619532585144, 0.00014853477478027344]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 16.0, 19.0, 27.0, 38.0, 75.0, 124.0, 186.0, 275.0, 481.0, 726.0, 1162.0, 1838.0, 3203.0, 5907.0, 11868.0, 25592.0, 61875.0, 151549.0, 284343.0, 266415.0, 133290.0, 53471.0, 22510.0, 10459.0, 5378.0, 3100.0, 1772.0, 1105.0, 631.0, 395.0, 250.0, 179.0, 100.0, 65.0, 41.0, 24.0, 22.0, 18.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.83880615234375, -2.7498779296875, -2.66094970703125, -2.572021484375, -2.48309326171875, -2.3941650390625, -2.30523681640625, -2.21630859375, -2.12738037109375, -2.0384521484375, -1.94952392578125, -1.860595703125, -1.77166748046875, -1.6827392578125, -1.59381103515625, -1.5048828125, -1.41595458984375, -1.3270263671875, -1.23809814453125, -1.149169921875, -1.06024169921875, -0.9713134765625, -0.88238525390625, -0.79345703125, -0.70452880859375, -0.6156005859375, -0.52667236328125, -0.437744140625, -0.34881591796875, -0.2598876953125, -0.17095947265625, -0.08203125, 0.00689697265625, 0.0958251953125, 0.18475341796875, 0.273681640625, 0.36260986328125, 0.4515380859375, 0.54046630859375, 0.62939453125, 0.71832275390625, 0.8072509765625, 0.89617919921875, 0.985107421875, 1.07403564453125, 1.1629638671875, 1.25189208984375, 1.3408203125, 1.42974853515625, 1.5186767578125, 1.60760498046875, 1.696533203125, 1.78546142578125, 1.8743896484375, 1.96331787109375, 2.05224609375, 2.14117431640625, 2.2301025390625, 2.31903076171875, 2.407958984375, 2.49688720703125, 2.5858154296875, 2.67474365234375, 2.763671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 5.0, 14.0, 15.0, 19.0, 22.0, 31.0, 36.0, 44.0, 55.0, 85.0, 65.0, 89.0, 70.0, 73.0, 63.0, 56.0, 43.0, 39.0, 29.0, 25.0, 31.0, 14.0, 12.0, 12.0, 7.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7098464965820312, -0.6843414306640625, -0.6588363647460938, -0.633331298828125, -0.6078262329101562, -0.5823211669921875, -0.5568161010742188, -0.53131103515625, -0.5058059692382812, -0.4803009033203125, -0.45479583740234375, -0.429290771484375, -0.40378570556640625, -0.3782806396484375, -0.35277557373046875, -0.3272705078125, -0.30176544189453125, -0.2762603759765625, -0.25075531005859375, -0.225250244140625, -0.19974517822265625, -0.1742401123046875, -0.14873504638671875, -0.12322998046875, -0.09772491455078125, -0.0722198486328125, -0.04671478271484375, -0.021209716796875, 0.00429534912109375, 0.0298004150390625, 0.05530548095703125, 0.080810546875, 0.10631561279296875, 0.1318206787109375, 0.15732574462890625, 0.182830810546875, 0.20833587646484375, 0.2338409423828125, 0.25934600830078125, 0.28485107421875, 0.31035614013671875, 0.3358612060546875, 0.36136627197265625, 0.386871337890625, 0.41237640380859375, 0.4378814697265625, 0.46338653564453125, 0.4888916015625, 0.5143966674804688, 0.5399017333984375, 0.5654067993164062, 0.590911865234375, 0.6164169311523438, 0.6419219970703125, 0.6674270629882812, 0.69293212890625, 0.7184371948242188, 0.7439422607421875, 0.7694473266601562, 0.794952392578125, 0.8204574584960938, 0.8459625244140625, 0.8714675903320312, 0.89697265625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 22.0, 18.0, 16.0, 25.0, 39.0, 45.0, 47.0, 59.0, 62.0, 77.0, 66.0, 69.0, 51.0, 45.0, 46.0, 53.0, 54.0, 35.0, 26.0, 22.0, 29.0, 19.0, 10.0, 15.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564897298812866, -2.4802913665771484, -2.3956854343414307, -2.311079502105713, -2.226473331451416, -2.1418673992156982, -2.0572614669799805, -1.9726555347442627, -1.8880494832992554, -1.8034435510635376, -1.7188374996185303, -1.6342315673828125, -1.5496256351470947, -1.4650195837020874, -1.3804136514663696, -1.2958076000213623, -1.2112016677856445, -1.1265957355499268, -1.0419896841049194, -0.9573837518692017, -0.8727777600288391, -0.7881717681884766, -0.7035658359527588, -0.6189598441123962, -0.5343538522720337, -0.44974786043167114, -0.365141898393631, -0.2805359363555908, -0.19592994451522827, -0.11132395267486572, -0.02671802043914795, 0.0578879714012146, 0.14249420166015625, 0.2271001785993576, 0.31170615553855896, 0.3963121175765991, 0.48091810941696167, 0.5655241012573242, 0.650130033493042, 0.7347360253334045, 0.8193420171737671, 0.9039480090141296, 0.9885540008544922, 1.07315993309021, 1.1577658653259277, 1.242371916770935, 1.3269778490066528, 1.4115839004516602, 1.496189832687378, 1.5807957649230957, 1.665401816368103, 1.7500077486038208, 1.8346138000488281, 1.919219732284546, 2.0038256645202637, 2.0884315967559814, 2.173037528991699, 2.257643461227417, 2.3422493934631348, 2.4268555641174316, 2.5114614963531494, 2.596067428588867, 2.680673360824585, 2.7652792930603027, 2.8498854637145996]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 1.0, 7.0, 6.0, 10.0, 10.0, 10.0, 6.0, 13.0, 19.0, 15.0, 18.0, 22.0, 20.0, 23.0, 26.0, 32.0, 37.0, 30.0, 22.0, 34.0, 31.0, 38.0, 39.0, 34.0, 33.0, 35.0, 27.0, 35.0, 37.0, 38.0, 25.0, 19.0, 20.0, 26.0, 24.0, 14.0, 20.0, 24.0, 10.0, 15.0, 10.0, 17.0, 11.0, 10.0, 5.0, 8.0, 10.0, 9.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.6389598846435547, -1.5876710414886475, -1.5363821983337402, -1.485093355178833, -1.4338045120239258, -1.3825156688690186, -1.3312268257141113, -1.279937982559204, -1.2286491394042969, -1.1773602962493896, -1.1260714530944824, -1.0747826099395752, -1.023493766784668, -0.9722049236297607, -0.9209160804748535, -0.8696272373199463, -0.8183384537696838, -0.7670496106147766, -0.7157607674598694, -0.6644719243049622, -0.6131830811500549, -0.5618942975997925, -0.5106054544448853, -0.45931658148765564, -0.4080277383327484, -0.3567388951778412, -0.30545005202293396, -0.2541612386703491, -0.2028723806142807, -0.15158355236053467, -0.10029470920562744, -0.049005866050720215, 0.0022829771041870117, 0.05357181653380394, 0.10486065596342087, 0.1561494916677475, 0.20743833482265472, 0.25872716307640076, 0.310016006231308, 0.3613048493862152, 0.41259369254112244, 0.46388253569602966, 0.5151713490486145, 0.5664601922035217, 0.617749035358429, 0.6690378785133362, 0.7203267216682434, 0.7716155648231506, 0.8229044079780579, 0.8741932511329651, 0.9254820942878723, 0.9767709374427795, 1.028059720993042, 1.0793485641479492, 1.1306374073028564, 1.1819262504577637, 1.233215093612671, 1.2845039367675781, 1.3357927799224854, 1.3870816230773926, 1.4383704662322998, 1.489659309387207, 1.5409481525421143, 1.5922369956970215, 1.6435258388519287]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 12.0, 11.0, 28.0, 59.0, 95.0, 174.0, 299.0, 496.0, 850.0, 1501.0, 2740.0, 4621.0, 8159.0, 14452.0, 25672.0, 45516.0, 82119.0, 141962.0, 240000.0, 379876.0, 542413.0, 655204.0, 643477.0, 518130.0, 357821.0, 222909.0, 131684.0, 75607.0, 42503.0, 23913.0, 13638.0, 7811.0, 4365.0, 2568.0, 1522.0, 867.0, 481.0, 291.0, 188.0, 86.0, 65.0, 44.0, 24.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7557373046875, -1.698974609375, -1.6422119140625, -1.58544921875, -1.5286865234375, -1.471923828125, -1.4151611328125, -1.3583984375, -1.3016357421875, -1.244873046875, -1.1881103515625, -1.13134765625, -1.0745849609375, -1.017822265625, -0.9610595703125, -0.904296875, -0.8475341796875, -0.790771484375, -0.7340087890625, -0.67724609375, -0.6204833984375, -0.563720703125, -0.5069580078125, -0.4501953125, -0.3934326171875, -0.336669921875, -0.2799072265625, -0.22314453125, -0.1663818359375, -0.109619140625, -0.0528564453125, 0.00390625, 0.0606689453125, 0.117431640625, 0.1741943359375, 0.23095703125, 0.2877197265625, 0.344482421875, 0.4012451171875, 0.4580078125, 0.5147705078125, 0.571533203125, 0.6282958984375, 0.68505859375, 0.7418212890625, 0.798583984375, 0.8553466796875, 0.912109375, 0.9688720703125, 1.025634765625, 1.0823974609375, 1.13916015625, 1.1959228515625, 1.252685546875, 1.3094482421875, 1.3662109375, 1.4229736328125, 1.479736328125, 1.5364990234375, 1.59326171875, 1.6500244140625, 1.706787109375, 1.7635498046875, 1.8203125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 3.0, 9.0, 11.0, 14.0, 12.0, 24.0, 19.0, 21.0, 25.0, 24.0, 28.0, 25.0, 29.0, 32.0, 44.0, 45.0, 28.0, 36.0, 37.0, 24.0, 35.0, 37.0, 32.0, 39.0, 40.0, 31.0, 38.0, 17.0, 14.0, 21.0, 32.0, 23.0, 19.0, 15.0, 21.0, 10.0, 15.0, 11.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.092803955078125, -1.05474853515625, -1.016693115234375, -0.9786376953125, -0.940582275390625, -0.90252685546875, -0.864471435546875, -0.826416015625, -0.788360595703125, -0.75030517578125, -0.712249755859375, -0.6741943359375, -0.636138916015625, -0.59808349609375, -0.560028076171875, -0.52197265625, -0.483917236328125, -0.44586181640625, -0.407806396484375, -0.3697509765625, -0.331695556640625, -0.29364013671875, -0.255584716796875, -0.217529296875, -0.179473876953125, -0.14141845703125, -0.103363037109375, -0.0653076171875, -0.027252197265625, 0.01080322265625, 0.048858642578125, 0.0869140625, 0.124969482421875, 0.16302490234375, 0.201080322265625, 0.2391357421875, 0.277191162109375, 0.31524658203125, 0.353302001953125, 0.391357421875, 0.429412841796875, 0.46746826171875, 0.505523681640625, 0.5435791015625, 0.581634521484375, 0.61968994140625, 0.657745361328125, 0.69580078125, 0.733856201171875, 0.77191162109375, 0.809967041015625, 0.8480224609375, 0.886077880859375, 0.92413330078125, 0.962188720703125, 1.000244140625, 1.038299560546875, 1.07635498046875, 1.114410400390625, 1.1524658203125, 1.190521240234375, 1.22857666015625, 1.266632080078125, 1.3046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 18.0, 20.0, 35.0, 40.0, 83.0, 141.0, 224.0, 346.0, 567.0, 926.0, 1627.0, 2772.0, 4575.0, 7682.0, 13066.0, 21424.0, 35434.0, 57835.0, 90700.0, 141182.0, 207486.0, 296111.0, 388439.0, 470461.0, 511125.0, 492721.0, 423943.0, 332004.0, 241209.0, 164834.0, 108412.0, 69008.0, 43399.0, 26501.0, 16049.0, 9531.0, 5809.0, 3382.0, 2065.0, 1233.0, 721.0, 473.0, 262.0, 159.0, 97.0, 57.0, 37.0, 31.0, 9.0, 9.0, 2.0, 6.0, 2.0, 0.0, 4.0], "bins": [-1.5302734375, -1.48486328125, -1.439453125, -1.39404296875, -1.3486328125, -1.30322265625, -1.2578125, -1.21240234375, -1.1669921875, -1.12158203125, -1.076171875, -1.03076171875, -0.9853515625, -0.93994140625, -0.89453125, -0.84912109375, -0.8037109375, -0.75830078125, -0.712890625, -0.66748046875, -0.6220703125, -0.57666015625, -0.53125, -0.48583984375, -0.4404296875, -0.39501953125, -0.349609375, -0.30419921875, -0.2587890625, -0.21337890625, -0.16796875, -0.12255859375, -0.0771484375, -0.03173828125, 0.013671875, 0.05908203125, 0.1044921875, 0.14990234375, 0.1953125, 0.24072265625, 0.2861328125, 0.33154296875, 0.376953125, 0.42236328125, 0.4677734375, 0.51318359375, 0.55859375, 0.60400390625, 0.6494140625, 0.69482421875, 0.740234375, 0.78564453125, 0.8310546875, 0.87646484375, 0.921875, 0.96728515625, 1.0126953125, 1.05810546875, 1.103515625, 1.14892578125, 1.1943359375, 1.23974609375, 1.28515625, 1.33056640625, 1.3759765625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 2.0, 10.0, 7.0, 7.0, 7.0, 14.0, 18.0, 15.0, 39.0, 41.0, 48.0, 42.0, 50.0, 51.0, 67.0, 84.0, 123.0, 133.0, 134.0, 176.0, 139.0, 160.0, 165.0, 195.0, 203.0, 204.0, 192.0, 195.0, 172.0, 183.0, 155.0, 145.0, 140.0, 136.0, 122.0, 70.0, 75.0, 77.0, 64.0, 46.0, 31.0, 32.0, 27.0, 16.0, 12.0, 12.0, 13.0, 14.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.55126953125, -0.5328826904296875, -0.514495849609375, -0.4961090087890625, -0.47772216796875, -0.4593353271484375, -0.440948486328125, -0.4225616455078125, -0.4041748046875, -0.3857879638671875, -0.367401123046875, -0.3490142822265625, -0.33062744140625, -0.3122406005859375, -0.293853759765625, -0.2754669189453125, -0.257080078125, -0.2386932373046875, -0.220306396484375, -0.2019195556640625, -0.18353271484375, -0.1651458740234375, -0.146759033203125, -0.1283721923828125, -0.1099853515625, -0.0915985107421875, -0.073211669921875, -0.0548248291015625, -0.03643798828125, -0.0180511474609375, 0.000335693359375, 0.0187225341796875, 0.037109375, 0.0554962158203125, 0.073883056640625, 0.0922698974609375, 0.11065673828125, 0.1290435791015625, 0.147430419921875, 0.1658172607421875, 0.1842041015625, 0.2025909423828125, 0.220977783203125, 0.2393646240234375, 0.25775146484375, 0.2761383056640625, 0.294525146484375, 0.3129119873046875, 0.331298828125, 0.3496856689453125, 0.368072509765625, 0.3864593505859375, 0.40484619140625, 0.4232330322265625, 0.441619873046875, 0.4600067138671875, 0.4783935546875, 0.4967803955078125, 0.515167236328125, 0.5335540771484375, 0.55194091796875, 0.5703277587890625, 0.588714599609375, 0.6071014404296875, 0.62548828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 13.0, 11.0, 24.0, 19.0, 20.0, 25.0, 26.0, 34.0, 47.0, 49.0, 48.0, 57.0, 55.0, 50.0, 56.0, 61.0, 58.0, 40.0, 39.0, 50.0, 35.0, 35.0, 24.0, 21.0, 16.0, 15.0, 13.0, 9.0, 5.0, 15.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2901968955993652, -2.22659969329834, -2.1630024909973145, -2.099405288696289, -2.0358080863952637, -1.9722108840942383, -1.9086135625839233, -1.845016360282898, -1.7814191579818726, -1.7178219556808472, -1.6542247533798218, -1.5906275510787964, -1.5270302295684814, -1.463433027267456, -1.3998358249664307, -1.3362386226654053, -1.2726414203643799, -1.2090442180633545, -1.145447015762329, -1.0818498134613037, -1.0182526111602783, -0.9546553492546082, -0.891058087348938, -0.8274608850479126, -0.7638636827468872, -0.7002664804458618, -0.6366692781448364, -0.5730720162391663, -0.5094748139381409, -0.4458776116371155, -0.3822803795337677, -0.3186831474304199, -0.25508618354797363, -0.19148896634578705, -0.12789174914360046, -0.06429453194141388, -0.0006973147392272949, 0.0628998875617981, 0.12649711966514587, 0.19009435176849365, 0.25369155406951904, 0.31728875637054443, 0.3808859884738922, 0.44448322057724, 0.5080804228782654, 0.5716776251792908, 0.6352748870849609, 0.6988720893859863, 0.7624692916870117, 0.8260664939880371, 0.8896636962890625, 0.9532609581947327, 1.0168581008911133, 1.0804553031921387, 1.1440526247024536, 1.207649827003479, 1.2712470293045044, 1.3348442316055298, 1.3984414339065552, 1.4620386362075806, 1.5256359577178955, 1.589233160018921, 1.6528303623199463, 1.7164275646209717, 1.780024766921997]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 8.0, 3.0, 7.0, 7.0, 8.0, 17.0, 18.0, 26.0, 24.0, 28.0, 19.0, 25.0, 34.0, 25.0, 25.0, 36.0, 37.0, 44.0, 40.0, 27.0, 42.0, 38.0, 41.0, 35.0, 38.0, 41.0, 32.0, 31.0, 25.0, 19.0, 19.0, 18.0, 25.0, 17.0, 13.0, 23.0, 14.0, 16.0, 6.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4026124477386475, -1.3561328649520874, -1.3096531629562378, -1.2631735801696777, -1.2166939973831177, -1.1702144145965576, -1.123734712600708, -1.077255129814148, -1.030775547027588, -0.9842959046363831, -0.937816321849823, -0.8913366794586182, -0.8448570966720581, -0.7983774542808533, -0.7518978118896484, -0.7054182291030884, -0.6589385867118835, -0.6124589443206787, -0.5659793615341187, -0.5194997191429138, -0.47302013635635376, -0.4265404939651489, -0.3800608813762665, -0.33358126878738403, -0.2871016561985016, -0.24062204360961914, -0.1941424310207367, -0.14766280353069305, -0.10118319094181061, -0.05470357835292816, -0.008223950862884521, 0.038255661725997925, 0.08473527431488037, 0.13121488690376282, 0.17769449949264526, 0.2241741269826889, 0.27065372467041016, 0.317133367061615, 0.36361297965049744, 0.4100925922393799, 0.45657220482826233, 0.5030518174171448, 0.5495314598083496, 0.5960110425949097, 0.6424906849861145, 0.6889702677726746, 0.7354499101638794, 0.7819294929504395, 0.8284091353416443, 0.8748887777328491, 0.9213683605194092, 0.967848002910614, 1.0143276453018188, 1.060807228088379, 1.107286810874939, 1.153766393661499, 1.2002460956573486, 1.2467256784439087, 1.2932053804397583, 1.3396849632263184, 1.3861645460128784, 1.4326441287994385, 1.479123830795288, 1.5256034135818481, 1.5720829963684082]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 10.0, 9.0, 11.0, 13.0, 28.0, 29.0, 61.0, 82.0, 121.0, 179.0, 248.0, 435.0, 640.0, 1021.0, 1576.0, 2510.0, 3968.0, 6737.0, 11412.0, 19522.0, 34020.0, 60081.0, 101959.0, 159776.0, 199411.0, 171531.0, 112984.0, 67200.0, 38475.0, 22061.0, 12841.0, 7491.0, 4485.0, 2777.0, 1767.0, 1038.0, 672.0, 470.0, 295.0, 191.0, 129.0, 93.0, 69.0, 46.0, 26.0, 18.0, 15.0, 4.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.78271484375, -0.7579498291015625, -0.733184814453125, -0.7084197998046875, -0.68365478515625, -0.6588897705078125, -0.634124755859375, -0.6093597412109375, -0.5845947265625, -0.5598297119140625, -0.535064697265625, -0.5102996826171875, -0.48553466796875, -0.4607696533203125, -0.436004638671875, -0.4112396240234375, -0.386474609375, -0.3617095947265625, -0.336944580078125, -0.3121795654296875, -0.28741455078125, -0.2626495361328125, -0.237884521484375, -0.2131195068359375, -0.1883544921875, -0.1635894775390625, -0.138824462890625, -0.1140594482421875, -0.08929443359375, -0.0645294189453125, -0.039764404296875, -0.0149993896484375, 0.009765625, 0.0345306396484375, 0.059295654296875, 0.0840606689453125, 0.10882568359375, 0.1335906982421875, 0.158355712890625, 0.1831207275390625, 0.2078857421875, 0.2326507568359375, 0.257415771484375, 0.2821807861328125, 0.30694580078125, 0.3317108154296875, 0.356475830078125, 0.3812408447265625, 0.406005859375, 0.4307708740234375, 0.455535888671875, 0.4803009033203125, 0.50506591796875, 0.5298309326171875, 0.554595947265625, 0.5793609619140625, 0.6041259765625, 0.6288909912109375, 0.653656005859375, 0.6784210205078125, 0.70318603515625, 0.7279510498046875, 0.752716064453125, 0.7774810791015625, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 6.0, 11.0, 10.0, 19.0, 20.0, 28.0, 24.0, 26.0, 37.0, 29.0, 26.0, 35.0, 36.0, 40.0, 35.0, 35.0, 41.0, 34.0, 40.0, 39.0, 37.0, 38.0, 36.0, 31.0, 40.0, 25.0, 28.0, 28.0, 10.0, 17.0, 20.0, 17.0, 14.0, 14.0, 8.0, 6.0, 6.0, 9.0, 10.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.46624755859375, -1.4149169921875, -1.36358642578125, -1.312255859375, -1.26092529296875, -1.2095947265625, -1.15826416015625, -1.10693359375, -1.05560302734375, -1.0042724609375, -0.95294189453125, -0.901611328125, -0.85028076171875, -0.7989501953125, -0.74761962890625, -0.6962890625, -0.64495849609375, -0.5936279296875, -0.54229736328125, -0.490966796875, -0.43963623046875, -0.3883056640625, -0.33697509765625, -0.28564453125, -0.23431396484375, -0.1829833984375, -0.13165283203125, -0.080322265625, -0.02899169921875, 0.0223388671875, 0.07366943359375, 0.125, 0.17633056640625, 0.2276611328125, 0.27899169921875, 0.330322265625, 0.38165283203125, 0.4329833984375, 0.48431396484375, 0.53564453125, 0.58697509765625, 0.6383056640625, 0.68963623046875, 0.740966796875, 0.79229736328125, 0.8436279296875, 0.89495849609375, 0.9462890625, 0.99761962890625, 1.0489501953125, 1.10028076171875, 1.151611328125, 1.20294189453125, 1.2542724609375, 1.30560302734375, 1.35693359375, 1.40826416015625, 1.4595947265625, 1.51092529296875, 1.562255859375, 1.61358642578125, 1.6649169921875, 1.71624755859375, 1.767578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 6.0, 7.0, 11.0, 39.0, 44.0, 68.0, 113.0, 178.0, 248.0, 425.0, 684.0, 1098.0, 1796.0, 3009.0, 5298.0, 9575.0, 17182.0, 32353.0, 61138.0, 115634.0, 201279.0, 240623.0, 164357.0, 89781.0, 46939.0, 25070.0, 13530.0, 7438.0, 4281.0, 2435.0, 1492.0, 917.0, 536.0, 357.0, 204.0, 153.0, 88.0, 70.0, 41.0, 27.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9951171875, -0.9669265747070312, -0.9387359619140625, -0.9105453491210938, -0.882354736328125, -0.8541641235351562, -0.8259735107421875, -0.7977828979492188, -0.76959228515625, -0.7414016723632812, -0.7132110595703125, -0.6850204467773438, -0.656829833984375, -0.6286392211914062, -0.6004486083984375, -0.5722579956054688, -0.5440673828125, -0.5158767700195312, -0.4876861572265625, -0.45949554443359375, -0.431304931640625, -0.40311431884765625, -0.3749237060546875, -0.34673309326171875, -0.31854248046875, -0.29035186767578125, -0.2621612548828125, -0.23397064208984375, -0.205780029296875, -0.17758941650390625, -0.1493988037109375, -0.12120819091796875, -0.093017578125, -0.06482696533203125, -0.0366363525390625, -0.00844573974609375, 0.019744873046875, 0.04793548583984375, 0.0761260986328125, 0.10431671142578125, 0.13250732421875, 0.16069793701171875, 0.1888885498046875, 0.21707916259765625, 0.245269775390625, 0.27346038818359375, 0.3016510009765625, 0.32984161376953125, 0.3580322265625, 0.38622283935546875, 0.4144134521484375, 0.44260406494140625, 0.470794677734375, 0.49898529052734375, 0.5271759033203125, 0.5553665161132812, 0.58355712890625, 0.6117477416992188, 0.6399383544921875, 0.6681289672851562, 0.696319580078125, 0.7245101928710938, 0.7527008056640625, 0.7808914184570312, 0.80908203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 5.0, 15.0, 11.0, 13.0, 15.0, 14.0, 19.0, 22.0, 37.0, 21.0, 20.0, 32.0, 26.0, 33.0, 34.0, 46.0, 49.0, 53.0, 36.0, 43.0, 47.0, 43.0, 33.0, 41.0, 36.0, 26.0, 29.0, 32.0, 25.0, 22.0, 15.0, 23.0, 14.0, 13.0, 6.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.222137451171875, -1.18548583984375, -1.148834228515625, -1.1121826171875, -1.075531005859375, -1.03887939453125, -1.002227783203125, -0.965576171875, -0.928924560546875, -0.89227294921875, -0.855621337890625, -0.8189697265625, -0.782318115234375, -0.74566650390625, -0.709014892578125, -0.67236328125, -0.635711669921875, -0.59906005859375, -0.562408447265625, -0.5257568359375, -0.489105224609375, -0.45245361328125, -0.415802001953125, -0.379150390625, -0.342498779296875, -0.30584716796875, -0.269195556640625, -0.2325439453125, -0.195892333984375, -0.15924072265625, -0.122589111328125, -0.0859375, -0.049285888671875, -0.01263427734375, 0.024017333984375, 0.0606689453125, 0.097320556640625, 0.13397216796875, 0.170623779296875, 0.207275390625, 0.243927001953125, 0.28057861328125, 0.317230224609375, 0.3538818359375, 0.390533447265625, 0.42718505859375, 0.463836669921875, 0.50048828125, 0.537139892578125, 0.57379150390625, 0.610443115234375, 0.6470947265625, 0.683746337890625, 0.72039794921875, 0.757049560546875, 0.793701171875, 0.830352783203125, 0.86700439453125, 0.903656005859375, 0.9403076171875, 0.976959228515625, 1.01361083984375, 1.050262451171875, 1.0869140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 55.0, 77.0, 57.0, 112.0, 134.0, 196.0, 289.0, 410.0, 652.0, 1003.0, 1492.0, 2554.0, 4423.0, 8168.0, 17700.0, 46551.0, 162096.0, 466474.0, 228420.0, 62504.0, 22321.0, 9739.0, 5028.0, 2895.0, 1729.0, 1072.0, 717.0, 507.0, 328.0, 220.0, 161.0, 104.0, 81.0, 50.0, 57.0, 26.0, 21.0, 14.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4549674987792969, -0.43849945068359375, -0.4220314025878906, -0.4055633544921875, -0.3890953063964844, -0.37262725830078125, -0.3561592102050781, -0.339691162109375, -0.3232231140136719, -0.30675506591796875, -0.2902870178222656, -0.2738189697265625, -0.2573509216308594, -0.24088287353515625, -0.22441482543945312, -0.20794677734375, -0.19147872924804688, -0.17501068115234375, -0.15854263305664062, -0.1420745849609375, -0.12560653686523438, -0.10913848876953125, -0.09267044067382812, -0.076202392578125, -0.059734344482421875, -0.04326629638671875, -0.026798248291015625, -0.0103302001953125, 0.006137847900390625, 0.02260589599609375, 0.039073944091796875, 0.0555419921875, 0.07201004028320312, 0.08847808837890625, 0.10494613647460938, 0.1214141845703125, 0.13788223266601562, 0.15435028076171875, 0.17081832885742188, 0.187286376953125, 0.20375442504882812, 0.22022247314453125, 0.23669052124023438, 0.2531585693359375, 0.2696266174316406, 0.28609466552734375, 0.3025627136230469, 0.31903076171875, 0.3354988098144531, 0.35196685791015625, 0.3684349060058594, 0.3849029541015625, 0.4013710021972656, 0.41783905029296875, 0.4343070983886719, 0.450775146484375, 0.4672431945800781, 0.48371124267578125, 0.5001792907714844, 0.5166473388671875, 0.5331153869628906, 0.5495834350585938, 0.5660514831542969, 0.58251953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 5.0, 4.0, 15.0, 14.0, 21.0, 18.0, 19.0, 26.0, 36.0, 25.0, 35.0, 36.0, 49.0, 42.0, 56.0, 46.0, 60.0, 43.0, 51.0, 63.0, 40.0, 41.0, 31.0, 40.0, 30.0, 23.0, 20.0, 21.0, 16.0, 10.0, 8.0, 9.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.1083280444145203e-05, -2.0410865545272827e-05, -1.973845064640045e-05, -1.9066035747528076e-05, -1.83936208486557e-05, -1.7721205949783325e-05, -1.704879105091095e-05, -1.6376376152038574e-05, -1.57039612531662e-05, -1.5031546354293823e-05, -1.4359131455421448e-05, -1.3686716556549072e-05, -1.3014301657676697e-05, -1.2341886758804321e-05, -1.1669471859931946e-05, -1.099705696105957e-05, -1.0324642062187195e-05, -9.65222716331482e-06, -8.979812264442444e-06, -8.307397365570068e-06, -7.634982466697693e-06, -6.962567567825317e-06, -6.290152668952942e-06, -5.617737770080566e-06, -4.945322871208191e-06, -4.2729079723358154e-06, -3.60049307346344e-06, -2.9280781745910645e-06, -2.255663275718689e-06, -1.5832483768463135e-06, -9.10833477973938e-07, -2.384185791015625e-07, 4.33996319770813e-07, 1.1064112186431885e-06, 1.778826117515564e-06, 2.4512410163879395e-06, 3.123655915260315e-06, 3.7960708141326904e-06, 4.468485713005066e-06, 5.140900611877441e-06, 5.813315510749817e-06, 6.485730409622192e-06, 7.158145308494568e-06, 7.830560207366943e-06, 8.502975106239319e-06, 9.175390005111694e-06, 9.84780490398407e-06, 1.0520219802856445e-05, 1.119263470172882e-05, 1.1865049600601196e-05, 1.2537464499473572e-05, 1.3209879398345947e-05, 1.3882294297218323e-05, 1.4554709196090698e-05, 1.5227124094963074e-05, 1.589953899383545e-05, 1.6571953892707825e-05, 1.72443687915802e-05, 1.7916783690452576e-05, 1.858919858932495e-05, 1.9261613488197327e-05, 1.9934028387069702e-05, 2.0606443285942078e-05, 2.1278858184814453e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 15.0, 10.0, 24.0, 39.0, 77.0, 104.0, 185.0, 273.0, 466.0, 835.0, 1397.0, 2392.0, 4420.0, 8511.0, 17373.0, 36830.0, 82607.0, 186052.0, 306803.0, 216254.0, 98906.0, 43293.0, 20199.0, 9900.0, 5053.0, 2725.0, 1492.0, 913.0, 550.0, 305.0, 206.0, 118.0, 59.0, 57.0, 36.0, 26.0, 13.0, 9.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4791755676269531, -0.46298980712890625, -0.4468040466308594, -0.4306182861328125, -0.4144325256347656, -0.39824676513671875, -0.3820610046386719, -0.365875244140625, -0.3496894836425781, -0.33350372314453125, -0.3173179626464844, -0.3011322021484375, -0.2849464416503906, -0.26876068115234375, -0.2525749206542969, -0.23638916015625, -0.22020339965820312, -0.20401763916015625, -0.18783187866210938, -0.1716461181640625, -0.15546035766601562, -0.13927459716796875, -0.12308883666992188, -0.106903076171875, -0.09071731567382812, -0.07453155517578125, -0.058345794677734375, -0.0421600341796875, -0.025974273681640625, -0.00978851318359375, 0.006397247314453125, 0.0225830078125, 0.038768768310546875, 0.05495452880859375, 0.07114028930664062, 0.0873260498046875, 0.10351181030273438, 0.11969757080078125, 0.13588333129882812, 0.152069091796875, 0.16825485229492188, 0.18444061279296875, 0.20062637329101562, 0.2168121337890625, 0.23299789428710938, 0.24918365478515625, 0.2653694152832031, 0.28155517578125, 0.2977409362792969, 0.31392669677734375, 0.3301124572753906, 0.3462982177734375, 0.3624839782714844, 0.37866973876953125, 0.3948554992675781, 0.411041259765625, 0.4272270202636719, 0.44341278076171875, 0.4595985412597656, 0.4757843017578125, 0.4919700622558594, 0.5081558227539062, 0.5243415832519531, 0.54052734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 14.0, 8.0, 7.0, 16.0, 9.0, 20.0, 18.0, 16.0, 24.0, 20.0, 24.0, 35.0, 42.0, 40.0, 65.0, 59.0, 51.0, 59.0, 55.0, 56.0, 54.0, 42.0, 38.0, 25.0, 29.0, 28.0, 19.0, 19.0, 18.0, 13.0, 10.0, 4.0, 9.0, 6.0, 12.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.097412109375, -0.09454917907714844, -0.09168624877929688, -0.08882331848144531, -0.08596038818359375, -0.08309745788574219, -0.08023452758789062, -0.07737159729003906, -0.0745086669921875, -0.07164573669433594, -0.06878280639648438, -0.06591987609863281, -0.06305694580078125, -0.06019401550292969, -0.057331085205078125, -0.05446815490722656, -0.051605224609375, -0.04874229431152344, -0.045879364013671875, -0.04301643371582031, -0.04015350341796875, -0.03729057312011719, -0.034427642822265625, -0.03156471252441406, -0.0287017822265625, -0.025838851928710938, -0.022975921630859375, -0.020112991333007812, -0.01725006103515625, -0.014387130737304688, -0.011524200439453125, -0.008661270141601562, -0.00579833984375, -0.0029354095458984375, -7.2479248046875e-05, 0.0027904510498046875, 0.00565338134765625, 0.008516311645507812, 0.011379241943359375, 0.014242172241210938, 0.0171051025390625, 0.019968032836914062, 0.022830963134765625, 0.025693893432617188, 0.02855682373046875, 0.03141975402832031, 0.034282684326171875, 0.03714561462402344, 0.040008544921875, 0.04287147521972656, 0.045734405517578125, 0.04859733581542969, 0.05146026611328125, 0.05432319641113281, 0.057186126708984375, 0.06004905700683594, 0.0629119873046875, 0.06577491760253906, 0.06863784790039062, 0.07150077819824219, 0.07436370849609375, 0.07722663879394531, 0.08008956909179688, 0.08295249938964844, 0.0858154296875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 9.0, 15.0, 21.0, 19.0, 28.0, 26.0, 36.0, 36.0, 31.0, 53.0, 37.0, 65.0, 50.0, 61.0, 55.0, 50.0, 43.0, 54.0, 44.0, 37.0, 43.0, 31.0, 19.0, 21.0, 19.0, 18.0, 11.0, 10.0, 9.0, 6.0, 3.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1656153202056885, -2.103355646133423, -2.041095733642578, -1.978835940361023, -1.9165761470794678, -1.8543163537979126, -1.7920565605163574, -1.7297967672348022, -1.667536973953247, -1.605277180671692, -1.5430173873901367, -1.4807575941085815, -1.4184978008270264, -1.3562380075454712, -1.293978214263916, -1.2317184209823608, -1.1694586277008057, -1.1071988344192505, -1.0449390411376953, -0.9826792478561401, -0.920419454574585, -0.8581596612930298, -0.7958998680114746, -0.7336400747299194, -0.6713804006576538, -0.6091206073760986, -0.5468608140945435, -0.4846010208129883, -0.4223412275314331, -0.3600814640522003, -0.29782167077064514, -0.23556187748908997, -0.1733020544052124, -0.11104226112365723, -0.04878247529268265, 0.013477310538291931, 0.0757371038198471, 0.1379968822002411, 0.20025667548179626, 0.26251646876335144, 0.3247762620449066, 0.3870360553264618, 0.44929584860801697, 0.5115556120872498, 0.5738154053688049, 0.6360751986503601, 0.6983349919319153, 0.7605947852134705, 0.8228545784950256, 0.8851143717765808, 0.947374165058136, 1.0096338987350464, 1.0718936920166016, 1.1341534852981567, 1.196413278579712, 1.258673071861267, 1.3209328651428223, 1.3831926584243774, 1.4454524517059326, 1.5077122449874878, 1.569972038269043, 1.6322318315505981, 1.6944916248321533, 1.7567514181137085, 1.8190112113952637]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 6.0, 5.0, 5.0, 11.0, 12.0, 9.0, 25.0, 27.0, 24.0, 21.0, 21.0, 30.0, 29.0, 28.0, 24.0, 29.0, 42.0, 43.0, 35.0, 32.0, 39.0, 48.0, 37.0, 34.0, 35.0, 42.0, 29.0, 27.0, 23.0, 20.0, 24.0, 22.0, 21.0, 16.0, 15.0, 15.0, 19.0, 13.0, 9.0, 8.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3607033491134644, -1.3150500059127808, -1.2693967819213867, -1.2237434387207031, -1.1780900955200195, -1.132436752319336, -1.0867834091186523, -1.0411301851272583, -0.9954768419265747, -0.9498234987258911, -0.9041702151298523, -0.8585169315338135, -0.8128635883331299, -0.7672102451324463, -0.7215569615364075, -0.6759036779403687, -0.6302503347396851, -0.5845969915390015, -0.5389437079429626, -0.49329039454460144, -0.44763708114624023, -0.40198376774787903, -0.3563304543495178, -0.3106771409511566, -0.2650238275527954, -0.2193705141544342, -0.173717200756073, -0.1280638873577118, -0.08241057395935059, -0.03675726056098938, 0.008896052837371826, 0.05454936623573303, 0.10020256042480469, 0.1458558738231659, 0.1915091872215271, 0.2371625006198883, 0.2828158140182495, 0.3284691274166107, 0.3741224408149719, 0.41977575421333313, 0.46542906761169434, 0.5110824108123779, 0.5567356944084167, 0.6023889780044556, 0.6480423212051392, 0.6936956644058228, 0.7393489480018616, 0.7850022315979004, 0.830655574798584, 0.8763089179992676, 0.9219622015953064, 0.9676154851913452, 1.0132688283920288, 1.0589221715927124, 1.1045753955841064, 1.15022873878479, 1.1958820819854736, 1.2415354251861572, 1.2871887683868408, 1.3328419923782349, 1.3784953355789185, 1.424148678779602, 1.469801902770996, 1.5154552459716797, 1.5611085891723633]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 12.0, 18.0, 23.0, 50.0, 54.0, 87.0, 139.0, 231.0, 361.0, 564.0, 839.0, 1272.0, 1955.0, 3119.0, 4894.0, 7515.0, 11383.0, 17296.0, 25425.0, 36209.0, 50124.0, 67055.0, 84012.0, 99669.0, 108911.0, 109134.0, 100086.0, 85735.0, 67929.0, 50990.0, 36845.0, 25873.0, 17287.0, 11838.0, 7746.0, 4876.0, 3256.0, 2045.0, 1343.0, 849.0, 535.0, 343.0, 226.0, 152.0, 95.0, 41.0, 33.0, 28.0, 28.0, 7.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2749176025390625, -1.232452392578125, -1.1899871826171875, -1.14752197265625, -1.1050567626953125, -1.062591552734375, -1.0201263427734375, -0.9776611328125, -0.9351959228515625, -0.892730712890625, -0.8502655029296875, -0.80780029296875, -0.7653350830078125, -0.722869873046875, -0.6804046630859375, -0.637939453125, -0.5954742431640625, -0.553009033203125, -0.5105438232421875, -0.46807861328125, -0.4256134033203125, -0.383148193359375, -0.3406829833984375, -0.2982177734375, -0.2557525634765625, -0.213287353515625, -0.1708221435546875, -0.12835693359375, -0.0858917236328125, -0.043426513671875, -0.0009613037109375, 0.04150390625, 0.0839691162109375, 0.126434326171875, 0.1688995361328125, 0.21136474609375, 0.2538299560546875, 0.296295166015625, 0.3387603759765625, 0.3812255859375, 0.4236907958984375, 0.466156005859375, 0.5086212158203125, 0.55108642578125, 0.5935516357421875, 0.636016845703125, 0.6784820556640625, 0.720947265625, 0.7634124755859375, 0.805877685546875, 0.8483428955078125, 0.89080810546875, 0.9332733154296875, 0.975738525390625, 1.0182037353515625, 1.0606689453125, 1.1031341552734375, 1.145599365234375, 1.1880645751953125, 1.23052978515625, 1.2729949951171875, 1.315460205078125, 1.3579254150390625, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 11.0, 13.0, 15.0, 22.0, 18.0, 20.0, 27.0, 29.0, 26.0, 18.0, 34.0, 25.0, 33.0, 40.0, 38.0, 40.0, 33.0, 48.0, 40.0, 40.0, 46.0, 31.0, 20.0, 27.0, 27.0, 23.0, 31.0, 17.0, 20.0, 24.0, 13.0, 17.0, 19.0, 16.0, 10.0, 8.0, 8.0, 4.0, 6.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.5146484375, -1.4691009521484375, -1.423553466796875, -1.3780059814453125, -1.33245849609375, -1.2869110107421875, -1.241363525390625, -1.1958160400390625, -1.1502685546875, -1.1047210693359375, -1.059173583984375, -1.0136260986328125, -0.96807861328125, -0.9225311279296875, -0.876983642578125, -0.8314361572265625, -0.785888671875, -0.7403411865234375, -0.694793701171875, -0.6492462158203125, -0.60369873046875, -0.5581512451171875, -0.512603759765625, -0.4670562744140625, -0.4215087890625, -0.3759613037109375, -0.330413818359375, -0.2848663330078125, -0.23931884765625, -0.1937713623046875, -0.148223876953125, -0.1026763916015625, -0.05712890625, -0.0115814208984375, 0.033966064453125, 0.0795135498046875, 0.12506103515625, 0.1706085205078125, 0.216156005859375, 0.2617034912109375, 0.3072509765625, 0.3527984619140625, 0.398345947265625, 0.4438934326171875, 0.48944091796875, 0.5349884033203125, 0.580535888671875, 0.6260833740234375, 0.671630859375, 0.7171783447265625, 0.762725830078125, 0.8082733154296875, 0.85382080078125, 0.8993682861328125, 0.944915771484375, 0.9904632568359375, 1.0360107421875, 1.0815582275390625, 1.127105712890625, 1.1726531982421875, 1.21820068359375, 1.2637481689453125, 1.309295654296875, 1.3548431396484375, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 26.0, 34.0, 64.0, 90.0, 154.0, 214.0, 373.0, 565.0, 886.0, 1422.0, 2326.0, 3504.0, 5587.0, 8588.0, 13287.0, 20391.0, 30099.0, 43180.0, 59122.0, 77582.0, 95084.0, 108012.0, 112504.0, 106995.0, 94487.0, 77092.0, 58695.0, 42529.0, 29508.0, 19641.0, 12991.0, 8564.0, 5412.0, 3494.0, 2273.0, 1331.0, 874.0, 569.0, 356.0, 229.0, 158.0, 90.0, 52.0, 33.0, 24.0, 12.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.40625, -1.3642425537109375, -1.322235107421875, -1.2802276611328125, -1.23822021484375, -1.1962127685546875, -1.154205322265625, -1.1121978759765625, -1.0701904296875, -1.0281829833984375, -0.986175537109375, -0.9441680908203125, -0.90216064453125, -0.8601531982421875, -0.818145751953125, -0.7761383056640625, -0.734130859375, -0.6921234130859375, -0.650115966796875, -0.6081085205078125, -0.56610107421875, -0.5240936279296875, -0.482086181640625, -0.4400787353515625, -0.3980712890625, -0.3560638427734375, -0.314056396484375, -0.2720489501953125, -0.23004150390625, -0.1880340576171875, -0.146026611328125, -0.1040191650390625, -0.06201171875, -0.0200042724609375, 0.022003173828125, 0.0640106201171875, 0.10601806640625, 0.1480255126953125, 0.190032958984375, 0.2320404052734375, 0.2740478515625, 0.3160552978515625, 0.358062744140625, 0.4000701904296875, 0.44207763671875, 0.4840850830078125, 0.526092529296875, 0.5680999755859375, 0.610107421875, 0.6521148681640625, 0.694122314453125, 0.7361297607421875, 0.77813720703125, 0.8201446533203125, 0.862152099609375, 0.9041595458984375, 0.9461669921875, 0.9881744384765625, 1.030181884765625, 1.0721893310546875, 1.11419677734375, 1.1562042236328125, 1.198211669921875, 1.2402191162109375, 1.2822265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 2.0, 8.0, 12.0, 5.0, 14.0, 10.0, 12.0, 19.0, 18.0, 16.0, 23.0, 27.0, 13.0, 33.0, 24.0, 30.0, 31.0, 31.0, 31.0, 35.0, 31.0, 33.0, 35.0, 42.0, 42.0, 42.0, 39.0, 21.0, 42.0, 25.0, 30.0, 31.0, 22.0, 23.0, 18.0, 21.0, 17.0, 17.0, 11.0, 9.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9072265625, -0.8786849975585938, -0.8501434326171875, -0.8216018676757812, -0.793060302734375, -0.7645187377929688, -0.7359771728515625, -0.7074356079101562, -0.67889404296875, -0.6503524780273438, -0.6218109130859375, -0.5932693481445312, -0.564727783203125, -0.5361862182617188, -0.5076446533203125, -0.47910308837890625, -0.4505615234375, -0.42201995849609375, -0.3934783935546875, -0.36493682861328125, -0.336395263671875, -0.30785369873046875, -0.2793121337890625, -0.25077056884765625, -0.22222900390625, -0.19368743896484375, -0.1651458740234375, -0.13660430908203125, -0.108062744140625, -0.07952117919921875, -0.0509796142578125, -0.02243804931640625, 0.006103515625, 0.03464508056640625, 0.0631866455078125, 0.09172821044921875, 0.120269775390625, 0.14881134033203125, 0.1773529052734375, 0.20589447021484375, 0.23443603515625, 0.26297760009765625, 0.2915191650390625, 0.32006072998046875, 0.348602294921875, 0.37714385986328125, 0.4056854248046875, 0.43422698974609375, 0.4627685546875, 0.49131011962890625, 0.5198516845703125, 0.5483932495117188, 0.576934814453125, 0.6054763793945312, 0.6340179443359375, 0.6625595092773438, 0.69110107421875, 0.7196426391601562, 0.7481842041015625, 0.7767257690429688, 0.805267333984375, 0.8338088989257812, 0.8623504638671875, 0.8908920288085938, 0.91943359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 8.0, 16.0, 14.0, 24.0, 38.0, 48.0, 80.0, 126.0, 185.0, 286.0, 466.0, 680.0, 1139.0, 1975.0, 3384.0, 5995.0, 11202.0, 21092.0, 39146.0, 73194.0, 124782.0, 182377.0, 200390.0, 159393.0, 100831.0, 55619.0, 30179.0, 15855.0, 8473.0, 4718.0, 2667.0, 1543.0, 925.0, 556.0, 346.0, 246.0, 158.0, 118.0, 61.0, 60.0, 40.0, 27.0, 26.0, 16.0, 6.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.2763671875, -1.2368316650390625, -1.197296142578125, -1.1577606201171875, -1.11822509765625, -1.0786895751953125, -1.039154052734375, -0.9996185302734375, -0.9600830078125, -0.9205474853515625, -0.881011962890625, -0.8414764404296875, -0.80194091796875, -0.7624053955078125, -0.722869873046875, -0.6833343505859375, -0.643798828125, -0.6042633056640625, -0.564727783203125, -0.5251922607421875, -0.48565673828125, -0.4461212158203125, -0.406585693359375, -0.3670501708984375, -0.3275146484375, -0.2879791259765625, -0.248443603515625, -0.2089080810546875, -0.16937255859375, -0.1298370361328125, -0.090301513671875, -0.0507659912109375, -0.01123046875, 0.0283050537109375, 0.067840576171875, 0.1073760986328125, 0.14691162109375, 0.1864471435546875, 0.225982666015625, 0.2655181884765625, 0.3050537109375, 0.3445892333984375, 0.384124755859375, 0.4236602783203125, 0.46319580078125, 0.5027313232421875, 0.542266845703125, 0.5818023681640625, 0.621337890625, 0.6608734130859375, 0.700408935546875, 0.7399444580078125, 0.77947998046875, 0.8190155029296875, 0.858551025390625, 0.8980865478515625, 0.9376220703125, 0.9771575927734375, 1.016693115234375, 1.0562286376953125, 1.09576416015625, 1.1352996826171875, 1.174835205078125, 1.2143707275390625, 1.25390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 3.0, 9.0, 12.0, 12.0, 12.0, 23.0, 34.0, 32.0, 38.0, 44.0, 49.0, 57.0, 48.0, 64.0, 60.0, 44.0, 61.0, 60.0, 52.0, 37.0, 46.0, 33.0, 40.0, 19.0, 19.0, 22.0, 13.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010466575622558594, -0.00010150019079446793, -9.833462536334991e-05, -9.51690599322319e-05, -9.200349450111389e-05, -8.883792906999588e-05, -8.567236363887787e-05, -8.250679820775986e-05, -7.934123277664185e-05, -7.617566734552383e-05, -7.301010191440582e-05, -6.984453648328781e-05, -6.66789710521698e-05, -6.351340562105179e-05, -6.034784018993378e-05, -5.7182274758815765e-05, -5.4016709327697754e-05, -5.085114389657974e-05, -4.768557846546173e-05, -4.452001303434372e-05, -4.135444760322571e-05, -3.8188882172107697e-05, -3.5023316740989685e-05, -3.1857751309871674e-05, -2.8692185878753662e-05, -2.552662044763565e-05, -2.236105501651764e-05, -1.9195489585399628e-05, -1.6029924154281616e-05, -1.2864358723163605e-05, -9.698793292045593e-06, -6.533227860927582e-06, -3.3676624298095703e-06, -2.0209699869155884e-07, 2.9634684324264526e-06, 6.129033863544464e-06, 9.294599294662476e-06, 1.2460164725780487e-05, 1.56257301568985e-05, 1.879129558801651e-05, 2.195686101913452e-05, 2.5122426450252533e-05, 2.8287991881370544e-05, 3.1453557312488556e-05, 3.461912274360657e-05, 3.778468817472458e-05, 4.095025360584259e-05, 4.41158190369606e-05, 4.728138446807861e-05, 5.0446949899196625e-05, 5.3612515330314636e-05, 5.677808076143265e-05, 5.994364619255066e-05, 6.310921162366867e-05, 6.627477705478668e-05, 6.94403424859047e-05, 7.26059079170227e-05, 7.577147334814072e-05, 7.893703877925873e-05, 8.210260421037674e-05, 8.526816964149475e-05, 8.843373507261276e-05, 9.159930050373077e-05, 9.476486593484879e-05, 9.79304313659668e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 11.0, 17.0, 17.0, 40.0, 38.0, 42.0, 63.0, 79.0, 145.0, 222.0, 301.0, 461.0, 755.0, 1174.0, 1822.0, 2861.0, 4667.0, 7651.0, 12413.0, 19913.0, 32585.0, 51298.0, 79006.0, 112705.0, 143082.0, 152351.0, 134546.0, 102270.0, 69718.0, 44877.0, 28237.0, 17182.0, 10528.0, 6524.0, 4006.0, 2549.0, 1504.0, 1038.0, 628.0, 403.0, 251.0, 179.0, 107.0, 81.0, 58.0, 49.0, 29.0, 23.0, 13.0, 14.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0], "bins": [-0.9375, -0.9085159301757812, -0.8795318603515625, -0.8505477905273438, -0.821563720703125, -0.7925796508789062, -0.7635955810546875, -0.7346115112304688, -0.70562744140625, -0.6766433715820312, -0.6476593017578125, -0.6186752319335938, -0.589691162109375, -0.5607070922851562, -0.5317230224609375, -0.5027389526367188, -0.4737548828125, -0.44477081298828125, -0.4157867431640625, -0.38680267333984375, -0.357818603515625, -0.32883453369140625, -0.2998504638671875, -0.27086639404296875, -0.24188232421875, -0.21289825439453125, -0.1839141845703125, -0.15493011474609375, -0.125946044921875, -0.09696197509765625, -0.0679779052734375, -0.03899383544921875, -0.010009765625, 0.01897430419921875, 0.0479583740234375, 0.07694244384765625, 0.105926513671875, 0.13491058349609375, 0.1638946533203125, 0.19287872314453125, 0.22186279296875, 0.25084686279296875, 0.2798309326171875, 0.30881500244140625, 0.337799072265625, 0.36678314208984375, 0.3957672119140625, 0.42475128173828125, 0.4537353515625, 0.48271942138671875, 0.5117034912109375, 0.5406875610351562, 0.569671630859375, 0.5986557006835938, 0.6276397705078125, 0.6566238403320312, 0.68560791015625, 0.7145919799804688, 0.7435760498046875, 0.7725601196289062, 0.801544189453125, 0.8305282592773438, 0.8595123291015625, 0.8884963989257812, 0.91748046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 7.0, 4.0, 10.0, 12.0, 20.0, 16.0, 22.0, 31.0, 28.0, 31.0, 32.0, 39.0, 44.0, 50.0, 60.0, 58.0, 63.0, 50.0, 54.0, 55.0, 57.0, 43.0, 35.0, 31.0, 30.0, 30.0, 21.0, 17.0, 11.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47867584228515625, -0.4656524658203125, -0.45262908935546875, -0.439605712890625, -0.42658233642578125, -0.4135589599609375, -0.40053558349609375, -0.38751220703125, -0.37448883056640625, -0.3614654541015625, -0.34844207763671875, -0.335418701171875, -0.32239532470703125, -0.3093719482421875, -0.29634857177734375, -0.2833251953125, -0.27030181884765625, -0.2572784423828125, -0.24425506591796875, -0.231231689453125, -0.21820831298828125, -0.2051849365234375, -0.19216156005859375, -0.17913818359375, -0.16611480712890625, -0.1530914306640625, -0.14006805419921875, -0.127044677734375, -0.11402130126953125, -0.1009979248046875, -0.08797454833984375, -0.074951171875, -0.06192779541015625, -0.0489044189453125, -0.03588104248046875, -0.022857666015625, -0.00983428955078125, 0.0031890869140625, 0.01621246337890625, 0.02923583984375, 0.04225921630859375, 0.0552825927734375, 0.06830596923828125, 0.081329345703125, 0.09435272216796875, 0.1073760986328125, 0.12039947509765625, 0.1334228515625, 0.14644622802734375, 0.1594696044921875, 0.17249298095703125, 0.185516357421875, 0.19853973388671875, 0.2115631103515625, 0.22458648681640625, 0.23760986328125, 0.25063323974609375, 0.2636566162109375, 0.27667999267578125, 0.289703369140625, 0.30272674560546875, 0.3157501220703125, 0.32877349853515625, 0.341796875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 13.0, 12.0, 15.0, 9.0, 26.0, 20.0, 29.0, 34.0, 40.0, 39.0, 37.0, 52.0, 46.0, 45.0, 56.0, 49.0, 57.0, 49.0, 38.0, 55.0, 48.0, 31.0, 31.0, 25.0, 20.0, 15.0, 24.0, 11.0, 12.0, 12.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8894098997116089, -1.829939365386963, -1.770468831062317, -1.710998296737671, -1.651527762413025, -1.592057228088379, -1.5325868129730225, -1.4731162786483765, -1.4136457443237305, -1.3541752099990845, -1.2947046756744385, -1.2352341413497925, -1.1757636070251465, -1.11629319190979, -1.0568225383758545, -0.997352123260498, -0.9378815293312073, -0.8784109950065613, -0.8189404606819153, -0.7594699859619141, -0.6999994516372681, -0.6405289173126221, -0.5810583829879761, -0.5215878486633301, -0.46211734414100647, -0.4026468098163605, -0.34317630529403687, -0.28370577096939087, -0.22423525154590607, -0.16476473212242126, -0.10529419779777527, -0.04582369327545166, 0.013646841049194336, 0.07311736047267914, 0.13258787989616394, 0.19205841422080994, 0.25152891874313354, 0.31099945306777954, 0.37046998739242554, 0.42994049191474915, 0.48941102623939514, 0.5488815307617188, 0.6083520650863647, 0.6678225994110107, 0.7272931337356567, 0.7867636680603027, 0.8462342023849487, 0.90570467710495, 0.965175211429596, 1.0246456861495972, 1.0841162204742432, 1.1435867547988892, 1.2030572891235352, 1.2625278234481812, 1.3219983577728271, 1.3814688920974731, 1.4409394264221191, 1.5004099607467651, 1.5598804950714111, 1.6193510293960571, 1.6788215637207031, 1.7382919788360596, 1.7977626323699951, 1.8572330474853516, 1.9167035818099976]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 1.0, 8.0, 9.0, 7.0, 12.0, 11.0, 9.0, 12.0, 13.0, 14.0, 35.0, 24.0, 17.0, 29.0, 31.0, 42.0, 30.0, 34.0, 35.0, 27.0, 41.0, 45.0, 41.0, 31.0, 41.0, 38.0, 39.0, 44.0, 29.0, 37.0, 26.0, 17.0, 21.0, 24.0, 21.0, 12.0, 10.0, 13.0, 17.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.371199607849121, -1.3224812746047974, -1.2737629413604736, -1.22504460811615, -1.1763262748718262, -1.1276079416275024, -1.0788896083831787, -1.0301713943481445, -0.981453001499176, -0.9327346682548523, -0.8840163350105286, -0.8352980613708496, -0.7865797281265259, -0.7378613948822021, -0.6891430616378784, -0.6404247283935547, -0.591706395149231, -0.5429880619049072, -0.4942697286605835, -0.44555142521858215, -0.3968330919742584, -0.3481147587299347, -0.29939645528793335, -0.2506781220436096, -0.2019597887992859, -0.15324145555496216, -0.10452313721179962, -0.055804818868637085, -0.0070864856243133545, 0.041631847620010376, 0.09035015106201172, 0.13906848430633545, 0.18778681755065918, 0.2365051507949829, 0.28522348403930664, 0.333941787481308, 0.3826601207256317, 0.43137845396995544, 0.4800967574119568, 0.5288150906562805, 0.5775334239006042, 0.626251757144928, 0.6749700903892517, 0.7236883640289307, 0.7724066972732544, 0.8211250305175781, 0.8698433637619019, 0.9185616970062256, 0.9672800302505493, 1.015998363494873, 1.0647166967391968, 1.1134350299835205, 1.1621533632278442, 1.210871696472168, 1.2595899105072021, 1.3083083629608154, 1.3570265769958496, 1.4057449102401733, 1.454463243484497, 1.5031815767288208, 1.5518999099731445, 1.6006182432174683, 1.649336576461792, 1.6980547904968262, 1.7467732429504395]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 12.0, 27.0, 39.0, 49.0, 79.0, 135.0, 225.0, 378.0, 655.0, 1170.0, 1907.0, 3451.0, 5958.0, 10651.0, 19230.0, 33416.0, 58904.0, 103499.0, 176924.0, 289343.0, 440194.0, 593615.0, 663971.0, 602063.0, 453475.0, 300291.0, 184695.0, 107892.0, 61816.0, 35026.0, 19654.0, 11040.0, 6208.0, 3646.0, 2000.0, 1098.0, 603.0, 379.0, 236.0, 125.0, 81.0, 51.0, 27.0, 23.0, 7.0, 10.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.609375, -1.559906005859375, -1.51043701171875, -1.460968017578125, -1.4114990234375, -1.362030029296875, -1.31256103515625, -1.263092041015625, -1.213623046875, -1.164154052734375, -1.11468505859375, -1.065216064453125, -1.0157470703125, -0.966278076171875, -0.91680908203125, -0.867340087890625, -0.81787109375, -0.768402099609375, -0.71893310546875, -0.669464111328125, -0.6199951171875, -0.570526123046875, -0.52105712890625, -0.471588134765625, -0.422119140625, -0.372650146484375, -0.32318115234375, -0.273712158203125, -0.2242431640625, -0.174774169921875, -0.12530517578125, -0.075836181640625, -0.0263671875, 0.023101806640625, 0.07257080078125, 0.122039794921875, 0.1715087890625, 0.220977783203125, 0.27044677734375, 0.319915771484375, 0.369384765625, 0.418853759765625, 0.46832275390625, 0.517791748046875, 0.5672607421875, 0.616729736328125, 0.66619873046875, 0.715667724609375, 0.76513671875, 0.814605712890625, 0.86407470703125, 0.913543701171875, 0.9630126953125, 1.012481689453125, 1.06195068359375, 1.111419677734375, 1.160888671875, 1.210357666015625, 1.25982666015625, 1.309295654296875, 1.3587646484375, 1.408233642578125, 1.45770263671875, 1.507171630859375, 1.556640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 6.0, 7.0, 13.0, 9.0, 13.0, 14.0, 26.0, 23.0, 30.0, 20.0, 35.0, 25.0, 39.0, 36.0, 27.0, 37.0, 35.0, 33.0, 41.0, 34.0, 40.0, 28.0, 40.0, 36.0, 31.0, 33.0, 32.0, 26.0, 22.0, 22.0, 20.0, 11.0, 14.0, 17.0, 21.0, 15.0, 11.0, 7.0, 12.0, 5.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9029006958007812, -0.8707427978515625, -0.8385848999023438, -0.806427001953125, -0.7742691040039062, -0.7421112060546875, -0.7099533081054688, -0.67779541015625, -0.6456375122070312, -0.6134796142578125, -0.5813217163085938, -0.549163818359375, -0.5170059204101562, -0.4848480224609375, -0.45269012451171875, -0.4205322265625, -0.38837432861328125, -0.3562164306640625, -0.32405853271484375, -0.291900634765625, -0.25974273681640625, -0.2275848388671875, -0.19542694091796875, -0.16326904296875, -0.13111114501953125, -0.0989532470703125, -0.06679534912109375, -0.034637451171875, -0.00247955322265625, 0.0296783447265625, 0.06183624267578125, 0.093994140625, 0.12615203857421875, 0.1583099365234375, 0.19046783447265625, 0.222625732421875, 0.25478363037109375, 0.2869415283203125, 0.31909942626953125, 0.35125732421875, 0.38341522216796875, 0.4155731201171875, 0.44773101806640625, 0.479888916015625, 0.5120468139648438, 0.5442047119140625, 0.5763626098632812, 0.6085205078125, 0.6406784057617188, 0.6728363037109375, 0.7049942016601562, 0.737152099609375, 0.7693099975585938, 0.8014678955078125, 0.8336257934570312, 0.86578369140625, 0.8979415893554688, 0.9300994873046875, 0.9622573852539062, 0.994415283203125, 1.0265731811523438, 1.0587310791015625, 1.0908889770507812, 1.123046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 10.0, 16.0, 18.0, 36.0, 67.0, 119.0, 149.0, 267.0, 470.0, 755.0, 1308.0, 2118.0, 3435.0, 5913.0, 9869.0, 16485.0, 27229.0, 44764.0, 72471.0, 113592.0, 175828.0, 255213.0, 352056.0, 443335.0, 506013.0, 513012.0, 463209.0, 375762.0, 278724.0, 193409.0, 128425.0, 81391.0, 50984.0, 30690.0, 18794.0, 11265.0, 6935.0, 4039.0, 2419.0, 1484.0, 884.0, 508.0, 314.0, 189.0, 113.0, 80.0, 58.0, 30.0, 14.0, 12.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.3486328125, -1.30792236328125, -1.2672119140625, -1.22650146484375, -1.185791015625, -1.14508056640625, -1.1043701171875, -1.06365966796875, -1.02294921875, -0.98223876953125, -0.9415283203125, -0.90081787109375, -0.860107421875, -0.81939697265625, -0.7786865234375, -0.73797607421875, -0.697265625, -0.65655517578125, -0.6158447265625, -0.57513427734375, -0.534423828125, -0.49371337890625, -0.4530029296875, -0.41229248046875, -0.37158203125, -0.33087158203125, -0.2901611328125, -0.24945068359375, -0.208740234375, -0.16802978515625, -0.1273193359375, -0.08660888671875, -0.0458984375, -0.00518798828125, 0.0355224609375, 0.07623291015625, 0.116943359375, 0.15765380859375, 0.1983642578125, 0.23907470703125, 0.27978515625, 0.32049560546875, 0.3612060546875, 0.40191650390625, 0.442626953125, 0.48333740234375, 0.5240478515625, 0.56475830078125, 0.60546875, 0.64617919921875, 0.6868896484375, 0.72760009765625, 0.768310546875, 0.80902099609375, 0.8497314453125, 0.89044189453125, 0.93115234375, 0.97186279296875, 1.0125732421875, 1.05328369140625, 1.093994140625, 1.13470458984375, 1.1754150390625, 1.21612548828125, 1.2568359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 5.0, 8.0, 13.0, 14.0, 28.0, 29.0, 25.0, 44.0, 61.0, 65.0, 83.0, 88.0, 90.0, 108.0, 127.0, 149.0, 176.0, 197.0, 186.0, 208.0, 228.0, 216.0, 199.0, 203.0, 173.0, 185.0, 173.0, 134.0, 138.0, 111.0, 111.0, 101.0, 67.0, 69.0, 46.0, 43.0, 43.0, 33.0, 21.0, 12.0, 13.0, 8.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5343780517578125, -0.516998291015625, -0.4996185302734375, -0.48223876953125, -0.4648590087890625, -0.447479248046875, -0.4300994873046875, -0.4127197265625, -0.3953399658203125, -0.377960205078125, -0.3605804443359375, -0.34320068359375, -0.3258209228515625, -0.308441162109375, -0.2910614013671875, -0.273681640625, -0.2563018798828125, -0.238922119140625, -0.2215423583984375, -0.20416259765625, -0.1867828369140625, -0.169403076171875, -0.1520233154296875, -0.1346435546875, -0.1172637939453125, -0.099884033203125, -0.0825042724609375, -0.06512451171875, -0.0477447509765625, -0.030364990234375, -0.0129852294921875, 0.00439453125, 0.0217742919921875, 0.039154052734375, 0.0565338134765625, 0.07391357421875, 0.0912933349609375, 0.108673095703125, 0.1260528564453125, 0.1434326171875, 0.1608123779296875, 0.178192138671875, 0.1955718994140625, 0.21295166015625, 0.2303314208984375, 0.247711181640625, 0.2650909423828125, 0.282470703125, 0.2998504638671875, 0.317230224609375, 0.3346099853515625, 0.35198974609375, 0.3693695068359375, 0.386749267578125, 0.4041290283203125, 0.4215087890625, 0.4388885498046875, 0.456268310546875, 0.4736480712890625, 0.49102783203125, 0.5084075927734375, 0.525787353515625, 0.5431671142578125, 0.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 8.0, 6.0, 15.0, 15.0, 29.0, 25.0, 38.0, 39.0, 42.0, 46.0, 48.0, 69.0, 72.0, 57.0, 68.0, 53.0, 69.0, 53.0, 46.0, 38.0, 34.0, 21.0, 19.0, 28.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8024777173995972, -1.7369765043258667, -1.6714752912521362, -1.6059740781784058, -1.5404728651046753, -1.4749716520309448, -1.409470558166504, -1.3439693450927734, -1.278468132019043, -1.2129669189453125, -1.147465705871582, -1.0819644927978516, -1.016463279724121, -0.9509620666503906, -0.8854609131813049, -0.8199597001075745, -0.7544584274291992, -0.6889572143554688, -0.6234560012817383, -0.5579547882080078, -0.49245360493659973, -0.42695239186286926, -0.3614512085914612, -0.2959499955177307, -0.23044878244400024, -0.16494756937026978, -0.0994463711977005, -0.033945173025131226, 0.03155604004859924, 0.09705725312232971, 0.1625584363937378, 0.22805964946746826, 0.2935607433319092, 0.35906195640563965, 0.4245631694793701, 0.4900643527507782, 0.555565595626831, 0.6210668087005615, 0.6865679621696472, 0.7520691752433777, 0.8175703883171082, 0.8830716013908386, 0.9485728144645691, 1.0140739679336548, 1.0795751810073853, 1.1450763940811157, 1.2105776071548462, 1.2760788202285767, 1.3415800333023071, 1.4070812463760376, 1.472582459449768, 1.5380836725234985, 1.603584885597229, 1.6690860986709595, 1.7345871925354004, 1.8000884056091309, 1.8655896186828613, 1.9310908317565918, 1.9965920448303223, 2.0620932579040527, 2.127594470977783, 2.1930956840515137, 2.258596897125244, 2.3240981101989746, 2.389599323272705]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 4.0, 3.0, 8.0, 8.0, 17.0, 11.0, 10.0, 22.0, 13.0, 21.0, 24.0, 29.0, 29.0, 30.0, 35.0, 30.0, 35.0, 38.0, 29.0, 33.0, 35.0, 43.0, 43.0, 33.0, 40.0, 41.0, 38.0, 33.0, 34.0, 28.0, 24.0, 26.0, 25.0, 17.0, 11.0, 7.0, 12.0, 19.0, 13.0, 10.0, 10.0, 2.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.269423007965088, -1.2290480136871338, -1.1886730194091797, -1.1482980251312256, -1.1079230308532715, -1.0675479173660278, -1.0271729230880737, -0.9867979288101196, -0.9464229345321655, -0.9060479402542114, -0.8656729459762573, -0.8252978920936584, -0.7849228978157043, -0.7445479035377502, -0.7041728496551514, -0.6637978553771973, -0.6234228610992432, -0.5830478668212891, -0.542672872543335, -0.5022978186607361, -0.461922824382782, -0.4215478301048279, -0.3811728060245514, -0.3407977819442749, -0.3004227876663208, -0.2600477933883667, -0.2196727693080902, -0.17929776012897491, -0.13892275094985962, -0.09854774177074432, -0.05817273259162903, -0.01779770851135254, 0.022577285766601562, 0.06295229494571686, 0.10332730412483215, 0.14370231330394745, 0.18407732248306274, 0.22445233166217804, 0.26482734084129333, 0.3052023649215698, 0.3455773591995239, 0.385952353477478, 0.4263273775577545, 0.466702401638031, 0.5070773959159851, 0.5474523901939392, 0.5878274440765381, 0.6282024383544922, 0.6685774326324463, 0.7089524269104004, 0.7493274211883545, 0.7897024750709534, 0.8300774693489075, 0.8704524636268616, 0.9108275175094604, 0.9512025117874146, 0.9915775060653687, 1.0319525003433228, 1.0723274946212769, 1.112702488899231, 1.1530776023864746, 1.1934525966644287, 1.2338275909423828, 1.274202585220337, 1.314577579498291]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 12.0, 20.0, 43.0, 38.0, 70.0, 96.0, 146.0, 195.0, 279.0, 424.0, 633.0, 875.0, 1368.0, 2180.0, 3483.0, 5805.0, 9731.0, 16791.0, 29913.0, 52774.0, 91020.0, 147701.0, 200017.0, 184602.0, 124050.0, 74536.0, 42984.0, 23994.0, 13773.0, 7985.0, 4761.0, 2828.0, 1706.0, 1259.0, 759.0, 508.0, 339.0, 253.0, 174.0, 131.0, 97.0, 60.0, 36.0, 32.0, 19.0, 14.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.72021484375, -0.69891357421875, -0.6776123046875, -0.65631103515625, -0.635009765625, -0.61370849609375, -0.5924072265625, -0.57110595703125, -0.5498046875, -0.52850341796875, -0.5072021484375, -0.48590087890625, -0.464599609375, -0.44329833984375, -0.4219970703125, -0.40069580078125, -0.37939453125, -0.35809326171875, -0.3367919921875, -0.31549072265625, -0.294189453125, -0.27288818359375, -0.2515869140625, -0.23028564453125, -0.208984375, -0.18768310546875, -0.1663818359375, -0.14508056640625, -0.123779296875, -0.10247802734375, -0.0811767578125, -0.05987548828125, -0.03857421875, -0.01727294921875, 0.0040283203125, 0.02532958984375, 0.046630859375, 0.06793212890625, 0.0892333984375, 0.11053466796875, 0.1318359375, 0.15313720703125, 0.1744384765625, 0.19573974609375, 0.217041015625, 0.23834228515625, 0.2596435546875, 0.28094482421875, 0.30224609375, 0.32354736328125, 0.3448486328125, 0.36614990234375, 0.387451171875, 0.40875244140625, 0.4300537109375, 0.45135498046875, 0.47265625, 0.49395751953125, 0.5152587890625, 0.53656005859375, 0.557861328125, 0.57916259765625, 0.6004638671875, 0.62176513671875, 0.64306640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 9.0, 6.0, 8.0, 13.0, 11.0, 15.0, 17.0, 12.0, 24.0, 24.0, 32.0, 21.0, 30.0, 31.0, 30.0, 37.0, 46.0, 36.0, 34.0, 42.0, 48.0, 31.0, 33.0, 48.0, 36.0, 42.0, 34.0, 32.0, 20.0, 22.0, 25.0, 23.0, 12.0, 24.0, 14.0, 13.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.36297607421875, -1.3177490234375, -1.27252197265625, -1.227294921875, -1.18206787109375, -1.1368408203125, -1.09161376953125, -1.04638671875, -1.00115966796875, -0.9559326171875, -0.91070556640625, -0.865478515625, -0.82025146484375, -0.7750244140625, -0.72979736328125, -0.6845703125, -0.63934326171875, -0.5941162109375, -0.54888916015625, -0.503662109375, -0.45843505859375, -0.4132080078125, -0.36798095703125, -0.32275390625, -0.27752685546875, -0.2322998046875, -0.18707275390625, -0.141845703125, -0.09661865234375, -0.0513916015625, -0.00616455078125, 0.0390625, 0.08428955078125, 0.1295166015625, 0.17474365234375, 0.219970703125, 0.26519775390625, 0.3104248046875, 0.35565185546875, 0.40087890625, 0.44610595703125, 0.4913330078125, 0.53656005859375, 0.581787109375, 0.62701416015625, 0.6722412109375, 0.71746826171875, 0.7626953125, 0.80792236328125, 0.8531494140625, 0.89837646484375, 0.943603515625, 0.98883056640625, 1.0340576171875, 1.07928466796875, 1.12451171875, 1.16973876953125, 1.2149658203125, 1.26019287109375, 1.305419921875, 1.35064697265625, 1.3958740234375, 1.44110107421875, 1.486328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 1.0, 11.0, 12.0, 24.0, 34.0, 52.0, 66.0, 105.0, 138.0, 231.0, 358.0, 622.0, 1085.0, 2223.0, 4879.0, 12454.0, 38183.0, 130315.0, 389692.0, 322990.0, 97387.0, 29203.0, 10148.0, 4073.0, 1819.0, 936.0, 549.0, 348.0, 215.0, 117.0, 93.0, 62.0, 29.0, 31.0, 24.0, 17.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4833984375, -1.4396209716796875, -1.395843505859375, -1.3520660400390625, -1.30828857421875, -1.2645111083984375, -1.220733642578125, -1.1769561767578125, -1.1331787109375, -1.0894012451171875, -1.045623779296875, -1.0018463134765625, -0.95806884765625, -0.9142913818359375, -0.870513916015625, -0.8267364501953125, -0.782958984375, -0.7391815185546875, -0.695404052734375, -0.6516265869140625, -0.60784912109375, -0.5640716552734375, -0.520294189453125, -0.4765167236328125, -0.4327392578125, -0.3889617919921875, -0.345184326171875, -0.3014068603515625, -0.25762939453125, -0.2138519287109375, -0.170074462890625, -0.1262969970703125, -0.08251953125, -0.0387420654296875, 0.005035400390625, 0.0488128662109375, 0.09259033203125, 0.1363677978515625, 0.180145263671875, 0.2239227294921875, 0.2677001953125, 0.3114776611328125, 0.355255126953125, 0.3990325927734375, 0.44281005859375, 0.4865875244140625, 0.530364990234375, 0.5741424560546875, 0.617919921875, 0.6616973876953125, 0.705474853515625, 0.7492523193359375, 0.79302978515625, 0.8368072509765625, 0.880584716796875, 0.9243621826171875, 0.9681396484375, 1.0119171142578125, 1.055694580078125, 1.0994720458984375, 1.14324951171875, 1.1870269775390625, 1.230804443359375, 1.2745819091796875, 1.318359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 8.0, 13.0, 12.0, 13.0, 14.0, 16.0, 14.0, 17.0, 18.0, 27.0, 26.0, 20.0, 33.0, 27.0, 38.0, 45.0, 34.0, 29.0, 35.0, 44.0, 41.0, 46.0, 42.0, 27.0, 27.0, 37.0, 33.0, 25.0, 24.0, 22.0, 19.0, 22.0, 27.0, 19.0, 17.0, 17.0, 11.0, 11.0, 7.0, 5.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9482421875, -0.9193344116210938, -0.8904266357421875, -0.8615188598632812, -0.832611083984375, -0.8037033081054688, -0.7747955322265625, -0.7458877563476562, -0.71697998046875, -0.6880722045898438, -0.6591644287109375, -0.6302566528320312, -0.601348876953125, -0.5724411010742188, -0.5435333251953125, -0.5146255493164062, -0.4857177734375, -0.45680999755859375, -0.4279022216796875, -0.39899444580078125, -0.370086669921875, -0.34117889404296875, -0.3122711181640625, -0.28336334228515625, -0.25445556640625, -0.22554779052734375, -0.1966400146484375, -0.16773223876953125, -0.138824462890625, -0.10991668701171875, -0.0810089111328125, -0.05210113525390625, -0.023193359375, 0.00571441650390625, 0.0346221923828125, 0.06352996826171875, 0.092437744140625, 0.12134552001953125, 0.1502532958984375, 0.17916107177734375, 0.20806884765625, 0.23697662353515625, 0.2658843994140625, 0.29479217529296875, 0.323699951171875, 0.35260772705078125, 0.3815155029296875, 0.41042327880859375, 0.4393310546875, 0.46823883056640625, 0.4971466064453125, 0.5260543823242188, 0.554962158203125, 0.5838699340820312, 0.6127777099609375, 0.6416854858398438, 0.67059326171875, 0.6995010375976562, 0.7284088134765625, 0.7573165893554688, 0.786224365234375, 0.8151321411132812, 0.8440399169921875, 0.8729476928710938, 0.90185546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 9.0, 12.0, 16.0, 23.0, 31.0, 49.0, 56.0, 78.0, 100.0, 157.0, 193.0, 277.0, 382.0, 552.0, 923.0, 1438.0, 2798.0, 6708.0, 28105.0, 601080.0, 371774.0, 21285.0, 5694.0, 2531.0, 1413.0, 835.0, 544.0, 383.0, 292.0, 191.0, 170.0, 102.0, 89.0, 64.0, 48.0, 41.0, 19.0, 23.0, 21.0, 14.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2080078125, -1.1662445068359375, -1.124481201171875, -1.0827178955078125, -1.04095458984375, -0.9991912841796875, -0.957427978515625, -0.9156646728515625, -0.8739013671875, -0.8321380615234375, -0.790374755859375, -0.7486114501953125, -0.70684814453125, -0.6650848388671875, -0.623321533203125, -0.5815582275390625, -0.539794921875, -0.4980316162109375, -0.456268310546875, -0.4145050048828125, -0.37274169921875, -0.3309783935546875, -0.289215087890625, -0.2474517822265625, -0.2056884765625, -0.1639251708984375, -0.122161865234375, -0.0803985595703125, -0.03863525390625, 0.0031280517578125, 0.044891357421875, 0.0866546630859375, 0.12841796875, 0.1701812744140625, 0.211944580078125, 0.2537078857421875, 0.29547119140625, 0.3372344970703125, 0.378997802734375, 0.4207611083984375, 0.4625244140625, 0.5042877197265625, 0.546051025390625, 0.5878143310546875, 0.62957763671875, 0.6713409423828125, 0.713104248046875, 0.7548675537109375, 0.796630859375, 0.8383941650390625, 0.880157470703125, 0.9219207763671875, 0.96368408203125, 1.0054473876953125, 1.047210693359375, 1.0889739990234375, 1.1307373046875, 1.1725006103515625, 1.214263916015625, 1.2560272216796875, 1.29779052734375, 1.3395538330078125, 1.381317138671875, 1.4230804443359375, 1.46484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 10.0, 7.0, 37.0, 166.0, 378.0, 271.0, 90.0, 23.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017905235290527344, -0.00017454568296670914, -0.00017003901302814484, -0.00016553234308958054, -0.00016102567315101624, -0.00015651900321245193, -0.00015201233327388763, -0.00014750566333532333, -0.00014299899339675903, -0.00013849232345819473, -0.00013398565351963043, -0.00012947898358106613, -0.00012497231364250183, -0.00012046564370393753, -0.00011595897376537323, -0.00011145230382680893, -0.00010694563388824463, -0.00010243896394968033, -9.793229401111603e-05, -9.342562407255173e-05, -8.891895413398743e-05, -8.441228419542313e-05, -7.990561425685883e-05, -7.539894431829453e-05, -7.089227437973022e-05, -6.638560444116592e-05, -6.187893450260162e-05, -5.737226456403732e-05, -5.286559462547302e-05, -4.835892468690872e-05, -4.385225474834442e-05, -3.934558480978012e-05, -3.483891487121582e-05, -3.033224493265152e-05, -2.582557499408722e-05, -2.131890505552292e-05, -1.6812235116958618e-05, -1.2305565178394318e-05, -7.798895239830017e-06, -3.2922253012657166e-06, 1.214444637298584e-06, 5.7211145758628845e-06, 1.0227784514427185e-05, 1.4734454452991486e-05, 1.9241124391555786e-05, 2.3747794330120087e-05, 2.8254464268684387e-05, 3.276113420724869e-05, 3.726780414581299e-05, 4.177447408437729e-05, 4.628114402294159e-05, 5.078781396150589e-05, 5.529448390007019e-05, 5.980115383863449e-05, 6.430782377719879e-05, 6.881449371576309e-05, 7.332116365432739e-05, 7.782783359289169e-05, 8.2334503531456e-05, 8.68411734700203e-05, 9.13478434085846e-05, 9.58545133471489e-05, 0.0001003611832857132, 0.0001048678532242775, 0.0001093745231628418]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 18.0, 22.0, 33.0, 32.0, 56.0, 84.0, 101.0, 159.0, 233.0, 403.0, 732.0, 1164.0, 2207.0, 4459.0, 10179.0, 27892.0, 102862.0, 413747.0, 356340.0, 85602.0, 24236.0, 9093.0, 3952.0, 2007.0, 1109.0, 622.0, 392.0, 254.0, 155.0, 96.0, 66.0, 53.0, 42.0, 29.0, 25.0, 18.0, 9.0, 5.0, 5.0, 5.0, 5.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.75830078125, -0.7359542846679688, -0.7136077880859375, -0.6912612915039062, -0.668914794921875, -0.6465682983398438, -0.6242218017578125, -0.6018753051757812, -0.57952880859375, -0.5571823120117188, -0.5348358154296875, -0.5124893188476562, -0.490142822265625, -0.46779632568359375, -0.4454498291015625, -0.42310333251953125, -0.4007568359375, -0.37841033935546875, -0.3560638427734375, -0.33371734619140625, -0.311370849609375, -0.28902435302734375, -0.2666778564453125, -0.24433135986328125, -0.22198486328125, -0.19963836669921875, -0.1772918701171875, -0.15494537353515625, -0.132598876953125, -0.11025238037109375, -0.0879058837890625, -0.06555938720703125, -0.043212890625, -0.02086639404296875, 0.0014801025390625, 0.02382659912109375, 0.046173095703125, 0.06851959228515625, 0.0908660888671875, 0.11321258544921875, 0.13555908203125, 0.15790557861328125, 0.1802520751953125, 0.20259857177734375, 0.224945068359375, 0.24729156494140625, 0.2696380615234375, 0.29198455810546875, 0.3143310546875, 0.33667755126953125, 0.3590240478515625, 0.38137054443359375, 0.403717041015625, 0.42606353759765625, 0.4484100341796875, 0.47075653076171875, 0.49310302734375, 0.5154495239257812, 0.5377960205078125, 0.5601425170898438, 0.582489013671875, 0.6048355102539062, 0.6271820068359375, 0.6495285034179688, 0.671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 15.0, 18.0, 20.0, 35.0, 60.0, 128.0, 212.0, 219.0, 114.0, 70.0, 35.0, 33.0, 12.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.343505859375, -0.33570098876953125, -0.3278961181640625, -0.32009124755859375, -0.312286376953125, -0.30448150634765625, -0.2966766357421875, -0.28887176513671875, -0.28106689453125, -0.27326202392578125, -0.2654571533203125, -0.25765228271484375, -0.249847412109375, -0.24204254150390625, -0.2342376708984375, -0.22643280029296875, -0.2186279296875, -0.21082305908203125, -0.2030181884765625, -0.19521331787109375, -0.187408447265625, -0.17960357666015625, -0.1717987060546875, -0.16399383544921875, -0.15618896484375, -0.14838409423828125, -0.1405792236328125, -0.13277435302734375, -0.124969482421875, -0.11716461181640625, -0.1093597412109375, -0.10155487060546875, -0.09375, -0.08594512939453125, -0.0781402587890625, -0.07033538818359375, -0.062530517578125, -0.05472564697265625, -0.0469207763671875, -0.03911590576171875, -0.03131103515625, -0.02350616455078125, -0.0157012939453125, -0.00789642333984375, -9.1552734375e-05, 0.00771331787109375, 0.0155181884765625, 0.02332305908203125, 0.0311279296875, 0.03893280029296875, 0.0467376708984375, 0.05454254150390625, 0.062347412109375, 0.07015228271484375, 0.0779571533203125, 0.08576202392578125, 0.09356689453125, 0.10137176513671875, 0.1091766357421875, 0.11698150634765625, 0.124786376953125, 0.13259124755859375, 0.1403961181640625, 0.14820098876953125, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 12.0, 11.0, 11.0, 17.0, 20.0, 25.0, 34.0, 35.0, 37.0, 45.0, 50.0, 59.0, 78.0, 57.0, 64.0, 53.0, 62.0, 65.0, 46.0, 43.0, 33.0, 33.0, 20.0, 15.0, 20.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7161957025527954, -1.6523724794387817, -1.5885493755340576, -1.524726152420044, -1.4609029293060303, -1.3970797061920166, -1.333256483078003, -1.2694333791732788, -1.2056101560592651, -1.1417869329452515, -1.0779638290405273, -1.0141406059265137, -0.9503173828125, -0.8864941596984863, -0.8226709961891174, -0.7588478326797485, -0.6950246095657349, -0.6312013864517212, -0.5673782229423523, -0.5035550594329834, -0.4397318363189697, -0.37590864300727844, -0.31208544969558716, -0.24826225638389587, -0.1844390630722046, -0.1206158697605133, -0.05679267644882202, 0.007030516862869263, 0.07085371017456055, 0.13467690348625183, 0.19850009679794312, 0.2623232901096344, 0.32614636421203613, 0.3899695575237274, 0.4537927508354187, 0.5176159143447876, 0.5814391374588013, 0.6452623605728149, 0.7090855240821838, 0.7729086875915527, 0.8367319107055664, 0.9005551338195801, 0.964378297328949, 1.0282014608383179, 1.0920246839523315, 1.1558479070663452, 1.2196710109710693, 1.283494234085083, 1.3473174571990967, 1.4111406803131104, 1.474963903427124, 1.5387870073318481, 1.6026102304458618, 1.6664334535598755, 1.7302565574645996, 1.7940797805786133, 1.857903003692627, 1.9217262268066406, 1.9855494499206543, 2.049372673034668, 2.1131958961486816, 2.177018880844116, 2.24084210395813, 2.3046653270721436, 2.3684885501861572]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 3.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 15.0, 12.0, 22.0, 29.0, 29.0, 24.0, 28.0, 35.0, 30.0, 38.0, 37.0, 31.0, 33.0, 34.0, 46.0, 40.0, 37.0, 42.0, 38.0, 35.0, 31.0, 35.0, 28.0, 28.0, 21.0, 31.0, 12.0, 13.0, 12.0, 10.0, 16.0, 11.0, 12.0, 10.0, 2.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2592148780822754, -1.2190552949905396, -1.1788957118988037, -1.1387361288070679, -1.098576545715332, -1.0584168434143066, -1.0182572603225708, -0.978097677230835, -0.9379380941390991, -0.8977785110473633, -0.8576189279556274, -0.8174592852592468, -0.777299702167511, -0.7371401190757751, -0.6969804763793945, -0.6568208932876587, -0.6166613101959229, -0.576501727104187, -0.5363421440124512, -0.49618250131607056, -0.4560229182243347, -0.4158633351325989, -0.37570372223854065, -0.3355441093444824, -0.2953845262527466, -0.25522494316101074, -0.21506533026695251, -0.17490573227405548, -0.13474613428115845, -0.09458653628826141, -0.05442693829536438, -0.014267325401306152, 0.025892257690429688, 0.06605185568332672, 0.10621145367622375, 0.1463710516691208, 0.18653064966201782, 0.22669024765491486, 0.2668498456478119, 0.3070094585418701, 0.34716904163360596, 0.3873286247253418, 0.4274882376194, 0.46764785051345825, 0.5078074336051941, 0.5479670166969299, 0.5881266593933105, 0.6282862424850464, 0.6684458255767822, 0.7086054086685181, 0.7487649917602539, 0.7889246344566345, 0.8290842175483704, 0.8692438006401062, 0.9094034433364868, 0.9495630264282227, 0.9897226095199585, 1.0298821926116943, 1.0700417757034302, 1.110201358795166, 1.1503610610961914, 1.1905206441879272, 1.230680227279663, 1.270839810371399, 1.3109993934631348]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 8.0, 10.0, 23.0, 29.0, 54.0, 75.0, 126.0, 178.0, 292.0, 452.0, 695.0, 1067.0, 1650.0, 2535.0, 3781.0, 5759.0, 8684.0, 12999.0, 19103.0, 27869.0, 38388.0, 52981.0, 69031.0, 84784.0, 98282.0, 105789.0, 104631.0, 96323.0, 82034.0, 65992.0, 49762.0, 36587.0, 25666.0, 17795.0, 12116.0, 7964.0, 5170.0, 3386.0, 2239.0, 1430.0, 974.0, 638.0, 414.0, 273.0, 177.0, 131.0, 65.0, 60.0, 36.0, 13.0, 8.0, 10.0, 14.0, 8.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1064453125, -1.0717620849609375, -1.037078857421875, -1.0023956298828125, -0.96771240234375, -0.9330291748046875, -0.898345947265625, -0.8636627197265625, -0.8289794921875, -0.7942962646484375, -0.759613037109375, -0.7249298095703125, -0.69024658203125, -0.6555633544921875, -0.620880126953125, -0.5861968994140625, -0.551513671875, -0.5168304443359375, -0.482147216796875, -0.4474639892578125, -0.41278076171875, -0.3780975341796875, -0.343414306640625, -0.3087310791015625, -0.2740478515625, -0.2393646240234375, -0.204681396484375, -0.1699981689453125, -0.13531494140625, -0.1006317138671875, -0.065948486328125, -0.0312652587890625, 0.00341796875, 0.0381011962890625, 0.072784423828125, 0.1074676513671875, 0.14215087890625, 0.1768341064453125, 0.211517333984375, 0.2462005615234375, 0.2808837890625, 0.3155670166015625, 0.350250244140625, 0.3849334716796875, 0.41961669921875, 0.4542999267578125, 0.488983154296875, 0.5236663818359375, 0.558349609375, 0.5930328369140625, 0.627716064453125, 0.6623992919921875, 0.69708251953125, 0.7317657470703125, 0.766448974609375, 0.8011322021484375, 0.8358154296875, 0.8704986572265625, 0.905181884765625, 0.9398651123046875, 0.97454833984375, 1.0092315673828125, 1.043914794921875, 1.0785980224609375, 1.11328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 8.0, 18.0, 13.0, 18.0, 25.0, 13.0, 33.0, 36.0, 38.0, 26.0, 30.0, 42.0, 38.0, 31.0, 33.0, 33.0, 40.0, 44.0, 33.0, 45.0, 38.0, 28.0, 40.0, 28.0, 30.0, 21.0, 21.0, 25.0, 16.0, 8.0, 19.0, 12.0, 9.0, 10.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2978515625, -1.257110595703125, -1.21636962890625, -1.175628662109375, -1.1348876953125, -1.094146728515625, -1.05340576171875, -1.012664794921875, -0.971923828125, -0.931182861328125, -0.89044189453125, -0.849700927734375, -0.8089599609375, -0.768218994140625, -0.72747802734375, -0.686737060546875, -0.64599609375, -0.605255126953125, -0.56451416015625, -0.523773193359375, -0.4830322265625, -0.442291259765625, -0.40155029296875, -0.360809326171875, -0.320068359375, -0.279327392578125, -0.23858642578125, -0.197845458984375, -0.1571044921875, -0.116363525390625, -0.07562255859375, -0.034881591796875, 0.005859375, 0.046600341796875, 0.08734130859375, 0.128082275390625, 0.1688232421875, 0.209564208984375, 0.25030517578125, 0.291046142578125, 0.331787109375, 0.372528076171875, 0.41326904296875, 0.454010009765625, 0.4947509765625, 0.535491943359375, 0.57623291015625, 0.616973876953125, 0.65771484375, 0.698455810546875, 0.73919677734375, 0.779937744140625, 0.8206787109375, 0.861419677734375, 0.90216064453125, 0.942901611328125, 0.983642578125, 1.024383544921875, 1.06512451171875, 1.105865478515625, 1.1466064453125, 1.187347412109375, 1.22808837890625, 1.268829345703125, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 10.0, 22.0, 27.0, 39.0, 58.0, 90.0, 129.0, 171.0, 314.0, 443.0, 744.0, 1100.0, 1716.0, 2556.0, 3836.0, 6056.0, 8960.0, 13489.0, 19406.0, 27707.0, 38876.0, 52246.0, 68236.0, 83640.0, 96278.0, 103027.0, 102151.0, 94264.0, 82405.0, 66456.0, 51550.0, 37958.0, 27116.0, 19018.0, 12697.0, 8868.0, 5848.0, 3931.0, 2471.0, 1627.0, 1030.0, 683.0, 464.0, 296.0, 204.0, 121.0, 78.0, 45.0, 48.0, 21.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0], "bins": [-1.1064453125, -1.0728759765625, -1.039306640625, -1.0057373046875, -0.97216796875, -0.9385986328125, -0.905029296875, -0.8714599609375, -0.837890625, -0.8043212890625, -0.770751953125, -0.7371826171875, -0.70361328125, -0.6700439453125, -0.636474609375, -0.6029052734375, -0.5693359375, -0.5357666015625, -0.502197265625, -0.4686279296875, -0.43505859375, -0.4014892578125, -0.367919921875, -0.3343505859375, -0.30078125, -0.2672119140625, -0.233642578125, -0.2000732421875, -0.16650390625, -0.1329345703125, -0.099365234375, -0.0657958984375, -0.0322265625, 0.0013427734375, 0.034912109375, 0.0684814453125, 0.10205078125, 0.1356201171875, 0.169189453125, 0.2027587890625, 0.236328125, 0.2698974609375, 0.303466796875, 0.3370361328125, 0.37060546875, 0.4041748046875, 0.437744140625, 0.4713134765625, 0.5048828125, 0.5384521484375, 0.572021484375, 0.6055908203125, 0.63916015625, 0.6727294921875, 0.706298828125, 0.7398681640625, 0.7734375, 0.8070068359375, 0.840576171875, 0.8741455078125, 0.90771484375, 0.9412841796875, 0.974853515625, 1.0084228515625, 1.0419921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 15.0, 18.0, 17.0, 12.0, 21.0, 18.0, 22.0, 23.0, 18.0, 36.0, 30.0, 36.0, 39.0, 44.0, 40.0, 34.0, 43.0, 37.0, 35.0, 47.0, 37.0, 43.0, 49.0, 33.0, 30.0, 23.0, 38.0, 14.0, 24.0, 24.0, 14.0, 10.0, 11.0, 10.0, 3.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7753677368164062, -0.7480010986328125, -0.7206344604492188, -0.693267822265625, -0.6659011840820312, -0.6385345458984375, -0.6111679077148438, -0.58380126953125, -0.5564346313476562, -0.5290679931640625, -0.5017013549804688, -0.474334716796875, -0.44696807861328125, -0.4196014404296875, -0.39223480224609375, -0.3648681640625, -0.33750152587890625, -0.3101348876953125, -0.28276824951171875, -0.255401611328125, -0.22803497314453125, -0.2006683349609375, -0.17330169677734375, -0.14593505859375, -0.11856842041015625, -0.0912017822265625, -0.06383514404296875, -0.036468505859375, -0.00910186767578125, 0.0182647705078125, 0.04563140869140625, 0.072998046875, 0.10036468505859375, 0.1277313232421875, 0.15509796142578125, 0.182464599609375, 0.20983123779296875, 0.2371978759765625, 0.26456451416015625, 0.29193115234375, 0.31929779052734375, 0.3466644287109375, 0.37403106689453125, 0.401397705078125, 0.42876434326171875, 0.4561309814453125, 0.48349761962890625, 0.5108642578125, 0.5382308959960938, 0.5655975341796875, 0.5929641723632812, 0.620330810546875, 0.6476974487304688, 0.6750640869140625, 0.7024307250976562, 0.72979736328125, 0.7571640014648438, 0.7845306396484375, 0.8118972778320312, 0.839263916015625, 0.8666305541992188, 0.8939971923828125, 0.9213638305664062, 0.94873046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 9.0, 13.0, 31.0, 42.0, 61.0, 91.0, 178.0, 238.0, 365.0, 583.0, 965.0, 1513.0, 2474.0, 4178.0, 7039.0, 12463.0, 21956.0, 39284.0, 68589.0, 112228.0, 163587.0, 187293.0, 160961.0, 109378.0, 66472.0, 37843.0, 21280.0, 12082.0, 6906.0, 4105.0, 2366.0, 1444.0, 928.0, 562.0, 376.0, 210.0, 155.0, 95.0, 72.0, 41.0, 29.0, 20.0, 12.0, 15.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.92236328125, -0.894805908203125, -0.86724853515625, -0.839691162109375, -0.8121337890625, -0.784576416015625, -0.75701904296875, -0.729461669921875, -0.701904296875, -0.674346923828125, -0.64678955078125, -0.619232177734375, -0.5916748046875, -0.564117431640625, -0.53656005859375, -0.509002685546875, -0.4814453125, -0.453887939453125, -0.42633056640625, -0.398773193359375, -0.3712158203125, -0.343658447265625, -0.31610107421875, -0.288543701171875, -0.260986328125, -0.233428955078125, -0.20587158203125, -0.178314208984375, -0.1507568359375, -0.123199462890625, -0.09564208984375, -0.068084716796875, -0.04052734375, -0.012969970703125, 0.01458740234375, 0.042144775390625, 0.0697021484375, 0.097259521484375, 0.12481689453125, 0.152374267578125, 0.179931640625, 0.207489013671875, 0.23504638671875, 0.262603759765625, 0.2901611328125, 0.317718505859375, 0.34527587890625, 0.372833251953125, 0.400390625, 0.427947998046875, 0.45550537109375, 0.483062744140625, 0.5106201171875, 0.538177490234375, 0.56573486328125, 0.593292236328125, 0.620849609375, 0.648406982421875, 0.67596435546875, 0.703521728515625, 0.7310791015625, 0.758636474609375, 0.78619384765625, 0.813751220703125, 0.84130859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 25.0, 27.0, 29.0, 28.0, 27.0, 45.0, 38.0, 42.0, 42.0, 62.0, 62.0, 72.0, 48.0, 51.0, 43.0, 48.0, 47.0, 32.0, 29.0, 33.0, 23.0, 18.0, 14.0, 14.0, 12.0, 8.0, 5.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.390975952148438e-05, -7.155537605285645e-05, -6.920099258422852e-05, -6.684660911560059e-05, -6.449222564697266e-05, -6.213784217834473e-05, -5.97834587097168e-05, -5.742907524108887e-05, -5.507469177246094e-05, -5.272030830383301e-05, -5.036592483520508e-05, -4.801154136657715e-05, -4.565715789794922e-05, -4.330277442932129e-05, -4.094839096069336e-05, -3.859400749206543e-05, -3.62396240234375e-05, -3.388524055480957e-05, -3.153085708618164e-05, -2.917647361755371e-05, -2.682209014892578e-05, -2.446770668029785e-05, -2.2113323211669922e-05, -1.9758939743041992e-05, -1.7404556274414062e-05, -1.5050172805786133e-05, -1.2695789337158203e-05, -1.0341405868530273e-05, -7.987022399902344e-06, -5.632638931274414e-06, -3.2782554626464844e-06, -9.238719940185547e-07, 1.430511474609375e-06, 3.7848949432373047e-06, 6.139278411865234e-06, 8.493661880493164e-06, 1.0848045349121094e-05, 1.3202428817749023e-05, 1.5556812286376953e-05, 1.7911195755004883e-05, 2.0265579223632812e-05, 2.2619962692260742e-05, 2.4974346160888672e-05, 2.73287296295166e-05, 2.968311309814453e-05, 3.203749656677246e-05, 3.439188003540039e-05, 3.674626350402832e-05, 3.910064697265625e-05, 4.145503044128418e-05, 4.380941390991211e-05, 4.616379737854004e-05, 4.851818084716797e-05, 5.08725643157959e-05, 5.322694778442383e-05, 5.558133125305176e-05, 5.793571472167969e-05, 6.029009819030762e-05, 6.264448165893555e-05, 6.499886512756348e-05, 6.73532485961914e-05, 6.970763206481934e-05, 7.206201553344727e-05, 7.44163990020752e-05, 7.677078247070312e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 16.0, 20.0, 27.0, 49.0, 58.0, 104.0, 154.0, 224.0, 366.0, 613.0, 1018.0, 1768.0, 2840.0, 4807.0, 8372.0, 14733.0, 25419.0, 44505.0, 75655.0, 118628.0, 159821.0, 174986.0, 149433.0, 106494.0, 66374.0, 39158.0, 22162.0, 12750.0, 7421.0, 4107.0, 2534.0, 1479.0, 924.0, 536.0, 363.0, 232.0, 154.0, 92.0, 55.0, 35.0, 18.0, 18.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.84765625, -0.82147216796875, -0.7952880859375, -0.76910400390625, -0.742919921875, -0.71673583984375, -0.6905517578125, -0.66436767578125, -0.63818359375, -0.61199951171875, -0.5858154296875, -0.55963134765625, -0.533447265625, -0.50726318359375, -0.4810791015625, -0.45489501953125, -0.4287109375, -0.40252685546875, -0.3763427734375, -0.35015869140625, -0.323974609375, -0.29779052734375, -0.2716064453125, -0.24542236328125, -0.21923828125, -0.19305419921875, -0.1668701171875, -0.14068603515625, -0.114501953125, -0.08831787109375, -0.0621337890625, -0.03594970703125, -0.009765625, 0.01641845703125, 0.0426025390625, 0.06878662109375, 0.094970703125, 0.12115478515625, 0.1473388671875, 0.17352294921875, 0.19970703125, 0.22589111328125, 0.2520751953125, 0.27825927734375, 0.304443359375, 0.33062744140625, 0.3568115234375, 0.38299560546875, 0.4091796875, 0.43536376953125, 0.4615478515625, 0.48773193359375, 0.513916015625, 0.54010009765625, 0.5662841796875, 0.59246826171875, 0.61865234375, 0.64483642578125, 0.6710205078125, 0.69720458984375, 0.723388671875, 0.74957275390625, 0.7757568359375, 0.80194091796875, 0.828125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 10.0, 17.0, 12.0, 22.0, 25.0, 27.0, 44.0, 46.0, 56.0, 54.0, 65.0, 75.0, 68.0, 78.0, 64.0, 67.0, 43.0, 42.0, 35.0, 27.0, 22.0, 17.0, 22.0, 13.0, 11.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38722991943359375, -0.3760223388671875, -0.36481475830078125, -0.353607177734375, -0.34239959716796875, -0.3311920166015625, -0.31998443603515625, -0.30877685546875, -0.29756927490234375, -0.2863616943359375, -0.27515411376953125, -0.263946533203125, -0.25273895263671875, -0.2415313720703125, -0.23032379150390625, -0.2191162109375, -0.20790863037109375, -0.1967010498046875, -0.18549346923828125, -0.174285888671875, -0.16307830810546875, -0.1518707275390625, -0.14066314697265625, -0.12945556640625, -0.11824798583984375, -0.1070404052734375, -0.09583282470703125, -0.084625244140625, -0.07341766357421875, -0.0622100830078125, -0.05100250244140625, -0.039794921875, -0.02858734130859375, -0.0173797607421875, -0.00617218017578125, 0.005035400390625, 0.01624298095703125, 0.0274505615234375, 0.03865814208984375, 0.04986572265625, 0.06107330322265625, 0.0722808837890625, 0.08348846435546875, 0.094696044921875, 0.10590362548828125, 0.1171112060546875, 0.12831878662109375, 0.1395263671875, 0.15073394775390625, 0.1619415283203125, 0.17314910888671875, 0.184356689453125, 0.19556427001953125, 0.2067718505859375, 0.21797943115234375, 0.22918701171875, 0.24039459228515625, 0.2516021728515625, 0.26280975341796875, 0.274017333984375, 0.28522491455078125, 0.2964324951171875, 0.30764007568359375, 0.31884765625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 11.0, 7.0, 12.0, 19.0, 26.0, 30.0, 35.0, 33.0, 33.0, 57.0, 59.0, 64.0, 63.0, 70.0, 61.0, 64.0, 71.0, 52.0, 47.0, 38.0, 30.0, 23.0, 17.0, 18.0, 23.0, 9.0, 4.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96602463722229, -1.89926016330719, -1.8324956893920898, -1.7657313346862793, -1.6989668607711792, -1.632202386856079, -1.5654380321502686, -1.4986735582351685, -1.4319090843200684, -1.3651446104049683, -1.2983801364898682, -1.2316157817840576, -1.1648513078689575, -1.0980868339538574, -1.0313224792480469, -0.9645580053329468, -0.8977935314178467, -0.8310290575027466, -0.7642646431922913, -0.6975002288818359, -0.6307357549667358, -0.5639712810516357, -0.4972068667411804, -0.4304424226284027, -0.363677978515625, -0.2969135344028473, -0.23014909029006958, -0.16338464617729187, -0.09662020206451416, -0.02985575795173645, 0.03690868616104126, 0.10367313027381897, 0.17043781280517578, 0.2372022569179535, 0.3039667010307312, 0.3707311451435089, 0.4374955892562866, 0.5042600631713867, 0.571024477481842, 0.6377888917922974, 0.7045533657073975, 0.7713178396224976, 0.8380822539329529, 0.9048466682434082, 0.9716111421585083, 1.0383756160736084, 1.105139970779419, 1.171904444694519, 1.2386689186096191, 1.3054333925247192, 1.3721978664398193, 1.4389622211456299, 1.50572669506073, 1.57249116897583, 1.6392555236816406, 1.7060199975967407, 1.7727844715118408, 1.839548945426941, 1.906313419342041, 1.9730777740478516, 2.039842128753662, 2.1066067218780518, 2.1733710765838623, 2.240135669708252, 2.3069000244140625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 2.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 9.0, 8.0, 12.0, 9.0, 14.0, 17.0, 17.0, 29.0, 22.0, 20.0, 30.0, 22.0, 25.0, 29.0, 36.0, 37.0, 30.0, 24.0, 41.0, 46.0, 43.0, 31.0, 30.0, 40.0, 40.0, 33.0, 32.0, 33.0, 18.0, 14.0, 23.0, 16.0, 25.0, 13.0, 12.0, 16.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1299009323120117, -1.0913114547729492, -1.0527218580245972, -1.0141323804855347, -0.9755429029464722, -0.9369533658027649, -0.8983638286590576, -0.8597743511199951, -0.8211848139762878, -0.7825952768325806, -0.7440057992935181, -0.7054162621498108, -0.6668267250061035, -0.628237247467041, -0.5896477103233337, -0.5510581731796265, -0.512468695640564, -0.4738791882991791, -0.4352896809577942, -0.3967001438140869, -0.358110636472702, -0.31952112913131714, -0.28093159198760986, -0.24234208464622498, -0.2037525773048401, -0.1651630699634552, -0.12657354772090912, -0.08798403292894363, -0.04939451813697815, -0.010805010795593262, 0.02778451144695282, 0.0663740336894989, 0.10496342182159424, 0.14355292916297913, 0.1821424514055252, 0.2207319736480713, 0.2593214809894562, 0.29791098833084106, 0.33650052547454834, 0.3750900328159332, 0.4136795401573181, 0.452269047498703, 0.4908585548400879, 0.5294480919837952, 0.5680376291275024, 0.6066271066665649, 0.6452166438102722, 0.6838061809539795, 0.722395658493042, 0.7609851956367493, 0.7995746731758118, 0.838164210319519, 0.8767536878585815, 0.9153432250022888, 0.9539327621459961, 0.9925222396850586, 1.031111717224121, 1.0697011947631836, 1.1082907915115356, 1.1468802690505981, 1.1854697465896606, 1.2240593433380127, 1.2626488208770752, 1.3012382984161377, 1.3398278951644897]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 11.0, 22.0, 35.0, 56.0, 97.0, 163.0, 267.0, 412.0, 617.0, 1047.0, 1675.0, 2741.0, 4423.0, 7275.0, 11679.0, 19559.0, 31746.0, 52151.0, 84917.0, 136164.0, 215054.0, 320890.0, 445944.0, 551682.0, 584934.0, 526040.0, 409265.0, 287414.0, 189352.0, 119317.0, 73346.0, 45020.0, 27438.0, 16638.0, 10245.0, 6144.0, 3970.0, 2380.0, 1519.0, 949.0, 625.0, 398.0, 268.0, 156.0, 81.0, 64.0, 39.0, 22.0, 18.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.0457611083984375, -1.007537841796875, -0.9693145751953125, -0.93109130859375, -0.8928680419921875, -0.854644775390625, -0.8164215087890625, -0.7781982421875, -0.7399749755859375, -0.701751708984375, -0.6635284423828125, -0.62530517578125, -0.5870819091796875, -0.548858642578125, -0.5106353759765625, -0.472412109375, -0.4341888427734375, -0.395965576171875, -0.3577423095703125, -0.31951904296875, -0.2812957763671875, -0.243072509765625, -0.2048492431640625, -0.1666259765625, -0.1284027099609375, -0.090179443359375, -0.0519561767578125, -0.01373291015625, 0.0244903564453125, 0.062713623046875, 0.1009368896484375, 0.13916015625, 0.1773834228515625, 0.215606689453125, 0.2538299560546875, 0.29205322265625, 0.3302764892578125, 0.368499755859375, 0.4067230224609375, 0.4449462890625, 0.4831695556640625, 0.521392822265625, 0.5596160888671875, 0.59783935546875, 0.6360626220703125, 0.674285888671875, 0.7125091552734375, 0.750732421875, 0.7889556884765625, 0.827178955078125, 0.8654022216796875, 0.90362548828125, 0.9418487548828125, 0.980072021484375, 1.0182952880859375, 1.0565185546875, 1.0947418212890625, 1.132965087890625, 1.1711883544921875, 1.20941162109375, 1.2476348876953125, 1.285858154296875, 1.3240814208984375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 11.0, 17.0, 21.0, 18.0, 16.0, 24.0, 27.0, 33.0, 26.0, 30.0, 40.0, 44.0, 41.0, 32.0, 40.0, 50.0, 46.0, 38.0, 39.0, 36.0, 48.0, 39.0, 33.0, 31.0, 18.0, 24.0, 22.0, 20.0, 21.0, 19.0, 12.0, 8.0, 5.0, 9.0, 11.0, 4.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0205078125, -0.987518310546875, -0.95452880859375, -0.921539306640625, -0.8885498046875, -0.855560302734375, -0.82257080078125, -0.789581298828125, -0.756591796875, -0.723602294921875, -0.69061279296875, -0.657623291015625, -0.6246337890625, -0.591644287109375, -0.55865478515625, -0.525665283203125, -0.49267578125, -0.459686279296875, -0.42669677734375, -0.393707275390625, -0.3607177734375, -0.327728271484375, -0.29473876953125, -0.261749267578125, -0.228759765625, -0.195770263671875, -0.16278076171875, -0.129791259765625, -0.0968017578125, -0.063812255859375, -0.03082275390625, 0.002166748046875, 0.03515625, 0.068145751953125, 0.10113525390625, 0.134124755859375, 0.1671142578125, 0.200103759765625, 0.23309326171875, 0.266082763671875, 0.299072265625, 0.332061767578125, 0.36505126953125, 0.398040771484375, 0.4310302734375, 0.464019775390625, 0.49700927734375, 0.529998779296875, 0.56298828125, 0.595977783203125, 0.62896728515625, 0.661956787109375, 0.6949462890625, 0.727935791015625, 0.76092529296875, 0.793914794921875, 0.826904296875, 0.859893798828125, 0.89288330078125, 0.925872802734375, 0.9588623046875, 0.991851806640625, 1.02484130859375, 1.057830810546875, 1.0908203125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 7.0, 8.0, 10.0, 21.0, 33.0, 42.0, 81.0, 86.0, 161.0, 251.0, 405.0, 686.0, 1126.0, 1752.0, 2789.0, 4616.0, 7535.0, 12585.0, 20347.0, 33214.0, 53900.0, 85864.0, 132855.0, 197985.0, 282884.0, 376772.0, 460876.0, 508345.0, 497358.0, 434073.0, 344207.0, 251626.0, 174302.0, 115185.0, 73336.0, 45993.0, 28355.0, 17249.0, 10592.0, 6422.0, 3939.0, 2386.0, 1518.0, 959.0, 563.0, 398.0, 211.0, 131.0, 89.0, 68.0, 40.0, 15.0, 19.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.070556640625, -1.03466796875, -0.998779296875, -0.962890625, -0.927001953125, -0.89111328125, -0.855224609375, -0.8193359375, -0.783447265625, -0.74755859375, -0.711669921875, -0.67578125, -0.639892578125, -0.60400390625, -0.568115234375, -0.5322265625, -0.496337890625, -0.46044921875, -0.424560546875, -0.388671875, -0.352783203125, -0.31689453125, -0.281005859375, -0.2451171875, -0.209228515625, -0.17333984375, -0.137451171875, -0.1015625, -0.065673828125, -0.02978515625, 0.006103515625, 0.0419921875, 0.077880859375, 0.11376953125, 0.149658203125, 0.185546875, 0.221435546875, 0.25732421875, 0.293212890625, 0.3291015625, 0.364990234375, 0.40087890625, 0.436767578125, 0.47265625, 0.508544921875, 0.54443359375, 0.580322265625, 0.6162109375, 0.652099609375, 0.68798828125, 0.723876953125, 0.759765625, 0.795654296875, 0.83154296875, 0.867431640625, 0.9033203125, 0.939208984375, 0.97509765625, 1.010986328125, 1.046875, 1.082763671875, 1.11865234375, 1.154541015625, 1.1904296875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 6.0, 11.0, 12.0, 17.0, 34.0, 34.0, 33.0, 42.0, 49.0, 46.0, 72.0, 80.0, 107.0, 120.0, 154.0, 151.0, 166.0, 190.0, 192.0, 201.0, 213.0, 230.0, 240.0, 201.0, 206.0, 165.0, 164.0, 153.0, 132.0, 119.0, 100.0, 88.0, 67.0, 49.0, 58.0, 34.0, 23.0, 25.0, 18.0, 9.0, 10.0, 12.0, 11.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4644126892089844, -0.44860076904296875, -0.4327888488769531, -0.4169769287109375, -0.4011650085449219, -0.38535308837890625, -0.3695411682128906, -0.353729248046875, -0.3379173278808594, -0.32210540771484375, -0.3062934875488281, -0.2904815673828125, -0.2746696472167969, -0.25885772705078125, -0.24304580688476562, -0.22723388671875, -0.21142196655273438, -0.19561004638671875, -0.17979812622070312, -0.1639862060546875, -0.14817428588867188, -0.13236236572265625, -0.11655044555664062, -0.100738525390625, -0.08492660522460938, -0.06911468505859375, -0.053302764892578125, -0.0374908447265625, -0.021678924560546875, -0.00586700439453125, 0.009944915771484375, 0.0257568359375, 0.041568756103515625, 0.05738067626953125, 0.07319259643554688, 0.0890045166015625, 0.10481643676757812, 0.12062835693359375, 0.13644027709960938, 0.152252197265625, 0.16806411743164062, 0.18387603759765625, 0.19968795776367188, 0.2154998779296875, 0.23131179809570312, 0.24712371826171875, 0.2629356384277344, 0.27874755859375, 0.2945594787597656, 0.31037139892578125, 0.3261833190917969, 0.3419952392578125, 0.3578071594238281, 0.37361907958984375, 0.3894309997558594, 0.405242919921875, 0.4210548400878906, 0.43686676025390625, 0.4526786804199219, 0.4684906005859375, 0.4843025207519531, 0.5001144409179688, 0.5159263610839844, 0.53173828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 7.0, 9.0, 9.0, 10.0, 14.0, 18.0, 24.0, 23.0, 32.0, 37.0, 44.0, 46.0, 51.0, 66.0, 67.0, 52.0, 71.0, 53.0, 52.0, 37.0, 42.0, 38.0, 35.0, 31.0, 27.0, 20.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 4.0, 8.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5019704103469849, -1.4478763341903687, -1.393782377243042, -1.3396883010864258, -1.2855942249298096, -1.231500267982483, -1.1774061918258667, -1.12331223487854, -1.0692181587219238, -1.0151240825653076, -0.961030125617981, -0.9069360494613647, -0.8528420329093933, -0.7987480163574219, -0.7446539402008057, -0.6905599236488342, -0.6364659070968628, -0.5823718905448914, -0.5282778739929199, -0.4741837978363037, -0.4200897812843323, -0.36599576473236084, -0.311901718378067, -0.2578076720237732, -0.20371365547180176, -0.14961962401866913, -0.0955255925655365, -0.04143156111240387, 0.01266247034072876, 0.0667564868927002, 0.12085053324699402, 0.17494457960128784, 0.22903847694396973, 0.28313249349594116, 0.337226539850235, 0.3913205862045288, 0.44541460275650024, 0.4995086193084717, 0.5536026954650879, 0.6076967120170593, 0.6617907285690308, 0.7158847451210022, 0.7699787616729736, 0.8240728378295898, 0.8781668543815613, 0.9322608709335327, 0.9863549470901489, 1.0404489040374756, 1.0945429801940918, 1.148637056350708, 1.2027310132980347, 1.2568250894546509, 1.3109190464019775, 1.3650131225585938, 1.41910719871521, 1.4732012748718262, 1.5272952318191528, 1.581389307975769, 1.6354832649230957, 1.689577341079712, 1.7436714172363281, 1.7977653741836548, 1.851859450340271, 1.9059534072875977, 1.9600474834442139]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 14.0, 12.0, 4.0, 7.0, 9.0, 20.0, 15.0, 15.0, 21.0, 20.0, 38.0, 21.0, 32.0, 28.0, 28.0, 35.0, 37.0, 38.0, 42.0, 44.0, 29.0, 30.0, 35.0, 37.0, 34.0, 27.0, 29.0, 34.0, 34.0, 22.0, 25.0, 23.0, 23.0, 20.0, 11.0, 15.0, 16.0, 17.0, 16.0, 6.0, 6.0, 4.0, 8.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.111849308013916, -1.0768101215362549, -1.0417709350585938, -1.0067317485809326, -0.9716925621032715, -0.9366533756256104, -0.9016141295433044, -0.8665749430656433, -0.8315357565879822, -0.796496570110321, -0.7614573836326599, -0.7264181971549988, -0.6913789510726929, -0.6563397645950317, -0.6213005781173706, -0.5862613916397095, -0.5512222051620483, -0.5161830186843872, -0.4811438322067261, -0.44610461592674255, -0.4110654294490814, -0.3760262429714203, -0.34098702669143677, -0.30594784021377563, -0.2709086537361145, -0.23586946725845337, -0.20083026587963104, -0.16579106450080872, -0.13075187802314758, -0.09571269154548645, -0.060673490166664124, -0.025634288787841797, 0.009405016899108887, 0.044444210827350616, 0.07948340475559235, 0.11452259868383408, 0.1495617926120758, 0.18460097908973694, 0.21964018046855927, 0.2546793818473816, 0.2897185683250427, 0.32475775480270386, 0.359796941280365, 0.3948361575603485, 0.42987534403800964, 0.4649145305156708, 0.4999537467956543, 0.5349929332733154, 0.5700321197509766, 0.6050713062286377, 0.6401104927062988, 0.67514967918396, 0.7101888656616211, 0.7452280521392822, 0.7802672982215881, 0.8153064846992493, 0.8503456711769104, 0.8853848576545715, 0.9204240441322327, 0.9554632306098938, 0.9905024766921997, 1.0255416631698608, 1.060580849647522, 1.095620036125183, 1.1306592226028442]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 1.0, 10.0, 8.0, 15.0, 21.0, 24.0, 22.0, 54.0, 63.0, 88.0, 141.0, 198.0, 277.0, 439.0, 731.0, 1047.0, 1769.0, 2715.0, 4535.0, 7041.0, 11846.0, 19658.0, 32748.0, 53931.0, 87933.0, 135080.0, 176522.0, 173044.0, 127677.0, 82773.0, 50333.0, 30352.0, 18346.0, 11088.0, 6773.0, 4067.0, 2531.0, 1661.0, 1032.0, 662.0, 406.0, 300.0, 183.0, 128.0, 91.0, 45.0, 59.0, 29.0, 19.0, 11.0, 9.0, 10.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416748046875, -0.40234375, -0.387939453125, -0.37353515625, -0.359130859375, -0.3447265625, -0.330322265625, -0.31591796875, -0.301513671875, -0.287109375, -0.272705078125, -0.25830078125, -0.243896484375, -0.2294921875, -0.215087890625, -0.20068359375, -0.186279296875, -0.171875, -0.157470703125, -0.14306640625, -0.128662109375, -0.1142578125, -0.099853515625, -0.08544921875, -0.071044921875, -0.056640625, -0.042236328125, -0.02783203125, -0.013427734375, 0.0009765625, 0.015380859375, 0.02978515625, 0.044189453125, 0.05859375, 0.072998046875, 0.08740234375, 0.101806640625, 0.1162109375, 0.130615234375, 0.14501953125, 0.159423828125, 0.173828125, 0.188232421875, 0.20263671875, 0.217041015625, 0.2314453125, 0.245849609375, 0.26025390625, 0.274658203125, 0.2890625, 0.303466796875, 0.31787109375, 0.332275390625, 0.3466796875, 0.361083984375, 0.37548828125, 0.389892578125, 0.404296875, 0.418701171875, 0.43310546875, 0.447509765625, 0.4619140625, 0.476318359375, 0.49072265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 11.0, 12.0, 14.0, 10.0, 16.0, 12.0, 18.0, 33.0, 23.0, 27.0, 36.0, 27.0, 27.0, 46.0, 35.0, 41.0, 43.0, 40.0, 38.0, 45.0, 30.0, 42.0, 42.0, 36.0, 31.0, 25.0, 32.0, 23.0, 31.0, 20.0, 24.0, 12.0, 19.0, 11.0, 13.0, 7.0, 13.0, 6.0, 2.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2594757080078125, -1.219146728515625, -1.1788177490234375, -1.13848876953125, -1.0981597900390625, -1.057830810546875, -1.0175018310546875, -0.9771728515625, -0.9368438720703125, -0.896514892578125, -0.8561859130859375, -0.81585693359375, -0.7755279541015625, -0.735198974609375, -0.6948699951171875, -0.654541015625, -0.6142120361328125, -0.573883056640625, -0.5335540771484375, -0.49322509765625, -0.4528961181640625, -0.412567138671875, -0.3722381591796875, -0.3319091796875, -0.2915802001953125, -0.251251220703125, -0.2109222412109375, -0.17059326171875, -0.1302642822265625, -0.089935302734375, -0.0496063232421875, -0.00927734375, 0.0310516357421875, 0.071380615234375, 0.1117095947265625, 0.15203857421875, 0.1923675537109375, 0.232696533203125, 0.2730255126953125, 0.3133544921875, 0.3536834716796875, 0.394012451171875, 0.4343414306640625, 0.47467041015625, 0.5149993896484375, 0.555328369140625, 0.5956573486328125, 0.635986328125, 0.6763153076171875, 0.716644287109375, 0.7569732666015625, 0.79730224609375, 0.8376312255859375, 0.877960205078125, 0.9182891845703125, 0.9586181640625, 0.9989471435546875, 1.039276123046875, 1.0796051025390625, 1.11993408203125, 1.1602630615234375, 1.200592041015625, 1.2409210205078125, 1.28125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 10.0, 10.0, 20.0, 36.0, 42.0, 66.0, 105.0, 174.0, 210.0, 367.0, 569.0, 1026.0, 1787.0, 3248.0, 6200.0, 11638.0, 23402.0, 47637.0, 96681.0, 184208.0, 259963.0, 198395.0, 106425.0, 52593.0, 25850.0, 12901.0, 6659.0, 3507.0, 1894.0, 1119.0, 631.0, 464.0, 264.0, 163.0, 99.0, 68.0, 48.0, 26.0, 20.0, 14.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6123046875, -0.593505859375, -0.57470703125, -0.555908203125, -0.537109375, -0.518310546875, -0.49951171875, -0.480712890625, -0.4619140625, -0.443115234375, -0.42431640625, -0.405517578125, -0.38671875, -0.367919921875, -0.34912109375, -0.330322265625, -0.3115234375, -0.292724609375, -0.27392578125, -0.255126953125, -0.236328125, -0.217529296875, -0.19873046875, -0.179931640625, -0.1611328125, -0.142333984375, -0.12353515625, -0.104736328125, -0.0859375, -0.067138671875, -0.04833984375, -0.029541015625, -0.0107421875, 0.008056640625, 0.02685546875, 0.045654296875, 0.064453125, 0.083251953125, 0.10205078125, 0.120849609375, 0.1396484375, 0.158447265625, 0.17724609375, 0.196044921875, 0.21484375, 0.233642578125, 0.25244140625, 0.271240234375, 0.2900390625, 0.308837890625, 0.32763671875, 0.346435546875, 0.365234375, 0.384033203125, 0.40283203125, 0.421630859375, 0.4404296875, 0.459228515625, 0.47802734375, 0.496826171875, 0.515625, 0.534423828125, 0.55322265625, 0.572021484375, 0.5908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 7.0, 17.0, 19.0, 17.0, 26.0, 31.0, 35.0, 34.0, 29.0, 32.0, 39.0, 34.0, 40.0, 41.0, 42.0, 47.0, 42.0, 37.0, 44.0, 51.0, 30.0, 34.0, 34.0, 32.0, 23.0, 18.0, 17.0, 17.0, 21.0, 16.0, 11.0, 7.0, 14.0, 2.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7228012084960938, -0.6951141357421875, -0.6674270629882812, -0.639739990234375, -0.6120529174804688, -0.5843658447265625, -0.5566787719726562, -0.52899169921875, -0.5013046264648438, -0.4736175537109375, -0.44593048095703125, -0.418243408203125, -0.39055633544921875, -0.3628692626953125, -0.33518218994140625, -0.3074951171875, -0.27980804443359375, -0.2521209716796875, -0.22443389892578125, -0.196746826171875, -0.16905975341796875, -0.1413726806640625, -0.11368560791015625, -0.08599853515625, -0.05831146240234375, -0.0306243896484375, -0.00293731689453125, 0.024749755859375, 0.05243682861328125, 0.0801239013671875, 0.10781097412109375, 0.135498046875, 0.16318511962890625, 0.1908721923828125, 0.21855926513671875, 0.246246337890625, 0.27393341064453125, 0.3016204833984375, 0.32930755615234375, 0.35699462890625, 0.38468170166015625, 0.4123687744140625, 0.44005584716796875, 0.467742919921875, 0.49542999267578125, 0.5231170654296875, 0.5508041381835938, 0.5784912109375, 0.6061782836914062, 0.6338653564453125, 0.6615524291992188, 0.689239501953125, 0.7169265747070312, 0.7446136474609375, 0.7723007202148438, 0.79998779296875, 0.8276748657226562, 0.8553619384765625, 0.8830490112304688, 0.910736083984375, 0.9384231567382812, 0.9661102294921875, 0.9937973022460938, 1.021484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 18.0, 21.0, 29.0, 32.0, 45.0, 78.0, 123.0, 131.0, 184.0, 244.0, 346.0, 439.0, 569.0, 871.0, 1205.0, 1694.0, 2662.0, 3800.0, 5977.0, 9812.0, 16993.0, 31692.0, 65999.0, 149403.0, 301991.0, 238409.0, 105710.0, 48787.0, 24321.0, 13262.0, 8045.0, 5030.0, 3163.0, 2192.0, 1452.0, 1065.0, 732.0, 555.0, 368.0, 308.0, 209.0, 185.0, 84.0, 92.0, 64.0, 43.0, 29.0, 26.0, 19.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0], "bins": [-0.2322998046875, -0.22542572021484375, -0.2185516357421875, -0.21167755126953125, -0.204803466796875, -0.19792938232421875, -0.1910552978515625, -0.18418121337890625, -0.17730712890625, -0.17043304443359375, -0.1635589599609375, -0.15668487548828125, -0.149810791015625, -0.14293670654296875, -0.1360626220703125, -0.12918853759765625, -0.122314453125, -0.11544036865234375, -0.1085662841796875, -0.10169219970703125, -0.094818115234375, -0.08794403076171875, -0.0810699462890625, -0.07419586181640625, -0.06732177734375, -0.06044769287109375, -0.0535736083984375, -0.04669952392578125, -0.039825439453125, -0.03295135498046875, -0.0260772705078125, -0.01920318603515625, -0.0123291015625, -0.00545501708984375, 0.0014190673828125, 0.00829315185546875, 0.015167236328125, 0.02204132080078125, 0.0289154052734375, 0.03578948974609375, 0.04266357421875, 0.04953765869140625, 0.0564117431640625, 0.06328582763671875, 0.070159912109375, 0.07703399658203125, 0.0839080810546875, 0.09078216552734375, 0.09765625, 0.10453033447265625, 0.1114044189453125, 0.11827850341796875, 0.125152587890625, 0.13202667236328125, 0.1389007568359375, 0.14577484130859375, 0.15264892578125, 0.15952301025390625, 0.1663970947265625, 0.17327117919921875, 0.180145263671875, 0.18701934814453125, 0.1938934326171875, 0.20076751708984375, 0.2076416015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 13.0, 5.0, 13.0, 19.0, 15.0, 26.0, 30.0, 31.0, 39.0, 70.0, 64.0, 76.0, 85.0, 82.0, 72.0, 78.0, 62.0, 53.0, 24.0, 27.0, 24.0, 15.0, 17.0, 10.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.2709369659423828e-05, -2.2079795598983765e-05, -2.14502215385437e-05, -2.0820647478103638e-05, -2.0191073417663574e-05, -1.956149935722351e-05, -1.8931925296783447e-05, -1.8302351236343384e-05, -1.767277717590332e-05, -1.7043203115463257e-05, -1.6413629055023193e-05, -1.578405499458313e-05, -1.5154480934143066e-05, -1.4524906873703003e-05, -1.389533281326294e-05, -1.3265758752822876e-05, -1.2636184692382812e-05, -1.2006610631942749e-05, -1.1377036571502686e-05, -1.0747462511062622e-05, -1.0117888450622559e-05, -9.488314390182495e-06, -8.858740329742432e-06, -8.229166269302368e-06, -7.599592208862305e-06, -6.970018148422241e-06, -6.340444087982178e-06, -5.710870027542114e-06, -5.081295967102051e-06, -4.451721906661987e-06, -3.822147846221924e-06, -3.1925737857818604e-06, -2.562999725341797e-06, -1.9334256649017334e-06, -1.30385160446167e-06, -6.742775440216064e-07, -4.470348358154297e-08, 5.848705768585205e-07, 1.214444637298584e-06, 1.8440186977386475e-06, 2.473592758178711e-06, 3.1031668186187744e-06, 3.732740879058838e-06, 4.362314939498901e-06, 4.991888999938965e-06, 5.621463060379028e-06, 6.251037120819092e-06, 6.880611181259155e-06, 7.510185241699219e-06, 8.139759302139282e-06, 8.769333362579346e-06, 9.39890742301941e-06, 1.0028481483459473e-05, 1.0658055543899536e-05, 1.12876296043396e-05, 1.1917203664779663e-05, 1.2546777725219727e-05, 1.317635178565979e-05, 1.3805925846099854e-05, 1.4435499906539917e-05, 1.506507396697998e-05, 1.5694648027420044e-05, 1.6324222087860107e-05, 1.695379614830017e-05, 1.7583370208740234e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 3.0, 18.0, 12.0, 25.0, 32.0, 40.0, 72.0, 115.0, 160.0, 248.0, 414.0, 642.0, 935.0, 1456.0, 2144.0, 3403.0, 5216.0, 8202.0, 13302.0, 21351.0, 34753.0, 58266.0, 99458.0, 161448.0, 206357.0, 166801.0, 104936.0, 61770.0, 36595.0, 22115.0, 13847.0, 8758.0, 5522.0, 3507.0, 2361.0, 1517.0, 1005.0, 611.0, 377.0, 267.0, 154.0, 114.0, 73.0, 40.0, 38.0, 21.0, 28.0, 7.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.2200927734375, -0.21372222900390625, -0.2073516845703125, -0.20098114013671875, -0.194610595703125, -0.18824005126953125, -0.1818695068359375, -0.17549896240234375, -0.16912841796875, -0.16275787353515625, -0.1563873291015625, -0.15001678466796875, -0.143646240234375, -0.13727569580078125, -0.1309051513671875, -0.12453460693359375, -0.1181640625, -0.11179351806640625, -0.1054229736328125, -0.09905242919921875, -0.092681884765625, -0.08631134033203125, -0.0799407958984375, -0.07357025146484375, -0.06719970703125, -0.06082916259765625, -0.0544586181640625, -0.04808807373046875, -0.041717529296875, -0.03534698486328125, -0.0289764404296875, -0.02260589599609375, -0.0162353515625, -0.00986480712890625, -0.0034942626953125, 0.00287628173828125, 0.009246826171875, 0.01561737060546875, 0.0219879150390625, 0.02835845947265625, 0.03472900390625, 0.04109954833984375, 0.0474700927734375, 0.05384063720703125, 0.060211181640625, 0.06658172607421875, 0.0729522705078125, 0.07932281494140625, 0.085693359375, 0.09206390380859375, 0.0984344482421875, 0.10480499267578125, 0.111175537109375, 0.11754608154296875, 0.1239166259765625, 0.13028717041015625, 0.13665771484375, 0.14302825927734375, 0.1493988037109375, 0.15576934814453125, 0.162139892578125, 0.16851043701171875, 0.1748809814453125, 0.18125152587890625, 0.1876220703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 14.0, 26.0, 34.0, 25.0, 36.0, 58.0, 62.0, 73.0, 79.0, 84.0, 93.0, 54.0, 63.0, 51.0, 29.0, 42.0, 37.0, 29.0, 17.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.0648794174194336, -0.06225395202636719, -0.05962848663330078, -0.057003021240234375, -0.05437755584716797, -0.05175209045410156, -0.049126625061035156, -0.04650115966796875, -0.043875694274902344, -0.04125022888183594, -0.03862476348876953, -0.035999298095703125, -0.03337383270263672, -0.030748367309570312, -0.028122901916503906, -0.0254974365234375, -0.022871971130371094, -0.020246505737304688, -0.01762104034423828, -0.014995574951171875, -0.012370109558105469, -0.009744644165039062, -0.007119178771972656, -0.00449371337890625, -0.0018682479858398438, 0.0007572174072265625, 0.0033826828002929688, 0.006008148193359375, 0.008633613586425781, 0.011259078979492188, 0.013884544372558594, 0.016510009765625, 0.019135475158691406, 0.021760940551757812, 0.02438640594482422, 0.027011871337890625, 0.02963733673095703, 0.03226280212402344, 0.034888267517089844, 0.03751373291015625, 0.040139198303222656, 0.04276466369628906, 0.04539012908935547, 0.048015594482421875, 0.05064105987548828, 0.05326652526855469, 0.055891990661621094, 0.0585174560546875, 0.061142921447753906, 0.06376838684082031, 0.06639385223388672, 0.06901931762695312, 0.07164478302001953, 0.07427024841308594, 0.07689571380615234, 0.07952117919921875, 0.08214664459228516, 0.08477210998535156, 0.08739757537841797, 0.09002304077148438, 0.09264850616455078, 0.09527397155761719, 0.0978994369506836, 0.10052490234375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 11.0, 11.0, 19.0, 22.0, 29.0, 35.0, 22.0, 51.0, 42.0, 63.0, 50.0, 69.0, 59.0, 54.0, 65.0, 42.0, 47.0, 49.0, 36.0, 25.0, 34.0, 28.0, 21.0, 16.0, 18.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4869941473007202, -1.433651328086853, -1.3803086280822754, -1.3269658088684082, -1.273622989654541, -1.2202801704406738, -1.1669373512268066, -1.113594651222229, -1.0602518320083618, -1.0069090127944946, -0.9535662531852722, -0.9002234935760498, -0.8468806743621826, -0.7935378551483154, -0.740195095539093, -0.6868523359298706, -0.6335095167160034, -0.5801666975021362, -0.5268239378929138, -0.473481148481369, -0.4201383590698242, -0.3667955696582794, -0.3134527802467346, -0.2601099908351898, -0.20676720142364502, -0.15342441201210022, -0.10008162260055542, -0.04673883318901062, 0.00660395622253418, 0.05994674563407898, 0.11328953504562378, 0.16663232445716858, 0.21997511386871338, 0.2733179032802582, 0.326660692691803, 0.3800034821033478, 0.4333462715148926, 0.4866890609264374, 0.5400318503379822, 0.5933746099472046, 0.6467174291610718, 0.700060248374939, 0.7534030079841614, 0.8067457675933838, 0.860088586807251, 0.9134314060211182, 0.9667741656303406, 1.020116925239563, 1.0734597444534302, 1.1268025636672974, 1.180145263671875, 1.2334880828857422, 1.2868309020996094, 1.3401737213134766, 1.3935165405273438, 1.4468592405319214, 1.5002020597457886, 1.5535448789596558, 1.6068875789642334, 1.6602303981781006, 1.7135732173919678, 1.766916036605835, 1.8202588558197021, 1.8736015558242798, 1.926944375038147]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 4.0, 12.0, 13.0, 5.0, 8.0, 7.0, 17.0, 17.0, 19.0, 17.0, 24.0, 28.0, 29.0, 26.0, 30.0, 36.0, 35.0, 33.0, 40.0, 43.0, 30.0, 45.0, 29.0, 37.0, 36.0, 32.0, 22.0, 34.0, 33.0, 36.0, 23.0, 21.0, 26.0, 21.0, 17.0, 16.0, 12.0, 23.0, 10.0, 16.0, 7.0, 5.0, 7.0, 2.0, 5.0, 2.0, 8.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.1195793151855469, -1.0842653512954712, -1.048951506614685, -1.0136375427246094, -0.9783235788345337, -0.9430096745491028, -0.9076957702636719, -0.8723818063735962, -0.8370679020881653, -0.8017539978027344, -0.7664400339126587, -0.7311261296272278, -0.6958122253417969, -0.6604982614517212, -0.6251843571662903, -0.5898704528808594, -0.5545564889907837, -0.5192425847053528, -0.4839286208152771, -0.4486147165298462, -0.4133007824420929, -0.3779868483543396, -0.3426729440689087, -0.3073590099811554, -0.2720450758934021, -0.2367311418056488, -0.2014172226190567, -0.1661033034324646, -0.1307893693447113, -0.09547543525695801, -0.060161516070365906, -0.024847596883773804, 0.010466217994689941, 0.04578014463186264, 0.08109407126903534, 0.11640799790620804, 0.15172192454338074, 0.18703585863113403, 0.22234977781772614, 0.25766369700431824, 0.29297763109207153, 0.32829156517982483, 0.3636054992675781, 0.39891940355300903, 0.43423333764076233, 0.4695472717285156, 0.5048611760139465, 0.5401750802993774, 0.5754890441894531, 0.610802948474884, 0.6461169123649597, 0.6814308166503906, 0.7167447805404663, 0.7520586848258972, 0.7873725891113281, 0.8226865530014038, 0.8580004572868347, 0.8933143615722656, 0.9286283254623413, 0.9639422297477722, 0.9992561340332031, 1.0345700979232788, 1.0698840618133545, 1.1051979064941406, 1.1405118703842163]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 9.0, 9.0, 21.0, 23.0, 26.0, 35.0, 58.0, 78.0, 145.0, 182.0, 279.0, 420.0, 617.0, 833.0, 1273.0, 1946.0, 2980.0, 4437.0, 6468.0, 9511.0, 14122.0, 20150.0, 28597.0, 39687.0, 52228.0, 67427.0, 81790.0, 93884.0, 100042.0, 99973.0, 92837.0, 81267.0, 66285.0, 51557.0, 38564.0, 28347.0, 19676.0, 13907.0, 9248.0, 6521.0, 4258.0, 2877.0, 1954.0, 1284.0, 899.0, 561.0, 425.0, 268.0, 168.0, 130.0, 77.0, 68.0, 40.0, 37.0, 20.0, 12.0, 11.0, 10.0, 2.0, 0.0, 2.0], "bins": [-0.9580078125, -0.9280471801757812, -0.8980865478515625, -0.8681259155273438, -0.838165283203125, -0.8082046508789062, -0.7782440185546875, -0.7482833862304688, -0.71832275390625, -0.6883621215820312, -0.6584014892578125, -0.6284408569335938, -0.598480224609375, -0.5685195922851562, -0.5385589599609375, -0.5085983276367188, -0.4786376953125, -0.44867706298828125, -0.4187164306640625, -0.38875579833984375, -0.358795166015625, -0.32883453369140625, -0.2988739013671875, -0.26891326904296875, -0.23895263671875, -0.20899200439453125, -0.1790313720703125, -0.14907073974609375, -0.119110107421875, -0.08914947509765625, -0.0591888427734375, -0.02922821044921875, 0.000732421875, 0.03069305419921875, 0.0606536865234375, 0.09061431884765625, 0.120574951171875, 0.15053558349609375, 0.1804962158203125, 0.21045684814453125, 0.24041748046875, 0.27037811279296875, 0.3003387451171875, 0.33029937744140625, 0.360260009765625, 0.39022064208984375, 0.4201812744140625, 0.45014190673828125, 0.4801025390625, 0.5100631713867188, 0.5400238037109375, 0.5699844360351562, 0.599945068359375, 0.6299057006835938, 0.6598663330078125, 0.6898269653320312, 0.71978759765625, 0.7497482299804688, 0.7797088623046875, 0.8096694946289062, 0.839630126953125, 0.8695907592773438, 0.8995513916015625, 0.9295120239257812, 0.95947265625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 9.0, 15.0, 9.0, 14.0, 18.0, 16.0, 18.0, 32.0, 18.0, 27.0, 27.0, 35.0, 32.0, 39.0, 38.0, 42.0, 42.0, 35.0, 45.0, 34.0, 30.0, 40.0, 39.0, 31.0, 31.0, 29.0, 32.0, 36.0, 20.0, 22.0, 28.0, 14.0, 24.0, 15.0, 13.0, 6.0, 7.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.2323455810546875, -1.193206787109375, -1.1540679931640625, -1.11492919921875, -1.0757904052734375, -1.036651611328125, -0.9975128173828125, -0.9583740234375, -0.9192352294921875, -0.880096435546875, -0.8409576416015625, -0.80181884765625, -0.7626800537109375, -0.723541259765625, -0.6844024658203125, -0.645263671875, -0.6061248779296875, -0.566986083984375, -0.5278472900390625, -0.48870849609375, -0.4495697021484375, -0.410430908203125, -0.3712921142578125, -0.3321533203125, -0.2930145263671875, -0.253875732421875, -0.2147369384765625, -0.17559814453125, -0.1364593505859375, -0.097320556640625, -0.0581817626953125, -0.01904296875, 0.0200958251953125, 0.059234619140625, 0.0983734130859375, 0.13751220703125, 0.1766510009765625, 0.215789794921875, 0.2549285888671875, 0.2940673828125, 0.3332061767578125, 0.372344970703125, 0.4114837646484375, 0.45062255859375, 0.4897613525390625, 0.528900146484375, 0.5680389404296875, 0.607177734375, 0.6463165283203125, 0.685455322265625, 0.7245941162109375, 0.76373291015625, 0.8028717041015625, 0.842010498046875, 0.8811492919921875, 0.9202880859375, 0.9594268798828125, 0.998565673828125, 1.0377044677734375, 1.07684326171875, 1.1159820556640625, 1.155120849609375, 1.1942596435546875, 1.2333984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 29.0, 68.0, 67.0, 119.0, 184.0, 317.0, 494.0, 762.0, 1152.0, 2022.0, 3092.0, 4905.0, 8088.0, 12717.0, 20001.0, 30216.0, 44584.0, 62767.0, 83348.0, 102451.0, 116277.0, 118908.0, 110914.0, 93998.0, 73122.0, 53166.0, 37010.0, 24681.0, 15944.0, 10088.0, 6514.0, 3982.0, 2479.0, 1537.0, 959.0, 526.0, 366.0, 207.0, 155.0, 102.0, 67.0, 40.0, 28.0, 19.0, 9.0, 14.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.1669921875, -1.13189697265625, -1.0968017578125, -1.06170654296875, -1.026611328125, -0.99151611328125, -0.9564208984375, -0.92132568359375, -0.88623046875, -0.85113525390625, -0.8160400390625, -0.78094482421875, -0.745849609375, -0.71075439453125, -0.6756591796875, -0.64056396484375, -0.60546875, -0.57037353515625, -0.5352783203125, -0.50018310546875, -0.465087890625, -0.42999267578125, -0.3948974609375, -0.35980224609375, -0.32470703125, -0.28961181640625, -0.2545166015625, -0.21942138671875, -0.184326171875, -0.14923095703125, -0.1141357421875, -0.07904052734375, -0.0439453125, -0.00885009765625, 0.0262451171875, 0.06134033203125, 0.096435546875, 0.13153076171875, 0.1666259765625, 0.20172119140625, 0.23681640625, 0.27191162109375, 0.3070068359375, 0.34210205078125, 0.377197265625, 0.41229248046875, 0.4473876953125, 0.48248291015625, 0.517578125, 0.55267333984375, 0.5877685546875, 0.62286376953125, 0.657958984375, 0.69305419921875, 0.7281494140625, 0.76324462890625, 0.79833984375, 0.83343505859375, 0.8685302734375, 0.90362548828125, 0.938720703125, 0.97381591796875, 1.0089111328125, 1.04400634765625, 1.0791015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 8.0, 17.0, 23.0, 19.0, 23.0, 29.0, 28.0, 30.0, 29.0, 28.0, 31.0, 34.0, 40.0, 48.0, 45.0, 29.0, 33.0, 38.0, 35.0, 42.0, 32.0, 40.0, 26.0, 29.0, 29.0, 31.0, 19.0, 22.0, 13.0, 16.0, 16.0, 13.0, 17.0, 3.0, 14.0, 11.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.701171875, -0.6784591674804688, -0.6557464599609375, -0.6330337524414062, -0.610321044921875, -0.5876083374023438, -0.5648956298828125, -0.5421829223632812, -0.51947021484375, -0.49675750732421875, -0.4740447998046875, -0.45133209228515625, -0.428619384765625, -0.40590667724609375, -0.3831939697265625, -0.36048126220703125, -0.3377685546875, -0.31505584716796875, -0.2923431396484375, -0.26963043212890625, -0.246917724609375, -0.22420501708984375, -0.2014923095703125, -0.17877960205078125, -0.15606689453125, -0.13335418701171875, -0.1106414794921875, -0.08792877197265625, -0.065216064453125, -0.04250335693359375, -0.0197906494140625, 0.00292205810546875, 0.025634765625, 0.04834747314453125, 0.0710601806640625, 0.09377288818359375, 0.116485595703125, 0.13919830322265625, 0.1619110107421875, 0.18462371826171875, 0.20733642578125, 0.23004913330078125, 0.2527618408203125, 0.27547454833984375, 0.298187255859375, 0.32089996337890625, 0.3436126708984375, 0.36632537841796875, 0.3890380859375, 0.41175079345703125, 0.4344635009765625, 0.45717620849609375, 0.479888916015625, 0.5026016235351562, 0.5253143310546875, 0.5480270385742188, 0.57073974609375, 0.5934524536132812, 0.6161651611328125, 0.6388778686523438, 0.661590576171875, 0.6843032836914062, 0.7070159912109375, 0.7297286987304688, 0.75244140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 9.0, 7.0, 13.0, 16.0, 29.0, 39.0, 43.0, 82.0, 137.0, 235.0, 319.0, 584.0, 978.0, 1580.0, 2731.0, 4820.0, 8641.0, 16403.0, 31157.0, 58939.0, 107061.0, 169935.0, 206219.0, 179453.0, 117424.0, 66069.0, 34905.0, 18197.0, 9790.0, 5309.0, 2977.0, 1718.0, 1037.0, 649.0, 366.0, 227.0, 145.0, 88.0, 66.0, 43.0, 32.0, 20.0, 18.0, 11.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.98583984375, -0.95733642578125, -0.9288330078125, -0.90032958984375, -0.871826171875, -0.84332275390625, -0.8148193359375, -0.78631591796875, -0.7578125, -0.72930908203125, -0.7008056640625, -0.67230224609375, -0.643798828125, -0.61529541015625, -0.5867919921875, -0.55828857421875, -0.52978515625, -0.50128173828125, -0.4727783203125, -0.44427490234375, -0.415771484375, -0.38726806640625, -0.3587646484375, -0.33026123046875, -0.3017578125, -0.27325439453125, -0.2447509765625, -0.21624755859375, -0.187744140625, -0.15924072265625, -0.1307373046875, -0.10223388671875, -0.07373046875, -0.04522705078125, -0.0167236328125, 0.01177978515625, 0.040283203125, 0.06878662109375, 0.0972900390625, 0.12579345703125, 0.154296875, 0.18280029296875, 0.2113037109375, 0.23980712890625, 0.268310546875, 0.29681396484375, 0.3253173828125, 0.35382080078125, 0.38232421875, 0.41082763671875, 0.4393310546875, 0.46783447265625, 0.496337890625, 0.52484130859375, 0.5533447265625, 0.58184814453125, 0.6103515625, 0.63885498046875, 0.6673583984375, 0.69586181640625, 0.724365234375, 0.75286865234375, 0.7813720703125, 0.80987548828125, 0.83837890625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 20.0, 14.0, 20.0, 22.0, 32.0, 29.0, 37.0, 50.0, 51.0, 50.0, 70.0, 48.0, 48.0, 61.0, 46.0, 69.0, 51.0, 41.0, 33.0, 38.0, 27.0, 18.0, 13.0, 19.0, 12.0, 14.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.426738739013672e-05, -7.211044430732727e-05, -6.995350122451782e-05, -6.779655814170837e-05, -6.563961505889893e-05, -6.348267197608948e-05, -6.132572889328003e-05, -5.916878581047058e-05, -5.701184272766113e-05, -5.4854899644851685e-05, -5.2697956562042236e-05, -5.054101347923279e-05, -4.838407039642334e-05, -4.622712731361389e-05, -4.407018423080444e-05, -4.1913241147994995e-05, -3.975629806518555e-05, -3.75993549823761e-05, -3.544241189956665e-05, -3.32854688167572e-05, -3.1128525733947754e-05, -2.8971582651138306e-05, -2.6814639568328857e-05, -2.465769648551941e-05, -2.250075340270996e-05, -2.0343810319900513e-05, -1.8186867237091064e-05, -1.6029924154281616e-05, -1.3872981071472168e-05, -1.171603798866272e-05, -9.559094905853271e-06, -7.402151823043823e-06, -5.245208740234375e-06, -3.0882656574249268e-06, -9.313225746154785e-07, 1.2256205081939697e-06, 3.382563591003418e-06, 5.539506673812866e-06, 7.696449756622314e-06, 9.853392839431763e-06, 1.2010335922241211e-05, 1.416727900505066e-05, 1.6324222087860107e-05, 1.8481165170669556e-05, 2.0638108253479004e-05, 2.2795051336288452e-05, 2.49519944190979e-05, 2.710893750190735e-05, 2.9265880584716797e-05, 3.1422823667526245e-05, 3.357976675033569e-05, 3.573670983314514e-05, 3.789365291595459e-05, 4.005059599876404e-05, 4.2207539081573486e-05, 4.4364482164382935e-05, 4.652142524719238e-05, 4.867836833000183e-05, 5.083531141281128e-05, 5.299225449562073e-05, 5.5149197578430176e-05, 5.7306140661239624e-05, 5.946308374404907e-05, 6.162002682685852e-05, 6.377696990966797e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 12.0, 15.0, 23.0, 36.0, 44.0, 74.0, 99.0, 142.0, 203.0, 282.0, 478.0, 713.0, 1120.0, 1600.0, 2595.0, 3883.0, 6021.0, 9513.0, 15378.0, 24343.0, 37686.0, 56452.0, 82289.0, 110634.0, 132661.0, 137119.0, 123755.0, 98314.0, 70054.0, 47818.0, 30862.0, 19866.0, 12479.0, 7609.0, 5040.0, 3219.0, 2080.0, 1329.0, 904.0, 634.0, 387.0, 257.0, 175.0, 117.0, 75.0, 63.0, 32.0, 24.0, 13.0, 12.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5724029541015625, -0.553497314453125, -0.5345916748046875, -0.51568603515625, -0.4967803955078125, -0.477874755859375, -0.4589691162109375, -0.4400634765625, -0.4211578369140625, -0.402252197265625, -0.3833465576171875, -0.36444091796875, -0.3455352783203125, -0.326629638671875, -0.3077239990234375, -0.288818359375, -0.2699127197265625, -0.251007080078125, -0.2321014404296875, -0.21319580078125, -0.1942901611328125, -0.175384521484375, -0.1564788818359375, -0.1375732421875, -0.1186676025390625, -0.099761962890625, -0.0808563232421875, -0.06195068359375, -0.0430450439453125, -0.024139404296875, -0.0052337646484375, 0.013671875, 0.0325775146484375, 0.051483154296875, 0.0703887939453125, 0.08929443359375, 0.1082000732421875, 0.127105712890625, 0.1460113525390625, 0.1649169921875, 0.1838226318359375, 0.202728271484375, 0.2216339111328125, 0.24053955078125, 0.2594451904296875, 0.278350830078125, 0.2972564697265625, 0.316162109375, 0.3350677490234375, 0.353973388671875, 0.3728790283203125, 0.39178466796875, 0.4106903076171875, 0.429595947265625, 0.4485015869140625, 0.4674072265625, 0.4863128662109375, 0.505218505859375, 0.5241241455078125, 0.54302978515625, 0.5619354248046875, 0.580841064453125, 0.5997467041015625, 0.61865234375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 3.0, 10.0, 7.0, 6.0, 5.0, 12.0, 18.0, 18.0, 29.0, 26.0, 26.0, 40.0, 30.0, 51.0, 35.0, 58.0, 45.0, 55.0, 52.0, 60.0, 53.0, 48.0, 51.0, 38.0, 40.0, 39.0, 19.0, 19.0, 23.0, 13.0, 16.0, 10.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22766685485839844, -0.21961593627929688, -0.2115650177001953, -0.20351409912109375, -0.1954631805419922, -0.18741226196289062, -0.17936134338378906, -0.1713104248046875, -0.16325950622558594, -0.15520858764648438, -0.1471576690673828, -0.13910675048828125, -0.1310558319091797, -0.12300491333007812, -0.11495399475097656, -0.106903076171875, -0.09885215759277344, -0.09080123901367188, -0.08275032043457031, -0.07469940185546875, -0.06664848327636719, -0.058597564697265625, -0.05054664611816406, -0.0424957275390625, -0.03444480895996094, -0.026393890380859375, -0.018342971801757812, -0.01029205322265625, -0.0022411346435546875, 0.005809783935546875, 0.013860702514648438, 0.02191162109375, 0.029962539672851562, 0.038013458251953125, 0.04606437683105469, 0.05411529541015625, 0.06216621398925781, 0.07021713256835938, 0.07826805114746094, 0.0863189697265625, 0.09436988830566406, 0.10242080688476562, 0.11047172546386719, 0.11852264404296875, 0.1265735626220703, 0.13462448120117188, 0.14267539978027344, 0.150726318359375, 0.15877723693847656, 0.16682815551757812, 0.1748790740966797, 0.18292999267578125, 0.1909809112548828, 0.19903182983398438, 0.20708274841308594, 0.2151336669921875, 0.22318458557128906, 0.23123550415039062, 0.2392864227294922, 0.24733734130859375, 0.2553882598876953, 0.2634391784667969, 0.27149009704589844, 0.279541015625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 9.0, 5.0, 6.0, 7.0, 16.0, 15.0, 21.0, 23.0, 38.0, 29.0, 47.0, 48.0, 44.0, 52.0, 50.0, 56.0, 71.0, 50.0, 58.0, 47.0, 43.0, 42.0, 35.0, 32.0, 27.0, 22.0, 22.0, 16.0, 13.0, 5.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4840911626815796, -1.4314384460449219, -1.3787857294082642, -1.3261330127716064, -1.2734804153442383, -1.2208276987075806, -1.1681749820709229, -1.1155222654342651, -1.0628695487976074, -1.0102168321609497, -0.9575641751289368, -0.904911458492279, -0.8522588014602661, -0.7996060848236084, -0.7469533681869507, -0.694300651550293, -0.6416480541229248, -0.5889953374862671, -0.5363426804542542, -0.48368996381759644, -0.4310372769832611, -0.3783845901489258, -0.32573187351226807, -0.27307918667793274, -0.2204264998435974, -0.16777381300926208, -0.11512111127376556, -0.06246840953826904, -0.009815722703933716, 0.04283696413040161, 0.09548968076705933, 0.14814236760139465, 0.20079493522644043, 0.25344762206077576, 0.3061003088951111, 0.3587530255317688, 0.4114057123661041, 0.46405839920043945, 0.5167111158370972, 0.5693638324737549, 0.6220164895057678, 0.6746692061424255, 0.7273218631744385, 0.7799745798110962, 0.8326272964477539, 0.8852799534797668, 0.9379326701164246, 0.9905853271484375, 1.0432380437850952, 1.095890760421753, 1.1485434770584106, 1.2011961936950684, 1.2538487911224365, 1.3065015077590942, 1.359154224395752, 1.4118069410324097, 1.4644596576690674, 1.517112374305725, 1.5697650909423828, 1.622417688369751, 1.6750704050064087, 1.7277231216430664, 1.7803758382797241, 1.8330285549163818, 1.88568115234375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 8.0, 13.0, 18.0, 16.0, 12.0, 27.0, 26.0, 29.0, 25.0, 37.0, 28.0, 26.0, 41.0, 37.0, 37.0, 37.0, 42.0, 36.0, 30.0, 32.0, 38.0, 39.0, 31.0, 26.0, 25.0, 30.0, 23.0, 27.0, 26.0, 17.0, 14.0, 14.0, 13.0, 13.0, 11.0, 12.0, 15.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-1.2504222393035889, -1.2146520614624023, -1.1788820028305054, -1.1431118249893188, -1.1073417663574219, -1.0715715885162354, -1.0358015298843384, -1.0000313520431519, -0.9642612934112549, -0.9284911751747131, -0.8927210569381714, -0.8569509387016296, -0.8211808204650879, -0.7854107022285461, -0.7496405839920044, -0.7138704061508179, -0.6781002879142761, -0.6423301696777344, -0.6065600514411926, -0.5707899332046509, -0.5350198149681091, -0.4992496967315674, -0.46347954869270325, -0.4277094304561615, -0.39193931221961975, -0.356169193983078, -0.32039907574653625, -0.2846289277076721, -0.24885882437229156, -0.21308870613574982, -0.17731857299804688, -0.14154845476150513, -0.10577833652496338, -0.07000821828842163, -0.034238092601299286, 0.001532033085823059, 0.03730215132236481, 0.07307226955890656, 0.1088424026966095, 0.14461252093315125, 0.180382639169693, 0.21615275740623474, 0.2519228756427765, 0.2876930236816406, 0.3234631419181824, 0.3592332601547241, 0.39500337839126587, 0.4307734966278076, 0.46654361486434937, 0.5023137331008911, 0.5380838513374329, 0.5738539695739746, 0.6096240878105164, 0.6453942060470581, 0.6811643838882446, 0.7169344425201416, 0.7527046203613281, 0.7884747385978699, 0.8242448568344116, 0.8600149750709534, 0.8957850933074951, 0.9315552115440369, 0.9673253297805786, 1.0030955076217651, 1.038865566253662]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 27.0, 51.0, 55.0, 87.0, 141.0, 202.0, 342.0, 526.0, 773.0, 1209.0, 1954.0, 3154.0, 5054.0, 8268.0, 13544.0, 22511.0, 37272.0, 62087.0, 102599.0, 165864.0, 261436.0, 385996.0, 514907.0, 595147.0, 580517.0, 478583.0, 348549.0, 230901.0, 146224.0, 89542.0, 53929.0, 32804.0, 19336.0, 11745.0, 7175.0, 4370.0, 2751.0, 1632.0, 1050.0, 640.0, 454.0, 287.0, 210.0, 126.0, 83.0, 46.0, 35.0, 22.0, 13.0, 6.0, 9.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0], "bins": [-1.1181640625, -1.0819244384765625, -1.045684814453125, -1.0094451904296875, -0.97320556640625, -0.9369659423828125, -0.900726318359375, -0.8644866943359375, -0.8282470703125, -0.7920074462890625, -0.755767822265625, -0.7195281982421875, -0.68328857421875, -0.6470489501953125, -0.610809326171875, -0.5745697021484375, -0.538330078125, -0.5020904541015625, -0.465850830078125, -0.4296112060546875, -0.39337158203125, -0.3571319580078125, -0.320892333984375, -0.2846527099609375, -0.2484130859375, -0.2121734619140625, -0.175933837890625, -0.1396942138671875, -0.10345458984375, -0.0672149658203125, -0.030975341796875, 0.0052642822265625, 0.04150390625, 0.0777435302734375, 0.113983154296875, 0.1502227783203125, 0.18646240234375, 0.2227020263671875, 0.258941650390625, 0.2951812744140625, 0.3314208984375, 0.3676605224609375, 0.403900146484375, 0.4401397705078125, 0.47637939453125, 0.5126190185546875, 0.548858642578125, 0.5850982666015625, 0.621337890625, 0.6575775146484375, 0.693817138671875, 0.7300567626953125, 0.76629638671875, 0.8025360107421875, 0.838775634765625, 0.8750152587890625, 0.9112548828125, 0.9474945068359375, 0.983734130859375, 1.0199737548828125, 1.05621337890625, 1.0924530029296875, 1.128692626953125, 1.1649322509765625, 1.201171875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 3.0, 13.0, 10.0, 10.0, 11.0, 10.0, 17.0, 22.0, 17.0, 31.0, 25.0, 39.0, 40.0, 33.0, 28.0, 37.0, 26.0, 43.0, 40.0, 39.0, 29.0, 39.0, 39.0, 39.0, 26.0, 35.0, 31.0, 33.0, 25.0, 28.0, 16.0, 23.0, 23.0, 18.0, 11.0, 11.0, 12.0, 16.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.842926025390625, -0.81622314453125, -0.789520263671875, -0.7628173828125, -0.736114501953125, -0.70941162109375, -0.682708740234375, -0.656005859375, -0.629302978515625, -0.60260009765625, -0.575897216796875, -0.5491943359375, -0.522491455078125, -0.49578857421875, -0.469085693359375, -0.4423828125, -0.415679931640625, -0.38897705078125, -0.362274169921875, -0.3355712890625, -0.308868408203125, -0.28216552734375, -0.255462646484375, -0.228759765625, -0.202056884765625, -0.17535400390625, -0.148651123046875, -0.1219482421875, -0.095245361328125, -0.06854248046875, -0.041839599609375, -0.01513671875, 0.011566162109375, 0.03826904296875, 0.064971923828125, 0.0916748046875, 0.118377685546875, 0.14508056640625, 0.171783447265625, 0.198486328125, 0.225189208984375, 0.25189208984375, 0.278594970703125, 0.3052978515625, 0.332000732421875, 0.35870361328125, 0.385406494140625, 0.412109375, 0.438812255859375, 0.46551513671875, 0.492218017578125, 0.5189208984375, 0.545623779296875, 0.57232666015625, 0.599029541015625, 0.625732421875, 0.652435302734375, 0.67913818359375, 0.705841064453125, 0.7325439453125, 0.759246826171875, 0.78594970703125, 0.812652587890625, 0.83935546875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 10.0, 18.0, 27.0, 53.0, 75.0, 140.0, 176.0, 299.0, 464.0, 772.0, 1244.0, 2035.0, 3147.0, 5348.0, 8621.0, 14054.0, 23110.0, 37565.0, 58740.0, 92549.0, 141389.0, 208076.0, 289879.0, 379392.0, 455817.0, 496042.0, 482191.0, 420586.0, 337083.0, 247941.0, 173525.0, 115371.0, 75168.0, 47425.0, 29394.0, 18006.0, 11169.0, 6637.0, 4120.0, 2539.0, 1571.0, 950.0, 580.0, 356.0, 231.0, 139.0, 93.0, 60.0, 42.0, 26.0, 20.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.001953125, -0.9693756103515625, -0.936798095703125, -0.9042205810546875, -0.87164306640625, -0.8390655517578125, -0.806488037109375, -0.7739105224609375, -0.7413330078125, -0.7087554931640625, -0.676177978515625, -0.6436004638671875, -0.61102294921875, -0.5784454345703125, -0.545867919921875, -0.5132904052734375, -0.480712890625, -0.4481353759765625, -0.415557861328125, -0.3829803466796875, -0.35040283203125, -0.3178253173828125, -0.285247802734375, -0.2526702880859375, -0.2200927734375, -0.1875152587890625, -0.154937744140625, -0.1223602294921875, -0.08978271484375, -0.0572052001953125, -0.024627685546875, 0.0079498291015625, 0.04052734375, 0.0731048583984375, 0.105682373046875, 0.1382598876953125, 0.17083740234375, 0.2034149169921875, 0.235992431640625, 0.2685699462890625, 0.3011474609375, 0.3337249755859375, 0.366302490234375, 0.3988800048828125, 0.43145751953125, 0.4640350341796875, 0.496612548828125, 0.5291900634765625, 0.561767578125, 0.5943450927734375, 0.626922607421875, 0.6595001220703125, 0.69207763671875, 0.7246551513671875, 0.757232666015625, 0.7898101806640625, 0.8223876953125, 0.8549652099609375, 0.887542724609375, 0.9201202392578125, 0.95269775390625, 0.9852752685546875, 1.017852783203125, 1.0504302978515625, 1.0830078125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 8.0, 10.0, 21.0, 28.0, 31.0, 37.0, 62.0, 68.0, 64.0, 92.0, 124.0, 139.0, 153.0, 184.0, 233.0, 217.0, 261.0, 220.0, 245.0, 226.0, 217.0, 203.0, 190.0, 163.0, 163.0, 134.0, 131.0, 121.0, 73.0, 54.0, 43.0, 46.0, 23.0, 18.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5153656005859375, -0.499481201171875, -0.4835968017578125, -0.46771240234375, -0.4518280029296875, -0.435943603515625, -0.4200592041015625, -0.4041748046875, -0.3882904052734375, -0.372406005859375, -0.3565216064453125, -0.34063720703125, -0.3247528076171875, -0.308868408203125, -0.2929840087890625, -0.277099609375, -0.2612152099609375, -0.245330810546875, -0.2294464111328125, -0.21356201171875, -0.1976776123046875, -0.181793212890625, -0.1659088134765625, -0.1500244140625, -0.1341400146484375, -0.118255615234375, -0.1023712158203125, -0.08648681640625, -0.0706024169921875, -0.054718017578125, -0.0388336181640625, -0.02294921875, -0.0070648193359375, 0.008819580078125, 0.0247039794921875, 0.04058837890625, 0.0564727783203125, 0.072357177734375, 0.0882415771484375, 0.1041259765625, 0.1200103759765625, 0.135894775390625, 0.1517791748046875, 0.16766357421875, 0.1835479736328125, 0.199432373046875, 0.2153167724609375, 0.231201171875, 0.2470855712890625, 0.262969970703125, 0.2788543701171875, 0.29473876953125, 0.3106231689453125, 0.326507568359375, 0.3423919677734375, 0.3582763671875, 0.3741607666015625, 0.390045166015625, 0.4059295654296875, 0.42181396484375, 0.4376983642578125, 0.453582763671875, 0.4694671630859375, 0.4853515625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 18.0, 17.0, 25.0, 29.0, 38.0, 34.0, 45.0, 47.0, 45.0, 56.0, 63.0, 65.0, 61.0, 46.0, 63.0, 40.0, 35.0, 31.0, 29.0, 30.0, 31.0, 18.0, 23.0, 22.0, 7.0, 7.0, 10.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7404402494430542, -1.6902867555618286, -1.6401333808898926, -1.589979887008667, -1.5398263931274414, -1.4896728992462158, -1.4395195245742798, -1.3893660306930542, -1.3392125368118286, -1.289059042930603, -1.238905668258667, -1.1887521743774414, -1.1385986804962158, -1.0884451866149902, -1.0382918119430542, -0.9881383180618286, -0.9379848837852478, -0.887831449508667, -0.8376779556274414, -0.7875245213508606, -0.737371027469635, -0.6872175931930542, -0.6370640993118286, -0.5869106650352478, -0.536757230758667, -0.4866037666797638, -0.4364503026008606, -0.3862968683242798, -0.3361433744430542, -0.2859899401664734, -0.2358364760875702, -0.185683012008667, -0.1355295181274414, -0.08537605404853821, -0.03522259742021561, 0.014930859208106995, 0.06508432328701019, 0.1152377724647522, 0.1653912365436554, 0.2155447006225586, 0.2656981647014618, 0.315851628780365, 0.3660050928592682, 0.4161585569381714, 0.4663119912147522, 0.516465425491333, 0.5666189193725586, 0.6167724132537842, 0.666925847530365, 0.7170792818069458, 0.7672327756881714, 0.8173862099647522, 0.8675397038459778, 0.9176931381225586, 0.9678466320037842, 1.0180001258850098, 1.0681535005569458, 1.1183069944381714, 1.1684603691101074, 1.218613862991333, 1.2687673568725586, 1.3189208507537842, 1.3690742254257202, 1.4192277193069458, 1.4693812131881714]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 33.0, 31.0, 49.0, 32.0, 43.0, 33.0, 42.0, 45.0, 38.0, 41.0, 46.0, 48.0, 35.0, 43.0, 32.0, 41.0, 34.0, 29.0, 22.0, 29.0, 18.0, 22.0, 18.0, 18.0, 10.0, 13.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1312960386276245, -1.0931018590927124, -1.0549076795578003, -1.0167135000228882, -0.9785193204879761, -0.940325140953064, -0.9021309614181519, -0.8639367818832397, -0.8257426023483276, -0.7875484228134155, -0.7493542432785034, -0.7111600637435913, -0.6729658842086792, -0.6347717046737671, -0.596577525138855, -0.5583833456039429, -0.520189106464386, -0.4819949269294739, -0.44380074739456177, -0.40560656785964966, -0.36741238832473755, -0.32921820878982544, -0.29102399945259094, -0.25282981991767883, -0.21463564038276672, -0.17644146084785461, -0.1382472813129425, -0.1000530868768692, -0.06185890734195709, -0.023664727807044983, 0.01452946662902832, 0.05272364616394043, 0.09091782569885254, 0.12911200523376465, 0.16730618476867676, 0.20550037920475006, 0.24369455873966217, 0.2818887233734131, 0.3200829327106476, 0.3582771122455597, 0.3964712917804718, 0.4346654713153839, 0.472859650850296, 0.5110538601875305, 0.5492480397224426, 0.5874422192573547, 0.6256363987922668, 0.663830578327179, 0.7020247578620911, 0.7402189373970032, 0.7784131169319153, 0.8166072964668274, 0.8548014760017395, 0.8929956555366516, 0.9311898946762085, 0.9693840742111206, 1.0075782537460327, 1.0457724332809448, 1.083966612815857, 1.122160792350769, 1.1603549718856812, 1.1985491514205933, 1.2367433309555054, 1.2749375104904175, 1.3131316900253296]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 11.0, 22.0, 16.0, 46.0, 63.0, 92.0, 134.0, 198.0, 265.0, 442.0, 722.0, 1011.0, 1595.0, 2449.0, 3737.0, 5824.0, 8756.0, 13578.0, 20997.0, 32060.0, 48982.0, 73299.0, 105470.0, 140775.0, 155347.0, 133909.0, 99948.0, 68504.0, 45225.0, 29942.0, 19296.0, 12498.0, 8209.0, 5180.0, 3422.0, 2184.0, 1536.0, 928.0, 632.0, 396.0, 281.0, 194.0, 134.0, 76.0, 51.0, 37.0, 31.0, 26.0, 8.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.358642578125, -0.3485145568847656, -0.33838653564453125, -0.3282585144042969, -0.3181304931640625, -0.3080024719238281, -0.29787445068359375, -0.2877464294433594, -0.277618408203125, -0.2674903869628906, -0.25736236572265625, -0.24723434448242188, -0.2371063232421875, -0.22697830200195312, -0.21685028076171875, -0.20672225952148438, -0.19659423828125, -0.18646621704101562, -0.17633819580078125, -0.16621017456054688, -0.1560821533203125, -0.14595413208007812, -0.13582611083984375, -0.12569808959960938, -0.115570068359375, -0.10544204711914062, -0.09531402587890625, -0.08518600463867188, -0.0750579833984375, -0.06492996215820312, -0.05480194091796875, -0.044673919677734375, -0.0345458984375, -0.024417877197265625, -0.01428985595703125, -0.004161834716796875, 0.0059661865234375, 0.016094207763671875, 0.02622222900390625, 0.036350250244140625, 0.046478271484375, 0.056606292724609375, 0.06673431396484375, 0.07686233520507812, 0.0869903564453125, 0.09711837768554688, 0.10724639892578125, 0.11737442016601562, 0.12750244140625, 0.13763046264648438, 0.14775848388671875, 0.15788650512695312, 0.1680145263671875, 0.17814254760742188, 0.18827056884765625, 0.19839859008789062, 0.208526611328125, 0.21865463256835938, 0.22878265380859375, 0.23891067504882812, 0.2490386962890625, 0.2591667175292969, 0.26929473876953125, 0.2794227600097656, 0.28955078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 5.0, 8.0, 5.0, 8.0, 10.0, 13.0, 9.0, 18.0, 18.0, 27.0, 19.0, 31.0, 35.0, 35.0, 35.0, 29.0, 52.0, 31.0, 33.0, 46.0, 38.0, 42.0, 42.0, 45.0, 38.0, 40.0, 38.0, 26.0, 26.0, 32.0, 22.0, 31.0, 13.0, 18.0, 14.0, 10.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0423736572265625, -1.005645751953125, -0.9689178466796875, -0.93218994140625, -0.8954620361328125, -0.858734130859375, -0.8220062255859375, -0.7852783203125, -0.7485504150390625, -0.711822509765625, -0.6750946044921875, -0.63836669921875, -0.6016387939453125, -0.564910888671875, -0.5281829833984375, -0.491455078125, -0.4547271728515625, -0.417999267578125, -0.3812713623046875, -0.34454345703125, -0.3078155517578125, -0.271087646484375, -0.2343597412109375, -0.1976318359375, -0.1609039306640625, -0.124176025390625, -0.0874481201171875, -0.05072021484375, -0.0139923095703125, 0.022735595703125, 0.0594635009765625, 0.09619140625, 0.1329193115234375, 0.169647216796875, 0.2063751220703125, 0.24310302734375, 0.2798309326171875, 0.316558837890625, 0.3532867431640625, 0.3900146484375, 0.4267425537109375, 0.463470458984375, 0.5001983642578125, 0.53692626953125, 0.5736541748046875, 0.610382080078125, 0.6471099853515625, 0.683837890625, 0.7205657958984375, 0.757293701171875, 0.7940216064453125, 0.83074951171875, 0.8674774169921875, 0.904205322265625, 0.9409332275390625, 0.9776611328125, 1.0143890380859375, 1.051116943359375, 1.0878448486328125, 1.12457275390625, 1.1613006591796875, 1.198028564453125, 1.2347564697265625, 1.271484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 20.0, 13.0, 23.0, 29.0, 55.0, 75.0, 119.0, 169.0, 306.0, 486.0, 820.0, 1418.0, 2535.0, 4501.0, 8335.0, 16166.0, 31751.0, 62708.0, 120147.0, 204119.0, 236822.0, 167482.0, 92455.0, 47155.0, 23902.0, 12360.0, 6375.0, 3495.0, 1908.0, 1073.0, 645.0, 373.0, 215.0, 137.0, 120.0, 68.0, 51.0, 33.0, 17.0, 12.0, 14.0, 5.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.50390625, -0.48876953125, -0.4736328125, -0.45849609375, -0.443359375, -0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 7.0, 7.0, 13.0, 13.0, 25.0, 18.0, 19.0, 25.0, 24.0, 26.0, 45.0, 29.0, 31.0, 34.0, 42.0, 34.0, 33.0, 38.0, 32.0, 39.0, 35.0, 33.0, 28.0, 29.0, 28.0, 31.0, 28.0, 29.0, 23.0, 29.0, 19.0, 23.0, 21.0, 14.0, 14.0, 16.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6994247436523438, -0.6766815185546875, -0.6539382934570312, -0.631195068359375, -0.6084518432617188, -0.5857086181640625, -0.5629653930664062, -0.54022216796875, -0.5174789428710938, -0.4947357177734375, -0.47199249267578125, -0.449249267578125, -0.42650604248046875, -0.4037628173828125, -0.38101959228515625, -0.3582763671875, -0.33553314208984375, -0.3127899169921875, -0.29004669189453125, -0.267303466796875, -0.24456024169921875, -0.2218170166015625, -0.19907379150390625, -0.17633056640625, -0.15358734130859375, -0.1308441162109375, -0.10810089111328125, -0.085357666015625, -0.06261444091796875, -0.0398712158203125, -0.01712799072265625, 0.005615234375, 0.02835845947265625, 0.0511016845703125, 0.07384490966796875, 0.096588134765625, 0.11933135986328125, 0.1420745849609375, 0.16481781005859375, 0.18756103515625, 0.21030426025390625, 0.2330474853515625, 0.25579071044921875, 0.278533935546875, 0.30127716064453125, 0.3240203857421875, 0.34676361083984375, 0.3695068359375, 0.39225006103515625, 0.4149932861328125, 0.43773651123046875, 0.460479736328125, 0.48322296142578125, 0.5059661865234375, 0.5287094116210938, 0.55145263671875, 0.5741958618164062, 0.5969390869140625, 0.6196823120117188, 0.642425537109375, 0.6651687622070312, 0.6879119873046875, 0.7106552124023438, 0.7333984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 19.0, 26.0, 30.0, 53.0, 92.0, 94.0, 129.0, 178.0, 271.0, 372.0, 490.0, 724.0, 1016.0, 1391.0, 2200.0, 3264.0, 5237.0, 8778.0, 16545.0, 32888.0, 73867.0, 178310.0, 335355.0, 214488.0, 88057.0, 38656.0, 18903.0, 9985.0, 5853.0, 3593.0, 2335.0, 1601.0, 1055.0, 700.0, 542.0, 389.0, 279.0, 215.0, 158.0, 110.0, 77.0, 58.0, 36.0, 25.0, 26.0, 14.0, 15.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.19970703125, -0.1933879852294922, -0.18706893920898438, -0.18074989318847656, -0.17443084716796875, -0.16811180114746094, -0.16179275512695312, -0.1554737091064453, -0.1491546630859375, -0.1428356170654297, -0.13651657104492188, -0.13019752502441406, -0.12387847900390625, -0.11755943298339844, -0.11124038696289062, -0.10492134094238281, -0.098602294921875, -0.09228324890136719, -0.08596420288085938, -0.07964515686035156, -0.07332611083984375, -0.06700706481933594, -0.060688018798828125, -0.05436897277832031, -0.0480499267578125, -0.04173088073730469, -0.035411834716796875, -0.029092788696289062, -0.02277374267578125, -0.016454696655273438, -0.010135650634765625, -0.0038166046142578125, 0.00250244140625, 0.008821487426757812, 0.015140533447265625, 0.021459579467773438, 0.02777862548828125, 0.03409767150878906, 0.040416717529296875, 0.04673576354980469, 0.0530548095703125, 0.05937385559082031, 0.06569290161132812, 0.07201194763183594, 0.07833099365234375, 0.08465003967285156, 0.09096908569335938, 0.09728813171386719, 0.103607177734375, 0.10992622375488281, 0.11624526977539062, 0.12256431579589844, 0.12888336181640625, 0.13520240783691406, 0.14152145385742188, 0.1478404998779297, 0.1541595458984375, 0.1604785919189453, 0.16679763793945312, 0.17311668395996094, 0.17943572998046875, 0.18575477600097656, 0.19207382202148438, 0.1983928680419922, 0.2047119140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 10.0, 2.0, 7.0, 17.0, 15.0, 16.0, 17.0, 30.0, 33.0, 58.0, 68.0, 59.0, 72.0, 71.0, 74.0, 83.0, 72.0, 62.0, 52.0, 38.0, 43.0, 20.0, 23.0, 12.0, 16.0, 9.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.3930723071098328e-05, -1.3377517461776733e-05, -1.282431185245514e-05, -1.2271106243133545e-05, -1.171790063381195e-05, -1.1164695024490356e-05, -1.0611489415168762e-05, -1.0058283805847168e-05, -9.505078196525574e-06, -8.95187258720398e-06, -8.398666977882385e-06, -7.845461368560791e-06, -7.292255759239197e-06, -6.7390501499176025e-06, -6.185844540596008e-06, -5.632638931274414e-06, -5.07943332195282e-06, -4.526227712631226e-06, -3.973022103309631e-06, -3.419816493988037e-06, -2.866610884666443e-06, -2.3134052753448486e-06, -1.7601996660232544e-06, -1.2069940567016602e-06, -6.537884473800659e-07, -1.0058283805847168e-07, 4.5262277126312256e-07, 1.0058283805847168e-06, 1.559033989906311e-06, 2.1122395992279053e-06, 2.6654452085494995e-06, 3.2186508178710938e-06, 3.771856427192688e-06, 4.325062036514282e-06, 4.8782676458358765e-06, 5.431473255157471e-06, 5.984678864479065e-06, 6.537884473800659e-06, 7.091090083122253e-06, 7.644295692443848e-06, 8.197501301765442e-06, 8.750706911087036e-06, 9.30391252040863e-06, 9.857118129730225e-06, 1.0410323739051819e-05, 1.0963529348373413e-05, 1.1516734957695007e-05, 1.2069940567016602e-05, 1.2623146176338196e-05, 1.317635178565979e-05, 1.3729557394981384e-05, 1.4282763004302979e-05, 1.4835968613624573e-05, 1.5389174222946167e-05, 1.594237983226776e-05, 1.6495585441589355e-05, 1.704879105091095e-05, 1.7601996660232544e-05, 1.8155202269554138e-05, 1.8708407878875732e-05, 1.9261613488197327e-05, 1.981481909751892e-05, 2.0368024706840515e-05, 2.092123031616211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 4.0, 15.0, 24.0, 26.0, 34.0, 50.0, 94.0, 146.0, 233.0, 368.0, 577.0, 898.0, 1420.0, 2468.0, 3811.0, 6526.0, 11684.0, 21027.0, 39899.0, 75922.0, 139346.0, 220519.0, 220420.0, 138690.0, 75217.0, 39763.0, 20831.0, 11654.0, 6795.0, 3905.0, 2368.0, 1410.0, 832.0, 564.0, 334.0, 217.0, 133.0, 123.0, 55.0, 35.0, 43.0, 23.0, 15.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1708984375, -0.16500473022460938, -0.15911102294921875, -0.15321731567382812, -0.1473236083984375, -0.14142990112304688, -0.13553619384765625, -0.12964248657226562, -0.123748779296875, -0.11785507202148438, -0.11196136474609375, -0.10606765747070312, -0.1001739501953125, -0.09428024291992188, -0.08838653564453125, -0.08249282836914062, -0.07659912109375, -0.07070541381835938, -0.06481170654296875, -0.058917999267578125, -0.0530242919921875, -0.047130584716796875, -0.04123687744140625, -0.035343170166015625, -0.029449462890625, -0.023555755615234375, -0.01766204833984375, -0.011768341064453125, -0.0058746337890625, 1.9073486328125e-05, 0.00591278076171875, 0.011806488037109375, 0.0177001953125, 0.023593902587890625, 0.02948760986328125, 0.035381317138671875, 0.0412750244140625, 0.047168731689453125, 0.05306243896484375, 0.058956146240234375, 0.064849853515625, 0.07074356079101562, 0.07663726806640625, 0.08253097534179688, 0.0884246826171875, 0.09431838989257812, 0.10021209716796875, 0.10610580444335938, 0.11199951171875, 0.11789321899414062, 0.12378692626953125, 0.12968063354492188, 0.1355743408203125, 0.14146804809570312, 0.14736175537109375, 0.15325546264648438, 0.159149169921875, 0.16504287719726562, 0.17093658447265625, 0.17683029174804688, 0.1827239990234375, 0.18861770629882812, 0.19451141357421875, 0.20040512084960938, 0.206298828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 18.0, 15.0, 20.0, 21.0, 20.0, 21.0, 30.0, 32.0, 31.0, 49.0, 52.0, 58.0, 52.0, 51.0, 58.0, 55.0, 56.0, 43.0, 37.0, 33.0, 40.0, 26.0, 34.0, 22.0, 19.0, 14.0, 6.0, 15.0, 3.0, 11.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03614616394042969, -0.034938812255859375, -0.03373146057128906, -0.03252410888671875, -0.03131675720214844, -0.030109405517578125, -0.028902053833007812, -0.0276947021484375, -0.026487350463867188, -0.025279998779296875, -0.024072647094726562, -0.02286529541015625, -0.021657943725585938, -0.020450592041015625, -0.019243240356445312, -0.018035888671875, -0.016828536987304688, -0.015621185302734375, -0.014413833618164062, -0.01320648193359375, -0.011999130249023438, -0.010791778564453125, -0.009584426879882812, -0.0083770751953125, -0.0071697235107421875, -0.005962371826171875, -0.0047550201416015625, -0.00354766845703125, -0.0023403167724609375, -0.001132965087890625, 7.43865966796875e-05, 0.00128173828125, 0.0024890899658203125, 0.003696441650390625, 0.0049037933349609375, 0.00611114501953125, 0.0073184967041015625, 0.008525848388671875, 0.009733200073242188, 0.0109405517578125, 0.012147903442382812, 0.013355255126953125, 0.014562606811523438, 0.01576995849609375, 0.016977310180664062, 0.018184661865234375, 0.019392013549804688, 0.020599365234375, 0.021806716918945312, 0.023014068603515625, 0.024221420288085938, 0.02542877197265625, 0.026636123657226562, 0.027843475341796875, 0.029050827026367188, 0.0302581787109375, 0.03146553039550781, 0.032672882080078125, 0.03388023376464844, 0.03508758544921875, 0.03629493713378906, 0.037502288818359375, 0.03870964050292969, 0.0399169921875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 8.0, 16.0, 19.0, 25.0, 28.0, 39.0, 41.0, 36.0, 45.0, 47.0, 68.0, 58.0, 65.0, 56.0, 54.0, 53.0, 37.0, 33.0, 34.0, 24.0, 37.0, 28.0, 29.0, 18.0, 18.0, 10.0, 4.0, 8.0, 8.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8160393238067627, -1.7665389776229858, -1.717038631439209, -1.6675382852554321, -1.6180379390716553, -1.5685375928878784, -1.5190372467041016, -1.4695369005203247, -1.4200365543365479, -1.370536208152771, -1.3210358619689941, -1.2715355157852173, -1.2220351696014404, -1.1725348234176636, -1.1230344772338867, -1.0735341310501099, -1.024033784866333, -0.9745334386825562, -0.9250330924987793, -0.8755327463150024, -0.8260324001312256, -0.7765320539474487, -0.7270317077636719, -0.677531361579895, -0.6280310153961182, -0.5785306692123413, -0.5290303230285645, -0.4795299768447876, -0.43002963066101074, -0.3805292844772339, -0.33102893829345703, -0.2815285921096802, -0.23202836513519287, -0.18252801895141602, -0.13302767276763916, -0.0835273265838623, -0.03402698040008545, 0.015473365783691406, 0.06497371196746826, 0.11447405815124512, 0.16397440433502197, 0.21347475051879883, 0.2629750967025757, 0.31247544288635254, 0.3619757890701294, 0.41147613525390625, 0.4609764814376831, 0.51047682762146, 0.5599771738052368, 0.6094775199890137, 0.6589778661727905, 0.7084782123565674, 0.7579785585403442, 0.8074789047241211, 0.856979250907898, 0.9064795970916748, 0.9559799432754517, 1.0054802894592285, 1.0549806356430054, 1.1044809818267822, 1.153981328010559, 1.203481674194336, 1.2529820203781128, 1.3024823665618896, 1.3519827127456665]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 7.0, 9.0, 15.0, 18.0, 16.0, 24.0, 37.0, 28.0, 43.0, 36.0, 39.0, 40.0, 34.0, 42.0, 44.0, 35.0, 42.0, 51.0, 42.0, 36.0, 42.0, 31.0, 41.0, 35.0, 26.0, 28.0, 22.0, 20.0, 20.0, 21.0, 14.0, 10.0, 14.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1101436614990234, -1.0721240043640137, -1.0341042280197144, -0.9960845112800598, -0.9580647945404053, -0.9200450778007507, -0.8820253610610962, -0.8440056443214417, -0.8059859275817871, -0.7679662108421326, -0.729946494102478, -0.6919267773628235, -0.653907060623169, -0.6158873438835144, -0.5778676271438599, -0.5398479104042053, -0.5018281936645508, -0.46380847692489624, -0.4257887601852417, -0.38776904344558716, -0.3497493267059326, -0.3117296099662781, -0.27370989322662354, -0.235690176486969, -0.19767045974731445, -0.1596507430076599, -0.12163102626800537, -0.08361130952835083, -0.04559159278869629, -0.007571876049041748, 0.030447840690612793, 0.06846755743026733, 0.10648727416992188, 0.14450699090957642, 0.18252670764923096, 0.2205464243888855, 0.25856614112854004, 0.2965858578681946, 0.3346055746078491, 0.37262529134750366, 0.4106450080871582, 0.44866472482681274, 0.4866844415664673, 0.5247041583061218, 0.5627238750457764, 0.6007435917854309, 0.6387633085250854, 0.67678302526474, 0.7148027420043945, 0.7528224587440491, 0.7908421754837036, 0.8288618922233582, 0.8668816089630127, 0.9049013257026672, 0.9429210424423218, 0.9809407591819763, 1.0189604759216309, 1.0569801330566406, 1.09499990940094, 1.1330196857452393, 1.171039342880249, 1.2090590000152588, 1.247078776359558, 1.2850985527038574, 1.3231182098388672]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 26.0, 32.0, 50.0, 89.0, 123.0, 213.0, 307.0, 545.0, 957.0, 1324.0, 2135.0, 3391.0, 5303.0, 8356.0, 12820.0, 19623.0, 28643.0, 41411.0, 56893.0, 74877.0, 91945.0, 104753.0, 111172.0, 106640.0, 95520.0, 79605.0, 61970.0, 45297.0, 32077.0, 21696.0, 14627.0, 9602.0, 6132.0, 3790.0, 2364.0, 1580.0, 979.0, 593.0, 399.0, 286.0, 143.0, 86.0, 69.0, 29.0, 27.0, 21.0, 11.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.94384765625, -0.9149322509765625, -0.886016845703125, -0.8571014404296875, -0.82818603515625, -0.7992706298828125, -0.770355224609375, -0.7414398193359375, -0.7125244140625, -0.6836090087890625, -0.654693603515625, -0.6257781982421875, -0.59686279296875, -0.5679473876953125, -0.539031982421875, -0.5101165771484375, -0.481201171875, -0.4522857666015625, -0.423370361328125, -0.3944549560546875, -0.36553955078125, -0.3366241455078125, -0.307708740234375, -0.2787933349609375, -0.2498779296875, -0.2209625244140625, -0.192047119140625, -0.1631317138671875, -0.13421630859375, -0.1053009033203125, -0.076385498046875, -0.0474700927734375, -0.0185546875, 0.0103607177734375, 0.039276123046875, 0.0681915283203125, 0.09710693359375, 0.1260223388671875, 0.154937744140625, 0.1838531494140625, 0.2127685546875, 0.2416839599609375, 0.270599365234375, 0.2995147705078125, 0.32843017578125, 0.3573455810546875, 0.386260986328125, 0.4151763916015625, 0.444091796875, 0.4730072021484375, 0.501922607421875, 0.5308380126953125, 0.55975341796875, 0.5886688232421875, 0.617584228515625, 0.6464996337890625, 0.6754150390625, 0.7043304443359375, 0.733245849609375, 0.7621612548828125, 0.79107666015625, 0.8199920654296875, 0.848907470703125, 0.8778228759765625, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 16.0, 11.0, 19.0, 17.0, 34.0, 24.0, 28.0, 44.0, 40.0, 36.0, 35.0, 45.0, 46.0, 40.0, 49.0, 59.0, 46.0, 45.0, 35.0, 36.0, 32.0, 34.0, 42.0, 31.0, 20.0, 20.0, 15.0, 20.0, 15.0, 14.0, 6.0, 12.0, 8.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0507049560546875, -1.008636474609375, -0.9665679931640625, -0.92449951171875, -0.8824310302734375, -0.840362548828125, -0.7982940673828125, -0.7562255859375, -0.7141571044921875, -0.672088623046875, -0.6300201416015625, -0.58795166015625, -0.5458831787109375, -0.503814697265625, -0.4617462158203125, -0.419677734375, -0.3776092529296875, -0.335540771484375, -0.2934722900390625, -0.25140380859375, -0.2093353271484375, -0.167266845703125, -0.1251983642578125, -0.0831298828125, -0.0410614013671875, 0.001007080078125, 0.0430755615234375, 0.08514404296875, 0.1272125244140625, 0.169281005859375, 0.2113494873046875, 0.25341796875, 0.2954864501953125, 0.337554931640625, 0.3796234130859375, 0.42169189453125, 0.4637603759765625, 0.505828857421875, 0.5478973388671875, 0.5899658203125, 0.6320343017578125, 0.674102783203125, 0.7161712646484375, 0.75823974609375, 0.8003082275390625, 0.842376708984375, 0.8844451904296875, 0.926513671875, 0.9685821533203125, 1.010650634765625, 1.0527191162109375, 1.09478759765625, 1.1368560791015625, 1.178924560546875, 1.2209930419921875, 1.2630615234375, 1.3051300048828125, 1.347198486328125, 1.3892669677734375, 1.43133544921875, 1.4734039306640625, 1.515472412109375, 1.5575408935546875, 1.599609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 11.0, 20.0, 30.0, 46.0, 59.0, 118.0, 220.0, 298.0, 528.0, 846.0, 1370.0, 2109.0, 3427.0, 5542.0, 8731.0, 13722.0, 20852.0, 31190.0, 44331.0, 61992.0, 80846.0, 97880.0, 110067.0, 113781.0, 106870.0, 93017.0, 74861.0, 56971.0, 40357.0, 27822.0, 18451.0, 12064.0, 7561.0, 4733.0, 2944.0, 1789.0, 1118.0, 739.0, 457.0, 305.0, 193.0, 100.0, 69.0, 30.0, 30.0, 15.0, 14.0, 8.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0], "bins": [-0.994140625, -0.9643325805664062, -0.9345245361328125, -0.9047164916992188, -0.874908447265625, -0.8451004028320312, -0.8152923583984375, -0.7854843139648438, -0.75567626953125, -0.7258682250976562, -0.6960601806640625, -0.6662521362304688, -0.636444091796875, -0.6066360473632812, -0.5768280029296875, -0.5470199584960938, -0.5172119140625, -0.48740386962890625, -0.4575958251953125, -0.42778778076171875, -0.397979736328125, -0.36817169189453125, -0.3383636474609375, -0.30855560302734375, -0.27874755859375, -0.24893951416015625, -0.2191314697265625, -0.18932342529296875, -0.159515380859375, -0.12970733642578125, -0.0998992919921875, -0.07009124755859375, -0.040283203125, -0.01047515869140625, 0.0193328857421875, 0.04914093017578125, 0.078948974609375, 0.10875701904296875, 0.1385650634765625, 0.16837310791015625, 0.19818115234375, 0.22798919677734375, 0.2577972412109375, 0.28760528564453125, 0.317413330078125, 0.34722137451171875, 0.3770294189453125, 0.40683746337890625, 0.4366455078125, 0.46645355224609375, 0.4962615966796875, 0.5260696411132812, 0.555877685546875, 0.5856857299804688, 0.6154937744140625, 0.6453018188476562, 0.67510986328125, 0.7049179077148438, 0.7347259521484375, 0.7645339965820312, 0.794342041015625, 0.8241500854492188, 0.8539581298828125, 0.8837661743164062, 0.91357421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 15.0, 13.0, 21.0, 20.0, 18.0, 36.0, 26.0, 24.0, 36.0, 28.0, 25.0, 32.0, 38.0, 37.0, 47.0, 38.0, 49.0, 39.0, 31.0, 40.0, 36.0, 32.0, 33.0, 33.0, 20.0, 23.0, 31.0, 22.0, 14.0, 22.0, 16.0, 18.0, 8.0, 7.0, 10.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64013671875, -0.6192398071289062, -0.5983428955078125, -0.5774459838867188, -0.556549072265625, -0.5356521606445312, -0.5147552490234375, -0.49385833740234375, -0.47296142578125, -0.45206451416015625, -0.4311676025390625, -0.41027069091796875, -0.389373779296875, -0.36847686767578125, -0.3475799560546875, -0.32668304443359375, -0.3057861328125, -0.28488922119140625, -0.2639923095703125, -0.24309539794921875, -0.222198486328125, -0.20130157470703125, -0.1804046630859375, -0.15950775146484375, -0.13861083984375, -0.11771392822265625, -0.0968170166015625, -0.07592010498046875, -0.055023193359375, -0.03412628173828125, -0.0132293701171875, 0.00766754150390625, 0.028564453125, 0.04946136474609375, 0.0703582763671875, 0.09125518798828125, 0.112152099609375, 0.13304901123046875, 0.1539459228515625, 0.17484283447265625, 0.19573974609375, 0.21663665771484375, 0.2375335693359375, 0.25843048095703125, 0.279327392578125, 0.30022430419921875, 0.3211212158203125, 0.34201812744140625, 0.3629150390625, 0.38381195068359375, 0.4047088623046875, 0.42560577392578125, 0.446502685546875, 0.46739959716796875, 0.4882965087890625, 0.5091934204101562, 0.53009033203125, 0.5509872436523438, 0.5718841552734375, 0.5927810668945312, 0.613677978515625, 0.6345748901367188, 0.6554718017578125, 0.6763687133789062, 0.697265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 9.0, 13.0, 28.0, 39.0, 57.0, 80.0, 105.0, 176.0, 293.0, 362.0, 572.0, 869.0, 1393.0, 2049.0, 3130.0, 4786.0, 7342.0, 11471.0, 17431.0, 26727.0, 40727.0, 60185.0, 85102.0, 109918.0, 128765.0, 131837.0, 117383.0, 93379.0, 68122.0, 46839.0, 31012.0, 20376.0, 13225.0, 8566.0, 5604.0, 3639.0, 2322.0, 1581.0, 1031.0, 674.0, 448.0, 314.0, 190.0, 130.0, 89.0, 53.0, 45.0, 26.0, 14.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4667091369628906, -0.45124053955078125, -0.4357719421386719, -0.4203033447265625, -0.4048347473144531, -0.38936614990234375, -0.3738975524902344, -0.358428955078125, -0.3429603576660156, -0.32749176025390625, -0.3120231628417969, -0.2965545654296875, -0.2810859680175781, -0.26561737060546875, -0.2501487731933594, -0.23468017578125, -0.21921157836914062, -0.20374298095703125, -0.18827438354492188, -0.1728057861328125, -0.15733718872070312, -0.14186859130859375, -0.12639999389648438, -0.110931396484375, -0.09546279907226562, -0.07999420166015625, -0.06452560424804688, -0.0490570068359375, -0.033588409423828125, -0.01811981201171875, -0.002651214599609375, 0.0128173828125, 0.028285980224609375, 0.04375457763671875, 0.059223175048828125, 0.0746917724609375, 0.09016036987304688, 0.10562896728515625, 0.12109756469726562, 0.136566162109375, 0.15203475952148438, 0.16750335693359375, 0.18297195434570312, 0.1984405517578125, 0.21390914916992188, 0.22937774658203125, 0.24484634399414062, 0.26031494140625, 0.2757835388183594, 0.29125213623046875, 0.3067207336425781, 0.3221893310546875, 0.3376579284667969, 0.35312652587890625, 0.3685951232910156, 0.384063720703125, 0.3995323181152344, 0.41500091552734375, 0.4304695129394531, 0.4459381103515625, 0.4614067077636719, 0.47687530517578125, 0.4923439025878906, 0.5078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 12.0, 16.0, 12.0, 15.0, 31.0, 29.0, 23.0, 29.0, 22.0, 39.0, 46.0, 54.0, 41.0, 65.0, 65.0, 37.0, 56.0, 56.0, 42.0, 33.0, 39.0, 30.0, 32.0, 28.0, 24.0, 16.0, 13.0, 20.0, 7.0, 5.0, 7.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.251169204711914e-05, -5.0866976380348206e-05, -4.922226071357727e-05, -4.7577545046806335e-05, -4.59328293800354e-05, -4.4288113713264465e-05, -4.264339804649353e-05, -4.0998682379722595e-05, -3.935396671295166e-05, -3.7709251046180725e-05, -3.606453537940979e-05, -3.4419819712638855e-05, -3.277510404586792e-05, -3.1130388379096985e-05, -2.948567271232605e-05, -2.7840957045555115e-05, -2.619624137878418e-05, -2.4551525712013245e-05, -2.290681004524231e-05, -2.1262094378471375e-05, -1.961737871170044e-05, -1.7972663044929504e-05, -1.632794737815857e-05, -1.4683231711387634e-05, -1.30385160446167e-05, -1.1393800377845764e-05, -9.749084711074829e-06, -8.104369044303894e-06, -6.459653377532959e-06, -4.814937710762024e-06, -3.170222043991089e-06, -1.5255063772201538e-06, 1.1920928955078125e-07, 1.7639249563217163e-06, 3.4086406230926514e-06, 5.0533562898635864e-06, 6.6980719566345215e-06, 8.342787623405457e-06, 9.987503290176392e-06, 1.1632218956947327e-05, 1.3276934623718262e-05, 1.4921650290489197e-05, 1.6566365957260132e-05, 1.8211081624031067e-05, 1.9855797290802002e-05, 2.1500512957572937e-05, 2.3145228624343872e-05, 2.4789944291114807e-05, 2.6434659957885742e-05, 2.8079375624656677e-05, 2.9724091291427612e-05, 3.136880695819855e-05, 3.301352262496948e-05, 3.465823829174042e-05, 3.630295395851135e-05, 3.794766962528229e-05, 3.959238529205322e-05, 4.123710095882416e-05, 4.288181662559509e-05, 4.452653229236603e-05, 4.617124795913696e-05, 4.78159636259079e-05, 4.946067929267883e-05, 5.110539495944977e-05, 5.27501106262207e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 16.0, 39.0, 50.0, 65.0, 134.0, 187.0, 283.0, 476.0, 726.0, 1181.0, 1872.0, 2903.0, 4727.0, 7476.0, 11813.0, 18170.0, 29183.0, 44470.0, 66653.0, 92804.0, 118968.0, 135421.0, 133745.0, 115551.0, 86846.0, 61254.0, 40689.0, 26670.0, 17076.0, 10621.0, 6882.0, 4290.0, 2694.0, 1713.0, 1105.0, 652.0, 429.0, 271.0, 167.0, 97.0, 64.0, 44.0, 27.0, 12.0, 11.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.490478515625, -0.4746055603027344, -0.45873260498046875, -0.4428596496582031, -0.4269866943359375, -0.4111137390136719, -0.39524078369140625, -0.3793678283691406, -0.363494873046875, -0.3476219177246094, -0.33174896240234375, -0.3158760070800781, -0.3000030517578125, -0.2841300964355469, -0.26825714111328125, -0.2523841857910156, -0.23651123046875, -0.22063827514648438, -0.20476531982421875, -0.18889236450195312, -0.1730194091796875, -0.15714645385742188, -0.14127349853515625, -0.12540054321289062, -0.109527587890625, -0.09365463256835938, -0.07778167724609375, -0.061908721923828125, -0.0460357666015625, -0.030162811279296875, -0.01428985595703125, 0.001583099365234375, 0.0174560546875, 0.033329010009765625, 0.04920196533203125, 0.06507492065429688, 0.0809478759765625, 0.09682083129882812, 0.11269378662109375, 0.12856674194335938, 0.144439697265625, 0.16031265258789062, 0.17618560791015625, 0.19205856323242188, 0.2079315185546875, 0.22380447387695312, 0.23967742919921875, 0.2555503845214844, 0.27142333984375, 0.2872962951660156, 0.30316925048828125, 0.3190422058105469, 0.3349151611328125, 0.3507881164550781, 0.36666107177734375, 0.3825340270996094, 0.398406982421875, 0.4142799377441406, 0.43015289306640625, 0.4460258483886719, 0.4618988037109375, 0.4777717590332031, 0.49364471435546875, 0.5095176696777344, 0.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 2.0, 14.0, 13.0, 24.0, 11.0, 17.0, 27.0, 24.0, 21.0, 28.0, 42.0, 51.0, 46.0, 50.0, 50.0, 59.0, 42.0, 53.0, 42.0, 57.0, 41.0, 32.0, 41.0, 28.0, 20.0, 30.0, 23.0, 22.0, 15.0, 10.0, 11.0, 11.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15713119506835938, -0.15166473388671875, -0.14619827270507812, -0.1407318115234375, -0.13526535034179688, -0.12979888916015625, -0.12433242797851562, -0.118865966796875, -0.11339950561523438, -0.10793304443359375, -0.10246658325195312, -0.0970001220703125, -0.09153366088867188, -0.08606719970703125, -0.08060073852539062, -0.07513427734375, -0.06966781616210938, -0.06420135498046875, -0.058734893798828125, -0.0532684326171875, -0.047801971435546875, -0.04233551025390625, -0.036869049072265625, -0.031402587890625, -0.025936126708984375, -0.02046966552734375, -0.015003204345703125, -0.0095367431640625, -0.004070281982421875, 0.00139617919921875, 0.006862640380859375, 0.0123291015625, 0.017795562744140625, 0.02326202392578125, 0.028728485107421875, 0.0341949462890625, 0.039661407470703125, 0.04512786865234375, 0.050594329833984375, 0.056060791015625, 0.061527252197265625, 0.06699371337890625, 0.07246017456054688, 0.0779266357421875, 0.08339309692382812, 0.08885955810546875, 0.09432601928710938, 0.09979248046875, 0.10525894165039062, 0.11072540283203125, 0.11619186401367188, 0.1216583251953125, 0.12712478637695312, 0.13259124755859375, 0.13805770874023438, 0.143524169921875, 0.14899063110351562, 0.15445709228515625, 0.15992355346679688, 0.1653900146484375, 0.17085647583007812, 0.17632293701171875, 0.18178939819335938, 0.187255859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 16.0, 14.0, 26.0, 29.0, 39.0, 40.0, 32.0, 54.0, 54.0, 50.0, 51.0, 63.0, 69.0, 47.0, 55.0, 34.0, 36.0, 35.0, 30.0, 34.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.7850890159606934, -1.737668514251709, -1.6902481317520142, -1.6428276300430298, -1.5954071283340454, -1.5479867458343506, -1.5005662441253662, -1.4531457424163818, -1.4057252407073975, -1.358304738998413, -1.3108843564987183, -1.2634638547897339, -1.2160433530807495, -1.1686229705810547, -1.1212024688720703, -1.073781967163086, -1.0263615846633911, -0.9789411425590515, -0.9315206408500671, -0.8841001987457275, -0.8366796970367432, -0.7892592549324036, -0.741838812828064, -0.6944183111190796, -0.64699786901474, -0.5995774269104004, -0.552156925201416, -0.5047364830970764, -0.45731601119041443, -0.40989553928375244, -0.36247509717941284, -0.31505462527275085, -0.2676340341567993, -0.22021356225013733, -0.17279310524463654, -0.12537264823913574, -0.07795217633247375, -0.030531704425811768, 0.016888737678527832, 0.06430920958518982, 0.1117296814918518, 0.1591501533985138, 0.2065706104040146, 0.2539910674095154, 0.30141153931617737, 0.34883201122283936, 0.39625245332717896, 0.44367292523384094, 0.49109339714050293, 0.5385138392448425, 0.5859343409538269, 0.6333547830581665, 0.6807752847671509, 0.7281957268714905, 0.7756161689758301, 0.8230366706848145, 0.870457112789154, 0.9178775548934937, 0.965298056602478, 1.0127184391021729, 1.0601389408111572, 1.1075594425201416, 1.154979944229126, 1.2024003267288208, 1.2498208284378052]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 4.0, 13.0, 13.0, 15.0, 23.0, 22.0, 22.0, 45.0, 25.0, 33.0, 36.0, 41.0, 47.0, 27.0, 28.0, 49.0, 44.0, 39.0, 46.0, 38.0, 50.0, 39.0, 27.0, 35.0, 34.0, 28.0, 18.0, 20.0, 23.0, 17.0, 17.0, 21.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1418660879135132, -1.1035720109939575, -1.0652778148651123, -1.0269837379455566, -0.988689661026001, -0.9503955841064453, -0.9121014475822449, -0.8738073110580444, -0.8355132341384888, -0.7972191572189331, -0.7589250206947327, -0.7206308841705322, -0.6823368072509766, -0.6440427303314209, -0.6057485938072205, -0.56745445728302, -0.5291603803634644, -0.4908662736415863, -0.45257216691970825, -0.4142780601978302, -0.37598395347595215, -0.3376898467540741, -0.29939574003219604, -0.261101633310318, -0.22280752658843994, -0.1845134198665619, -0.14621931314468384, -0.10792520642280579, -0.06963109970092773, -0.03133699297904968, 0.006957113742828369, 0.04525122046470642, 0.08354544639587402, 0.12183955311775208, 0.16013365983963013, 0.19842776656150818, 0.23672187328338623, 0.2750159800052643, 0.31331008672714233, 0.3516041934490204, 0.38989830017089844, 0.4281924068927765, 0.46648651361465454, 0.504780650138855, 0.5430747270584106, 0.5813688039779663, 0.6196629405021667, 0.6579570770263672, 0.6962511539459229, 0.7345452308654785, 0.772839367389679, 0.8111335039138794, 0.8494275808334351, 0.8877216577529907, 0.9260157942771912, 0.9643099308013916, 1.0026040077209473, 1.040898084640503, 1.0791921615600586, 1.1174863576889038, 1.1557804346084595, 1.1940745115280151, 1.2323687076568604, 1.270662784576416, 1.3089568614959717]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 12.0, 19.0, 27.0, 56.0, 92.0, 177.0, 259.0, 522.0, 890.0, 1499.0, 2833.0, 5345.0, 9825.0, 18294.0, 34720.0, 65267.0, 122446.0, 224053.0, 385772.0, 589798.0, 738902.0, 710247.0, 533755.0, 335285.0, 191041.0, 104108.0, 55782.0, 29337.0, 15295.0, 8283.0, 4550.0, 2502.0, 1361.0, 812.0, 426.0, 246.0, 168.0, 84.0, 74.0, 40.0, 26.0, 17.0, 20.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.4482421875, -1.405487060546875, -1.36273193359375, -1.319976806640625, -1.2772216796875, -1.234466552734375, -1.19171142578125, -1.148956298828125, -1.106201171875, -1.063446044921875, -1.02069091796875, -0.977935791015625, -0.9351806640625, -0.892425537109375, -0.84967041015625, -0.806915283203125, -0.76416015625, -0.721405029296875, -0.67864990234375, -0.635894775390625, -0.5931396484375, -0.550384521484375, -0.50762939453125, -0.464874267578125, -0.422119140625, -0.379364013671875, -0.33660888671875, -0.293853759765625, -0.2510986328125, -0.208343505859375, -0.16558837890625, -0.122833251953125, -0.080078125, -0.037322998046875, 0.00543212890625, 0.048187255859375, 0.0909423828125, 0.133697509765625, 0.17645263671875, 0.219207763671875, 0.261962890625, 0.304718017578125, 0.34747314453125, 0.390228271484375, 0.4329833984375, 0.475738525390625, 0.51849365234375, 0.561248779296875, 0.60400390625, 0.646759033203125, 0.68951416015625, 0.732269287109375, 0.7750244140625, 0.817779541015625, 0.86053466796875, 0.903289794921875, 0.946044921875, 0.988800048828125, 1.03155517578125, 1.074310302734375, 1.1170654296875, 1.159820556640625, 1.20257568359375, 1.245330810546875, 1.2880859375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 15.0, 17.0, 25.0, 27.0, 21.0, 19.0, 21.0, 32.0, 40.0, 38.0, 42.0, 29.0, 26.0, 51.0, 42.0, 52.0, 33.0, 46.0, 47.0, 39.0, 43.0, 25.0, 31.0, 29.0, 31.0, 20.0, 20.0, 29.0, 21.0, 7.0, 18.0, 10.0, 10.0, 5.0, 1.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.8899612426757812, -0.8619537353515625, -0.8339462280273438, -0.805938720703125, -0.7779312133789062, -0.7499237060546875, -0.7219161987304688, -0.69390869140625, -0.6659011840820312, -0.6378936767578125, -0.6098861694335938, -0.581878662109375, -0.5538711547851562, -0.5258636474609375, -0.49785614013671875, -0.4698486328125, -0.44184112548828125, -0.4138336181640625, -0.38582611083984375, -0.357818603515625, -0.32981109619140625, -0.3018035888671875, -0.27379608154296875, -0.24578857421875, -0.21778106689453125, -0.1897735595703125, -0.16176605224609375, -0.133758544921875, -0.10575103759765625, -0.0777435302734375, -0.04973602294921875, -0.021728515625, 0.00627899169921875, 0.0342864990234375, 0.06229400634765625, 0.090301513671875, 0.11830902099609375, 0.1463165283203125, 0.17432403564453125, 0.20233154296875, 0.23033905029296875, 0.2583465576171875, 0.28635406494140625, 0.314361572265625, 0.34236907958984375, 0.3703765869140625, 0.39838409423828125, 0.4263916015625, 0.45439910888671875, 0.4824066162109375, 0.5104141235351562, 0.538421630859375, 0.5664291381835938, 0.5944366455078125, 0.6224441528320312, 0.65045166015625, 0.6784591674804688, 0.7064666748046875, 0.7344741821289062, 0.762481689453125, 0.7904891967773438, 0.8184967041015625, 0.8465042114257812, 0.87451171875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 7.0, 18.0, 25.0, 51.0, 72.0, 67.0, 141.0, 243.0, 335.0, 561.0, 1030.0, 1663.0, 2766.0, 4650.0, 8010.0, 13360.0, 22186.0, 37924.0, 62782.0, 101553.0, 160775.0, 241775.0, 344058.0, 448981.0, 525655.0, 539371.0, 487189.0, 392118.0, 285105.0, 193315.0, 124145.0, 77481.0, 47066.0, 28337.0, 16965.0, 9878.0, 5880.0, 3423.0, 2081.0, 1253.0, 748.0, 466.0, 281.0, 191.0, 98.0, 94.0, 32.0, 29.0, 17.0, 9.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0810546875, -1.0475006103515625, -1.013946533203125, -0.9803924560546875, -0.94683837890625, -0.9132843017578125, -0.879730224609375, -0.8461761474609375, -0.8126220703125, -0.7790679931640625, -0.745513916015625, -0.7119598388671875, -0.67840576171875, -0.6448516845703125, -0.611297607421875, -0.5777435302734375, -0.544189453125, -0.5106353759765625, -0.477081298828125, -0.4435272216796875, -0.40997314453125, -0.3764190673828125, -0.342864990234375, -0.3093109130859375, -0.2757568359375, -0.2422027587890625, -0.208648681640625, -0.1750946044921875, -0.14154052734375, -0.1079864501953125, -0.074432373046875, -0.0408782958984375, -0.00732421875, 0.0262298583984375, 0.059783935546875, 0.0933380126953125, 0.12689208984375, 0.1604461669921875, 0.194000244140625, 0.2275543212890625, 0.2611083984375, 0.2946624755859375, 0.328216552734375, 0.3617706298828125, 0.39532470703125, 0.4288787841796875, 0.462432861328125, 0.4959869384765625, 0.529541015625, 0.5630950927734375, 0.596649169921875, 0.6302032470703125, 0.66375732421875, 0.6973114013671875, 0.730865478515625, 0.7644195556640625, 0.7979736328125, 0.8315277099609375, 0.865081787109375, 0.8986358642578125, 0.93218994140625, 0.9657440185546875, 0.999298095703125, 1.0328521728515625, 1.06640625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 24.0, 41.0, 53.0, 59.0, 85.0, 88.0, 123.0, 118.0, 134.0, 151.0, 188.0, 166.0, 209.0, 222.0, 229.0, 237.0, 239.0, 211.0, 209.0, 209.0, 158.0, 149.0, 123.0, 124.0, 94.0, 85.0, 55.0, 47.0, 40.0, 32.0, 26.0, 10.0, 19.0, 13.0, 7.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42724609375, -0.4130363464355469, -0.39882659912109375, -0.3846168518066406, -0.3704071044921875, -0.3561973571777344, -0.34198760986328125, -0.3277778625488281, -0.313568115234375, -0.2993583679199219, -0.28514862060546875, -0.2709388732910156, -0.2567291259765625, -0.24251937866210938, -0.22830963134765625, -0.21409988403320312, -0.19989013671875, -0.18568038940429688, -0.17147064208984375, -0.15726089477539062, -0.1430511474609375, -0.12884140014648438, -0.11463165283203125, -0.10042190551757812, -0.086212158203125, -0.07200241088867188, -0.05779266357421875, -0.043582916259765625, -0.0293731689453125, -0.015163421630859375, -0.00095367431640625, 0.013256072998046875, 0.0274658203125, 0.041675567626953125, 0.05588531494140625, 0.07009506225585938, 0.0843048095703125, 0.09851455688476562, 0.11272430419921875, 0.12693405151367188, 0.141143798828125, 0.15535354614257812, 0.16956329345703125, 0.18377304077148438, 0.1979827880859375, 0.21219253540039062, 0.22640228271484375, 0.24061203002929688, 0.25482177734375, 0.2690315246582031, 0.28324127197265625, 0.2974510192871094, 0.3116607666015625, 0.3258705139160156, 0.34008026123046875, 0.3542900085449219, 0.368499755859375, 0.3827095031738281, 0.39691925048828125, 0.4111289978027344, 0.4253387451171875, 0.4395484924316406, 0.45375823974609375, 0.4679679870605469, 0.482177734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 9.0, 14.0, 20.0, 25.0, 24.0, 28.0, 39.0, 43.0, 30.0, 36.0, 57.0, 52.0, 59.0, 59.0, 58.0, 53.0, 52.0, 48.0, 29.0, 37.0, 35.0, 20.0, 32.0, 22.0, 15.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.469054102897644, -1.4224615097045898, -1.3758689165115356, -1.3292763233184814, -1.2826837301254272, -1.236091136932373, -1.1894984245300293, -1.1429059505462646, -1.096313238143921, -1.0497206449508667, -1.0031280517578125, -0.9565354585647583, -0.9099428653717041, -0.8633502721786499, -0.8167576193809509, -0.7701650261878967, -0.7235724925994873, -0.6769798994064331, -0.6303873062133789, -0.5837947130203247, -0.5372021198272705, -0.4906094968318939, -0.44401687383651733, -0.39742428064346313, -0.35083168745040894, -0.30423909425735474, -0.25764650106430054, -0.21105387806892395, -0.16446128487586975, -0.11786869168281555, -0.07127606868743896, -0.024683475494384766, 0.021908998489379883, 0.06850159913301468, 0.11509419977664948, 0.16168680787086487, 0.20827940106391907, 0.25487199425697327, 0.30146461725234985, 0.34805721044540405, 0.39464980363845825, 0.44124239683151245, 0.48783499002456665, 0.5344276428222656, 0.5810202360153198, 0.627612829208374, 0.6742054224014282, 0.7207980155944824, 0.7673906087875366, 0.8139832019805908, 0.860575795173645, 0.9071683883666992, 0.9537609815597534, 1.0003535747528076, 1.0469462871551514, 1.093538761138916, 1.1401314735412598, 1.186724066734314, 1.2333166599273682, 1.2799092531204224, 1.3265018463134766, 1.3730944395065308, 1.419687032699585, 1.4662797451019287, 1.5128722190856934]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 10.0, 17.0, 10.0, 19.0, 20.0, 32.0, 23.0, 33.0, 33.0, 26.0, 35.0, 41.0, 45.0, 48.0, 43.0, 38.0, 35.0, 42.0, 29.0, 45.0, 32.0, 40.0, 36.0, 29.0, 24.0, 29.0, 20.0, 24.0, 19.0, 24.0, 12.0, 9.0, 11.0, 8.0, 13.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.993068277835846, -0.9603825807571411, -0.927696943283081, -0.8950112462043762, -0.8623255491256714, -0.8296399116516113, -0.7969542145729065, -0.7642685174942017, -0.7315828800201416, -0.6988971829414368, -0.6662115454673767, -0.6335258483886719, -0.6008402109146118, -0.568154513835907, -0.5354688167572021, -0.5027831792831421, -0.47009748220443726, -0.4374118149280548, -0.40472614765167236, -0.37204045057296753, -0.3393547832965851, -0.30666911602020264, -0.2739834189414978, -0.24129775166511536, -0.2086120843887329, -0.17592641711235046, -0.14324073493480682, -0.11055506020784378, -0.07786938548088074, -0.04518371820449829, -0.012498036026954651, 0.02018764615058899, 0.05287337303161621, 0.08555904775857925, 0.1182447224855423, 0.15093040466308594, 0.18361607193946838, 0.21630173921585083, 0.24898742139339447, 0.2816731035709381, 0.31435877084732056, 0.347044438123703, 0.37973010540008545, 0.4124158024787903, 0.44510146975517273, 0.4777871370315552, 0.51047283411026, 0.5431585311889648, 0.5758441686630249, 0.6085298657417297, 0.6412155032157898, 0.6739012002944946, 0.7065868377685547, 0.7392725348472595, 0.7719582319259644, 0.8046438694000244, 0.8373295664787292, 0.8700152635574341, 0.9027009010314941, 0.935386598110199, 0.9680722951889038, 1.0007579326629639, 1.033443570137024, 1.0661293268203735, 1.0988149642944336]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 8.0, 12.0, 21.0, 21.0, 49.0, 48.0, 90.0, 155.0, 191.0, 355.0, 591.0, 955.0, 1472.0, 2410.0, 4068.0, 6547.0, 10696.0, 17770.0, 29482.0, 48878.0, 79344.0, 122158.0, 168576.0, 177988.0, 138252.0, 91985.0, 57556.0, 34994.0, 21108.0, 12825.0, 7760.0, 4588.0, 2954.0, 1733.0, 1023.0, 651.0, 440.0, 287.0, 167.0, 119.0, 69.0, 50.0, 25.0, 24.0, 16.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.315673828125, -0.3061561584472656, -0.29663848876953125, -0.2871208190917969, -0.2776031494140625, -0.2680854797363281, -0.25856781005859375, -0.24905014038085938, -0.239532470703125, -0.23001480102539062, -0.22049713134765625, -0.21097946166992188, -0.2014617919921875, -0.19194412231445312, -0.18242645263671875, -0.17290878295898438, -0.16339111328125, -0.15387344360351562, -0.14435577392578125, -0.13483810424804688, -0.1253204345703125, -0.11580276489257812, -0.10628509521484375, -0.09676742553710938, -0.087249755859375, -0.07773208618164062, -0.06821441650390625, -0.058696746826171875, -0.0491790771484375, -0.039661407470703125, -0.03014373779296875, -0.020626068115234375, -0.0111083984375, -0.001590728759765625, 0.00792694091796875, 0.017444610595703125, 0.0269622802734375, 0.036479949951171875, 0.04599761962890625, 0.055515289306640625, 0.065032958984375, 0.07455062866210938, 0.08406829833984375, 0.09358596801757812, 0.1031036376953125, 0.11262130737304688, 0.12213897705078125, 0.13165664672851562, 0.14117431640625, 0.15069198608398438, 0.16020965576171875, 0.16972732543945312, 0.1792449951171875, 0.18876266479492188, 0.19828033447265625, 0.20779800415039062, 0.217315673828125, 0.22683334350585938, 0.23635101318359375, 0.24586868286132812, 0.2553863525390625, 0.2649040222167969, 0.27442169189453125, 0.2839393615722656, 0.29345703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 11.0, 23.0, 14.0, 18.0, 18.0, 30.0, 24.0, 38.0, 27.0, 50.0, 61.0, 48.0, 46.0, 41.0, 48.0, 55.0, 45.0, 42.0, 39.0, 41.0, 37.0, 36.0, 32.0, 21.0, 23.0, 19.0, 19.0, 11.0, 11.0, 15.0, 5.0, 8.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.23504638671875, -1.1947021484375, -1.15435791015625, -1.114013671875, -1.07366943359375, -1.0333251953125, -0.99298095703125, -0.95263671875, -0.91229248046875, -0.8719482421875, -0.83160400390625, -0.791259765625, -0.75091552734375, -0.7105712890625, -0.67022705078125, -0.6298828125, -0.58953857421875, -0.5491943359375, -0.50885009765625, -0.468505859375, -0.42816162109375, -0.3878173828125, -0.34747314453125, -0.30712890625, -0.26678466796875, -0.2264404296875, -0.18609619140625, -0.145751953125, -0.10540771484375, -0.0650634765625, -0.02471923828125, 0.015625, 0.05596923828125, 0.0963134765625, 0.13665771484375, 0.177001953125, 0.21734619140625, 0.2576904296875, 0.29803466796875, 0.33837890625, 0.37872314453125, 0.4190673828125, 0.45941162109375, 0.499755859375, 0.54010009765625, 0.5804443359375, 0.62078857421875, 0.6611328125, 0.70147705078125, 0.7418212890625, 0.78216552734375, 0.822509765625, 0.86285400390625, 0.9031982421875, 0.94354248046875, 0.98388671875, 1.02423095703125, 1.0645751953125, 1.10491943359375, 1.145263671875, 1.18560791015625, 1.2259521484375, 1.26629638671875, 1.306640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 6.0, 6.0, 20.0, 21.0, 41.0, 53.0, 90.0, 135.0, 224.0, 344.0, 597.0, 1046.0, 1847.0, 3292.0, 6116.0, 11655.0, 22439.0, 44921.0, 88282.0, 165038.0, 245352.0, 209021.0, 120249.0, 62166.0, 31260.0, 15929.0, 8079.0, 4618.0, 2368.0, 1313.0, 770.0, 460.0, 283.0, 157.0, 109.0, 81.0, 48.0, 30.0, 17.0, 10.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4267578125, -0.4141082763671875, -0.401458740234375, -0.3888092041015625, -0.37615966796875, -0.3635101318359375, -0.350860595703125, -0.3382110595703125, -0.3255615234375, -0.3129119873046875, -0.300262451171875, -0.2876129150390625, -0.27496337890625, -0.2623138427734375, -0.249664306640625, -0.2370147705078125, -0.224365234375, -0.2117156982421875, -0.199066162109375, -0.1864166259765625, -0.17376708984375, -0.1611175537109375, -0.148468017578125, -0.1358184814453125, -0.1231689453125, -0.1105194091796875, -0.097869873046875, -0.0852203369140625, -0.07257080078125, -0.0599212646484375, -0.047271728515625, -0.0346221923828125, -0.02197265625, -0.0093231201171875, 0.003326416015625, 0.0159759521484375, 0.02862548828125, 0.0412750244140625, 0.053924560546875, 0.0665740966796875, 0.0792236328125, 0.0918731689453125, 0.104522705078125, 0.1171722412109375, 0.12982177734375, 0.1424713134765625, 0.155120849609375, 0.1677703857421875, 0.180419921875, 0.1930694580078125, 0.205718994140625, 0.2183685302734375, 0.23101806640625, 0.2436676025390625, 0.256317138671875, 0.2689666748046875, 0.2816162109375, 0.2942657470703125, 0.306915283203125, 0.3195648193359375, 0.33221435546875, 0.3448638916015625, 0.357513427734375, 0.3701629638671875, 0.3828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 11.0, 10.0, 10.0, 14.0, 23.0, 16.0, 19.0, 23.0, 21.0, 26.0, 28.0, 26.0, 37.0, 38.0, 40.0, 47.0, 38.0, 41.0, 49.0, 32.0, 43.0, 33.0, 35.0, 32.0, 42.0, 35.0, 23.0, 25.0, 19.0, 16.0, 30.0, 10.0, 18.0, 12.0, 14.0, 7.0, 5.0, 5.0, 3.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6044921875, -0.5842742919921875, -0.564056396484375, -0.5438385009765625, -0.52362060546875, -0.5034027099609375, -0.483184814453125, -0.4629669189453125, -0.4427490234375, -0.4225311279296875, -0.402313232421875, -0.3820953369140625, -0.36187744140625, -0.3416595458984375, -0.321441650390625, -0.3012237548828125, -0.281005859375, -0.2607879638671875, -0.240570068359375, -0.2203521728515625, -0.20013427734375, -0.1799163818359375, -0.159698486328125, -0.1394805908203125, -0.1192626953125, -0.0990447998046875, -0.078826904296875, -0.0586090087890625, -0.03839111328125, -0.0181732177734375, 0.002044677734375, 0.0222625732421875, 0.04248046875, 0.0626983642578125, 0.082916259765625, 0.1031341552734375, 0.12335205078125, 0.1435699462890625, 0.163787841796875, 0.1840057373046875, 0.2042236328125, 0.2244415283203125, 0.244659423828125, 0.2648773193359375, 0.28509521484375, 0.3053131103515625, 0.325531005859375, 0.3457489013671875, 0.365966796875, 0.3861846923828125, 0.406402587890625, 0.4266204833984375, 0.44683837890625, 0.4670562744140625, 0.487274169921875, 0.5074920654296875, 0.5277099609375, 0.5479278564453125, 0.568145751953125, 0.5883636474609375, 0.60858154296875, 0.6287994384765625, 0.649017333984375, 0.6692352294921875, 0.689453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 19.0, 18.0, 40.0, 40.0, 82.0, 99.0, 191.0, 249.0, 411.0, 609.0, 887.0, 1549.0, 2450.0, 4303.0, 7593.0, 15093.0, 32191.0, 78715.0, 214299.0, 377292.0, 185032.0, 67972.0, 28689.0, 13487.0, 7011.0, 3928.0, 2280.0, 1451.0, 886.0, 561.0, 391.0, 219.0, 154.0, 104.0, 63.0, 66.0, 41.0, 14.0, 18.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.19189453125, -0.18615341186523438, -0.18041229248046875, -0.17467117309570312, -0.1689300537109375, -0.16318893432617188, -0.15744781494140625, -0.15170669555664062, -0.145965576171875, -0.14022445678710938, -0.13448333740234375, -0.12874221801757812, -0.1230010986328125, -0.11725997924804688, -0.11151885986328125, -0.10577774047851562, -0.10003662109375, -0.09429550170898438, -0.08855438232421875, -0.08281326293945312, -0.0770721435546875, -0.07133102416992188, -0.06558990478515625, -0.059848785400390625, -0.054107666015625, -0.048366546630859375, -0.04262542724609375, -0.036884307861328125, -0.0311431884765625, -0.025402069091796875, -0.01966094970703125, -0.013919830322265625, -0.0081787109375, -0.002437591552734375, 0.00330352783203125, 0.009044647216796875, 0.0147857666015625, 0.020526885986328125, 0.02626800537109375, 0.032009124755859375, 0.037750244140625, 0.043491363525390625, 0.04923248291015625, 0.054973602294921875, 0.0607147216796875, 0.06645584106445312, 0.07219696044921875, 0.07793807983398438, 0.08367919921875, 0.08942031860351562, 0.09516143798828125, 0.10090255737304688, 0.1066436767578125, 0.11238479614257812, 0.11812591552734375, 0.12386703491210938, 0.129608154296875, 0.13534927368164062, 0.14109039306640625, 0.14683151245117188, 0.1525726318359375, 0.15831375122070312, 0.16405487060546875, 0.16979598999023438, 0.175537109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 6.0, 3.0, 14.0, 12.0, 21.0, 24.0, 33.0, 28.0, 30.0, 38.0, 42.0, 46.0, 45.0, 51.0, 39.0, 55.0, 46.0, 45.0, 64.0, 40.0, 55.0, 32.0, 24.0, 25.0, 22.0, 18.0, 19.0, 23.0, 17.0, 13.0, 12.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -8.977949619293213e-06, -8.657574653625488e-06, -8.337199687957764e-06, -8.016824722290039e-06, -7.696449756622314e-06, -7.37607479095459e-06, -7.055699825286865e-06, -6.735324859619141e-06, -6.414949893951416e-06, -6.094574928283691e-06, -5.774199962615967e-06, -5.453824996948242e-06, -5.133450031280518e-06, -4.813075065612793e-06, -4.492700099945068e-06, -4.172325134277344e-06, -3.851950168609619e-06, -3.5315752029418945e-06, -3.21120023727417e-06, -2.8908252716064453e-06, -2.5704503059387207e-06, -2.250075340270996e-06, -1.9297003746032715e-06, -1.6093254089355469e-06, -1.2889504432678223e-06, -9.685754776000977e-07, -6.48200511932373e-07, -3.2782554626464844e-07, -7.450580596923828e-09, 3.129243850708008e-07, 6.332993507385254e-07, 9.5367431640625e-07, 1.2740492820739746e-06, 1.5944242477416992e-06, 1.914799213409424e-06, 2.2351741790771484e-06, 2.555549144744873e-06, 2.8759241104125977e-06, 3.1962990760803223e-06, 3.516674041748047e-06, 3.8370490074157715e-06, 4.157423973083496e-06, 4.477798938751221e-06, 4.798173904418945e-06, 5.11854887008667e-06, 5.4389238357543945e-06, 5.759298801422119e-06, 6.079673767089844e-06, 6.400048732757568e-06, 6.720423698425293e-06, 7.040798664093018e-06, 7.361173629760742e-06, 7.681548595428467e-06, 8.001923561096191e-06, 8.322298526763916e-06, 8.64267349243164e-06, 8.963048458099365e-06, 9.28342342376709e-06, 9.603798389434814e-06, 9.924173355102539e-06, 1.0244548320770264e-05, 1.0564923286437988e-05, 1.0885298252105713e-05, 1.1205673217773438e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 10.0, 15.0, 33.0, 26.0, 45.0, 79.0, 95.0, 147.0, 187.0, 331.0, 554.0, 788.0, 1247.0, 2113.0, 3588.0, 6208.0, 10415.0, 18253.0, 31186.0, 56630.0, 100991.0, 169169.0, 219709.0, 177462.0, 108321.0, 60437.0, 34049.0, 19150.0, 11045.0, 6387.0, 3707.0, 2269.0, 1410.0, 887.0, 534.0, 371.0, 254.0, 142.0, 105.0, 65.0, 45.0, 22.0, 23.0, 24.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12136077880859375, -0.1171112060546875, -0.11286163330078125, -0.108612060546875, -0.10436248779296875, -0.1001129150390625, -0.09586334228515625, -0.09161376953125, -0.08736419677734375, -0.0831146240234375, -0.07886505126953125, -0.074615478515625, -0.07036590576171875, -0.0661163330078125, -0.06186676025390625, -0.0576171875, -0.05336761474609375, -0.0491180419921875, -0.04486846923828125, -0.040618896484375, -0.03636932373046875, -0.0321197509765625, -0.02787017822265625, -0.02362060546875, -0.01937103271484375, -0.0151214599609375, -0.01087188720703125, -0.006622314453125, -0.00237274169921875, 0.0018768310546875, 0.00612640380859375, 0.0103759765625, 0.01462554931640625, 0.0188751220703125, 0.02312469482421875, 0.027374267578125, 0.03162384033203125, 0.0358734130859375, 0.04012298583984375, 0.04437255859375, 0.04862213134765625, 0.0528717041015625, 0.05712127685546875, 0.061370849609375, 0.06562042236328125, 0.0698699951171875, 0.07411956787109375, 0.078369140625, 0.08261871337890625, 0.0868682861328125, 0.09111785888671875, 0.095367431640625, 0.09961700439453125, 0.1038665771484375, 0.10811614990234375, 0.11236572265625, 0.11661529541015625, 0.1208648681640625, 0.12511444091796875, 0.129364013671875, 0.13361358642578125, 0.1378631591796875, 0.14211273193359375, 0.1463623046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 6.0, 13.0, 4.0, 16.0, 12.0, 15.0, 17.0, 14.0, 14.0, 24.0, 30.0, 33.0, 31.0, 36.0, 45.0, 53.0, 70.0, 78.0, 55.0, 48.0, 44.0, 42.0, 44.0, 35.0, 35.0, 30.0, 31.0, 8.0, 21.0, 16.0, 11.0, 11.0, 5.0, 6.0, 2.0, 8.0, 5.0, 5.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0284576416015625, -0.027442216873168945, -0.02642679214477539, -0.025411367416381836, -0.02439594268798828, -0.023380517959594727, -0.022365093231201172, -0.021349668502807617, -0.020334243774414062, -0.019318819046020508, -0.018303394317626953, -0.0172879695892334, -0.016272544860839844, -0.015257120132446289, -0.014241695404052734, -0.01322627067565918, -0.012210845947265625, -0.01119542121887207, -0.010179996490478516, -0.009164571762084961, -0.008149147033691406, -0.0071337223052978516, -0.006118297576904297, -0.005102872848510742, -0.0040874481201171875, -0.003072023391723633, -0.002056598663330078, -0.0010411739349365234, -2.574920654296875e-05, 0.000989675521850586, 0.0020051002502441406, 0.0030205249786376953, 0.00403594970703125, 0.005051374435424805, 0.006066799163818359, 0.007082223892211914, 0.008097648620605469, 0.009113073348999023, 0.010128498077392578, 0.011143922805786133, 0.012159347534179688, 0.013174772262573242, 0.014190196990966797, 0.015205621719360352, 0.016221046447753906, 0.01723647117614746, 0.018251895904541016, 0.01926732063293457, 0.020282745361328125, 0.02129817008972168, 0.022313594818115234, 0.02332901954650879, 0.024344444274902344, 0.0253598690032959, 0.026375293731689453, 0.027390718460083008, 0.028406143188476562, 0.029421567916870117, 0.030436992645263672, 0.03145241737365723, 0.03246784210205078, 0.033483266830444336, 0.03449869155883789, 0.035514116287231445, 0.036529541015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 15.0, 8.0, 9.0, 23.0, 11.0, 28.0, 19.0, 31.0, 46.0, 32.0, 34.0, 35.0, 60.0, 57.0, 57.0, 56.0, 55.0, 57.0, 46.0, 49.0, 28.0, 33.0, 34.0, 23.0, 26.0, 28.0, 16.0, 17.0, 11.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.437822937965393, -1.3920657634735107, -1.3463085889816284, -1.300551414489746, -1.2547943592071533, -1.209037184715271, -1.1632800102233887, -1.1175228357315063, -1.071765661239624, -1.0260084867477417, -0.9802513718605042, -0.9344941973686218, -0.8887370824813843, -0.842979907989502, -0.7972227334976196, -0.7514655590057373, -0.7057085037231445, -0.6599513292312622, -0.6141942143440247, -0.5684370398521423, -0.5226799249649048, -0.47692275047302246, -0.43116557598114014, -0.3854084312915802, -0.33965128660202026, -0.2938941419124603, -0.2481369823217392, -0.20237982273101807, -0.15662267804145813, -0.1108655333518982, -0.06510835886001587, -0.019351214170455933, 0.026405811309814453, 0.07216296344995499, 0.11792011559009552, 0.16367727518081665, 0.2094344198703766, 0.2551915645599365, 0.30094873905181885, 0.3467058837413788, 0.3924630284309387, 0.43822017312049866, 0.4839773178100586, 0.5297344923019409, 0.5754916667938232, 0.6212487816810608, 0.6670059561729431, 0.7127630710601807, 0.758520245552063, 0.8042774200439453, 0.8500345349311829, 0.8957917094230652, 0.9415488243103027, 0.9873059988021851, 1.0330631732940674, 1.0788203477859497, 1.124577522277832, 1.1703346967697144, 1.2160918712615967, 1.2618489265441895, 1.3076061010360718, 1.353363275527954, 1.3991204500198364, 1.4448776245117188, 1.4906346797943115]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 3.0, 8.0, 13.0, 13.0, 14.0, 16.0, 22.0, 29.0, 23.0, 38.0, 32.0, 24.0, 34.0, 47.0, 47.0, 46.0, 38.0, 39.0, 40.0, 38.0, 26.0, 45.0, 36.0, 36.0, 41.0, 28.0, 27.0, 22.0, 21.0, 28.0, 21.0, 19.0, 9.0, 13.0, 12.0, 5.0, 12.0, 11.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9932097792625427, -0.960573136806488, -0.9279365539550781, -0.8952999114990234, -0.8626633286476135, -0.8300266861915588, -0.7973901033401489, -0.7647534608840942, -0.7321168184280396, -0.6994801759719849, -0.666843593120575, -0.6342069506645203, -0.6015703678131104, -0.5689337253570557, -0.536297082901001, -0.5036605000495911, -0.47102391719818115, -0.43838730454444885, -0.40575069189071655, -0.37311404943466187, -0.34047746658325195, -0.30784082412719727, -0.27520421147346497, -0.24256759881973267, -0.20993098616600037, -0.17729437351226807, -0.14465776085853577, -0.11202113330364227, -0.07938452064990997, -0.04674790799617767, -0.01411128044128418, 0.01852533221244812, 0.051161885261535645, 0.08379849791526794, 0.11643511801958084, 0.14907173812389374, 0.18170835077762604, 0.21434496343135834, 0.24698159098625183, 0.27961820363998413, 0.31225481629371643, 0.34489142894744873, 0.37752804160118103, 0.41016465425491333, 0.442801296710968, 0.47543787956237793, 0.5080745220184326, 0.5407111644744873, 0.5733477473258972, 0.6059843897819519, 0.6386209726333618, 0.6712576150894165, 0.7038941979408264, 0.7365308403968811, 0.769167423248291, 0.8018040657043457, 0.8344407081604004, 0.8670773506164551, 0.899713933467865, 0.9323505759239197, 0.9649871587753296, 0.9976238012313843, 1.030260443687439, 1.062896966934204, 1.0955336093902588]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 15.0, 25.0, 37.0, 39.0, 78.0, 130.0, 287.0, 484.0, 746.0, 1330.0, 2261.0, 3887.0, 6577.0, 11004.0, 18470.0, 30062.0, 46316.0, 69047.0, 95066.0, 118543.0, 132622.0, 130941.0, 114651.0, 89790.0, 64373.0, 42822.0, 27180.0, 17338.0, 9994.0, 6031.0, 3485.0, 2028.0, 1248.0, 667.0, 382.0, 222.0, 145.0, 84.0, 57.0, 37.0, 17.0, 11.0, 9.0, 4.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0747604370117188, -1.0420989990234375, -1.0094375610351562, -0.976776123046875, -0.9441146850585938, -0.9114532470703125, -0.8787918090820312, -0.84613037109375, -0.8134689331054688, -0.7808074951171875, -0.7481460571289062, -0.715484619140625, -0.6828231811523438, -0.6501617431640625, -0.6175003051757812, -0.5848388671875, -0.5521774291992188, -0.5195159912109375, -0.48685455322265625, -0.454193115234375, -0.42153167724609375, -0.3888702392578125, -0.35620880126953125, -0.32354736328125, -0.29088592529296875, -0.2582244873046875, -0.22556304931640625, -0.192901611328125, -0.16024017333984375, -0.1275787353515625, -0.09491729736328125, -0.062255859375, -0.02959442138671875, 0.0030670166015625, 0.03572845458984375, 0.068389892578125, 0.10105133056640625, 0.1337127685546875, 0.16637420654296875, 0.19903564453125, 0.23169708251953125, 0.2643585205078125, 0.29701995849609375, 0.329681396484375, 0.36234283447265625, 0.3950042724609375, 0.42766571044921875, 0.4603271484375, 0.49298858642578125, 0.5256500244140625, 0.5583114624023438, 0.590972900390625, 0.6236343383789062, 0.6562957763671875, 0.6889572143554688, 0.72161865234375, 0.7542800903320312, 0.7869415283203125, 0.8196029663085938, 0.852264404296875, 0.8849258422851562, 0.9175872802734375, 0.9502487182617188, 0.98291015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 7.0, 11.0, 12.0, 12.0, 32.0, 19.0, 39.0, 37.0, 38.0, 31.0, 39.0, 42.0, 59.0, 56.0, 54.0, 39.0, 58.0, 41.0, 41.0, 33.0, 47.0, 28.0, 29.0, 27.0, 28.0, 25.0, 15.0, 17.0, 14.0, 19.0, 6.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.11480712890625, -1.0753173828125, -1.03582763671875, -0.996337890625, -0.95684814453125, -0.9173583984375, -0.87786865234375, -0.83837890625, -0.79888916015625, -0.7593994140625, -0.71990966796875, -0.680419921875, -0.64093017578125, -0.6014404296875, -0.56195068359375, -0.5224609375, -0.48297119140625, -0.4434814453125, -0.40399169921875, -0.364501953125, -0.32501220703125, -0.2855224609375, -0.24603271484375, -0.20654296875, -0.16705322265625, -0.1275634765625, -0.08807373046875, -0.048583984375, -0.00909423828125, 0.0303955078125, 0.06988525390625, 0.109375, 0.14886474609375, 0.1883544921875, 0.22784423828125, 0.267333984375, 0.30682373046875, 0.3463134765625, 0.38580322265625, 0.42529296875, 0.46478271484375, 0.5042724609375, 0.54376220703125, 0.583251953125, 0.62274169921875, 0.6622314453125, 0.70172119140625, 0.7412109375, 0.78070068359375, 0.8201904296875, 0.85968017578125, 0.899169921875, 0.93865966796875, 0.9781494140625, 1.01763916015625, 1.05712890625, 1.09661865234375, 1.1361083984375, 1.17559814453125, 1.215087890625, 1.25457763671875, 1.2940673828125, 1.33355712890625, 1.373046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 15.0, 15.0, 25.0, 46.0, 61.0, 101.0, 151.0, 245.0, 404.0, 648.0, 984.0, 1589.0, 2513.0, 3897.0, 6072.0, 9312.0, 14391.0, 21976.0, 31910.0, 45404.0, 61562.0, 79713.0, 96118.0, 107680.0, 111343.0, 105211.0, 91511.0, 74286.0, 56345.0, 41036.0, 28749.0, 19406.0, 12786.0, 8361.0, 5350.0, 3397.0, 2147.0, 1382.0, 871.0, 543.0, 364.0, 248.0, 153.0, 76.0, 62.0, 38.0, 17.0, 13.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.847564697265625, -0.81964111328125, -0.791717529296875, -0.7637939453125, -0.735870361328125, -0.70794677734375, -0.680023193359375, -0.652099609375, -0.624176025390625, -0.59625244140625, -0.568328857421875, -0.5404052734375, -0.512481689453125, -0.48455810546875, -0.456634521484375, -0.4287109375, -0.400787353515625, -0.37286376953125, -0.344940185546875, -0.3170166015625, -0.289093017578125, -0.26116943359375, -0.233245849609375, -0.205322265625, -0.177398681640625, -0.14947509765625, -0.121551513671875, -0.0936279296875, -0.065704345703125, -0.03778076171875, -0.009857177734375, 0.01806640625, 0.045989990234375, 0.07391357421875, 0.101837158203125, 0.1297607421875, 0.157684326171875, 0.18560791015625, 0.213531494140625, 0.241455078125, 0.269378662109375, 0.29730224609375, 0.325225830078125, 0.3531494140625, 0.381072998046875, 0.40899658203125, 0.436920166015625, 0.46484375, 0.492767333984375, 0.52069091796875, 0.548614501953125, 0.5765380859375, 0.604461669921875, 0.63238525390625, 0.660308837890625, 0.688232421875, 0.716156005859375, 0.74407958984375, 0.772003173828125, 0.7999267578125, 0.827850341796875, 0.85577392578125, 0.883697509765625, 0.91162109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 12.0, 16.0, 20.0, 13.0, 32.0, 40.0, 31.0, 24.0, 45.0, 52.0, 52.0, 51.0, 56.0, 42.0, 44.0, 47.0, 48.0, 56.0, 41.0, 33.0, 50.0, 33.0, 26.0, 29.0, 24.0, 13.0, 11.0, 11.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6833038330078125, -0.657623291015625, -0.6319427490234375, -0.60626220703125, -0.5805816650390625, -0.554901123046875, -0.5292205810546875, -0.5035400390625, -0.4778594970703125, -0.452178955078125, -0.4264984130859375, -0.40081787109375, -0.3751373291015625, -0.349456787109375, -0.3237762451171875, -0.298095703125, -0.2724151611328125, -0.246734619140625, -0.2210540771484375, -0.19537353515625, -0.1696929931640625, -0.144012451171875, -0.1183319091796875, -0.0926513671875, -0.0669708251953125, -0.041290283203125, -0.0156097412109375, 0.01007080078125, 0.0357513427734375, 0.061431884765625, 0.0871124267578125, 0.11279296875, 0.1384735107421875, 0.164154052734375, 0.1898345947265625, 0.21551513671875, 0.2411956787109375, 0.266876220703125, 0.2925567626953125, 0.3182373046875, 0.3439178466796875, 0.369598388671875, 0.3952789306640625, 0.42095947265625, 0.4466400146484375, 0.472320556640625, 0.4980010986328125, 0.523681640625, 0.5493621826171875, 0.575042724609375, 0.6007232666015625, 0.62640380859375, 0.6520843505859375, 0.677764892578125, 0.7034454345703125, 0.7291259765625, 0.7548065185546875, 0.780487060546875, 0.8061676025390625, 0.83184814453125, 0.8575286865234375, 0.883209228515625, 0.9088897705078125, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 4.0, 9.0, 19.0, 29.0, 30.0, 37.0, 56.0, 82.0, 124.0, 215.0, 246.0, 403.0, 587.0, 869.0, 1309.0, 1976.0, 3057.0, 4616.0, 7145.0, 11384.0, 17593.0, 27230.0, 42210.0, 62524.0, 88929.0, 116502.0, 134577.0, 136402.0, 116924.0, 89630.0, 63299.0, 42319.0, 27685.0, 17843.0, 11367.0, 7256.0, 4924.0, 3130.0, 1965.0, 1289.0, 882.0, 565.0, 374.0, 276.0, 205.0, 132.0, 97.0, 66.0, 48.0, 39.0, 23.0, 21.0, 8.0, 11.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.46142578125, -0.44605255126953125, -0.4306793212890625, -0.41530609130859375, -0.399932861328125, -0.38455963134765625, -0.3691864013671875, -0.35381317138671875, -0.33843994140625, -0.32306671142578125, -0.3076934814453125, -0.29232025146484375, -0.276947021484375, -0.26157379150390625, -0.2462005615234375, -0.23082733154296875, -0.2154541015625, -0.20008087158203125, -0.1847076416015625, -0.16933441162109375, -0.153961181640625, -0.13858795166015625, -0.1232147216796875, -0.10784149169921875, -0.09246826171875, -0.07709503173828125, -0.0617218017578125, -0.04634857177734375, -0.030975341796875, -0.01560211181640625, -0.0002288818359375, 0.01514434814453125, 0.030517578125, 0.04589080810546875, 0.0612640380859375, 0.07663726806640625, 0.092010498046875, 0.10738372802734375, 0.1227569580078125, 0.13813018798828125, 0.15350341796875, 0.16887664794921875, 0.1842498779296875, 0.19962310791015625, 0.214996337890625, 0.23036956787109375, 0.2457427978515625, 0.26111602783203125, 0.2764892578125, 0.29186248779296875, 0.3072357177734375, 0.32260894775390625, 0.337982177734375, 0.35335540771484375, 0.3687286376953125, 0.38410186767578125, 0.39947509765625, 0.41484832763671875, 0.4302215576171875, 0.44559478759765625, 0.460968017578125, 0.47634124755859375, 0.4917144775390625, 0.5070877075195312, 0.5224609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 16.0, 22.0, 25.0, 28.0, 40.0, 35.0, 52.0, 48.0, 61.0, 59.0, 68.0, 65.0, 69.0, 50.0, 56.0, 50.0, 29.0, 46.0, 27.0, 16.0, 21.0, 16.0, 16.0, 13.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.340576171875e-05, -5.150400102138519e-05, -4.9602240324020386e-05, -4.770047962665558e-05, -4.579871892929077e-05, -4.3896958231925964e-05, -4.199519753456116e-05, -4.009343683719635e-05, -3.819167613983154e-05, -3.6289915442466736e-05, -3.438815474510193e-05, -3.248639404773712e-05, -3.0584633350372314e-05, -2.8682872653007507e-05, -2.67811119556427e-05, -2.4879351258277893e-05, -2.2977590560913086e-05, -2.107582986354828e-05, -1.917406916618347e-05, -1.7272308468818665e-05, -1.5370547771453857e-05, -1.346878707408905e-05, -1.1567026376724243e-05, -9.665265679359436e-06, -7.763504981994629e-06, -5.861744284629822e-06, -3.959983587265015e-06, -2.0582228899002075e-06, -1.564621925354004e-07, 1.7452985048294067e-06, 3.647059202194214e-06, 5.548819899559021e-06, 7.450580596923828e-06, 9.352341294288635e-06, 1.1254101991653442e-05, 1.315586268901825e-05, 1.5057623386383057e-05, 1.6959384083747864e-05, 1.886114478111267e-05, 2.0762905478477478e-05, 2.2664666175842285e-05, 2.4566426873207092e-05, 2.64681875705719e-05, 2.8369948267936707e-05, 3.0271708965301514e-05, 3.217346966266632e-05, 3.407523036003113e-05, 3.5976991057395935e-05, 3.787875175476074e-05, 3.978051245212555e-05, 4.1682273149490356e-05, 4.3584033846855164e-05, 4.548579454421997e-05, 4.738755524158478e-05, 4.9289315938949585e-05, 5.119107663631439e-05, 5.30928373336792e-05, 5.4994598031044006e-05, 5.6896358728408813e-05, 5.879811942577362e-05, 6.069988012313843e-05, 6.260164082050323e-05, 6.450340151786804e-05, 6.640516221523285e-05, 6.830692291259766e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 12.0, 8.0, 18.0, 28.0, 35.0, 41.0, 74.0, 106.0, 182.0, 280.0, 517.0, 771.0, 1402.0, 2447.0, 4601.0, 8304.0, 15893.0, 30309.0, 56366.0, 98206.0, 150535.0, 190416.0, 179239.0, 131875.0, 80131.0, 45044.0, 24030.0, 12518.0, 6665.0, 3629.0, 2037.0, 1047.0, 704.0, 403.0, 240.0, 147.0, 87.0, 85.0, 35.0, 31.0, 17.0, 20.0, 6.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5778579711914062, -0.5570831298828125, -0.5363082885742188, -0.515533447265625, -0.49475860595703125, -0.4739837646484375, -0.45320892333984375, -0.43243408203125, -0.41165924072265625, -0.3908843994140625, -0.37010955810546875, -0.349334716796875, -0.32855987548828125, -0.3077850341796875, -0.28701019287109375, -0.2662353515625, -0.24546051025390625, -0.2246856689453125, -0.20391082763671875, -0.183135986328125, -0.16236114501953125, -0.1415863037109375, -0.12081146240234375, -0.10003662109375, -0.07926177978515625, -0.0584869384765625, -0.03771209716796875, -0.016937255859375, 0.00383758544921875, 0.0246124267578125, 0.04538726806640625, 0.066162109375, 0.08693695068359375, 0.1077117919921875, 0.12848663330078125, 0.149261474609375, 0.17003631591796875, 0.1908111572265625, 0.21158599853515625, 0.23236083984375, 0.25313568115234375, 0.2739105224609375, 0.29468536376953125, 0.315460205078125, 0.33623504638671875, 0.3570098876953125, 0.37778472900390625, 0.3985595703125, 0.41933441162109375, 0.4401092529296875, 0.46088409423828125, 0.481658935546875, 0.5024337768554688, 0.5232086181640625, 0.5439834594726562, 0.56475830078125, 0.5855331420898438, 0.6063079833984375, 0.6270828247070312, 0.647857666015625, 0.6686325073242188, 0.6894073486328125, 0.7101821899414062, 0.73095703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 15.0, 8.0, 13.0, 12.0, 20.0, 18.0, 25.0, 31.0, 37.0, 31.0, 28.0, 35.0, 34.0, 39.0, 44.0, 48.0, 59.0, 45.0, 46.0, 36.0, 47.0, 43.0, 39.0, 35.0, 25.0, 24.0, 28.0, 15.0, 16.0, 15.0, 14.0, 7.0, 13.0, 11.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.154296875, -0.14919281005859375, -0.1440887451171875, -0.13898468017578125, -0.133880615234375, -0.12877655029296875, -0.1236724853515625, -0.11856842041015625, -0.11346435546875, -0.10836029052734375, -0.1032562255859375, -0.09815216064453125, -0.093048095703125, -0.08794403076171875, -0.0828399658203125, -0.07773590087890625, -0.0726318359375, -0.06752777099609375, -0.0624237060546875, -0.05731964111328125, -0.052215576171875, -0.04711151123046875, -0.0420074462890625, -0.03690338134765625, -0.03179931640625, -0.02669525146484375, -0.0215911865234375, -0.01648712158203125, -0.011383056640625, -0.00627899169921875, -0.0011749267578125, 0.00392913818359375, 0.009033203125, 0.01413726806640625, 0.0192413330078125, 0.02434539794921875, 0.029449462890625, 0.03455352783203125, 0.0396575927734375, 0.04476165771484375, 0.04986572265625, 0.05496978759765625, 0.0600738525390625, 0.06517791748046875, 0.070281982421875, 0.07538604736328125, 0.0804901123046875, 0.08559417724609375, 0.0906982421875, 0.09580230712890625, 0.1009063720703125, 0.10601043701171875, 0.111114501953125, 0.11621856689453125, 0.1213226318359375, 0.12642669677734375, 0.13153076171875, 0.13663482666015625, 0.1417388916015625, 0.14684295654296875, 0.151947021484375, 0.15705108642578125, 0.1621551513671875, 0.16725921630859375, 0.17236328125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 16.0, 6.0, 15.0, 20.0, 18.0, 33.0, 39.0, 30.0, 43.0, 39.0, 54.0, 55.0, 60.0, 48.0, 60.0, 65.0, 46.0, 48.0, 45.0, 50.0, 34.0, 18.0, 22.0, 22.0, 19.0, 14.0, 14.0, 21.0, 7.0, 4.0, 6.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.6769119501113892, -1.6277453899383545, -1.5785787105560303, -1.5294121503829956, -1.4802454710006714, -1.4310789108276367, -1.3819122314453125, -1.3327456712722778, -1.2835791110992432, -1.2344125509262085, -1.1852458715438843, -1.1360793113708496, -1.0869126319885254, -1.0377460718154907, -0.9885794520378113, -0.9394128322601318, -0.8902461528778076, -0.8410795331001282, -0.7919129133224487, -0.7427463531494141, -0.6935796737670898, -0.6444131135940552, -0.5952464938163757, -0.5460798740386963, -0.49691325426101685, -0.4477466344833374, -0.39858001470565796, -0.3494134247303009, -0.30024680495262146, -0.251080185174942, -0.20191359519958496, -0.15274697542190552, -0.10358047485351562, -0.05441386252641678, -0.005247250199317932, 0.04391935467720032, 0.09308597445487976, 0.1422525942325592, 0.19141918420791626, 0.2405858039855957, 0.28975242376327515, 0.3389190435409546, 0.38808566331863403, 0.4372522532939911, 0.48641887307167053, 0.5355855226516724, 0.584752082824707, 0.6339187026023865, 0.6830853223800659, 0.7322519421577454, 0.7814185619354248, 0.8305851221084595, 0.8797518014907837, 0.9289183616638184, 0.9780849814414978, 1.0272516012191772, 1.076418161392212, 1.1255847215652466, 1.1747514009475708, 1.2239179611206055, 1.2730846405029297, 1.3222512006759644, 1.371417760848999, 1.4205844402313232, 1.4697511196136475]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 9.0, 22.0, 16.0, 26.0, 21.0, 23.0, 30.0, 30.0, 41.0, 38.0, 37.0, 39.0, 51.0, 48.0, 35.0, 56.0, 37.0, 38.0, 33.0, 31.0, 28.0, 35.0, 27.0, 34.0, 31.0, 28.0, 27.0, 19.0, 11.0, 7.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.144634485244751, -1.109297513961792, -1.073960542678833, -1.0386236906051636, -1.0032867193222046, -0.9679497480392456, -0.9326127767562866, -0.8972758054733276, -0.8619388937950134, -0.8266019225120544, -0.7912650108337402, -0.7559280395507812, -0.7205910682678223, -0.6852541565895081, -0.6499171853065491, -0.6145802736282349, -0.5792433023452759, -0.5439063310623169, -0.5085694193840027, -0.4732324481010437, -0.4378955066204071, -0.4025585651397705, -0.3672215938568115, -0.3318846523761749, -0.29654771089553833, -0.26121076941490173, -0.22587381303310394, -0.19053685665130615, -0.15519991517066956, -0.11986297369003296, -0.08452601730823517, -0.04918906092643738, -0.013852119445800781, 0.021484829485416412, 0.056821778416633606, 0.0921587273478508, 0.127495676279068, 0.1628326177597046, 0.19816957414150238, 0.23350653052330017, 0.26884347200393677, 0.30418041348457336, 0.33951735496520996, 0.37485432624816895, 0.41019126772880554, 0.44552820920944214, 0.4808651804924011, 0.5162020921707153, 0.5515390634536743, 0.5868760347366333, 0.6222129464149475, 0.6575499176979065, 0.6928868293762207, 0.7282238006591797, 0.7635607719421387, 0.7988977432250977, 0.8342346549034119, 0.8695716261863708, 0.9049085378646851, 0.940245509147644, 0.975582480430603, 1.0109193325042725, 1.0462563037872314, 1.0815932750701904, 1.1169302463531494]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 13.0, 11.0, 15.0, 41.0, 46.0, 109.0, 174.0, 333.0, 568.0, 1207.0, 2272.0, 4708.0, 9716.0, 20627.0, 44025.0, 95672.0, 203285.0, 409970.0, 706146.0, 909909.0, 798348.0, 501046.0, 258374.0, 121932.0, 55986.0, 25905.0, 12256.0, 5804.0, 2836.0, 1409.0, 723.0, 384.0, 184.0, 94.0, 64.0, 39.0, 19.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.755859375, -1.7052001953125, -1.654541015625, -1.6038818359375, -1.55322265625, -1.5025634765625, -1.451904296875, -1.4012451171875, -1.3505859375, -1.2999267578125, -1.249267578125, -1.1986083984375, -1.14794921875, -1.0972900390625, -1.046630859375, -0.9959716796875, -0.9453125, -0.8946533203125, -0.843994140625, -0.7933349609375, -0.74267578125, -0.6920166015625, -0.641357421875, -0.5906982421875, -0.5400390625, -0.4893798828125, -0.438720703125, -0.3880615234375, -0.33740234375, -0.2867431640625, -0.236083984375, -0.1854248046875, -0.134765625, -0.0841064453125, -0.033447265625, 0.0172119140625, 0.06787109375, 0.1185302734375, 0.169189453125, 0.2198486328125, 0.2705078125, 0.3211669921875, 0.371826171875, 0.4224853515625, 0.47314453125, 0.5238037109375, 0.574462890625, 0.6251220703125, 0.67578125, 0.7264404296875, 0.777099609375, 0.8277587890625, 0.87841796875, 0.9290771484375, 0.979736328125, 1.0303955078125, 1.0810546875, 1.1317138671875, 1.182373046875, 1.2330322265625, 1.28369140625, 1.3343505859375, 1.385009765625, 1.4356689453125, 1.486328125]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 13.0, 9.0, 12.0, 10.0, 19.0, 31.0, 30.0, 29.0, 26.0, 49.0, 33.0, 41.0, 45.0, 49.0, 38.0, 35.0, 40.0, 45.0, 37.0, 43.0, 29.0, 45.0, 33.0, 27.0, 30.0, 25.0, 16.0, 29.0, 25.0, 18.0, 17.0, 10.0, 7.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.787078857421875, -0.76019287109375, -0.733306884765625, -0.7064208984375, -0.679534912109375, -0.65264892578125, -0.625762939453125, -0.598876953125, -0.571990966796875, -0.54510498046875, -0.518218994140625, -0.4913330078125, -0.464447021484375, -0.43756103515625, -0.410675048828125, -0.3837890625, -0.356903076171875, -0.33001708984375, -0.303131103515625, -0.2762451171875, -0.249359130859375, -0.22247314453125, -0.195587158203125, -0.168701171875, -0.141815185546875, -0.11492919921875, -0.088043212890625, -0.0611572265625, -0.034271240234375, -0.00738525390625, 0.019500732421875, 0.04638671875, 0.073272705078125, 0.10015869140625, 0.127044677734375, 0.1539306640625, 0.180816650390625, 0.20770263671875, 0.234588623046875, 0.261474609375, 0.288360595703125, 0.31524658203125, 0.342132568359375, 0.3690185546875, 0.395904541015625, 0.42279052734375, 0.449676513671875, 0.4765625, 0.503448486328125, 0.53033447265625, 0.557220458984375, 0.5841064453125, 0.610992431640625, 0.63787841796875, 0.664764404296875, 0.691650390625, 0.718536376953125, 0.74542236328125, 0.772308349609375, 0.7991943359375, 0.826080322265625, 0.85296630859375, 0.879852294921875, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 13.0, 15.0, 24.0, 32.0, 52.0, 98.0, 134.0, 218.0, 400.0, 645.0, 1104.0, 1712.0, 2976.0, 4915.0, 8323.0, 14300.0, 23989.0, 40635.0, 68420.0, 112730.0, 179049.0, 273481.0, 385726.0, 496175.0, 562167.0, 549921.0, 468452.0, 354587.0, 243655.0, 158411.0, 97473.0, 59054.0, 34842.0, 20728.0, 12034.0, 7288.0, 4193.0, 2548.0, 1474.0, 897.0, 544.0, 323.0, 208.0, 126.0, 71.0, 49.0, 17.0, 19.0, 16.0, 3.0, 3.0, 2.0, 5.0], "bins": [-1.2412109375, -1.2065963745117188, -1.1719818115234375, -1.1373672485351562, -1.102752685546875, -1.0681381225585938, -1.0335235595703125, -0.9989089965820312, -0.96429443359375, -0.9296798706054688, -0.8950653076171875, -0.8604507446289062, -0.825836181640625, -0.7912216186523438, -0.7566070556640625, -0.7219924926757812, -0.6873779296875, -0.6527633666992188, -0.6181488037109375, -0.5835342407226562, -0.548919677734375, -0.5143051147460938, -0.4796905517578125, -0.44507598876953125, -0.41046142578125, -0.37584686279296875, -0.3412322998046875, -0.30661773681640625, -0.272003173828125, -0.23738861083984375, -0.2027740478515625, -0.16815948486328125, -0.133544921875, -0.09893035888671875, -0.0643157958984375, -0.02970123291015625, 0.004913330078125, 0.03952789306640625, 0.0741424560546875, 0.10875701904296875, 0.14337158203125, 0.17798614501953125, 0.2126007080078125, 0.24721527099609375, 0.281829833984375, 0.31644439697265625, 0.3510589599609375, 0.38567352294921875, 0.4202880859375, 0.45490264892578125, 0.4895172119140625, 0.5241317749023438, 0.558746337890625, 0.5933609008789062, 0.6279754638671875, 0.6625900268554688, 0.69720458984375, 0.7318191528320312, 0.7664337158203125, 0.8010482788085938, 0.835662841796875, 0.8702774047851562, 0.9048919677734375, 0.9395065307617188, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 13.0, 10.0, 15.0, 11.0, 25.0, 26.0, 24.0, 32.0, 44.0, 62.0, 72.0, 77.0, 112.0, 123.0, 109.0, 142.0, 148.0, 164.0, 194.0, 216.0, 214.0, 193.0, 221.0, 194.0, 202.0, 178.0, 155.0, 176.0, 144.0, 127.0, 103.0, 82.0, 92.0, 73.0, 59.0, 41.0, 50.0, 29.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 2.0], "bins": [-0.425048828125, -0.4124870300292969, -0.39992523193359375, -0.3873634338378906, -0.3748016357421875, -0.3622398376464844, -0.34967803955078125, -0.3371162414550781, -0.324554443359375, -0.3119926452636719, -0.29943084716796875, -0.2868690490722656, -0.2743072509765625, -0.2617454528808594, -0.24918365478515625, -0.23662185668945312, -0.22406005859375, -0.21149826049804688, -0.19893646240234375, -0.18637466430664062, -0.1738128662109375, -0.16125106811523438, -0.14868927001953125, -0.13612747192382812, -0.123565673828125, -0.11100387573242188, -0.09844207763671875, -0.08588027954101562, -0.0733184814453125, -0.060756683349609375, -0.04819488525390625, -0.035633087158203125, -0.0230712890625, -0.010509490966796875, 0.00205230712890625, 0.014614105224609375, 0.0271759033203125, 0.039737701416015625, 0.05229949951171875, 0.06486129760742188, 0.077423095703125, 0.08998489379882812, 0.10254669189453125, 0.11510848999023438, 0.1276702880859375, 0.14023208618164062, 0.15279388427734375, 0.16535568237304688, 0.17791748046875, 0.19047927856445312, 0.20304107666015625, 0.21560287475585938, 0.2281646728515625, 0.24072647094726562, 0.25328826904296875, 0.2658500671386719, 0.278411865234375, 0.2909736633300781, 0.30353546142578125, 0.3160972595214844, 0.3286590576171875, 0.3412208557128906, 0.35378265380859375, 0.3663444519042969, 0.37890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 14.0, 20.0, 21.0, 23.0, 32.0, 42.0, 41.0, 47.0, 55.0, 63.0, 73.0, 64.0, 59.0, 70.0, 55.0, 55.0, 47.0, 50.0, 23.0, 22.0, 22.0, 17.0, 15.0, 12.0, 9.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7150763273239136, -1.6594101190567017, -1.6037440299987793, -1.5480778217315674, -1.4924116134643555, -1.4367454051971436, -1.3810791969299316, -1.3254131078720093, -1.2697468996047974, -1.2140806913375854, -1.158414602279663, -1.1027483940124512, -1.0470821857452393, -0.9914159774780273, -0.9357498288154602, -0.8800836801528931, -0.8244174718856812, -0.7687512636184692, -0.7130851149559021, -0.657418966293335, -0.601752758026123, -0.5460865497589111, -0.490420401096344, -0.43475422263145447, -0.37908804416656494, -0.3234218657016754, -0.2677556872367859, -0.21208950877189636, -0.15642333030700684, -0.10075715184211731, -0.04509097337722778, 0.010575205087661743, 0.06624150276184082, 0.12190768122673035, 0.17757385969161987, 0.2332400381565094, 0.2889062166213989, 0.34457239508628845, 0.400238573551178, 0.4559047520160675, 0.511570930480957, 0.567237138748169, 0.6229032874107361, 0.6785694360733032, 0.7342356443405151, 0.789901852607727, 0.8455680012702942, 0.9012341499328613, 0.9569003582000732, 1.0125665664672852, 1.068232774734497, 1.1238988637924194, 1.1795650720596313, 1.2352312803268433, 1.2908973693847656, 1.3465635776519775, 1.4022297859191895, 1.4578959941864014, 1.5135622024536133, 1.5692282915115356, 1.6248944997787476, 1.6805607080459595, 1.7362267971038818, 1.7918930053710938, 1.8475592136383057]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 12.0, 9.0, 17.0, 12.0, 14.0, 25.0, 23.0, 24.0, 23.0, 38.0, 36.0, 38.0, 33.0, 33.0, 38.0, 52.0, 30.0, 51.0, 30.0, 50.0, 43.0, 42.0, 31.0, 35.0, 34.0, 33.0, 28.0, 11.0, 27.0, 16.0, 11.0, 14.0, 10.0, 5.0, 9.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0477453470230103, -1.0165857076644897, -0.9854260087013245, -0.9542663097381592, -0.9231066703796387, -0.8919470310211182, -0.8607873320579529, -0.8296276330947876, -0.7984679937362671, -0.7673083543777466, -0.7361486554145813, -0.704988956451416, -0.6738293170928955, -0.642669677734375, -0.6115099787712097, -0.5803502798080444, -0.5491906404495239, -0.5180310010910034, -0.48687130212783813, -0.45571163296699524, -0.42455196380615234, -0.39339229464530945, -0.36223262548446655, -0.33107295632362366, -0.29991328716278076, -0.26875361800193787, -0.23759394884109497, -0.20643427968025208, -0.17527461051940918, -0.14411494135856628, -0.11295527219772339, -0.0817956030368805, -0.0506359338760376, -0.019476264715194702, 0.011683404445648193, 0.04284307360649109, 0.07400274276733398, 0.10516241192817688, 0.13632208108901978, 0.16748175024986267, 0.19864141941070557, 0.22980108857154846, 0.26096075773239136, 0.29212042689323425, 0.32328009605407715, 0.35443976521492004, 0.38559943437576294, 0.41675910353660583, 0.44791877269744873, 0.4790784418582916, 0.5102381110191345, 0.5413978099822998, 0.5725574493408203, 0.6037170886993408, 0.6348767876625061, 0.6660364866256714, 0.6971961259841919, 0.7283557653427124, 0.7595154643058777, 0.790675163269043, 0.8218348026275635, 0.852994441986084, 0.8841541409492493, 0.9153138399124146, 0.9464734792709351]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 7.0, 8.0, 17.0, 33.0, 33.0, 74.0, 89.0, 155.0, 243.0, 405.0, 644.0, 1115.0, 1781.0, 2826.0, 4627.0, 7473.0, 12351.0, 20138.0, 33082.0, 53694.0, 83657.0, 124547.0, 163936.0, 168373.0, 130924.0, 89435.0, 57114.0, 35471.0, 22043.0, 13466.0, 8199.0, 4824.0, 2978.0, 1825.0, 1112.0, 689.0, 447.0, 265.0, 164.0, 106.0, 72.0, 49.0, 38.0, 14.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21484375, -0.20660400390625, -0.1983642578125, -0.19012451171875, -0.181884765625, -0.17364501953125, -0.1654052734375, -0.15716552734375, -0.14892578125, -0.14068603515625, -0.1324462890625, -0.12420654296875, -0.115966796875, -0.10772705078125, -0.0994873046875, -0.09124755859375, -0.0830078125, -0.07476806640625, -0.0665283203125, -0.05828857421875, -0.050048828125, -0.04180908203125, -0.0335693359375, -0.02532958984375, -0.01708984375, -0.00885009765625, -0.0006103515625, 0.00762939453125, 0.015869140625, 0.02410888671875, 0.0323486328125, 0.04058837890625, 0.048828125, 0.05706787109375, 0.0653076171875, 0.07354736328125, 0.081787109375, 0.09002685546875, 0.0982666015625, 0.10650634765625, 0.11474609375, 0.12298583984375, 0.1312255859375, 0.13946533203125, 0.147705078125, 0.15594482421875, 0.1641845703125, 0.17242431640625, 0.1806640625, 0.18890380859375, 0.1971435546875, 0.20538330078125, 0.213623046875, 0.22186279296875, 0.2301025390625, 0.23834228515625, 0.24658203125, 0.25482177734375, 0.2630615234375, 0.27130126953125, 0.279541015625, 0.28778076171875, 0.2960205078125, 0.30426025390625, 0.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 5.0, 7.0, 16.0, 18.0, 14.0, 16.0, 22.0, 27.0, 31.0, 33.0, 41.0, 35.0, 36.0, 30.0, 44.0, 47.0, 42.0, 51.0, 44.0, 45.0, 31.0, 40.0, 37.0, 31.0, 27.0, 35.0, 14.0, 32.0, 27.0, 26.0, 8.0, 12.0, 15.0, 8.0, 5.0, 6.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.09375, -1.0586395263671875, -1.023529052734375, -0.9884185791015625, -0.95330810546875, -0.9181976318359375, -0.883087158203125, -0.8479766845703125, -0.8128662109375, -0.7777557373046875, -0.742645263671875, -0.7075347900390625, -0.67242431640625, -0.6373138427734375, -0.602203369140625, -0.5670928955078125, -0.531982421875, -0.4968719482421875, -0.461761474609375, -0.4266510009765625, -0.39154052734375, -0.3564300537109375, -0.321319580078125, -0.2862091064453125, -0.2510986328125, -0.2159881591796875, -0.180877685546875, -0.1457672119140625, -0.11065673828125, -0.0755462646484375, -0.040435791015625, -0.0053253173828125, 0.02978515625, 0.0648956298828125, 0.100006103515625, 0.1351165771484375, 0.17022705078125, 0.2053375244140625, 0.240447998046875, 0.2755584716796875, 0.3106689453125, 0.3457794189453125, 0.380889892578125, 0.4160003662109375, 0.45111083984375, 0.4862213134765625, 0.521331787109375, 0.5564422607421875, 0.591552734375, 0.6266632080078125, 0.661773681640625, 0.6968841552734375, 0.73199462890625, 0.7671051025390625, 0.802215576171875, 0.8373260498046875, 0.8724365234375, 0.9075469970703125, 0.942657470703125, 0.9777679443359375, 1.01287841796875, 1.0479888916015625, 1.083099365234375, 1.1182098388671875, 1.1533203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 16.0, 21.0, 26.0, 44.0, 65.0, 100.0, 151.0, 321.0, 527.0, 1001.0, 1953.0, 3783.0, 7899.0, 16429.0, 34407.0, 72623.0, 143544.0, 232116.0, 237087.0, 149841.0, 76474.0, 36324.0, 17294.0, 8163.0, 4082.0, 1903.0, 1014.0, 571.0, 291.0, 193.0, 83.0, 63.0, 48.0, 22.0, 25.0, 14.0, 8.0, 7.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.437255859375, -0.424407958984375, -0.41156005859375, -0.398712158203125, -0.3858642578125, -0.373016357421875, -0.36016845703125, -0.347320556640625, -0.33447265625, -0.321624755859375, -0.30877685546875, -0.295928955078125, -0.2830810546875, -0.270233154296875, -0.25738525390625, -0.244537353515625, -0.231689453125, -0.218841552734375, -0.20599365234375, -0.193145751953125, -0.1802978515625, -0.167449951171875, -0.15460205078125, -0.141754150390625, -0.12890625, -0.116058349609375, -0.10321044921875, -0.090362548828125, -0.0775146484375, -0.064666748046875, -0.05181884765625, -0.038970947265625, -0.026123046875, -0.013275146484375, -0.00042724609375, 0.012420654296875, 0.0252685546875, 0.038116455078125, 0.05096435546875, 0.063812255859375, 0.07666015625, 0.089508056640625, 0.10235595703125, 0.115203857421875, 0.1280517578125, 0.140899658203125, 0.15374755859375, 0.166595458984375, 0.179443359375, 0.192291259765625, 0.20513916015625, 0.217987060546875, 0.2308349609375, 0.243682861328125, 0.25653076171875, 0.269378662109375, 0.2822265625, 0.295074462890625, 0.30792236328125, 0.320770263671875, 0.3336181640625, 0.346466064453125, 0.35931396484375, 0.372161865234375, 0.385009765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 10.0, 22.0, 23.0, 25.0, 25.0, 32.0, 25.0, 40.0, 36.0, 36.0, 37.0, 44.0, 35.0, 36.0, 34.0, 47.0, 40.0, 39.0, 47.0, 42.0, 43.0, 25.0, 43.0, 29.0, 27.0, 31.0, 15.0, 14.0, 13.0, 12.0, 8.0, 8.0, 6.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.748046875, -0.7252426147460938, -0.7024383544921875, -0.6796340942382812, -0.656829833984375, -0.6340255737304688, -0.6112213134765625, -0.5884170532226562, -0.56561279296875, -0.5428085327148438, -0.5200042724609375, -0.49720001220703125, -0.474395751953125, -0.45159149169921875, -0.4287872314453125, -0.40598297119140625, -0.3831787109375, -0.36037445068359375, -0.3375701904296875, -0.31476593017578125, -0.291961669921875, -0.26915740966796875, -0.2463531494140625, -0.22354888916015625, -0.20074462890625, -0.17794036865234375, -0.1551361083984375, -0.13233184814453125, -0.109527587890625, -0.08672332763671875, -0.0639190673828125, -0.04111480712890625, -0.018310546875, 0.00449371337890625, 0.0272979736328125, 0.05010223388671875, 0.072906494140625, 0.09571075439453125, 0.1185150146484375, 0.14131927490234375, 0.16412353515625, 0.18692779541015625, 0.2097320556640625, 0.23253631591796875, 0.255340576171875, 0.27814483642578125, 0.3009490966796875, 0.32375335693359375, 0.3465576171875, 0.36936187744140625, 0.3921661376953125, 0.41497039794921875, 0.437774658203125, 0.46057891845703125, 0.4833831787109375, 0.5061874389648438, 0.52899169921875, 0.5517959594726562, 0.5746002197265625, 0.5974044799804688, 0.620208740234375, 0.6430130004882812, 0.6658172607421875, 0.6886215209960938, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 7.0, 15.0, 20.0, 30.0, 33.0, 39.0, 80.0, 106.0, 159.0, 253.0, 363.0, 540.0, 882.0, 1338.0, 2145.0, 3523.0, 5848.0, 10449.0, 19765.0, 42676.0, 104117.0, 275394.0, 334154.0, 138400.0, 53669.0, 24343.0, 12486.0, 6746.0, 4049.0, 2498.0, 1514.0, 985.0, 650.0, 397.0, 284.0, 186.0, 112.0, 71.0, 69.0, 46.0, 28.0, 23.0, 22.0, 12.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1417236328125, -0.13717269897460938, -0.13262176513671875, -0.12807083129882812, -0.1235198974609375, -0.11896896362304688, -0.11441802978515625, -0.10986709594726562, -0.105316162109375, -0.10076522827148438, -0.09621429443359375, -0.09166336059570312, -0.0871124267578125, -0.08256149291992188, -0.07801055908203125, -0.07345962524414062, -0.06890869140625, -0.06435775756835938, -0.05980682373046875, -0.055255889892578125, -0.0507049560546875, -0.046154022216796875, -0.04160308837890625, -0.037052154541015625, -0.032501220703125, -0.027950286865234375, -0.02339935302734375, -0.018848419189453125, -0.0142974853515625, -0.009746551513671875, -0.00519561767578125, -0.000644683837890625, 0.00390625, 0.008457183837890625, 0.01300811767578125, 0.017559051513671875, 0.0221099853515625, 0.026660919189453125, 0.03121185302734375, 0.035762786865234375, 0.040313720703125, 0.044864654541015625, 0.04941558837890625, 0.053966522216796875, 0.0585174560546875, 0.06306838989257812, 0.06761932373046875, 0.07217025756835938, 0.07672119140625, 0.08127212524414062, 0.08582305908203125, 0.09037399291992188, 0.0949249267578125, 0.09947586059570312, 0.10402679443359375, 0.10857772827148438, 0.113128662109375, 0.11767959594726562, 0.12223052978515625, 0.12678146362304688, 0.1313323974609375, 0.13588333129882812, 0.14043426513671875, 0.14498519897460938, 0.1495361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 12.0, 15.0, 12.0, 30.0, 30.0, 31.0, 34.0, 43.0, 42.0, 46.0, 42.0, 64.0, 59.0, 59.0, 50.0, 56.0, 43.0, 51.0, 38.0, 39.0, 29.0, 30.0, 27.0, 21.0, 10.0, 9.0, 11.0, 10.0, 7.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0132789611816406e-05, -9.812414646148682e-06, -9.492039680480957e-06, -9.171664714813232e-06, -8.851289749145508e-06, -8.530914783477783e-06, -8.210539817810059e-06, -7.890164852142334e-06, -7.569789886474609e-06, -7.249414920806885e-06, -6.92903995513916e-06, -6.6086649894714355e-06, -6.288290023803711e-06, -5.967915058135986e-06, -5.647540092468262e-06, -5.327165126800537e-06, -5.0067901611328125e-06, -4.686415195465088e-06, -4.366040229797363e-06, -4.045665264129639e-06, -3.725290298461914e-06, -3.4049153327941895e-06, -3.084540367126465e-06, -2.7641654014587402e-06, -2.4437904357910156e-06, -2.123415470123291e-06, -1.8030405044555664e-06, -1.4826655387878418e-06, -1.1622905731201172e-06, -8.419156074523926e-07, -5.21540641784668e-07, -2.0116567611694336e-07, 1.1920928955078125e-07, 4.3958425521850586e-07, 7.599592208862305e-07, 1.080334186553955e-06, 1.4007091522216797e-06, 1.7210841178894043e-06, 2.041459083557129e-06, 2.3618340492248535e-06, 2.682209014892578e-06, 3.0025839805603027e-06, 3.3229589462280273e-06, 3.643333911895752e-06, 3.9637088775634766e-06, 4.284083843231201e-06, 4.604458808898926e-06, 4.92483377456665e-06, 5.245208740234375e-06, 5.5655837059021e-06, 5.885958671569824e-06, 6.206333637237549e-06, 6.5267086029052734e-06, 6.847083568572998e-06, 7.167458534240723e-06, 7.487833499908447e-06, 7.808208465576172e-06, 8.128583431243896e-06, 8.448958396911621e-06, 8.769333362579346e-06, 9.08970832824707e-06, 9.410083293914795e-06, 9.73045825958252e-06, 1.0050833225250244e-05, 1.0371208190917969e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 0.0, 7.0, 18.0, 19.0, 27.0, 53.0, 80.0, 119.0, 212.0, 291.0, 476.0, 824.0, 1382.0, 2432.0, 4030.0, 7078.0, 12623.0, 23080.0, 43206.0, 84580.0, 157625.0, 234993.0, 210404.0, 124752.0, 64491.0, 33679.0, 18115.0, 10100.0, 5688.0, 3372.0, 1835.0, 1180.0, 700.0, 384.0, 259.0, 164.0, 100.0, 64.0, 42.0, 20.0, 19.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111572265625, -0.1075592041015625, -0.103546142578125, -0.0995330810546875, -0.09552001953125, -0.0915069580078125, -0.087493896484375, -0.0834808349609375, -0.0794677734375, -0.0754547119140625, -0.071441650390625, -0.0674285888671875, -0.06341552734375, -0.0594024658203125, -0.055389404296875, -0.0513763427734375, -0.04736328125, -0.0433502197265625, -0.039337158203125, -0.0353240966796875, -0.03131103515625, -0.0272979736328125, -0.023284912109375, -0.0192718505859375, -0.0152587890625, -0.0112457275390625, -0.007232666015625, -0.0032196044921875, 0.00079345703125, 0.0048065185546875, 0.008819580078125, 0.0128326416015625, 0.016845703125, 0.0208587646484375, 0.024871826171875, 0.0288848876953125, 0.03289794921875, 0.0369110107421875, 0.040924072265625, 0.0449371337890625, 0.0489501953125, 0.0529632568359375, 0.056976318359375, 0.0609893798828125, 0.06500244140625, 0.0690155029296875, 0.073028564453125, 0.0770416259765625, 0.0810546875, 0.0850677490234375, 0.089080810546875, 0.0930938720703125, 0.09710693359375, 0.1011199951171875, 0.105133056640625, 0.1091461181640625, 0.1131591796875, 0.1171722412109375, 0.121185302734375, 0.1251983642578125, 0.12921142578125, 0.1332244873046875, 0.137237548828125, 0.1412506103515625, 0.145263671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 8.0, 6.0, 9.0, 17.0, 23.0, 31.0, 40.0, 47.0, 59.0, 60.0, 76.0, 96.0, 70.0, 84.0, 81.0, 55.0, 50.0, 42.0, 27.0, 22.0, 19.0, 7.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.028400421142578125, -0.02716827392578125, -0.025936126708984375, -0.0247039794921875, -0.023471832275390625, -0.02223968505859375, -0.021007537841796875, -0.019775390625, -0.018543243408203125, -0.01731109619140625, -0.016078948974609375, -0.0148468017578125, -0.013614654541015625, -0.01238250732421875, -0.011150360107421875, -0.009918212890625, -0.008686065673828125, -0.00745391845703125, -0.006221771240234375, -0.0049896240234375, -0.003757476806640625, -0.00252532958984375, -0.001293182373046875, -6.103515625e-05, 0.001171112060546875, 0.00240325927734375, 0.003635406494140625, 0.0048675537109375, 0.006099700927734375, 0.00733184814453125, 0.008563995361328125, 0.009796142578125, 0.011028289794921875, 0.01226043701171875, 0.013492584228515625, 0.0147247314453125, 0.015956878662109375, 0.01718902587890625, 0.018421173095703125, 0.0196533203125, 0.020885467529296875, 0.02211761474609375, 0.023349761962890625, 0.0245819091796875, 0.025814056396484375, 0.02704620361328125, 0.028278350830078125, 0.029510498046875, 0.030742645263671875, 0.03197479248046875, 0.033206939697265625, 0.0344390869140625, 0.035671234130859375, 0.03690338134765625, 0.038135528564453125, 0.03936767578125, 0.040599822998046875, 0.04183197021484375, 0.043064117431640625, 0.0442962646484375, 0.045528411865234375, 0.04676055908203125, 0.047992706298828125, 0.049224853515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 7.0, 6.0, 6.0, 9.0, 10.0, 16.0, 19.0, 20.0, 28.0, 48.0, 30.0, 45.0, 46.0, 66.0, 55.0, 71.0, 69.0, 54.0, 70.0, 52.0, 47.0, 43.0, 45.0, 25.0, 23.0, 18.0, 18.0, 15.0, 9.0, 10.0, 10.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.644814133644104, -1.5906760692596436, -1.5365378856658936, -1.482399821281433, -1.428261637687683, -1.3741235733032227, -1.3199853897094727, -1.2658473253250122, -1.2117092609405518, -1.1575711965560913, -1.1034330129623413, -1.0492949485778809, -0.9951568245887756, -0.9410187005996704, -0.8868805766105652, -0.83274245262146, -0.7786043286323547, -0.7244662046432495, -0.6703280806541443, -0.6161899566650391, -0.5620518922805786, -0.5079137682914734, -0.45377564430236816, -0.3996375501155853, -0.3454994261264801, -0.2913613021373749, -0.23722320795059204, -0.18308508396148682, -0.12894697487354279, -0.07480886578559875, -0.02067074179649353, 0.03346735239028931, 0.08760547637939453, 0.14174358546733856, 0.1958816945552826, 0.2500198185443878, 0.30415791273117065, 0.3582960367202759, 0.4124341607093811, 0.46657225489616394, 0.5207103490829468, 0.574848473072052, 0.6289865970611572, 0.6831246614456177, 0.7372627854347229, 0.7914009094238281, 0.8455390334129333, 0.8996771574020386, 0.9538152813911438, 1.007953405380249, 1.0620914697647095, 1.1162296533584595, 1.17036771774292, 1.22450590133667, 1.2786439657211304, 1.3327820301055908, 1.3869202136993408, 1.4410582780838013, 1.4951964616775513, 1.5493345260620117, 1.6034727096557617, 1.6576107740402222, 1.7117488384246826, 1.7658870220184326, 1.820025086402893]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 16.0, 11.0, 14.0, 17.0, 27.0, 20.0, 24.0, 28.0, 41.0, 36.0, 33.0, 33.0, 37.0, 41.0, 44.0, 40.0, 41.0, 35.0, 49.0, 46.0, 33.0, 39.0, 36.0, 29.0, 29.0, 26.0, 14.0, 24.0, 15.0, 13.0, 12.0, 8.0, 7.0, 10.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0365345478057861, -1.0054458379745483, -0.9743571877479553, -0.9432684779167175, -0.9121797680854797, -0.8810911178588867, -0.8500024080276489, -0.8189136981964111, -0.7878249883651733, -0.7567362785339355, -0.7256476283073425, -0.6945589184761047, -0.6634702086448669, -0.6323815584182739, -0.6012928485870361, -0.5702041387557983, -0.5391154289245605, -0.5080267190933228, -0.47693803906440735, -0.44584935903549194, -0.41476064920425415, -0.38367196917533875, -0.35258328914642334, -0.32149457931518555, -0.29040592908859253, -0.2593172490596771, -0.22822853922843933, -0.19713985919952393, -0.16605114936828613, -0.13496246933937073, -0.10387377440929413, -0.07278507947921753, -0.041696369647979736, -0.010607676580548286, 0.020481016486883163, 0.051569707691669464, 0.08265840262174606, 0.11374709010124207, 0.14483578503131866, 0.17592447996139526, 0.20701317489147186, 0.23810186982154846, 0.26919054985046387, 0.30027925968170166, 0.33136793971061707, 0.36245661973953247, 0.39354532957077026, 0.42463403940200806, 0.45572271943092346, 0.48681139945983887, 0.5179001092910767, 0.5489888191223145, 0.5800774693489075, 0.6111661791801453, 0.6422548890113831, 0.6733435392379761, 0.7044322490692139, 0.7355209589004517, 0.7666096091270447, 0.7976983189582825, 0.8287870287895203, 0.8598756790161133, 0.8909643888473511, 0.9220530986785889, 0.9531418085098267]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 15.0, 13.0, 24.0, 35.0, 67.0, 98.0, 133.0, 251.0, 436.0, 672.0, 1159.0, 2024.0, 3361.0, 5546.0, 9478.0, 15526.0, 24875.0, 38559.0, 57642.0, 80537.0, 104299.0, 122948.0, 129396.0, 121257.0, 101697.0, 77271.0, 54921.0, 37020.0, 23107.0, 14401.0, 8788.0, 5247.0, 3018.0, 1896.0, 1153.0, 637.0, 369.0, 241.0, 147.0, 106.0, 59.0, 37.0, 27.0, 21.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 6.0], "bins": [-1.0537109375, -1.0231094360351562, -0.9925079345703125, -0.9619064331054688, -0.931304931640625, -0.9007034301757812, -0.8701019287109375, -0.8395004272460938, -0.80889892578125, -0.7782974243164062, -0.7476959228515625, -0.7170944213867188, -0.686492919921875, -0.6558914184570312, -0.6252899169921875, -0.5946884155273438, -0.5640869140625, -0.5334854125976562, -0.5028839111328125, -0.47228240966796875, -0.441680908203125, -0.41107940673828125, -0.3804779052734375, -0.34987640380859375, -0.31927490234375, -0.28867340087890625, -0.2580718994140625, -0.22747039794921875, -0.196868896484375, -0.16626739501953125, -0.1356658935546875, -0.10506439208984375, -0.074462890625, -0.04386138916015625, -0.0132598876953125, 0.01734161376953125, 0.047943115234375, 0.07854461669921875, 0.1091461181640625, 0.13974761962890625, 0.17034912109375, 0.20095062255859375, 0.2315521240234375, 0.26215362548828125, 0.292755126953125, 0.32335662841796875, 0.3539581298828125, 0.38455963134765625, 0.4151611328125, 0.44576263427734375, 0.4763641357421875, 0.5069656372070312, 0.537567138671875, 0.5681686401367188, 0.5987701416015625, 0.6293716430664062, 0.65997314453125, 0.6905746459960938, 0.7211761474609375, 0.7517776489257812, 0.782379150390625, 0.8129806518554688, 0.8435821533203125, 0.8741836547851562, 0.90478515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 12.0, 5.0, 14.0, 16.0, 11.0, 23.0, 35.0, 22.0, 33.0, 31.0, 30.0, 44.0, 49.0, 44.0, 60.0, 49.0, 53.0, 52.0, 37.0, 45.0, 44.0, 43.0, 30.0, 25.0, 28.0, 29.0, 25.0, 8.0, 16.0, 11.0, 15.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.22607421875, -1.1884765625, -1.15087890625, -1.11328125, -1.07568359375, -1.0380859375, -1.00048828125, -0.962890625, -0.92529296875, -0.8876953125, -0.85009765625, -0.8125, -0.77490234375, -0.7373046875, -0.69970703125, -0.662109375, -0.62451171875, -0.5869140625, -0.54931640625, -0.51171875, -0.47412109375, -0.4365234375, -0.39892578125, -0.361328125, -0.32373046875, -0.2861328125, -0.24853515625, -0.2109375, -0.17333984375, -0.1357421875, -0.09814453125, -0.060546875, -0.02294921875, 0.0146484375, 0.05224609375, 0.08984375, 0.12744140625, 0.1650390625, 0.20263671875, 0.240234375, 0.27783203125, 0.3154296875, 0.35302734375, 0.390625, 0.42822265625, 0.4658203125, 0.50341796875, 0.541015625, 0.57861328125, 0.6162109375, 0.65380859375, 0.69140625, 0.72900390625, 0.7666015625, 0.80419921875, 0.841796875, 0.87939453125, 0.9169921875, 0.95458984375, 0.9921875, 1.02978515625, 1.0673828125, 1.10498046875, 1.142578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 5.0, 13.0, 18.0, 27.0, 37.0, 68.0, 94.0, 179.0, 303.0, 486.0, 819.0, 1395.0, 2398.0, 3926.0, 6242.0, 10014.0, 16372.0, 25509.0, 38498.0, 55605.0, 75921.0, 97229.0, 114464.0, 121588.0, 117499.0, 101670.0, 80640.0, 59727.0, 42282.0, 27995.0, 18212.0, 11424.0, 6979.0, 4390.0, 2663.0, 1530.0, 971.0, 557.0, 339.0, 179.0, 129.0, 59.0, 41.0, 23.0, 12.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.97216796875, -0.9423599243164062, -0.9125518798828125, -0.8827438354492188, -0.852935791015625, -0.8231277465820312, -0.7933197021484375, -0.7635116577148438, -0.73370361328125, -0.7038955688476562, -0.6740875244140625, -0.6442794799804688, -0.614471435546875, -0.5846633911132812, -0.5548553466796875, -0.5250473022460938, -0.4952392578125, -0.46543121337890625, -0.4356231689453125, -0.40581512451171875, -0.376007080078125, -0.34619903564453125, -0.3163909912109375, -0.28658294677734375, -0.25677490234375, -0.22696685791015625, -0.1971588134765625, -0.16735076904296875, -0.137542724609375, -0.10773468017578125, -0.0779266357421875, -0.04811859130859375, -0.018310546875, 0.01149749755859375, 0.0413055419921875, 0.07111358642578125, 0.100921630859375, 0.13072967529296875, 0.1605377197265625, 0.19034576416015625, 0.22015380859375, 0.24996185302734375, 0.2797698974609375, 0.30957794189453125, 0.339385986328125, 0.36919403076171875, 0.3990020751953125, 0.42881011962890625, 0.4586181640625, 0.48842620849609375, 0.5182342529296875, 0.5480422973632812, 0.577850341796875, 0.6076583862304688, 0.6374664306640625, 0.6672744750976562, 0.69708251953125, 0.7268905639648438, 0.7566986083984375, 0.7865066528320312, 0.816314697265625, 0.8461227416992188, 0.8759307861328125, 0.9057388305664062, 0.935546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 7.0, 16.0, 12.0, 29.0, 22.0, 21.0, 28.0, 25.0, 44.0, 31.0, 42.0, 53.0, 47.0, 40.0, 41.0, 30.0, 41.0, 34.0, 44.0, 47.0, 38.0, 46.0, 28.0, 32.0, 26.0, 22.0, 23.0, 26.0, 18.0, 23.0, 10.0, 9.0, 8.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5962295532226562, -0.5747833251953125, -0.5533370971679688, -0.531890869140625, -0.5104446411132812, -0.4889984130859375, -0.46755218505859375, -0.44610595703125, -0.42465972900390625, -0.4032135009765625, -0.38176727294921875, -0.360321044921875, -0.33887481689453125, -0.3174285888671875, -0.29598236083984375, -0.2745361328125, -0.25308990478515625, -0.2316436767578125, -0.21019744873046875, -0.188751220703125, -0.16730499267578125, -0.1458587646484375, -0.12441253662109375, -0.10296630859375, -0.08152008056640625, -0.0600738525390625, -0.03862762451171875, -0.017181396484375, 0.00426483154296875, 0.0257110595703125, 0.04715728759765625, 0.068603515625, 0.09004974365234375, 0.1114959716796875, 0.13294219970703125, 0.154388427734375, 0.17583465576171875, 0.1972808837890625, 0.21872711181640625, 0.24017333984375, 0.26161956787109375, 0.2830657958984375, 0.30451202392578125, 0.325958251953125, 0.34740447998046875, 0.3688507080078125, 0.39029693603515625, 0.4117431640625, 0.43318939208984375, 0.4546356201171875, 0.47608184814453125, 0.497528076171875, 0.5189743041992188, 0.5404205322265625, 0.5618667602539062, 0.58331298828125, 0.6047592163085938, 0.6262054443359375, 0.6476516723632812, 0.669097900390625, 0.6905441284179688, 0.7119903564453125, 0.7334365844726562, 0.7548828125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 21.0, 26.0, 52.0, 71.0, 107.0, 147.0, 193.0, 351.0, 498.0, 812.0, 1331.0, 2348.0, 4114.0, 7777.0, 14953.0, 29138.0, 56813.0, 104569.0, 168142.0, 209219.0, 184407.0, 121519.0, 67684.0, 35248.0, 17903.0, 9201.0, 4971.0, 2733.0, 1586.0, 945.0, 573.0, 352.0, 242.0, 158.0, 103.0, 59.0, 48.0, 39.0, 21.0, 18.0, 15.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.70123291015625, -0.6783447265625, -0.65545654296875, -0.632568359375, -0.60968017578125, -0.5867919921875, -0.56390380859375, -0.541015625, -0.51812744140625, -0.4952392578125, -0.47235107421875, -0.449462890625, -0.42657470703125, -0.4036865234375, -0.38079833984375, -0.35791015625, -0.33502197265625, -0.3121337890625, -0.28924560546875, -0.266357421875, -0.24346923828125, -0.2205810546875, -0.19769287109375, -0.1748046875, -0.15191650390625, -0.1290283203125, -0.10614013671875, -0.083251953125, -0.06036376953125, -0.0374755859375, -0.01458740234375, 0.00830078125, 0.03118896484375, 0.0540771484375, 0.07696533203125, 0.099853515625, 0.12274169921875, 0.1456298828125, 0.16851806640625, 0.19140625, 0.21429443359375, 0.2371826171875, 0.26007080078125, 0.282958984375, 0.30584716796875, 0.3287353515625, 0.35162353515625, 0.37451171875, 0.39739990234375, 0.4202880859375, 0.44317626953125, 0.466064453125, 0.48895263671875, 0.5118408203125, 0.53472900390625, 0.5576171875, 0.58050537109375, 0.6033935546875, 0.62628173828125, 0.649169921875, 0.67205810546875, 0.6949462890625, 0.71783447265625, 0.74072265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 1.0, 5.0, 11.0, 7.0, 11.0, 15.0, 17.0, 24.0, 22.0, 23.0, 27.0, 45.0, 39.0, 34.0, 52.0, 51.0, 62.0, 47.0, 40.0, 69.0, 48.0, 53.0, 48.0, 52.0, 32.0, 32.0, 36.0, 17.0, 11.0, 18.0, 8.0, 8.0, 5.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.357099533081055e-05, -4.1943974792957306e-05, -4.0316954255104065e-05, -3.8689933717250824e-05, -3.706291317939758e-05, -3.543589264154434e-05, -3.38088721036911e-05, -3.218185156583786e-05, -3.055483102798462e-05, -2.8927810490131378e-05, -2.7300789952278137e-05, -2.5673769414424896e-05, -2.4046748876571655e-05, -2.2419728338718414e-05, -2.0792707800865173e-05, -1.9165687263011932e-05, -1.753866672515869e-05, -1.591164618730545e-05, -1.428462564945221e-05, -1.2657605111598969e-05, -1.1030584573745728e-05, -9.403564035892487e-06, -7.776543498039246e-06, -6.149522960186005e-06, -4.522502422332764e-06, -2.8954818844795227e-06, -1.2684613466262817e-06, 3.5855919122695923e-07, 1.9855797290802e-06, 3.612600266933441e-06, 5.239620804786682e-06, 6.866641342639923e-06, 8.493661880493164e-06, 1.0120682418346405e-05, 1.1747702956199646e-05, 1.3374723494052887e-05, 1.5001744031906128e-05, 1.662876456975937e-05, 1.825578510761261e-05, 1.988280564546585e-05, 2.1509826183319092e-05, 2.3136846721172333e-05, 2.4763867259025574e-05, 2.6390887796878815e-05, 2.8017908334732056e-05, 2.9644928872585297e-05, 3.127194941043854e-05, 3.289896994829178e-05, 3.452599048614502e-05, 3.615301102399826e-05, 3.77800315618515e-05, 3.940705209970474e-05, 4.1034072637557983e-05, 4.2661093175411224e-05, 4.4288113713264465e-05, 4.5915134251117706e-05, 4.754215478897095e-05, 4.916917532682419e-05, 5.079619586467743e-05, 5.242321640253067e-05, 5.405023694038391e-05, 5.567725747823715e-05, 5.730427801609039e-05, 5.8931298553943634e-05, 6.0558319091796875e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 3.0, 11.0, 9.0, 17.0, 30.0, 54.0, 70.0, 127.0, 189.0, 283.0, 545.0, 880.0, 1416.0, 2431.0, 3994.0, 6661.0, 11224.0, 19066.0, 31131.0, 49666.0, 75383.0, 106676.0, 134235.0, 147185.0, 136659.0, 108893.0, 78643.0, 51342.0, 32335.0, 19917.0, 11936.0, 7034.0, 4096.0, 2517.0, 1515.0, 903.0, 569.0, 323.0, 218.0, 131.0, 84.0, 63.0, 30.0, 29.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.580078125, -0.5642051696777344, -0.5483322143554688, -0.5324592590332031, -0.5165863037109375, -0.5007133483886719, -0.48484039306640625, -0.4689674377441406, -0.453094482421875, -0.4372215270996094, -0.42134857177734375, -0.4054756164550781, -0.3896026611328125, -0.3737297058105469, -0.35785675048828125, -0.3419837951660156, -0.32611083984375, -0.3102378845214844, -0.29436492919921875, -0.2784919738769531, -0.2626190185546875, -0.24674606323242188, -0.23087310791015625, -0.21500015258789062, -0.199127197265625, -0.18325424194335938, -0.16738128662109375, -0.15150833129882812, -0.1356353759765625, -0.11976242065429688, -0.10388946533203125, -0.08801651000976562, -0.0721435546875, -0.056270599365234375, -0.04039764404296875, -0.024524688720703125, -0.0086517333984375, 0.007221221923828125, 0.02309417724609375, 0.038967132568359375, 0.054840087890625, 0.07071304321289062, 0.08658599853515625, 0.10245895385742188, 0.1183319091796875, 0.13420486450195312, 0.15007781982421875, 0.16595077514648438, 0.18182373046875, 0.19769668579101562, 0.21356964111328125, 0.22944259643554688, 0.2453155517578125, 0.2611885070800781, 0.27706146240234375, 0.2929344177246094, 0.308807373046875, 0.3246803283691406, 0.34055328369140625, 0.3564262390136719, 0.3722991943359375, 0.3881721496582031, 0.40404510498046875, 0.4199180603027344, 0.435791015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 10.0, 10.0, 8.0, 13.0, 10.0, 17.0, 22.0, 15.0, 29.0, 32.0, 36.0, 39.0, 46.0, 40.0, 43.0, 30.0, 46.0, 46.0, 45.0, 40.0, 42.0, 40.0, 37.0, 33.0, 33.0, 30.0, 23.0, 21.0, 27.0, 21.0, 19.0, 20.0, 9.0, 10.0, 9.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12152099609375, -0.11739253997802734, -0.11326408386230469, -0.10913562774658203, -0.10500717163085938, -0.10087871551513672, -0.09675025939941406, -0.0926218032836914, -0.08849334716796875, -0.0843648910522461, -0.08023643493652344, -0.07610797882080078, -0.07197952270507812, -0.06785106658935547, -0.06372261047363281, -0.059594154357910156, -0.0554656982421875, -0.051337242126464844, -0.04720878601074219, -0.04308032989501953, -0.038951873779296875, -0.03482341766357422, -0.030694961547851562, -0.026566505432128906, -0.02243804931640625, -0.018309593200683594, -0.014181137084960938, -0.010052680969238281, -0.005924224853515625, -0.0017957687377929688, 0.0023326873779296875, 0.006461143493652344, 0.010589599609375, 0.014718055725097656, 0.018846511840820312, 0.02297496795654297, 0.027103424072265625, 0.03123188018798828, 0.03536033630371094, 0.039488792419433594, 0.04361724853515625, 0.047745704650878906, 0.05187416076660156, 0.05600261688232422, 0.060131072998046875, 0.06425952911376953, 0.06838798522949219, 0.07251644134521484, 0.0766448974609375, 0.08077335357666016, 0.08490180969238281, 0.08903026580810547, 0.09315872192382812, 0.09728717803955078, 0.10141563415527344, 0.1055440902709961, 0.10967254638671875, 0.1138010025024414, 0.11792945861816406, 0.12205791473388672, 0.12618637084960938, 0.13031482696533203, 0.1344432830810547, 0.13857173919677734, 0.1427001953125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 16.0, 22.0, 26.0, 35.0, 49.0, 46.0, 52.0, 66.0, 55.0, 63.0, 78.0, 63.0, 65.0, 57.0, 39.0, 32.0, 34.0, 38.0, 17.0, 22.0, 22.0, 15.0, 10.0, 5.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5396769046783447, -1.4855743646621704, -1.4314717054367065, -1.3773691654205322, -1.3232665061950684, -1.269163966178894, -1.2150613069534302, -1.1609587669372559, -1.106856107711792, -1.0527535676956177, -0.9986509084701538, -0.9445483088493347, -0.8904457092285156, -0.8363431692123413, -0.7822405099868774, -0.7281379699707031, -0.674035370349884, -0.6199327707290649, -0.5658301711082458, -0.5117275714874268, -0.45762497186660767, -0.40352240204811096, -0.34941980242729187, -0.2953172028064728, -0.2412146031856537, -0.1871120035648346, -0.1330094039440155, -0.0789068192243576, -0.024804219603538513, 0.029298365116119385, 0.08340096473693848, 0.13750356435775757, 0.19160616397857666, 0.24570876359939575, 0.29981136322021484, 0.35391396284103394, 0.408016562461853, 0.46211913228034973, 0.5162217617034912, 0.5703243017196655, 0.6244269609451294, 0.6785295605659485, 0.7326321601867676, 0.7867347598075867, 0.8408373594284058, 0.8949398994445801, 0.949042558670044, 1.0031450986862183, 1.0572476387023926, 1.111350178718567, 1.1654528379440308, 1.219555377960205, 1.273658037185669, 1.3277605772018433, 1.3818632364273071, 1.4359657764434814, 1.4900684356689453, 1.5441709756851196, 1.5982736349105835, 1.6523761749267578, 1.7064788341522217, 1.760581374168396, 1.8146840333938599, 1.8687865734100342, 1.922889232635498]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 14.0, 19.0, 21.0, 19.0, 30.0, 30.0, 31.0, 31.0, 48.0, 46.0, 24.0, 34.0, 41.0, 45.0, 34.0, 45.0, 47.0, 44.0, 46.0, 36.0, 42.0, 37.0, 23.0, 16.0, 24.0, 22.0, 16.0, 13.0, 15.0, 11.0, 7.0, 12.0, 6.0, 10.0, 10.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0716361999511719, -1.0388997793197632, -1.006163239479065, -0.9734268188476562, -0.9406903386116028, -0.9079538583755493, -0.8752174377441406, -0.8424809575080872, -0.8097444772720337, -0.7770079970359802, -0.7442715167999268, -0.7115350961685181, -0.6787986159324646, -0.6460621356964111, -0.6133257150650024, -0.580589234828949, -0.5478527545928955, -0.515116274356842, -0.48237982392311096, -0.4496433734893799, -0.4169068932533264, -0.38417041301727295, -0.35143396258354187, -0.3186975121498108, -0.2859610319137573, -0.25322455167770386, -0.22048810124397278, -0.1877516359090805, -0.15501517057418823, -0.12227870523929596, -0.08954223990440369, -0.056805774569511414, -0.02406930923461914, 0.008667156100273132, 0.041403621435165405, 0.07414008677005768, 0.10687655210494995, 0.13961301743984222, 0.1723494827747345, 0.20508594810962677, 0.23782241344451904, 0.2705588936805725, 0.3032953441143036, 0.33603179454803467, 0.36876827478408813, 0.4015047550201416, 0.4342412054538727, 0.46697765588760376, 0.4997141361236572, 0.5324506163597107, 0.5651870965957642, 0.5979235172271729, 0.6306599974632263, 0.6633964776992798, 0.6961328983306885, 0.7288693785667419, 0.7616058588027954, 0.7943423390388489, 0.8270788192749023, 0.859815239906311, 0.8925517201423645, 0.925288200378418, 0.9580246210098267, 0.9907611012458801, 1.0234975814819336]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 17.0, 36.0, 48.0, 96.0, 103.0, 175.0, 266.0, 446.0, 790.0, 1303.0, 2120.0, 3750.0, 6345.0, 11120.0, 19382.0, 34501.0, 62484.0, 111686.0, 196831.0, 326758.0, 499138.0, 653865.0, 691305.0, 579542.0, 404078.0, 250541.0, 146391.0, 82448.0, 46626.0, 26247.0, 14894.0, 8594.0, 4901.0, 2963.0, 1765.0, 1074.0, 615.0, 380.0, 226.0, 160.0, 99.0, 52.0, 43.0, 27.0, 11.0, 7.0, 3.0, 10.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1010284423828125, -1.063385009765625, -1.0257415771484375, -0.98809814453125, -0.9504547119140625, -0.912811279296875, -0.8751678466796875, -0.8375244140625, -0.7998809814453125, -0.762237548828125, -0.7245941162109375, -0.68695068359375, -0.6493072509765625, -0.611663818359375, -0.5740203857421875, -0.536376953125, -0.4987335205078125, -0.461090087890625, -0.4234466552734375, -0.38580322265625, -0.3481597900390625, -0.310516357421875, -0.2728729248046875, -0.2352294921875, -0.1975860595703125, -0.159942626953125, -0.1222991943359375, -0.08465576171875, -0.0470123291015625, -0.009368896484375, 0.0282745361328125, 0.06591796875, 0.1035614013671875, 0.141204833984375, 0.1788482666015625, 0.21649169921875, 0.2541351318359375, 0.291778564453125, 0.3294219970703125, 0.3670654296875, 0.4047088623046875, 0.442352294921875, 0.4799957275390625, 0.51763916015625, 0.5552825927734375, 0.592926025390625, 0.6305694580078125, 0.668212890625, 0.7058563232421875, 0.743499755859375, 0.7811431884765625, 0.81878662109375, 0.8564300537109375, 0.894073486328125, 0.9317169189453125, 0.9693603515625, 1.0070037841796875, 1.044647216796875, 1.0822906494140625, 1.11993408203125, 1.1575775146484375, 1.195220947265625, 1.2328643798828125, 1.2705078125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 15.0, 9.0, 16.0, 29.0, 29.0, 26.0, 34.0, 27.0, 38.0, 44.0, 47.0, 34.0, 48.0, 49.0, 42.0, 40.0, 39.0, 43.0, 32.0, 32.0, 36.0, 33.0, 28.0, 23.0, 21.0, 21.0, 23.0, 18.0, 11.0, 15.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.806640625, -0.7824478149414062, -0.7582550048828125, -0.7340621948242188, -0.709869384765625, -0.6856765747070312, -0.6614837646484375, -0.6372909545898438, -0.61309814453125, -0.5889053344726562, -0.5647125244140625, -0.5405197143554688, -0.516326904296875, -0.49213409423828125, -0.4679412841796875, -0.44374847412109375, -0.4195556640625, -0.39536285400390625, -0.3711700439453125, -0.34697723388671875, -0.322784423828125, -0.29859161376953125, -0.2743988037109375, -0.25020599365234375, -0.22601318359375, -0.20182037353515625, -0.1776275634765625, -0.15343475341796875, -0.129241943359375, -0.10504913330078125, -0.0808563232421875, -0.05666351318359375, -0.032470703125, -0.00827789306640625, 0.0159149169921875, 0.04010772705078125, 0.064300537109375, 0.08849334716796875, 0.1126861572265625, 0.13687896728515625, 0.16107177734375, 0.18526458740234375, 0.2094573974609375, 0.23365020751953125, 0.257843017578125, 0.28203582763671875, 0.3062286376953125, 0.33042144775390625, 0.3546142578125, 0.37880706787109375, 0.4029998779296875, 0.42719268798828125, 0.451385498046875, 0.47557830810546875, 0.4997711181640625, 0.5239639282226562, 0.54815673828125, 0.5723495483398438, 0.5965423583984375, 0.6207351684570312, 0.644927978515625, 0.6691207885742188, 0.6933135986328125, 0.7175064086914062, 0.74169921875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [6.0, 3.0, 7.0, 13.0, 11.0, 26.0, 38.0, 66.0, 103.0, 191.0, 282.0, 464.0, 703.0, 1231.0, 1892.0, 3184.0, 5404.0, 8628.0, 14278.0, 23079.0, 38163.0, 62887.0, 99300.0, 157117.0, 236270.0, 334758.0, 440439.0, 517329.0, 536276.0, 490242.0, 395143.0, 289910.0, 198909.0, 128821.0, 81100.0, 50081.0, 30506.0, 18710.0, 11388.0, 6685.0, 4119.0, 2481.0, 1566.0, 985.0, 567.0, 362.0, 205.0, 140.0, 78.0, 60.0, 40.0, 20.0, 16.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92919921875, -0.8963394165039062, -0.8634796142578125, -0.8306198120117188, -0.797760009765625, -0.7649002075195312, -0.7320404052734375, -0.6991806030273438, -0.66632080078125, -0.6334609985351562, -0.6006011962890625, -0.5677413940429688, -0.534881591796875, -0.5020217895507812, -0.4691619873046875, -0.43630218505859375, -0.4034423828125, -0.37058258056640625, -0.3377227783203125, -0.30486297607421875, -0.272003173828125, -0.23914337158203125, -0.2062835693359375, -0.17342376708984375, -0.14056396484375, -0.10770416259765625, -0.0748443603515625, -0.04198455810546875, -0.009124755859375, 0.02373504638671875, 0.0565948486328125, 0.08945465087890625, 0.122314453125, 0.15517425537109375, 0.1880340576171875, 0.22089385986328125, 0.253753662109375, 0.28661346435546875, 0.3194732666015625, 0.35233306884765625, 0.38519287109375, 0.41805267333984375, 0.4509124755859375, 0.48377227783203125, 0.516632080078125, 0.5494918823242188, 0.5823516845703125, 0.6152114868164062, 0.6480712890625, 0.6809310913085938, 0.7137908935546875, 0.7466506958007812, 0.779510498046875, 0.8123703002929688, 0.8452301025390625, 0.8780899047851562, 0.91094970703125, 0.9438095092773438, 0.9766693115234375, 1.0095291137695312, 1.042388916015625, 1.0752487182617188, 1.1081085205078125, 1.1409683227539062, 1.173828125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 6.0, 6.0, 15.0, 13.0, 14.0, 22.0, 28.0, 33.0, 45.0, 52.0, 67.0, 71.0, 84.0, 81.0, 112.0, 126.0, 145.0, 147.0, 154.0, 193.0, 200.0, 202.0, 189.0, 207.0, 213.0, 185.0, 194.0, 183.0, 155.0, 141.0, 136.0, 101.0, 89.0, 79.0, 82.0, 57.0, 49.0, 28.0, 42.0, 23.0, 22.0, 10.0, 15.0, 13.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.38671875, -0.374908447265625, -0.36309814453125, -0.351287841796875, -0.3394775390625, -0.327667236328125, -0.31585693359375, -0.304046630859375, -0.292236328125, -0.280426025390625, -0.26861572265625, -0.256805419921875, -0.2449951171875, -0.233184814453125, -0.22137451171875, -0.209564208984375, -0.19775390625, -0.185943603515625, -0.17413330078125, -0.162322998046875, -0.1505126953125, -0.138702392578125, -0.12689208984375, -0.115081787109375, -0.103271484375, -0.091461181640625, -0.07965087890625, -0.067840576171875, -0.0560302734375, -0.044219970703125, -0.03240966796875, -0.020599365234375, -0.0087890625, 0.003021240234375, 0.01483154296875, 0.026641845703125, 0.0384521484375, 0.050262451171875, 0.06207275390625, 0.073883056640625, 0.085693359375, 0.097503662109375, 0.10931396484375, 0.121124267578125, 0.1329345703125, 0.144744873046875, 0.15655517578125, 0.168365478515625, 0.18017578125, 0.191986083984375, 0.20379638671875, 0.215606689453125, 0.2274169921875, 0.239227294921875, 0.25103759765625, 0.262847900390625, 0.274658203125, 0.286468505859375, 0.29827880859375, 0.310089111328125, 0.3218994140625, 0.333709716796875, 0.34552001953125, 0.357330322265625, 0.369140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 13.0, 10.0, 20.0, 14.0, 20.0, 19.0, 37.0, 42.0, 42.0, 52.0, 44.0, 60.0, 63.0, 63.0, 52.0, 53.0, 43.0, 56.0, 47.0, 41.0, 34.0, 29.0, 22.0, 25.0, 24.0, 10.0, 7.0, 12.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6071772575378418, -1.5585997104644775, -1.5100221633911133, -1.461444616317749, -1.4128670692443848, -1.3642895221710205, -1.3157119750976562, -1.267134428024292, -1.2185568809509277, -1.1699793338775635, -1.1214017868041992, -1.072824239730835, -1.0242466926574707, -0.9756691455841064, -0.927091658115387, -0.8785141110420227, -0.8299366235733032, -0.781359076499939, -0.7327815294265747, -0.6842039823532104, -0.6356264352798462, -0.5870488882064819, -0.5384714007377625, -0.4898938536643982, -0.44131630659103394, -0.3927387595176697, -0.3441612124443054, -0.29558369517326355, -0.2470061480998993, -0.19842860102653503, -0.14985108375549316, -0.1012735366821289, -0.0526958703994751, -0.004118330776691437, 0.044459208846092224, 0.09303674101829529, 0.14161428809165955, 0.1901918351650238, 0.23876935243606567, 0.28734689950942993, 0.3359244465827942, 0.38450199365615845, 0.4330795407295227, 0.4816570580005646, 0.5302345752716064, 0.5788121223449707, 0.627389669418335, 0.6759672164916992, 0.7245447635650635, 0.7731223106384277, 0.821699857711792, 0.8702774047851562, 0.9188549518585205, 0.9674324989318848, 1.016010046005249, 1.0645875930786133, 1.1131651401519775, 1.1617426872253418, 1.210320234298706, 1.2588977813720703, 1.3074753284454346, 1.3560528755187988, 1.404630422592163, 1.4532079696655273, 1.501785397529602]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 11.0, 14.0, 18.0, 20.0, 20.0, 26.0, 32.0, 26.0, 32.0, 43.0, 39.0, 31.0, 38.0, 31.0, 41.0, 42.0, 40.0, 43.0, 40.0, 42.0, 36.0, 47.0, 33.0, 29.0, 16.0, 34.0, 27.0, 15.0, 19.0, 10.0, 16.0, 12.0, 11.0, 10.0, 3.0, 10.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.025536060333252, -0.9957210421562195, -0.9659060835838318, -0.9360910654067993, -0.9062761068344116, -0.8764610886573792, -0.8466460704803467, -0.816831111907959, -0.7870160937309265, -0.757201075553894, -0.7273861169815063, -0.6975710988044739, -0.6677560806274414, -0.6379411220550537, -0.6081261038780212, -0.5783110857009888, -0.5484961271286011, -0.5186811089515686, -0.4888661503791809, -0.45905113220214844, -0.42923614382743835, -0.39942115545272827, -0.3696061372756958, -0.3397911489009857, -0.30997616052627563, -0.28016117215156555, -0.25034618377685547, -0.220531165599823, -0.19071617722511292, -0.16090118885040283, -0.13108618557453156, -0.10127118229866028, -0.0714561939239502, -0.041641198098659515, -0.011826202273368835, 0.017988793551921844, 0.047803789377212524, 0.07761877775192261, 0.10743378102779388, 0.13724878430366516, 0.16706377267837524, 0.19687876105308533, 0.2266937643289566, 0.2565087676048279, 0.28632375597953796, 0.31613874435424805, 0.3459537625312805, 0.3757687509059906, 0.4055837392807007, 0.43539872765541077, 0.46521371603012085, 0.4950287342071533, 0.524843692779541, 0.5546587109565735, 0.584473729133606, 0.6142886877059937, 0.6441037058830261, 0.6739187240600586, 0.7037336826324463, 0.7335487008094788, 0.7633637189865112, 0.7931786775588989, 0.8229936957359314, 0.8528087139129639, 0.8826236724853516]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 15.0, 21.0, 27.0, 36.0, 40.0, 75.0, 102.0, 178.0, 234.0, 318.0, 522.0, 750.0, 1180.0, 1866.0, 2999.0, 4865.0, 8342.0, 14639.0, 26880.0, 50211.0, 94159.0, 166844.0, 231184.0, 192673.0, 114023.0, 60994.0, 32664.0, 17614.0, 9820.0, 5576.0, 3467.0, 2112.0, 1335.0, 899.0, 600.0, 390.0, 272.0, 192.0, 129.0, 86.0, 59.0, 41.0, 35.0, 23.0, 18.0, 13.0, 9.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.390869140625, -0.3785209655761719, -0.36617279052734375, -0.3538246154785156, -0.3414764404296875, -0.3291282653808594, -0.31678009033203125, -0.3044319152832031, -0.292083740234375, -0.2797355651855469, -0.26738739013671875, -0.2550392150878906, -0.2426910400390625, -0.23034286499023438, -0.21799468994140625, -0.20564651489257812, -0.19329833984375, -0.18095016479492188, -0.16860198974609375, -0.15625381469726562, -0.1439056396484375, -0.13155746459960938, -0.11920928955078125, -0.10686111450195312, -0.094512939453125, -0.08216476440429688, -0.06981658935546875, -0.057468414306640625, -0.0451202392578125, -0.032772064208984375, -0.02042388916015625, -0.008075714111328125, 0.0042724609375, 0.016620635986328125, 0.02896881103515625, 0.041316986083984375, 0.0536651611328125, 0.06601333618164062, 0.07836151123046875, 0.09070968627929688, 0.103057861328125, 0.11540603637695312, 0.12775421142578125, 0.14010238647460938, 0.1524505615234375, 0.16479873657226562, 0.17714691162109375, 0.18949508666992188, 0.20184326171875, 0.21419143676757812, 0.22653961181640625, 0.23888778686523438, 0.2512359619140625, 0.2635841369628906, 0.27593231201171875, 0.2882804870605469, 0.300628662109375, 0.3129768371582031, 0.32532501220703125, 0.3376731872558594, 0.3500213623046875, 0.3623695373535156, 0.37471771240234375, 0.3870658874511719, 0.3994140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 7.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 18.0, 15.0, 26.0, 19.0, 22.0, 19.0, 26.0, 39.0, 41.0, 37.0, 38.0, 48.0, 30.0, 41.0, 48.0, 40.0, 34.0, 30.0, 38.0, 36.0, 41.0, 29.0, 31.0, 20.0, 25.0, 23.0, 25.0, 18.0, 12.0, 5.0, 12.0, 12.0, 11.0, 5.0, 4.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0360031127929688, -1.0046234130859375, -0.9732437133789062, -0.941864013671875, -0.9104843139648438, -0.8791046142578125, -0.8477249145507812, -0.81634521484375, -0.7849655151367188, -0.7535858154296875, -0.7222061157226562, -0.690826416015625, -0.6594467163085938, -0.6280670166015625, -0.5966873168945312, -0.5653076171875, -0.5339279174804688, -0.5025482177734375, -0.47116851806640625, -0.439788818359375, -0.40840911865234375, -0.3770294189453125, -0.34564971923828125, -0.31427001953125, -0.28289031982421875, -0.2515106201171875, -0.22013092041015625, -0.188751220703125, -0.15737152099609375, -0.1259918212890625, -0.09461212158203125, -0.063232421875, -0.03185272216796875, -0.0004730224609375, 0.03090667724609375, 0.062286376953125, 0.09366607666015625, 0.1250457763671875, 0.15642547607421875, 0.18780517578125, 0.21918487548828125, 0.2505645751953125, 0.28194427490234375, 0.313323974609375, 0.34470367431640625, 0.3760833740234375, 0.40746307373046875, 0.4388427734375, 0.47022247314453125, 0.5016021728515625, 0.5329818725585938, 0.564361572265625, 0.5957412719726562, 0.6271209716796875, 0.6585006713867188, 0.68988037109375, 0.7212600708007812, 0.7526397705078125, 0.7840194702148438, 0.815399169921875, 0.8467788696289062, 0.8781585693359375, 0.9095382690429688, 0.94091796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 12.0, 16.0, 27.0, 53.0, 40.0, 76.0, 128.0, 191.0, 313.0, 408.0, 645.0, 1009.0, 1678.0, 3093.0, 6303.0, 13032.0, 30344.0, 75614.0, 189844.0, 330399.0, 231462.0, 94277.0, 37567.0, 15860.0, 7191.0, 3695.0, 2024.0, 1168.0, 682.0, 465.0, 307.0, 181.0, 135.0, 108.0, 64.0, 31.0, 36.0, 13.0, 9.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5599822998046875, -0.542816162109375, -0.5256500244140625, -0.50848388671875, -0.4913177490234375, -0.474151611328125, -0.4569854736328125, -0.4398193359375, -0.4226531982421875, -0.405487060546875, -0.3883209228515625, -0.37115478515625, -0.3539886474609375, -0.336822509765625, -0.3196563720703125, -0.302490234375, -0.2853240966796875, -0.268157958984375, -0.2509918212890625, -0.23382568359375, -0.2166595458984375, -0.199493408203125, -0.1823272705078125, -0.1651611328125, -0.1479949951171875, -0.130828857421875, -0.1136627197265625, -0.09649658203125, -0.0793304443359375, -0.062164306640625, -0.0449981689453125, -0.02783203125, -0.0106658935546875, 0.006500244140625, 0.0236663818359375, 0.04083251953125, 0.0579986572265625, 0.075164794921875, 0.0923309326171875, 0.1094970703125, 0.1266632080078125, 0.143829345703125, 0.1609954833984375, 0.17816162109375, 0.1953277587890625, 0.212493896484375, 0.2296600341796875, 0.246826171875, 0.2639923095703125, 0.281158447265625, 0.2983245849609375, 0.31549072265625, 0.3326568603515625, 0.349822998046875, 0.3669891357421875, 0.3841552734375, 0.4013214111328125, 0.418487548828125, 0.4356536865234375, 0.45281982421875, 0.4699859619140625, 0.487152099609375, 0.5043182373046875, 0.521484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 8.0, 6.0, 10.0, 11.0, 11.0, 16.0, 14.0, 19.0, 20.0, 26.0, 30.0, 29.0, 39.0, 47.0, 46.0, 39.0, 42.0, 38.0, 37.0, 45.0, 46.0, 38.0, 40.0, 40.0, 42.0, 45.0, 31.0, 39.0, 14.0, 19.0, 17.0, 24.0, 14.0, 6.0, 10.0, 7.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.66143798828125, -0.6402587890625, -0.61907958984375, -0.597900390625, -0.57672119140625, -0.5555419921875, -0.53436279296875, -0.51318359375, -0.49200439453125, -0.4708251953125, -0.44964599609375, -0.428466796875, -0.40728759765625, -0.3861083984375, -0.36492919921875, -0.34375, -0.32257080078125, -0.3013916015625, -0.28021240234375, -0.259033203125, -0.23785400390625, -0.2166748046875, -0.19549560546875, -0.17431640625, -0.15313720703125, -0.1319580078125, -0.11077880859375, -0.089599609375, -0.06842041015625, -0.0472412109375, -0.02606201171875, -0.0048828125, 0.01629638671875, 0.0374755859375, 0.05865478515625, 0.079833984375, 0.10101318359375, 0.1221923828125, 0.14337158203125, 0.16455078125, 0.18572998046875, 0.2069091796875, 0.22808837890625, 0.249267578125, 0.27044677734375, 0.2916259765625, 0.31280517578125, 0.333984375, 0.35516357421875, 0.3763427734375, 0.39752197265625, 0.418701171875, 0.43988037109375, 0.4610595703125, 0.48223876953125, 0.50341796875, 0.52459716796875, 0.5457763671875, 0.56695556640625, 0.588134765625, 0.60931396484375, 0.6304931640625, 0.65167236328125, 0.6728515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 13.0, 7.0, 14.0, 19.0, 19.0, 42.0, 45.0, 62.0, 102.0, 152.0, 202.0, 311.0, 483.0, 709.0, 1112.0, 2138.0, 3962.0, 9292.0, 33561.0, 534818.0, 414011.0, 29973.0, 8666.0, 3581.0, 1907.0, 1158.0, 675.0, 459.0, 317.0, 209.0, 165.0, 94.0, 73.0, 51.0, 48.0, 31.0, 18.0, 14.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5329666137695312, -0.5131988525390625, -0.49343109130859375, -0.473663330078125, -0.45389556884765625, -0.4341278076171875, -0.41436004638671875, -0.39459228515625, -0.37482452392578125, -0.3550567626953125, -0.33528900146484375, -0.315521240234375, -0.29575347900390625, -0.2759857177734375, -0.25621795654296875, -0.2364501953125, -0.21668243408203125, -0.1969146728515625, -0.17714691162109375, -0.157379150390625, -0.13761138916015625, -0.1178436279296875, -0.09807586669921875, -0.07830810546875, -0.05854034423828125, -0.0387725830078125, -0.01900482177734375, 0.000762939453125, 0.02053070068359375, 0.0402984619140625, 0.06006622314453125, 0.079833984375, 0.09960174560546875, 0.1193695068359375, 0.13913726806640625, 0.158905029296875, 0.17867279052734375, 0.1984405517578125, 0.21820831298828125, 0.23797607421875, 0.25774383544921875, 0.2775115966796875, 0.29727935791015625, 0.317047119140625, 0.33681488037109375, 0.3565826416015625, 0.37635040283203125, 0.3961181640625, 0.41588592529296875, 0.4356536865234375, 0.45542144775390625, 0.475189208984375, 0.49495697021484375, 0.5147247314453125, 0.5344924926757812, 0.55426025390625, 0.5740280151367188, 0.5937957763671875, 0.6135635375976562, 0.633331298828125, 0.6530990600585938, 0.6728668212890625, 0.6926345825195312, 0.71240234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 7.0, 6.0, 11.0, 17.0, 37.0, 71.0, 66.0, 130.0, 157.0, 140.0, 105.0, 87.0, 61.0, 30.0, 18.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.946518361568451e-05, -2.841278910636902e-05, -2.7360394597053528e-05, -2.6308000087738037e-05, -2.5255605578422546e-05, -2.4203211069107056e-05, -2.3150816559791565e-05, -2.2098422050476074e-05, -2.1046027541160583e-05, -1.9993633031845093e-05, -1.8941238522529602e-05, -1.788884401321411e-05, -1.683644950389862e-05, -1.578405499458313e-05, -1.473166048526764e-05, -1.3679265975952148e-05, -1.2626871466636658e-05, -1.1574476957321167e-05, -1.0522082448005676e-05, -9.469687938690186e-06, -8.417293429374695e-06, -7.364898920059204e-06, -6.312504410743713e-06, -5.260109901428223e-06, -4.207715392112732e-06, -3.155320882797241e-06, -2.1029263734817505e-06, -1.0505318641662598e-06, 1.862645149230957e-09, 1.0542571544647217e-06, 2.1066516637802124e-06, 3.159046173095703e-06, 4.211440682411194e-06, 5.2638351917266846e-06, 6.316229701042175e-06, 7.368624210357666e-06, 8.421018719673157e-06, 9.473413228988647e-06, 1.0525807738304138e-05, 1.1578202247619629e-05, 1.263059675693512e-05, 1.368299126625061e-05, 1.4735385775566101e-05, 1.5787780284881592e-05, 1.6840174794197083e-05, 1.7892569303512573e-05, 1.8944963812828064e-05, 1.9997358322143555e-05, 2.1049752831459045e-05, 2.2102147340774536e-05, 2.3154541850090027e-05, 2.4206936359405518e-05, 2.5259330868721008e-05, 2.63117253780365e-05, 2.736411988735199e-05, 2.841651439666748e-05, 2.946890890598297e-05, 3.052130341529846e-05, 3.157369792461395e-05, 3.262609243392944e-05, 3.3678486943244934e-05, 3.4730881452560425e-05, 3.5783275961875916e-05, 3.6835670471191406e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 17.0, 14.0, 18.0, 39.0, 40.0, 62.0, 55.0, 96.0, 145.0, 179.0, 267.0, 332.0, 432.0, 644.0, 936.0, 1340.0, 2043.0, 3175.0, 4984.0, 8638.0, 16254.0, 38430.0, 140454.0, 507221.0, 222042.0, 53205.0, 20443.0, 10299.0, 5884.0, 3522.0, 2204.0, 1464.0, 1079.0, 701.0, 518.0, 394.0, 233.0, 200.0, 126.0, 96.0, 81.0, 64.0, 50.0, 30.0, 26.0, 18.0, 15.0, 10.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.35888671875, -0.34789276123046875, -0.3368988037109375, -0.32590484619140625, -0.314910888671875, -0.30391693115234375, -0.2929229736328125, -0.28192901611328125, -0.27093505859375, -0.25994110107421875, -0.2489471435546875, -0.23795318603515625, -0.226959228515625, -0.21596527099609375, -0.2049713134765625, -0.19397735595703125, -0.1829833984375, -0.17198944091796875, -0.1609954833984375, -0.15000152587890625, -0.139007568359375, -0.12801361083984375, -0.1170196533203125, -0.10602569580078125, -0.09503173828125, -0.08403778076171875, -0.0730438232421875, -0.06204986572265625, -0.051055908203125, -0.04006195068359375, -0.0290679931640625, -0.01807403564453125, -0.007080078125, 0.00391387939453125, 0.0149078369140625, 0.02590179443359375, 0.036895751953125, 0.04788970947265625, 0.0588836669921875, 0.06987762451171875, 0.08087158203125, 0.09186553955078125, 0.1028594970703125, 0.11385345458984375, 0.124847412109375, 0.13584136962890625, 0.1468353271484375, 0.15782928466796875, 0.1688232421875, 0.17981719970703125, 0.1908111572265625, 0.20180511474609375, 0.212799072265625, 0.22379302978515625, 0.2347869873046875, 0.24578094482421875, 0.25677490234375, 0.26776885986328125, 0.2787628173828125, 0.28975677490234375, 0.300750732421875, 0.31174468994140625, 0.3227386474609375, 0.33373260498046875, 0.3447265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 9.0, 9.0, 18.0, 20.0, 34.0, 45.0, 97.0, 220.0, 235.0, 124.0, 65.0, 31.0, 28.0, 16.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14694595336914062, -0.14264678955078125, -0.13834762573242188, -0.1340484619140625, -0.12974929809570312, -0.12545013427734375, -0.12115097045898438, -0.116851806640625, -0.11255264282226562, -0.10825347900390625, -0.10395431518554688, -0.0996551513671875, -0.09535598754882812, -0.09105682373046875, -0.08675765991210938, -0.08245849609375, -0.07815933227539062, -0.07386016845703125, -0.06956100463867188, -0.0652618408203125, -0.060962677001953125, -0.05666351318359375, -0.052364349365234375, -0.048065185546875, -0.043766021728515625, -0.03946685791015625, -0.035167694091796875, -0.0308685302734375, -0.026569366455078125, -0.02227020263671875, -0.017971038818359375, -0.013671875, -0.009372711181640625, -0.00507354736328125, -0.000774383544921875, 0.0035247802734375, 0.007823944091796875, 0.01212310791015625, 0.016422271728515625, 0.020721435546875, 0.025020599365234375, 0.02931976318359375, 0.033618927001953125, 0.0379180908203125, 0.042217254638671875, 0.04651641845703125, 0.050815582275390625, 0.05511474609375, 0.059413909912109375, 0.06371307373046875, 0.06801223754882812, 0.0723114013671875, 0.07661056518554688, 0.08090972900390625, 0.08520889282226562, 0.089508056640625, 0.09380722045898438, 0.09810638427734375, 0.10240554809570312, 0.1067047119140625, 0.11100387573242188, 0.11530303955078125, 0.11960220336914062, 0.1239013671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 21.0, 10.0, 20.0, 22.0, 33.0, 29.0, 44.0, 48.0, 51.0, 52.0, 64.0, 59.0, 46.0, 58.0, 54.0, 46.0, 49.0, 41.0, 42.0, 37.0, 21.0, 23.0, 23.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5663504600524902, -1.518341064453125, -1.4703317880630493, -1.422322392463684, -1.3743131160736084, -1.3263037204742432, -1.2782944440841675, -1.2302850484848022, -1.1822757720947266, -1.1342663764953613, -1.0862571001052856, -1.0382477045059204, -0.9902384281158447, -0.9422290921211243, -0.8942197561264038, -0.8462103605270386, -0.7982010245323181, -0.7501916885375977, -0.7021823525428772, -0.6541730165481567, -0.6061636805534363, -0.5581543445587158, -0.5101449489593506, -0.4621356427669525, -0.41412630677223206, -0.3661169707775116, -0.31810763478279114, -0.2700982689857483, -0.22208894789218903, -0.17407961189746857, -0.12607026100158691, -0.07806092500686646, -0.030051589012145996, 0.01795775070786476, 0.06596709042787552, 0.11397643387317657, 0.16198576986789703, 0.2099951058626175, 0.25800445675849915, 0.3060137927532196, 0.35402312874794006, 0.4020324647426605, 0.450041800737381, 0.49805116653442383, 0.5460605025291443, 0.5940698385238647, 0.6420791745185852, 0.6900885105133057, 0.7380978465080261, 0.7861071825027466, 0.834116518497467, 0.8821258544921875, 0.930135190486908, 0.9781445264816284, 1.0261539220809937, 1.0741631984710693, 1.1221725940704346, 1.1701819896697998, 1.2181912660598755, 1.2662006616592407, 1.3142099380493164, 1.3622193336486816, 1.4102286100387573, 1.4582380056381226, 1.5062472820281982]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 18.0, 22.0, 23.0, 23.0, 29.0, 28.0, 34.0, 39.0, 43.0, 34.0, 30.0, 35.0, 38.0, 45.0, 41.0, 39.0, 34.0, 40.0, 43.0, 40.0, 36.0, 28.0, 18.0, 34.0, 23.0, 12.0, 23.0, 14.0, 10.0, 14.0, 15.0, 8.0, 4.0, 7.0, 11.0, 7.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.999873161315918, -0.9706754088401794, -0.9414777159690857, -0.9122799634933472, -0.8830822706222534, -0.8538845181465149, -0.8246867656707764, -0.7954890727996826, -0.7662913799285889, -0.7370936274528503, -0.7078959345817566, -0.6786981821060181, -0.6495004892349243, -0.6203027367591858, -0.5911049842834473, -0.5619072914123535, -0.532709538936615, -0.5035117864608765, -0.4743140935897827, -0.4451163411140442, -0.41591864824295044, -0.3867208957672119, -0.3575231730937958, -0.32832545042037964, -0.2991277277469635, -0.26993000507354736, -0.24073228240013123, -0.2115345448255539, -0.18233682215213776, -0.15313909947872162, -0.12394136190414429, -0.09474363923072815, -0.06554597616195679, -0.03634824976325035, -0.007150523364543915, 0.02204720675945282, 0.05124492943286896, 0.0804426521062851, 0.10964038968086243, 0.13883811235427856, 0.1680358350276947, 0.19723355770111084, 0.22643128037452698, 0.2556290030479431, 0.28482675552368164, 0.3140244483947754, 0.3432222008705139, 0.37241992354393005, 0.4016176462173462, 0.43081536889076233, 0.46001309156417847, 0.489210844039917, 0.5184085369110107, 0.5476062893867493, 0.5768040418624878, 0.6060017347335815, 0.6351994276046753, 0.6643971800804138, 0.6935948729515076, 0.7227926254272461, 0.7519903182983398, 0.7811880707740784, 0.8103858232498169, 0.8395835161209106, 0.8687812685966492]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 10.0, 11.0, 23.0, 48.0, 76.0, 86.0, 154.0, 228.0, 424.0, 616.0, 877.0, 1482.0, 2232.0, 3495.0, 5394.0, 8185.0, 12522.0, 18719.0, 26972.0, 38317.0, 52104.0, 68538.0, 84633.0, 98160.0, 105484.0, 106325.0, 97266.0, 83393.0, 66853.0, 50854.0, 37206.0, 25735.0, 17828.0, 11861.0, 7833.0, 5104.0, 3333.0, 2149.0, 1460.0, 932.0, 580.0, 362.0, 280.0, 153.0, 89.0, 65.0, 35.0, 29.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.81005859375, -0.7847061157226562, -0.7593536376953125, -0.7340011596679688, -0.708648681640625, -0.6832962036132812, -0.6579437255859375, -0.6325912475585938, -0.60723876953125, -0.5818862915039062, -0.5565338134765625, -0.5311813354492188, -0.505828857421875, -0.48047637939453125, -0.4551239013671875, -0.42977142333984375, -0.4044189453125, -0.37906646728515625, -0.3537139892578125, -0.32836151123046875, -0.303009033203125, -0.27765655517578125, -0.2523040771484375, -0.22695159912109375, -0.20159912109375, -0.17624664306640625, -0.1508941650390625, -0.12554168701171875, -0.100189208984375, -0.07483673095703125, -0.0494842529296875, -0.02413177490234375, 0.001220703125, 0.02657318115234375, 0.0519256591796875, 0.07727813720703125, 0.102630615234375, 0.12798309326171875, 0.1533355712890625, 0.17868804931640625, 0.20404052734375, 0.22939300537109375, 0.2547454833984375, 0.28009796142578125, 0.305450439453125, 0.33080291748046875, 0.3561553955078125, 0.38150787353515625, 0.4068603515625, 0.43221282958984375, 0.4575653076171875, 0.48291778564453125, 0.508270263671875, 0.5336227416992188, 0.5589752197265625, 0.5843276977539062, 0.60968017578125, 0.6350326538085938, 0.6603851318359375, 0.6857376098632812, 0.711090087890625, 0.7364425659179688, 0.7617950439453125, 0.7871475219726562, 0.8125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 14.0, 11.0, 13.0, 17.0, 17.0, 22.0, 19.0, 26.0, 24.0, 36.0, 34.0, 36.0, 34.0, 41.0, 37.0, 41.0, 41.0, 28.0, 54.0, 39.0, 34.0, 39.0, 49.0, 29.0, 28.0, 27.0, 20.0, 22.0, 24.0, 23.0, 15.0, 16.0, 10.0, 13.0, 14.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0791015625, -1.04779052734375, -1.0164794921875, -0.98516845703125, -0.953857421875, -0.92254638671875, -0.8912353515625, -0.85992431640625, -0.82861328125, -0.79730224609375, -0.7659912109375, -0.73468017578125, -0.703369140625, -0.67205810546875, -0.6407470703125, -0.60943603515625, -0.578125, -0.54681396484375, -0.5155029296875, -0.48419189453125, -0.452880859375, -0.42156982421875, -0.3902587890625, -0.35894775390625, -0.32763671875, -0.29632568359375, -0.2650146484375, -0.23370361328125, -0.202392578125, -0.17108154296875, -0.1397705078125, -0.10845947265625, -0.0771484375, -0.04583740234375, -0.0145263671875, 0.01678466796875, 0.048095703125, 0.07940673828125, 0.1107177734375, 0.14202880859375, 0.17333984375, 0.20465087890625, 0.2359619140625, 0.26727294921875, 0.298583984375, 0.32989501953125, 0.3612060546875, 0.39251708984375, 0.423828125, 0.45513916015625, 0.4864501953125, 0.51776123046875, 0.549072265625, 0.58038330078125, 0.6116943359375, 0.64300537109375, 0.67431640625, 0.70562744140625, 0.7369384765625, 0.76824951171875, 0.799560546875, 0.83087158203125, 0.8621826171875, 0.89349365234375, 0.9248046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 13.0, 20.0, 29.0, 44.0, 67.0, 101.0, 148.0, 276.0, 357.0, 662.0, 1004.0, 1583.0, 2454.0, 4004.0, 6099.0, 9600.0, 15093.0, 22473.0, 32911.0, 46223.0, 62955.0, 80810.0, 97359.0, 108282.0, 110793.0, 103765.0, 90898.0, 73331.0, 55579.0, 40128.0, 28018.0, 18925.0, 12409.0, 8120.0, 5110.0, 3319.0, 2035.0, 1259.0, 846.0, 519.0, 318.0, 219.0, 143.0, 86.0, 58.0, 45.0, 18.0, 13.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8521575927734375, -0.824920654296875, -0.7976837158203125, -0.77044677734375, -0.7432098388671875, -0.715972900390625, -0.6887359619140625, -0.6614990234375, -0.6342620849609375, -0.607025146484375, -0.5797882080078125, -0.55255126953125, -0.5253143310546875, -0.498077392578125, -0.4708404541015625, -0.443603515625, -0.4163665771484375, -0.389129638671875, -0.3618927001953125, -0.33465576171875, -0.3074188232421875, -0.280181884765625, -0.2529449462890625, -0.2257080078125, -0.1984710693359375, -0.171234130859375, -0.1439971923828125, -0.11676025390625, -0.0895233154296875, -0.062286376953125, -0.0350494384765625, -0.0078125, 0.0194244384765625, 0.046661376953125, 0.0738983154296875, 0.10113525390625, 0.1283721923828125, 0.155609130859375, 0.1828460693359375, 0.2100830078125, 0.2373199462890625, 0.264556884765625, 0.2917938232421875, 0.31903076171875, 0.3462677001953125, 0.373504638671875, 0.4007415771484375, 0.427978515625, 0.4552154541015625, 0.482452392578125, 0.5096893310546875, 0.53692626953125, 0.5641632080078125, 0.591400146484375, 0.6186370849609375, 0.6458740234375, 0.6731109619140625, 0.700347900390625, 0.7275848388671875, 0.75482177734375, 0.7820587158203125, 0.809295654296875, 0.8365325927734375, 0.86376953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 17.0, 12.0, 17.0, 18.0, 12.0, 18.0, 21.0, 23.0, 33.0, 25.0, 30.0, 18.0, 29.0, 42.0, 31.0, 35.0, 46.0, 48.0, 29.0, 45.0, 41.0, 33.0, 28.0, 36.0, 31.0, 30.0, 30.0, 33.0, 26.0, 22.0, 17.0, 19.0, 15.0, 9.0, 12.0, 4.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.546875, -0.5294418334960938, -0.5120086669921875, -0.49457550048828125, -0.477142333984375, -0.45970916748046875, -0.4422760009765625, -0.42484283447265625, -0.40740966796875, -0.38997650146484375, -0.3725433349609375, -0.35511016845703125, -0.337677001953125, -0.32024383544921875, -0.3028106689453125, -0.28537750244140625, -0.2679443359375, -0.25051116943359375, -0.2330780029296875, -0.21564483642578125, -0.198211669921875, -0.18077850341796875, -0.1633453369140625, -0.14591217041015625, -0.12847900390625, -0.11104583740234375, -0.0936126708984375, -0.07617950439453125, -0.058746337890625, -0.04131317138671875, -0.0238800048828125, -0.00644683837890625, 0.010986328125, 0.02841949462890625, 0.0458526611328125, 0.06328582763671875, 0.080718994140625, 0.09815216064453125, 0.1155853271484375, 0.13301849365234375, 0.15045166015625, 0.16788482666015625, 0.1853179931640625, 0.20275115966796875, 0.220184326171875, 0.23761749267578125, 0.2550506591796875, 0.27248382568359375, 0.2899169921875, 0.30735015869140625, 0.3247833251953125, 0.34221649169921875, 0.359649658203125, 0.37708282470703125, 0.3945159912109375, 0.41194915771484375, 0.42938232421875, 0.44681549072265625, 0.4642486572265625, 0.48168182373046875, 0.499114990234375, 0.5165481567382812, 0.5339813232421875, 0.5514144897460938, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 12.0, 23.0, 47.0, 69.0, 102.0, 148.0, 236.0, 362.0, 641.0, 980.0, 1418.0, 2274.0, 3591.0, 5607.0, 8773.0, 13739.0, 21428.0, 32919.0, 49663.0, 71792.0, 96924.0, 120999.0, 132617.0, 127312.0, 107304.0, 81767.0, 57413.0, 38751.0, 25680.0, 16575.0, 10579.0, 6772.0, 4415.0, 2838.0, 1642.0, 1159.0, 706.0, 486.0, 295.0, 164.0, 128.0, 68.0, 59.0, 26.0, 19.0, 11.0, 11.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45325469970703125, -0.4384918212890625, -0.42372894287109375, -0.408966064453125, -0.39420318603515625, -0.3794403076171875, -0.36467742919921875, -0.34991455078125, -0.33515167236328125, -0.3203887939453125, -0.30562591552734375, -0.290863037109375, -0.27610015869140625, -0.2613372802734375, -0.24657440185546875, -0.2318115234375, -0.21704864501953125, -0.2022857666015625, -0.18752288818359375, -0.172760009765625, -0.15799713134765625, -0.1432342529296875, -0.12847137451171875, -0.11370849609375, -0.09894561767578125, -0.0841827392578125, -0.06941986083984375, -0.054656982421875, -0.03989410400390625, -0.0251312255859375, -0.01036834716796875, 0.00439453125, 0.01915740966796875, 0.0339202880859375, 0.04868316650390625, 0.063446044921875, 0.07820892333984375, 0.0929718017578125, 0.10773468017578125, 0.12249755859375, 0.13726043701171875, 0.1520233154296875, 0.16678619384765625, 0.181549072265625, 0.19631195068359375, 0.2110748291015625, 0.22583770751953125, 0.2406005859375, 0.25536346435546875, 0.2701263427734375, 0.28488922119140625, 0.299652099609375, 0.31441497802734375, 0.3291778564453125, 0.34394073486328125, 0.35870361328125, 0.37346649169921875, 0.3882293701171875, 0.40299224853515625, 0.417755126953125, 0.43251800537109375, 0.4472808837890625, 0.46204376220703125, 0.476806640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 12.0, 7.0, 8.0, 3.0, 14.0, 16.0, 24.0, 21.0, 35.0, 26.0, 43.0, 54.0, 50.0, 47.0, 54.0, 48.0, 53.0, 57.0, 50.0, 47.0, 45.0, 49.0, 34.0, 37.0, 35.0, 26.0, 25.0, 18.0, 17.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.739927291870117e-05, -5.577225238084793e-05, -5.414523184299469e-05, -5.251821130514145e-05, -5.089119076728821e-05, -4.926417022943497e-05, -4.7637149691581726e-05, -4.6010129153728485e-05, -4.4383108615875244e-05, -4.2756088078022e-05, -4.112906754016876e-05, -3.950204700231552e-05, -3.787502646446228e-05, -3.624800592660904e-05, -3.46209853887558e-05, -3.299396485090256e-05, -3.1366944313049316e-05, -2.9739923775196075e-05, -2.8112903237342834e-05, -2.6485882699489594e-05, -2.4858862161636353e-05, -2.323184162378311e-05, -2.160482108592987e-05, -1.997780054807663e-05, -1.835078001022339e-05, -1.6723759472370148e-05, -1.5096738934516907e-05, -1.3469718396663666e-05, -1.1842697858810425e-05, -1.0215677320957184e-05, -8.588656783103943e-06, -6.961636245250702e-06, -5.334615707397461e-06, -3.70759516954422e-06, -2.080574631690979e-06, -4.5355409383773804e-07, 1.173466444015503e-06, 2.800486981868744e-06, 4.427507519721985e-06, 6.054528057575226e-06, 7.681548595428467e-06, 9.308569133281708e-06, 1.0935589671134949e-05, 1.256261020898819e-05, 1.418963074684143e-05, 1.581665128469467e-05, 1.7443671822547913e-05, 1.9070692360401154e-05, 2.0697712898254395e-05, 2.2324733436107635e-05, 2.3951753973960876e-05, 2.5578774511814117e-05, 2.720579504966736e-05, 2.88328155875206e-05, 3.045983612537384e-05, 3.208685666322708e-05, 3.371387720108032e-05, 3.534089773893356e-05, 3.6967918276786804e-05, 3.8594938814640045e-05, 4.0221959352493286e-05, 4.184897989034653e-05, 4.347600042819977e-05, 4.510302096605301e-05, 4.673004150390625e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 14.0, 27.0, 46.0, 61.0, 116.0, 195.0, 314.0, 435.0, 773.0, 1214.0, 2107.0, 3487.0, 5866.0, 9935.0, 16769.0, 27183.0, 43301.0, 66628.0, 94840.0, 123548.0, 142199.0, 140680.0, 118615.0, 88658.0, 60800.0, 39430.0, 24270.0, 14941.0, 8973.0, 5110.0, 3178.0, 1855.0, 1107.0, 713.0, 447.0, 244.0, 173.0, 109.0, 62.0, 42.0, 34.0, 17.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49330902099609375, -0.4773406982421875, -0.46137237548828125, -0.445404052734375, -0.42943572998046875, -0.4134674072265625, -0.39749908447265625, -0.38153076171875, -0.36556243896484375, -0.3495941162109375, -0.33362579345703125, -0.317657470703125, -0.30168914794921875, -0.2857208251953125, -0.26975250244140625, -0.2537841796875, -0.23781585693359375, -0.2218475341796875, -0.20587921142578125, -0.189910888671875, -0.17394256591796875, -0.1579742431640625, -0.14200592041015625, -0.12603759765625, -0.11006927490234375, -0.0941009521484375, -0.07813262939453125, -0.062164306640625, -0.04619598388671875, -0.0302276611328125, -0.01425933837890625, 0.001708984375, 0.01767730712890625, 0.0336456298828125, 0.04961395263671875, 0.065582275390625, 0.08155059814453125, 0.0975189208984375, 0.11348724365234375, 0.12945556640625, 0.14542388916015625, 0.1613922119140625, 0.17736053466796875, 0.193328857421875, 0.20929718017578125, 0.2252655029296875, 0.24123382568359375, 0.2572021484375, 0.27317047119140625, 0.2891387939453125, 0.30510711669921875, 0.321075439453125, 0.33704376220703125, 0.3530120849609375, 0.36898040771484375, 0.38494873046875, 0.40091705322265625, 0.4168853759765625, 0.43285369873046875, 0.448822021484375, 0.46479034423828125, 0.4807586669921875, 0.49672698974609375, 0.5126953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 17.0, 9.0, 11.0, 12.0, 19.0, 17.0, 23.0, 29.0, 24.0, 37.0, 37.0, 33.0, 32.0, 41.0, 34.0, 43.0, 53.0, 50.0, 48.0, 50.0, 45.0, 54.0, 36.0, 32.0, 28.0, 24.0, 26.0, 17.0, 20.0, 15.0, 11.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.1547374725341797, -0.15017318725585938, -0.14560890197753906, -0.14104461669921875, -0.13648033142089844, -0.13191604614257812, -0.1273517608642578, -0.1227874755859375, -0.11822319030761719, -0.11365890502929688, -0.10909461975097656, -0.10453033447265625, -0.09996604919433594, -0.09540176391601562, -0.09083747863769531, -0.086273193359375, -0.08170890808105469, -0.07714462280273438, -0.07258033752441406, -0.06801605224609375, -0.06345176696777344, -0.058887481689453125, -0.05432319641113281, -0.0497589111328125, -0.04519462585449219, -0.040630340576171875, -0.03606605529785156, -0.03150177001953125, -0.026937484741210938, -0.022373199462890625, -0.017808914184570312, -0.01324462890625, -0.008680343627929688, -0.004116058349609375, 0.0004482269287109375, 0.00501251220703125, 0.009576797485351562, 0.014141082763671875, 0.018705368041992188, 0.0232696533203125, 0.027833938598632812, 0.032398223876953125, 0.03696250915527344, 0.04152679443359375, 0.04609107971191406, 0.050655364990234375, 0.05521965026855469, 0.059783935546875, 0.06434822082519531, 0.06891250610351562, 0.07347679138183594, 0.07804107666015625, 0.08260536193847656, 0.08716964721679688, 0.09173393249511719, 0.0962982177734375, 0.10086250305175781, 0.10542678833007812, 0.10999107360839844, 0.11455535888671875, 0.11911964416503906, 0.12368392944335938, 0.1282482147216797, 0.1328125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 7.0, 8.0, 6.0, 11.0, 11.0, 18.0, 17.0, 22.0, 28.0, 35.0, 44.0, 45.0, 47.0, 43.0, 42.0, 49.0, 56.0, 61.0, 54.0, 46.0, 47.0, 38.0, 41.0, 40.0, 34.0, 27.0, 24.0, 23.0, 13.0, 15.0, 10.0, 6.0, 9.0, 5.0, 5.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.5691479444503784, -1.5247411727905273, -1.4803344011306763, -1.4359276294708252, -1.3915208578109741, -1.347114086151123, -1.302707314491272, -1.258300542831421, -1.2138937711715698, -1.1694869995117188, -1.1250802278518677, -1.0806734561920166, -1.0362666845321655, -0.9918599128723145, -0.9474531412124634, -0.9030463695526123, -0.858639657497406, -0.8142328858375549, -0.7698261141777039, -0.7254193425178528, -0.6810125708580017, -0.6366057991981506, -0.5921990871429443, -0.5477923154830933, -0.5033855438232422, -0.4589787721633911, -0.41457200050354004, -0.37016522884368896, -0.3257584571838379, -0.2813516855239868, -0.23694494366645813, -0.19253817200660706, -0.1481313705444336, -0.10372459888458252, -0.05931783467531204, -0.014911070466041565, 0.02949570119380951, 0.07390247285366058, 0.11830922961235046, 0.16271600127220154, 0.2071227729320526, 0.2515295445919037, 0.29593631625175476, 0.34034305810928345, 0.3847498297691345, 0.4291566014289856, 0.47356337308883667, 0.5179701447486877, 0.5623769164085388, 0.6067836880683899, 0.651190459728241, 0.695597231388092, 0.7400040030479431, 0.7844107747077942, 0.8288174867630005, 0.8732242584228516, 0.9176310300827026, 0.9620378017425537, 1.0064445734024048, 1.0508513450622559, 1.095258116722107, 1.139664888381958, 1.184071660041809, 1.2284784317016602, 1.2728852033615112]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 3.0, 1.0, 11.0, 7.0, 14.0, 14.0, 17.0, 23.0, 14.0, 32.0, 18.0, 27.0, 26.0, 38.0, 34.0, 32.0, 37.0, 31.0, 40.0, 43.0, 31.0, 47.0, 36.0, 26.0, 32.0, 33.0, 23.0, 25.0, 33.0, 29.0, 31.0, 23.0, 21.0, 28.0, 21.0, 19.0, 6.0, 7.0, 6.0, 10.0, 5.0, 9.0, 8.0, 8.0, 5.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8512454032897949, -0.823173463344574, -0.795101523399353, -0.7670295834541321, -0.7389576435089111, -0.7108856439590454, -0.6828137040138245, -0.6547417640686035, -0.6266698241233826, -0.5985978841781616, -0.5705259442329407, -0.5424540042877197, -0.514382004737854, -0.48631009459495544, -0.4582381248474121, -0.43016618490219116, -0.4020942449569702, -0.37402230501174927, -0.3459503650665283, -0.317878395318985, -0.28980645537376404, -0.2617345154285431, -0.23366256058216095, -0.2055906057357788, -0.17751866579055786, -0.14944672584533691, -0.12137477099895477, -0.09330282360315323, -0.06523087620735168, -0.03715893626213074, -0.009086981415748596, 0.018984973430633545, 0.04705685377120972, 0.07512880116701126, 0.1032007485628128, 0.13127270340919495, 0.1593446433544159, 0.18741658329963684, 0.21548853814601898, 0.24356049299240112, 0.27163243293762207, 0.299704372882843, 0.32777631282806396, 0.3558482825756073, 0.38392022252082825, 0.4119921624660492, 0.44006413221359253, 0.4681360721588135, 0.4962080121040344, 0.5242799520492554, 0.5523518919944763, 0.5804238319396973, 0.608495831489563, 0.6365677118301392, 0.6646397113800049, 0.6927116513252258, 0.7207835912704468, 0.7488555312156677, 0.7769274711608887, 0.8049994111061096, 0.8330713510513306, 0.8611433506011963, 0.8892152905464172, 0.9172872304916382, 0.9453591704368591]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 14.0, 13.0, 21.0, 48.0, 64.0, 116.0, 182.0, 321.0, 636.0, 1056.0, 1945.0, 3825.0, 7265.0, 14544.0, 28719.0, 57960.0, 116626.0, 230718.0, 419027.0, 664369.0, 820548.0, 738583.0, 502134.0, 286032.0, 149223.0, 74702.0, 37259.0, 18699.0, 9440.0, 4701.0, 2513.0, 1301.0, 746.0, 417.0, 191.0, 134.0, 85.0, 44.0, 21.0, 17.0, 7.0, 6.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5625, -1.5160980224609375, -1.469696044921875, -1.4232940673828125, -1.37689208984375, -1.3304901123046875, -1.284088134765625, -1.2376861572265625, -1.1912841796875, -1.1448822021484375, -1.098480224609375, -1.0520782470703125, -1.00567626953125, -0.9592742919921875, -0.912872314453125, -0.8664703369140625, -0.820068359375, -0.7736663818359375, -0.727264404296875, -0.6808624267578125, -0.63446044921875, -0.5880584716796875, -0.541656494140625, -0.4952545166015625, -0.4488525390625, -0.4024505615234375, -0.356048583984375, -0.3096466064453125, -0.26324462890625, -0.2168426513671875, -0.170440673828125, -0.1240386962890625, -0.07763671875, -0.0312347412109375, 0.015167236328125, 0.0615692138671875, 0.10797119140625, 0.1543731689453125, 0.200775146484375, 0.2471771240234375, 0.2935791015625, 0.3399810791015625, 0.386383056640625, 0.4327850341796875, 0.47918701171875, 0.5255889892578125, 0.571990966796875, 0.6183929443359375, 0.664794921875, 0.7111968994140625, 0.757598876953125, 0.8040008544921875, 0.85040283203125, 0.8968048095703125, 0.943206787109375, 0.9896087646484375, 1.0360107421875, 1.0824127197265625, 1.128814697265625, 1.1752166748046875, 1.22161865234375, 1.2680206298828125, 1.314422607421875, 1.3608245849609375, 1.4072265625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 14.0, 13.0, 15.0, 18.0, 37.0, 25.0, 29.0, 32.0, 29.0, 33.0, 33.0, 42.0, 39.0, 47.0, 38.0, 48.0, 35.0, 49.0, 52.0, 39.0, 34.0, 36.0, 28.0, 29.0, 32.0, 18.0, 22.0, 17.0, 14.0, 12.0, 8.0, 12.0, 14.0, 4.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.73187255859375, -0.7064208984375, -0.68096923828125, -0.655517578125, -0.63006591796875, -0.6046142578125, -0.57916259765625, -0.5537109375, -0.52825927734375, -0.5028076171875, -0.47735595703125, -0.451904296875, -0.42645263671875, -0.4010009765625, -0.37554931640625, -0.35009765625, -0.32464599609375, -0.2991943359375, -0.27374267578125, -0.248291015625, -0.22283935546875, -0.1973876953125, -0.17193603515625, -0.146484375, -0.12103271484375, -0.0955810546875, -0.07012939453125, -0.044677734375, -0.01922607421875, 0.0062255859375, 0.03167724609375, 0.05712890625, 0.08258056640625, 0.1080322265625, 0.13348388671875, 0.158935546875, 0.18438720703125, 0.2098388671875, 0.23529052734375, 0.2607421875, 0.28619384765625, 0.3116455078125, 0.33709716796875, 0.362548828125, 0.38800048828125, 0.4134521484375, 0.43890380859375, 0.46435546875, 0.48980712890625, 0.5152587890625, 0.54071044921875, 0.566162109375, 0.59161376953125, 0.6170654296875, 0.64251708984375, 0.66796875, 0.69342041015625, 0.7188720703125, 0.74432373046875, 0.769775390625, 0.79522705078125, 0.8206787109375, 0.84613037109375, 0.87158203125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 10.0, 15.0, 29.0, 49.0, 59.0, 101.0, 147.0, 208.0, 345.0, 565.0, 924.0, 1485.0, 2386.0, 3765.0, 5901.0, 9598.0, 15752.0, 25186.0, 39861.0, 63095.0, 98882.0, 148523.0, 217341.0, 302422.0, 391982.0, 468376.0, 502358.0, 479228.0, 411582.0, 320062.0, 232448.0, 160558.0, 105881.0, 69419.0, 43298.0, 27452.0, 16920.0, 10505.0, 6654.0, 4075.0, 2620.0, 1543.0, 991.0, 646.0, 381.0, 258.0, 134.0, 80.0, 75.0, 29.0, 29.0, 21.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.97314453125, -0.9413375854492188, -0.9095306396484375, -0.8777236938476562, -0.845916748046875, -0.8141098022460938, -0.7823028564453125, -0.7504959106445312, -0.71868896484375, -0.6868820190429688, -0.6550750732421875, -0.6232681274414062, -0.591461181640625, -0.5596542358398438, -0.5278472900390625, -0.49604034423828125, -0.4642333984375, -0.43242645263671875, -0.4006195068359375, -0.36881256103515625, -0.337005615234375, -0.30519866943359375, -0.2733917236328125, -0.24158477783203125, -0.20977783203125, -0.17797088623046875, -0.1461639404296875, -0.11435699462890625, -0.082550048828125, -0.05074310302734375, -0.0189361572265625, 0.01287078857421875, 0.044677734375, 0.07648468017578125, 0.1082916259765625, 0.14009857177734375, 0.171905517578125, 0.20371246337890625, 0.2355194091796875, 0.26732635498046875, 0.29913330078125, 0.33094024658203125, 0.3627471923828125, 0.39455413818359375, 0.426361083984375, 0.45816802978515625, 0.4899749755859375, 0.5217819213867188, 0.5535888671875, 0.5853958129882812, 0.6172027587890625, 0.6490097045898438, 0.680816650390625, 0.7126235961914062, 0.7444305419921875, 0.7762374877929688, 0.80804443359375, 0.8398513793945312, 0.8716583251953125, 0.9034652709960938, 0.935272216796875, 0.9670791625976562, 0.9988861083984375, 1.0306930541992188, 1.0625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 24.0, 16.0, 21.0, 33.0, 30.0, 47.0, 66.0, 62.0, 90.0, 85.0, 91.0, 122.0, 112.0, 157.0, 172.0, 160.0, 202.0, 196.0, 209.0, 175.0, 189.0, 207.0, 182.0, 204.0, 166.0, 154.0, 135.0, 126.0, 108.0, 84.0, 69.0, 65.0, 54.0, 41.0, 54.0, 28.0, 40.0, 20.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.392578125, -0.3801116943359375, -0.367645263671875, -0.3551788330078125, -0.34271240234375, -0.3302459716796875, -0.317779541015625, -0.3053131103515625, -0.2928466796875, -0.2803802490234375, -0.267913818359375, -0.2554473876953125, -0.24298095703125, -0.2305145263671875, -0.218048095703125, -0.2055816650390625, -0.193115234375, -0.1806488037109375, -0.168182373046875, -0.1557159423828125, -0.14324951171875, -0.1307830810546875, -0.118316650390625, -0.1058502197265625, -0.0933837890625, -0.0809173583984375, -0.068450927734375, -0.0559844970703125, -0.04351806640625, -0.0310516357421875, -0.018585205078125, -0.0061187744140625, 0.00634765625, 0.0188140869140625, 0.031280517578125, 0.0437469482421875, 0.05621337890625, 0.0686798095703125, 0.081146240234375, 0.0936126708984375, 0.1060791015625, 0.1185455322265625, 0.131011962890625, 0.1434783935546875, 0.15594482421875, 0.1684112548828125, 0.180877685546875, 0.1933441162109375, 0.205810546875, 0.2182769775390625, 0.230743408203125, 0.2432098388671875, 0.25567626953125, 0.2681427001953125, 0.280609130859375, 0.2930755615234375, 0.3055419921875, 0.3180084228515625, 0.330474853515625, 0.3429412841796875, 0.35540771484375, 0.3678741455078125, 0.380340576171875, 0.3928070068359375, 0.4052734375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 17.0, 32.0, 32.0, 19.0, 50.0, 41.0, 49.0, 57.0, 63.0, 61.0, 41.0, 55.0, 33.0, 43.0, 47.0, 27.0, 34.0, 34.0, 30.0, 18.0, 13.0, 19.0, 16.0, 10.0, 15.0, 13.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.5239067077636719, -1.4816919565200806, -1.4394772052764893, -1.397262454032898, -1.3550477027893066, -1.3128328323364258, -1.2706180810928345, -1.2284033298492432, -1.1861885786056519, -1.1439738273620605, -1.1017590761184692, -1.059544324874878, -1.017329454421997, -0.9751147627830505, -0.9328999519348145, -0.8906852006912231, -0.8484704494476318, -0.8062556982040405, -0.7640409469604492, -0.7218261361122131, -0.6796113848686218, -0.6373966336250305, -0.5951818227767944, -0.5529670715332031, -0.5107523202896118, -0.4685375690460205, -0.4263227880001068, -0.3841080069541931, -0.3418932557106018, -0.2996785044670105, -0.2574637234210968, -0.2152489423751831, -0.17303407192230225, -0.13081930577754974, -0.08860453963279724, -0.04638977348804474, -0.004175007343292236, 0.038039758801460266, 0.08025452494621277, 0.12246930599212646, 0.16468405723571777, 0.20689882338047028, 0.24911358952522278, 0.2913283705711365, 0.3335431218147278, 0.3757578730583191, 0.4179726541042328, 0.4601874351501465, 0.5024021863937378, 0.5446169376373291, 0.5868316888809204, 0.6290464997291565, 0.6712612509727478, 0.7134760022163391, 0.7556908130645752, 0.7979055643081665, 0.8401203155517578, 0.8823350667953491, 0.9245498180389404, 0.9667646288871765, 1.008979320526123, 1.051194190979004, 1.0934089422225952, 1.1356236934661865, 1.1778384447097778]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 22.0, 14.0, 18.0, 17.0, 24.0, 38.0, 25.0, 29.0, 32.0, 31.0, 44.0, 37.0, 43.0, 28.0, 41.0, 32.0, 44.0, 34.0, 46.0, 40.0, 34.0, 33.0, 35.0, 27.0, 32.0, 27.0, 20.0, 15.0, 16.0, 9.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8927128911018372, -0.8629211783409119, -0.8331294655799866, -0.8033376932144165, -0.7735459804534912, -0.7437542676925659, -0.7139625549316406, -0.6841708421707153, -0.65437912940979, -0.6245874166488647, -0.5947957038879395, -0.5650039911270142, -0.5352122187614441, -0.5054205060005188, -0.4756287932395935, -0.4458370804786682, -0.41604530811309814, -0.38625359535217285, -0.35646185278892517, -0.3266701400279999, -0.2968783974647522, -0.2670866847038269, -0.2372949719429016, -0.20750324428081512, -0.17771151661872864, -0.14791978895664215, -0.11812806874513626, -0.08833634853363037, -0.058544620871543884, -0.028752893209457397, 0.0010388195514678955, 0.030830547213554382, 0.060622334480285645, 0.09041406214237213, 0.12020578235387802, 0.1499975025653839, 0.1797892302274704, 0.20958095788955688, 0.23937267065048218, 0.26916438341140747, 0.29895612597465515, 0.32874783873558044, 0.3585395812988281, 0.3883312940597534, 0.4181230068206787, 0.4479147493839264, 0.4777064621448517, 0.5074982047080994, 0.5372899174690247, 0.56708163022995, 0.5968733429908752, 0.6266651153564453, 0.6564568281173706, 0.6862485408782959, 0.7160402536392212, 0.7458319664001465, 0.7756236791610718, 0.8054153919219971, 0.8352071046829224, 0.8649988174438477, 0.8947905898094177, 0.924582302570343, 0.9543740153312683, 0.9841657280921936, 1.0139575004577637]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 17.0, 36.0, 47.0, 64.0, 99.0, 135.0, 252.0, 363.0, 579.0, 888.0, 1426.0, 2285.0, 3651.0, 5875.0, 9740.0, 16518.0, 27680.0, 46405.0, 75989.0, 122123.0, 171544.0, 184211.0, 142336.0, 93330.0, 57356.0, 34168.0, 20107.0, 12079.0, 7463.0, 4430.0, 2690.0, 1632.0, 1083.0, 690.0, 426.0, 295.0, 154.0, 122.0, 75.0, 57.0, 37.0, 25.0, 16.0, 15.0, 5.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.287109375, -0.2779083251953125, -0.268707275390625, -0.2595062255859375, -0.25030517578125, -0.2411041259765625, -0.231903076171875, -0.2227020263671875, -0.2135009765625, -0.2042999267578125, -0.195098876953125, -0.1858978271484375, -0.17669677734375, -0.1674957275390625, -0.158294677734375, -0.1490936279296875, -0.139892578125, -0.1306915283203125, -0.121490478515625, -0.1122894287109375, -0.10308837890625, -0.0938873291015625, -0.084686279296875, -0.0754852294921875, -0.0662841796875, -0.0570831298828125, -0.047882080078125, -0.0386810302734375, -0.02947998046875, -0.0202789306640625, -0.011077880859375, -0.0018768310546875, 0.00732421875, 0.0165252685546875, 0.025726318359375, 0.0349273681640625, 0.04412841796875, 0.0533294677734375, 0.062530517578125, 0.0717315673828125, 0.0809326171875, 0.0901336669921875, 0.099334716796875, 0.1085357666015625, 0.11773681640625, 0.1269378662109375, 0.136138916015625, 0.1453399658203125, 0.154541015625, 0.1637420654296875, 0.172943115234375, 0.1821441650390625, 0.19134521484375, 0.2005462646484375, 0.209747314453125, 0.2189483642578125, 0.2281494140625, 0.2373504638671875, 0.246551513671875, 0.2557525634765625, 0.26495361328125, 0.2741546630859375, 0.283355712890625, 0.2925567626953125, 0.3017578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 5.0, 10.0, 8.0, 10.0, 15.0, 17.0, 18.0, 29.0, 31.0, 34.0, 31.0, 39.0, 38.0, 55.0, 50.0, 34.0, 43.0, 34.0, 47.0, 49.0, 50.0, 48.0, 47.0, 50.0, 32.0, 38.0, 18.0, 24.0, 28.0, 17.0, 9.0, 5.0, 10.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0746002197265625, -1.036895751953125, -0.9991912841796875, -0.96148681640625, -0.9237823486328125, -0.886077880859375, -0.8483734130859375, -0.8106689453125, -0.7729644775390625, -0.735260009765625, -0.6975555419921875, -0.65985107421875, -0.6221466064453125, -0.584442138671875, -0.5467376708984375, -0.509033203125, -0.4713287353515625, -0.433624267578125, -0.3959197998046875, -0.35821533203125, -0.3205108642578125, -0.282806396484375, -0.2451019287109375, -0.2073974609375, -0.1696929931640625, -0.131988525390625, -0.0942840576171875, -0.05657958984375, -0.0188751220703125, 0.018829345703125, 0.0565338134765625, 0.09423828125, 0.1319427490234375, 0.169647216796875, 0.2073516845703125, 0.24505615234375, 0.2827606201171875, 0.320465087890625, 0.3581695556640625, 0.3958740234375, 0.4335784912109375, 0.471282958984375, 0.5089874267578125, 0.54669189453125, 0.5843963623046875, 0.622100830078125, 0.6598052978515625, 0.697509765625, 0.7352142333984375, 0.772918701171875, 0.8106231689453125, 0.84832763671875, 0.8860321044921875, 0.923736572265625, 0.9614410400390625, 0.9991455078125, 1.0368499755859375, 1.074554443359375, 1.1122589111328125, 1.14996337890625, 1.1876678466796875, 1.225372314453125, 1.2630767822265625, 1.30078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 19.0, 26.0, 31.0, 48.0, 78.0, 92.0, 183.0, 287.0, 428.0, 713.0, 1215.0, 2119.0, 3675.0, 6701.0, 12524.0, 24172.0, 47481.0, 92232.0, 167658.0, 238107.0, 202878.0, 118327.0, 62149.0, 31329.0, 16273.0, 8631.0, 4754.0, 2584.0, 1481.0, 870.0, 511.0, 345.0, 192.0, 136.0, 91.0, 63.0, 40.0, 21.0, 21.0, 16.0, 8.0, 11.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.39501953125, -0.3829383850097656, -0.37085723876953125, -0.3587760925292969, -0.3466949462890625, -0.3346138000488281, -0.32253265380859375, -0.3104515075683594, -0.298370361328125, -0.2862892150878906, -0.27420806884765625, -0.2621269226074219, -0.2500457763671875, -0.23796463012695312, -0.22588348388671875, -0.21380233764648438, -0.20172119140625, -0.18964004516601562, -0.17755889892578125, -0.16547775268554688, -0.1533966064453125, -0.14131546020507812, -0.12923431396484375, -0.11715316772460938, -0.105072021484375, -0.09299087524414062, -0.08090972900390625, -0.06882858276367188, -0.0567474365234375, -0.044666290283203125, -0.03258514404296875, -0.020503997802734375, -0.0084228515625, 0.003658294677734375, 0.01573944091796875, 0.027820587158203125, 0.0399017333984375, 0.051982879638671875, 0.06406402587890625, 0.07614517211914062, 0.088226318359375, 0.10030746459960938, 0.11238861083984375, 0.12446975708007812, 0.1365509033203125, 0.14863204956054688, 0.16071319580078125, 0.17279434204101562, 0.18487548828125, 0.19695663452148438, 0.20903778076171875, 0.22111892700195312, 0.2332000732421875, 0.24528121948242188, 0.25736236572265625, 0.2694435119628906, 0.281524658203125, 0.2936058044433594, 0.30568695068359375, 0.3177680969238281, 0.3298492431640625, 0.3419303894042969, 0.35401153564453125, 0.3660926818847656, 0.378173828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 6.0, 4.0, 6.0, 1.0, 10.0, 11.0, 15.0, 17.0, 23.0, 20.0, 11.0, 32.0, 27.0, 31.0, 29.0, 39.0, 31.0, 37.0, 23.0, 50.0, 35.0, 32.0, 39.0, 45.0, 44.0, 27.0, 36.0, 28.0, 33.0, 29.0, 37.0, 25.0, 18.0, 22.0, 16.0, 13.0, 13.0, 10.0, 12.0, 11.0, 16.0, 5.0, 4.0, 9.0, 1.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.5888671875, -0.5704879760742188, -0.5521087646484375, -0.5337295532226562, -0.515350341796875, -0.49697113037109375, -0.4785919189453125, -0.46021270751953125, -0.44183349609375, -0.42345428466796875, -0.4050750732421875, -0.38669586181640625, -0.368316650390625, -0.34993743896484375, -0.3315582275390625, -0.31317901611328125, -0.2947998046875, -0.27642059326171875, -0.2580413818359375, -0.23966217041015625, -0.221282958984375, -0.20290374755859375, -0.1845245361328125, -0.16614532470703125, -0.14776611328125, -0.12938690185546875, -0.1110076904296875, -0.09262847900390625, -0.074249267578125, -0.05587005615234375, -0.0374908447265625, -0.01911163330078125, -0.000732421875, 0.01764678955078125, 0.0360260009765625, 0.05440521240234375, 0.072784423828125, 0.09116363525390625, 0.1095428466796875, 0.12792205810546875, 0.14630126953125, 0.16468048095703125, 0.1830596923828125, 0.20143890380859375, 0.219818115234375, 0.23819732666015625, 0.2565765380859375, 0.27495574951171875, 0.2933349609375, 0.31171417236328125, 0.3300933837890625, 0.34847259521484375, 0.366851806640625, 0.38523101806640625, 0.4036102294921875, 0.42198944091796875, 0.44036865234375, 0.45874786376953125, 0.4771270751953125, 0.49550628662109375, 0.513885498046875, 0.5322647094726562, 0.5506439208984375, 0.5690231323242188, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 16.0, 33.0, 24.0, 29.0, 84.0, 87.0, 135.0, 177.0, 268.0, 419.0, 613.0, 960.0, 1519.0, 2474.0, 4525.0, 8841.0, 21741.0, 72438.0, 375292.0, 430020.0, 83585.0, 23599.0, 9634.0, 4815.0, 2649.0, 1516.0, 1006.0, 651.0, 446.0, 278.0, 229.0, 142.0, 88.0, 57.0, 41.0, 30.0, 24.0, 14.0, 11.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2736091613769531, -0.26450347900390625, -0.2553977966308594, -0.2462921142578125, -0.23718643188476562, -0.22808074951171875, -0.21897506713867188, -0.209869384765625, -0.20076370239257812, -0.19165802001953125, -0.18255233764648438, -0.1734466552734375, -0.16434097290039062, -0.15523529052734375, -0.14612960815429688, -0.13702392578125, -0.12791824340820312, -0.11881256103515625, -0.10970687866210938, -0.1006011962890625, -0.09149551391601562, -0.08238983154296875, -0.07328414916992188, -0.064178466796875, -0.055072784423828125, -0.04596710205078125, -0.036861419677734375, -0.0277557373046875, -0.018650054931640625, -0.00954437255859375, -0.000438690185546875, 0.0086669921875, 0.017772674560546875, 0.02687835693359375, 0.035984039306640625, 0.0450897216796875, 0.054195404052734375, 0.06330108642578125, 0.07240676879882812, 0.081512451171875, 0.09061813354492188, 0.09972381591796875, 0.10882949829101562, 0.1179351806640625, 0.12704086303710938, 0.13614654541015625, 0.14525222778320312, 0.15435791015625, 0.16346359252929688, 0.17256927490234375, 0.18167495727539062, 0.1907806396484375, 0.19988632202148438, 0.20899200439453125, 0.21809768676757812, 0.227203369140625, 0.23630905151367188, 0.24541473388671875, 0.2545204162597656, 0.2636260986328125, 0.2727317810058594, 0.28183746337890625, 0.2909431457519531, 0.300048828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 16.0, 29.0, 65.0, 64.0, 88.0, 110.0, 125.0, 124.0, 115.0, 89.0, 52.0, 29.0, 26.0, 15.0, 10.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1655112504959106e-05, -2.0839273929595947e-05, -2.0023435354232788e-05, -1.920759677886963e-05, -1.839175820350647e-05, -1.757591962814331e-05, -1.676008105278015e-05, -1.5944242477416992e-05, -1.5128403902053833e-05, -1.4312565326690674e-05, -1.3496726751327515e-05, -1.2680888175964355e-05, -1.1865049600601196e-05, -1.1049211025238037e-05, -1.0233372449874878e-05, -9.417533874511719e-06, -8.60169529914856e-06, -7.7858567237854e-06, -6.970018148422241e-06, -6.154179573059082e-06, -5.338340997695923e-06, -4.522502422332764e-06, -3.7066638469696045e-06, -2.8908252716064453e-06, -2.074986696243286e-06, -1.259148120880127e-06, -4.4330954551696777e-07, 3.725290298461914e-07, 1.1883676052093506e-06, 2.0042061805725098e-06, 2.820044755935669e-06, 3.635883331298828e-06, 4.451721906661987e-06, 5.2675604820251465e-06, 6.083399057388306e-06, 6.899237632751465e-06, 7.715076208114624e-06, 8.530914783477783e-06, 9.346753358840942e-06, 1.0162591934204102e-05, 1.097843050956726e-05, 1.179426908493042e-05, 1.2610107660293579e-05, 1.3425946235656738e-05, 1.4241784811019897e-05, 1.5057623386383057e-05, 1.5873461961746216e-05, 1.6689300537109375e-05, 1.7505139112472534e-05, 1.8320977687835693e-05, 1.9136816263198853e-05, 1.9952654838562012e-05, 2.076849341392517e-05, 2.158433198928833e-05, 2.240017056465149e-05, 2.321600914001465e-05, 2.4031847715377808e-05, 2.4847686290740967e-05, 2.5663524866104126e-05, 2.6479363441467285e-05, 2.7295202016830444e-05, 2.8111040592193604e-05, 2.8926879167556763e-05, 2.9742717742919922e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 6.0, 16.0, 15.0, 9.0, 28.0, 42.0, 49.0, 69.0, 102.0, 174.0, 244.0, 368.0, 621.0, 935.0, 1592.0, 2658.0, 4724.0, 9444.0, 22645.0, 73713.0, 302116.0, 442906.0, 124475.0, 34270.0, 12918.0, 6156.0, 3245.0, 1832.0, 1072.0, 689.0, 449.0, 282.0, 209.0, 130.0, 93.0, 61.0, 50.0, 28.0, 25.0, 14.0, 15.0, 13.0, 11.0, 6.0, 3.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3310546875, -0.320770263671875, -0.31048583984375, -0.300201416015625, -0.2899169921875, -0.279632568359375, -0.26934814453125, -0.259063720703125, -0.248779296875, -0.238494873046875, -0.22821044921875, -0.217926025390625, -0.2076416015625, -0.197357177734375, -0.18707275390625, -0.176788330078125, -0.16650390625, -0.156219482421875, -0.14593505859375, -0.135650634765625, -0.1253662109375, -0.115081787109375, -0.10479736328125, -0.094512939453125, -0.084228515625, -0.073944091796875, -0.06365966796875, -0.053375244140625, -0.0430908203125, -0.032806396484375, -0.02252197265625, -0.012237548828125, -0.001953125, 0.008331298828125, 0.01861572265625, 0.028900146484375, 0.0391845703125, 0.049468994140625, 0.05975341796875, 0.070037841796875, 0.080322265625, 0.090606689453125, 0.10089111328125, 0.111175537109375, 0.1214599609375, 0.131744384765625, 0.14202880859375, 0.152313232421875, 0.16259765625, 0.172882080078125, 0.18316650390625, 0.193450927734375, 0.2037353515625, 0.214019775390625, 0.22430419921875, 0.234588623046875, 0.244873046875, 0.255157470703125, 0.26544189453125, 0.275726318359375, 0.2860107421875, 0.296295166015625, 0.30657958984375, 0.316864013671875, 0.3271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 3.0, 10.0, 4.0, 3.0, 7.0, 12.0, 10.0, 13.0, 18.0, 17.0, 21.0, 31.0, 44.0, 54.0, 74.0, 100.0, 93.0, 76.0, 80.0, 62.0, 42.0, 45.0, 26.0, 27.0, 19.0, 18.0, 14.0, 11.0, 7.0, 7.0, 7.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048370361328125, -0.04680013656616211, -0.04522991180419922, -0.04365968704223633, -0.04208946228027344, -0.04051923751831055, -0.038949012756347656, -0.037378787994384766, -0.035808563232421875, -0.034238338470458984, -0.032668113708496094, -0.031097888946533203, -0.029527664184570312, -0.027957439422607422, -0.02638721466064453, -0.02481698989868164, -0.02324676513671875, -0.02167654037475586, -0.02010631561279297, -0.018536090850830078, -0.016965866088867188, -0.015395641326904297, -0.013825416564941406, -0.012255191802978516, -0.010684967041015625, -0.009114742279052734, -0.007544517517089844, -0.005974292755126953, -0.0044040679931640625, -0.002833843231201172, -0.0012636184692382812, 0.0003066062927246094, 0.0018768310546875, 0.0034470558166503906, 0.005017280578613281, 0.006587505340576172, 0.008157730102539062, 0.009727954864501953, 0.011298179626464844, 0.012868404388427734, 0.014438629150390625, 0.016008853912353516, 0.017579078674316406, 0.019149303436279297, 0.020719528198242188, 0.022289752960205078, 0.02385997772216797, 0.02543020248413086, 0.02700042724609375, 0.02857065200805664, 0.03014087677001953, 0.03171110153198242, 0.03328132629394531, 0.0348515510559082, 0.036421775817871094, 0.037992000579833984, 0.039562225341796875, 0.041132450103759766, 0.042702674865722656, 0.04427289962768555, 0.04584312438964844, 0.04741334915161133, 0.04898357391357422, 0.05055379867553711, 0.0521240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 13.0, 19.0, 19.0, 17.0, 22.0, 21.0, 40.0, 24.0, 44.0, 43.0, 57.0, 52.0, 66.0, 56.0, 51.0, 45.0, 36.0, 50.0, 37.0, 30.0, 37.0, 36.0, 26.0, 18.0, 17.0, 13.0, 15.0, 14.0, 16.0, 6.0, 11.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.584175705909729, -1.5413509607315063, -1.4985262155532837, -1.455701470375061, -1.412876844406128, -1.3700520992279053, -1.3272273540496826, -1.28440260887146, -1.2415778636932373, -1.1987531185150146, -1.155928373336792, -1.1131036281585693, -1.0702788829803467, -1.0274542570114136, -0.9846295118331909, -0.9418047666549683, -0.8989800214767456, -0.856155276298523, -0.8133305311203003, -0.7705058455467224, -0.7276811003684998, -0.6848563551902771, -0.6420316696166992, -0.5992069244384766, -0.5563821792602539, -0.5135574340820312, -0.470732718706131, -0.4279080033302307, -0.38508325815200806, -0.3422585129737854, -0.29943379759788513, -0.25660908222198486, -0.21378445625305176, -0.1709597259759903, -0.12813499569892883, -0.08531026542186737, -0.04248553514480591, 0.0003391951322555542, 0.04316392540931702, 0.08598864078521729, 0.12881338596343994, 0.1716381162405014, 0.21446284651756287, 0.25728756189346313, 0.3001123070716858, 0.34293705224990845, 0.3857617676258087, 0.428586483001709, 0.47141122817993164, 0.5142359733581543, 0.557060718536377, 0.5998854041099548, 0.6427101492881775, 0.6855348944664001, 0.728359580039978, 0.7711843252182007, 0.8140090703964233, 0.856833815574646, 0.8996585607528687, 0.9424832463264465, 0.9853079915046692, 1.028132677078247, 1.0709574222564697, 1.1137821674346924, 1.156606912612915]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 18.0, 15.0, 15.0, 19.0, 20.0, 16.0, 30.0, 32.0, 25.0, 26.0, 39.0, 32.0, 42.0, 36.0, 43.0, 35.0, 38.0, 31.0, 44.0, 46.0, 34.0, 38.0, 38.0, 29.0, 32.0, 35.0, 30.0, 25.0, 16.0, 14.0, 14.0, 11.0, 18.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8862427473068237, -0.8564247488975525, -0.8266066908836365, -0.7967886924743652, -0.766970694065094, -0.7371526956558228, -0.7073346376419067, -0.6775166392326355, -0.6476986408233643, -0.617880642414093, -0.588062584400177, -0.5582445859909058, -0.5284265875816345, -0.4986085593700409, -0.46879053115844727, -0.438972532749176, -0.40915447473526, -0.3793364465236664, -0.34951844811439514, -0.3197004199028015, -0.2898824214935303, -0.26006439328193665, -0.23024636507034302, -0.20042835175991058, -0.17061033844947815, -0.14079232513904572, -0.11097430437803268, -0.08115628361701965, -0.05133827030658722, -0.021520256996154785, 0.008297771215438843, 0.03811578452587128, 0.06793379783630371, 0.09775181114673615, 0.12756982445716858, 0.1573878526687622, 0.18720586597919464, 0.21702387928962708, 0.2468419075012207, 0.27665990591049194, 0.30647793412208557, 0.3362959623336792, 0.36611396074295044, 0.39593198895454407, 0.4257500171661377, 0.45556801557540894, 0.48538604378700256, 0.5152040719985962, 0.5450220704078674, 0.5748400688171387, 0.6046581268310547, 0.6344761252403259, 0.6642941236495972, 0.6941121816635132, 0.7239301800727844, 0.7537481784820557, 0.7835662364959717, 0.8133842349052429, 0.8432022929191589, 0.8730202913284302, 0.9028382897377014, 0.9326562881469727, 0.9624743461608887, 0.9922923445701599, 1.0221103429794312]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 13.0, 18.0, 34.0, 43.0, 58.0, 99.0, 186.0, 260.0, 451.0, 641.0, 1063.0, 1744.0, 2757.0, 4522.0, 7418.0, 11858.0, 18801.0, 29105.0, 43605.0, 62628.0, 84486.0, 104622.0, 119193.0, 122436.0, 113746.0, 95058.0, 73044.0, 52177.0, 35877.0, 23411.0, 14931.0, 9292.0, 5736.0, 3542.0, 2141.0, 1317.0, 812.0, 582.0, 305.0, 192.0, 133.0, 86.0, 49.0, 22.0, 24.0, 21.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.984375, -0.9538497924804688, -0.9233245849609375, -0.8927993774414062, -0.862274169921875, -0.8317489624023438, -0.8012237548828125, -0.7706985473632812, -0.74017333984375, -0.7096481323242188, -0.6791229248046875, -0.6485977172851562, -0.618072509765625, -0.5875473022460938, -0.5570220947265625, -0.5264968872070312, -0.4959716796875, -0.46544647216796875, -0.4349212646484375, -0.40439605712890625, -0.373870849609375, -0.34334564208984375, -0.3128204345703125, -0.28229522705078125, -0.25177001953125, -0.22124481201171875, -0.1907196044921875, -0.16019439697265625, -0.129669189453125, -0.09914398193359375, -0.0686187744140625, -0.03809356689453125, -0.007568359375, 0.02295684814453125, 0.0534820556640625, 0.08400726318359375, 0.114532470703125, 0.14505767822265625, 0.1755828857421875, 0.20610809326171875, 0.23663330078125, 0.26715850830078125, 0.2976837158203125, 0.32820892333984375, 0.358734130859375, 0.38925933837890625, 0.4197845458984375, 0.45030975341796875, 0.4808349609375, 0.5113601684570312, 0.5418853759765625, 0.5724105834960938, 0.602935791015625, 0.6334609985351562, 0.6639862060546875, 0.6945114135742188, 0.72503662109375, 0.7555618286132812, 0.7860870361328125, 0.8166122436523438, 0.847137451171875, 0.8776626586914062, 0.9081878662109375, 0.9387130737304688, 0.96923828125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 11.0, 10.0, 16.0, 15.0, 24.0, 25.0, 24.0, 18.0, 29.0, 29.0, 33.0, 36.0, 35.0, 46.0, 43.0, 40.0, 48.0, 40.0, 42.0, 32.0, 59.0, 37.0, 30.0, 39.0, 28.0, 30.0, 31.0, 22.0, 22.0, 20.0, 8.0, 21.0, 12.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0275115966796875, -0.993499755859375, -0.9594879150390625, -0.92547607421875, -0.8914642333984375, -0.857452392578125, -0.8234405517578125, -0.7894287109375, -0.7554168701171875, -0.721405029296875, -0.6873931884765625, -0.65338134765625, -0.6193695068359375, -0.585357666015625, -0.5513458251953125, -0.517333984375, -0.4833221435546875, -0.449310302734375, -0.4152984619140625, -0.38128662109375, -0.3472747802734375, -0.313262939453125, -0.2792510986328125, -0.2452392578125, -0.2112274169921875, -0.177215576171875, -0.1432037353515625, -0.10919189453125, -0.0751800537109375, -0.041168212890625, -0.0071563720703125, 0.02685546875, 0.0608673095703125, 0.094879150390625, 0.1288909912109375, 0.16290283203125, 0.1969146728515625, 0.230926513671875, 0.2649383544921875, 0.2989501953125, 0.3329620361328125, 0.366973876953125, 0.4009857177734375, 0.43499755859375, 0.4690093994140625, 0.503021240234375, 0.5370330810546875, 0.571044921875, 0.6050567626953125, 0.639068603515625, 0.6730804443359375, 0.70709228515625, 0.7411041259765625, 0.775115966796875, 0.8091278076171875, 0.8431396484375, 0.8771514892578125, 0.911163330078125, 0.9451751708984375, 0.97918701171875, 1.0131988525390625, 1.047210693359375, 1.0812225341796875, 1.115234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 25.0, 32.0, 48.0, 76.0, 93.0, 169.0, 258.0, 371.0, 583.0, 909.0, 1389.0, 2217.0, 3487.0, 5229.0, 7921.0, 11858.0, 17735.0, 25076.0, 35306.0, 48511.0, 62575.0, 77501.0, 91774.0, 99311.0, 101884.0, 97625.0, 86166.0, 72361.0, 57289.0, 42784.0, 31079.0, 22028.0, 15110.0, 10146.0, 6871.0, 4430.0, 2935.0, 1878.0, 1200.0, 805.0, 515.0, 330.0, 209.0, 163.0, 97.0, 74.0, 39.0, 26.0, 16.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.83984375, -0.8138504028320312, -0.7878570556640625, -0.7618637084960938, -0.735870361328125, -0.7098770141601562, -0.6838836669921875, -0.6578903198242188, -0.63189697265625, -0.6059036254882812, -0.5799102783203125, -0.5539169311523438, -0.527923583984375, -0.5019302368164062, -0.4759368896484375, -0.44994354248046875, -0.4239501953125, -0.39795684814453125, -0.3719635009765625, -0.34597015380859375, -0.319976806640625, -0.29398345947265625, -0.2679901123046875, -0.24199676513671875, -0.21600341796875, -0.19001007080078125, -0.1640167236328125, -0.13802337646484375, -0.112030029296875, -0.08603668212890625, -0.0600433349609375, -0.03404998779296875, -0.008056640625, 0.01793670654296875, 0.0439300537109375, 0.06992340087890625, 0.095916748046875, 0.12191009521484375, 0.1479034423828125, 0.17389678955078125, 0.19989013671875, 0.22588348388671875, 0.2518768310546875, 0.27787017822265625, 0.303863525390625, 0.32985687255859375, 0.3558502197265625, 0.38184356689453125, 0.4078369140625, 0.43383026123046875, 0.4598236083984375, 0.48581695556640625, 0.511810302734375, 0.5378036499023438, 0.5637969970703125, 0.5897903442382812, 0.61578369140625, 0.6417770385742188, 0.6677703857421875, 0.6937637329101562, 0.719757080078125, 0.7457504272460938, 0.7717437744140625, 0.7977371215820312, 0.82373046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 8.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 17.0, 8.0, 18.0, 20.0, 24.0, 21.0, 18.0, 28.0, 24.0, 37.0, 41.0, 42.0, 35.0, 34.0, 35.0, 39.0, 45.0, 25.0, 37.0, 31.0, 17.0, 29.0, 31.0, 35.0, 16.0, 30.0, 22.0, 25.0, 18.0, 18.0, 11.0, 8.0, 11.0, 13.0, 5.0, 10.0, 12.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.50830078125, -0.49228668212890625, -0.4762725830078125, -0.46025848388671875, -0.444244384765625, -0.42823028564453125, -0.4122161865234375, -0.39620208740234375, -0.38018798828125, -0.36417388916015625, -0.3481597900390625, -0.33214569091796875, -0.316131591796875, -0.30011749267578125, -0.2841033935546875, -0.26808929443359375, -0.2520751953125, -0.23606109619140625, -0.2200469970703125, -0.20403289794921875, -0.188018798828125, -0.17200469970703125, -0.1559906005859375, -0.13997650146484375, -0.12396240234375, -0.10794830322265625, -0.0919342041015625, -0.07592010498046875, -0.059906005859375, -0.04389190673828125, -0.0278778076171875, -0.01186370849609375, 0.004150390625, 0.02016448974609375, 0.0361785888671875, 0.05219268798828125, 0.068206787109375, 0.08422088623046875, 0.1002349853515625, 0.11624908447265625, 0.13226318359375, 0.14827728271484375, 0.1642913818359375, 0.18030548095703125, 0.196319580078125, 0.21233367919921875, 0.2283477783203125, 0.24436187744140625, 0.2603759765625, 0.27639007568359375, 0.2924041748046875, 0.30841827392578125, 0.324432373046875, 0.34044647216796875, 0.3564605712890625, 0.37247467041015625, 0.38848876953125, 0.40450286865234375, 0.4205169677734375, 0.43653106689453125, 0.452545166015625, 0.46855926513671875, 0.4845733642578125, 0.5005874633789062, 0.5166015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 17.0, 7.0, 26.0, 25.0, 39.0, 47.0, 53.0, 87.0, 127.0, 155.0, 224.0, 259.0, 396.0, 487.0, 733.0, 993.0, 1545.0, 2065.0, 3362.0, 5792.0, 14319.0, 62424.0, 326381.0, 465670.0, 120042.0, 23139.0, 7778.0, 3985.0, 2439.0, 1718.0, 1154.0, 826.0, 591.0, 425.0, 306.0, 235.0, 167.0, 123.0, 91.0, 74.0, 55.0, 41.0, 30.0, 23.0, 21.0, 16.0, 14.0, 7.0, 3.0, 5.0, 3.0], "bins": [-2.533203125, -2.46319580078125, -2.3931884765625, -2.32318115234375, -2.253173828125, -2.18316650390625, -2.1131591796875, -2.04315185546875, -1.97314453125, -1.90313720703125, -1.8331298828125, -1.76312255859375, -1.693115234375, -1.62310791015625, -1.5531005859375, -1.48309326171875, -1.4130859375, -1.34307861328125, -1.2730712890625, -1.20306396484375, -1.133056640625, -1.06304931640625, -0.9930419921875, -0.92303466796875, -0.85302734375, -0.78302001953125, -0.7130126953125, -0.64300537109375, -0.572998046875, -0.50299072265625, -0.4329833984375, -0.36297607421875, -0.29296875, -0.22296142578125, -0.1529541015625, -0.08294677734375, -0.012939453125, 0.05706787109375, 0.1270751953125, 0.19708251953125, 0.26708984375, 0.33709716796875, 0.4071044921875, 0.47711181640625, 0.547119140625, 0.61712646484375, 0.6871337890625, 0.75714111328125, 0.8271484375, 0.89715576171875, 0.9671630859375, 1.03717041015625, 1.107177734375, 1.17718505859375, 1.2471923828125, 1.31719970703125, 1.38720703125, 1.45721435546875, 1.5272216796875, 1.59722900390625, 1.667236328125, 1.73724365234375, 1.8072509765625, 1.87725830078125, 1.947265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 15.0, 28.0, 52.0, 81.0, 166.0, 194.0, 164.0, 116.0, 82.0, 34.0, 20.0, 11.0, 7.0, 6.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021147727966308594, -0.0002046283334493637, -0.00019777938723564148, -0.00019093044102191925, -0.00018408149480819702, -0.0001772325485944748, -0.00017038360238075256, -0.00016353465616703033, -0.0001566857099533081, -0.00014983676373958588, -0.00014298781752586365, -0.00013613887131214142, -0.0001292899250984192, -0.00012244097888469696, -0.00011559203267097473, -0.0001087430864572525, -0.00010189414024353027, -9.504519402980804e-05, -8.819624781608582e-05, -8.134730160236359e-05, -7.449835538864136e-05, -6.764940917491913e-05, -6.08004629611969e-05, -5.395151674747467e-05, -4.710257053375244e-05, -4.025362432003021e-05, -3.3404678106307983e-05, -2.6555731892585754e-05, -1.9706785678863525e-05, -1.2857839465141296e-05, -6.008893251419067e-06, 8.400529623031616e-07, 7.68899917602539e-06, 1.453794538974762e-05, 2.138689160346985e-05, 2.8235837817192078e-05, 3.508478403091431e-05, 4.1933730244636536e-05, 4.8782676458358765e-05, 5.5631622672080994e-05, 6.248056888580322e-05, 6.932951509952545e-05, 7.617846131324768e-05, 8.302740752696991e-05, 8.987635374069214e-05, 9.672529995441437e-05, 0.0001035742461681366, 0.00011042319238185883, 0.00011727213859558105, 0.00012412108480930328, 0.0001309700310230255, 0.00013781897723674774, 0.00014466792345046997, 0.0001515168696641922, 0.00015836581587791443, 0.00016521476209163666, 0.0001720637083053589, 0.00017891265451908112, 0.00018576160073280334, 0.00019261054694652557, 0.0001994594931602478, 0.00020630843937397003, 0.00021315738558769226, 0.0002200063318014145, 0.00022685527801513672]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 9.0, 8.0, 8.0, 20.0, 22.0, 34.0, 45.0, 82.0, 109.0, 167.0, 227.0, 401.0, 532.0, 804.0, 1270.0, 2045.0, 3555.0, 8269.0, 31062.0, 166683.0, 480473.0, 274360.0, 54881.0, 12088.0, 4607.0, 2537.0, 1476.0, 958.0, 593.0, 424.0, 236.0, 181.0, 107.0, 79.0, 47.0, 43.0, 32.0, 26.0, 19.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.306640625, -2.241973876953125, -2.17730712890625, -2.112640380859375, -2.0479736328125, -1.983306884765625, -1.91864013671875, -1.853973388671875, -1.789306640625, -1.724639892578125, -1.65997314453125, -1.595306396484375, -1.5306396484375, -1.465972900390625, -1.40130615234375, -1.336639404296875, -1.27197265625, -1.207305908203125, -1.14263916015625, -1.077972412109375, -1.0133056640625, -0.948638916015625, -0.88397216796875, -0.819305419921875, -0.754638671875, -0.689971923828125, -0.62530517578125, -0.560638427734375, -0.4959716796875, -0.431304931640625, -0.36663818359375, -0.301971435546875, -0.2373046875, -0.172637939453125, -0.10797119140625, -0.043304443359375, 0.0213623046875, 0.086029052734375, 0.15069580078125, 0.215362548828125, 0.280029296875, 0.344696044921875, 0.40936279296875, 0.474029541015625, 0.5386962890625, 0.603363037109375, 0.66802978515625, 0.732696533203125, 0.79736328125, 0.862030029296875, 0.92669677734375, 0.991363525390625, 1.0560302734375, 1.120697021484375, 1.18536376953125, 1.250030517578125, 1.314697265625, 1.379364013671875, 1.44403076171875, 1.508697509765625, 1.5733642578125, 1.638031005859375, 1.70269775390625, 1.767364501953125, 1.83203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 10.0, 7.0, 12.0, 16.0, 17.0, 26.0, 34.0, 42.0, 59.0, 56.0, 73.0, 74.0, 65.0, 84.0, 84.0, 82.0, 69.0, 46.0, 39.0, 21.0, 25.0, 14.0, 11.0, 9.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212646484375, -0.20475387573242188, -0.19686126708984375, -0.18896865844726562, -0.1810760498046875, -0.17318344116210938, -0.16529083251953125, -0.15739822387695312, -0.149505615234375, -0.14161300659179688, -0.13372039794921875, -0.12582778930664062, -0.1179351806640625, -0.11004257202148438, -0.10214996337890625, -0.09425735473632812, -0.08636474609375, -0.07847213745117188, -0.07057952880859375, -0.06268692016601562, -0.0547943115234375, -0.046901702880859375, -0.03900909423828125, -0.031116485595703125, -0.023223876953125, -0.015331268310546875, -0.00743865966796875, 0.000453948974609375, 0.0083465576171875, 0.016239166259765625, 0.02413177490234375, 0.032024383544921875, 0.0399169921875, 0.047809600830078125, 0.05570220947265625, 0.06359481811523438, 0.0714874267578125, 0.07938003540039062, 0.08727264404296875, 0.09516525268554688, 0.103057861328125, 0.11095046997070312, 0.11884307861328125, 0.12673568725585938, 0.1346282958984375, 0.14252090454101562, 0.15041351318359375, 0.15830612182617188, 0.16619873046875, 0.17409133911132812, 0.18198394775390625, 0.18987655639648438, 0.1977691650390625, 0.20566177368164062, 0.21355438232421875, 0.22144699096679688, 0.229339599609375, 0.23723220825195312, 0.24512481689453125, 0.2530174255371094, 0.2609100341796875, 0.2688026428222656, 0.27669525146484375, 0.2845878601074219, 0.29248046875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 29.0, 28.0, 28.0, 33.0, 39.0, 41.0, 51.0, 48.0, 54.0, 55.0, 65.0, 56.0, 51.0, 36.0, 51.0, 37.0, 39.0, 32.0, 22.0, 26.0, 21.0, 23.0, 17.0, 10.0, 8.0, 3.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.5890384912490845, -1.5426957607269287, -1.496353030204773, -1.4500102996826172, -1.4036675691604614, -1.3573248386383057, -1.3109819889068604, -1.2646393775939941, -1.2182965278625488, -1.171953797340393, -1.1256110668182373, -1.0792683362960815, -1.0329256057739258, -0.98658287525177, -0.9402400851249695, -0.8938973546028137, -0.8475546836853027, -0.801211953163147, -0.7548692226409912, -0.7085264921188354, -0.6621837615966797, -0.6158410310745239, -0.5694982409477234, -0.5231555104255676, -0.47681277990341187, -0.4304700493812561, -0.38412731885910034, -0.3377845585346222, -0.29144182801246643, -0.24509909749031067, -0.19875633716583252, -0.15241360664367676, -0.10607099533081055, -0.05972825735807419, -0.01338551938533783, 0.032957226037979126, 0.07929995656013489, 0.12564268708229065, 0.1719854474067688, 0.21832817792892456, 0.2646709084510803, 0.3110136389732361, 0.35735636949539185, 0.40369912981987, 0.45004186034202576, 0.4963845908641815, 0.5427273511886597, 0.5890700817108154, 0.6354128122329712, 0.681755542755127, 0.7280982732772827, 0.7744410037994385, 0.8207837343215942, 0.86712646484375, 0.9134692549705505, 0.9598119854927063, 1.0061547756195068, 1.0524975061416626, 1.0988402366638184, 1.1451829671859741, 1.1915256977081299, 1.2378684282302856, 1.2842111587524414, 1.3305540084838867, 1.376896619796753]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 8.0, 20.0, 21.0, 15.0, 34.0, 37.0, 23.0, 34.0, 48.0, 26.0, 46.0, 38.0, 27.0, 58.0, 38.0, 42.0, 47.0, 46.0, 47.0, 28.0, 34.0, 40.0, 38.0, 18.0, 27.0, 20.0, 19.0, 15.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.153900146484375, -1.1200770139694214, -1.0862538814544678, -1.0524308681488037, -1.01860773563385, -0.9847846031188965, -0.9509614706039429, -0.9171383380889893, -0.8833152651786804, -0.8494921326637268, -0.815669059753418, -0.7818459272384644, -0.7480227947235107, -0.7141997218132019, -0.6803765892982483, -0.6465535163879395, -0.6127303838729858, -0.5789072513580322, -0.5450841784477234, -0.5112610459327698, -0.47743794322013855, -0.4436148405075073, -0.4097917079925537, -0.3759686052799225, -0.34214550256729126, -0.30832239985466003, -0.2744992971420288, -0.2406761646270752, -0.20685306191444397, -0.17302995920181274, -0.13920684158802032, -0.1053837239742279, -0.07156062126159668, -0.03773751109838486, -0.003914400935173035, 0.029908709228038788, 0.06373181939125061, 0.09755492210388184, 0.13137803971767426, 0.16520115733146667, 0.1990242600440979, 0.23284736275672913, 0.26667046546936035, 0.30049359798431396, 0.3343167006969452, 0.3681398034095764, 0.40196293592453003, 0.43578603863716125, 0.4696091413497925, 0.5034322738647461, 0.5372553467750549, 0.5710784792900085, 0.6049015522003174, 0.638724684715271, 0.6725478172302246, 0.7063709497451782, 0.7401940226554871, 0.7740171551704407, 0.8078402280807495, 0.8416633605957031, 0.8754864931106567, 0.9093095660209656, 0.9431326985359192, 0.976955771446228, 1.0107789039611816]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 6.0, 12.0, 18.0, 34.0, 53.0, 88.0, 133.0, 229.0, 338.0, 530.0, 858.0, 1469.0, 2435.0, 4044.0, 6904.0, 11900.0, 20216.0, 35296.0, 61153.0, 104817.0, 176564.0, 285254.0, 423747.0, 563860.0, 633579.0, 591438.0, 462193.0, 318973.0, 200328.0, 120198.0, 69911.0, 40563.0, 23435.0, 13945.0, 7871.0, 4776.0, 2818.0, 1682.0, 1052.0, 608.0, 375.0, 231.0, 136.0, 88.0, 45.0, 27.0, 16.0, 14.0, 10.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.265625, -1.2279815673828125, -1.190338134765625, -1.1526947021484375, -1.11505126953125, -1.0774078369140625, -1.039764404296875, -1.0021209716796875, -0.9644775390625, -0.9268341064453125, -0.889190673828125, -0.8515472412109375, -0.81390380859375, -0.7762603759765625, -0.738616943359375, -0.7009735107421875, -0.663330078125, -0.6256866455078125, -0.588043212890625, -0.5503997802734375, -0.51275634765625, -0.4751129150390625, -0.437469482421875, -0.3998260498046875, -0.3621826171875, -0.3245391845703125, -0.286895751953125, -0.2492523193359375, -0.21160888671875, -0.1739654541015625, -0.136322021484375, -0.0986785888671875, -0.06103515625, -0.0233917236328125, 0.014251708984375, 0.0518951416015625, 0.08953857421875, 0.1271820068359375, 0.164825439453125, 0.2024688720703125, 0.2401123046875, 0.2777557373046875, 0.315399169921875, 0.3530426025390625, 0.39068603515625, 0.4283294677734375, 0.465972900390625, 0.5036163330078125, 0.541259765625, 0.5789031982421875, 0.616546630859375, 0.6541900634765625, 0.69183349609375, 0.7294769287109375, 0.767120361328125, 0.8047637939453125, 0.8424072265625, 0.8800506591796875, 0.917694091796875, 0.9553375244140625, 0.99298095703125, 1.0306243896484375, 1.068267822265625, 1.1059112548828125, 1.1435546875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 10.0, 15.0, 21.0, 19.0, 30.0, 28.0, 25.0, 26.0, 30.0, 28.0, 37.0, 45.0, 45.0, 44.0, 43.0, 47.0, 57.0, 51.0, 58.0, 36.0, 33.0, 30.0, 30.0, 23.0, 32.0, 25.0, 26.0, 13.0, 6.0, 17.0, 14.0, 8.0, 10.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9123153686523438, -0.8842010498046875, -0.8560867309570312, -0.827972412109375, -0.7998580932617188, -0.7717437744140625, -0.7436294555664062, -0.71551513671875, -0.6874008178710938, -0.6592864990234375, -0.6311721801757812, -0.603057861328125, -0.5749435424804688, -0.5468292236328125, -0.5187149047851562, -0.4906005859375, -0.46248626708984375, -0.4343719482421875, -0.40625762939453125, -0.378143310546875, -0.35002899169921875, -0.3219146728515625, -0.29380035400390625, -0.26568603515625, -0.23757171630859375, -0.2094573974609375, -0.18134307861328125, -0.153228759765625, -0.12511444091796875, -0.0970001220703125, -0.06888580322265625, -0.040771484375, -0.01265716552734375, 0.0154571533203125, 0.04357147216796875, 0.071685791015625, 0.09980010986328125, 0.1279144287109375, 0.15602874755859375, 0.18414306640625, 0.21225738525390625, 0.2403717041015625, 0.26848602294921875, 0.296600341796875, 0.32471466064453125, 0.3528289794921875, 0.38094329833984375, 0.4090576171875, 0.43717193603515625, 0.4652862548828125, 0.49340057373046875, 0.521514892578125, 0.5496292114257812, 0.5777435302734375, 0.6058578491210938, 0.63397216796875, 0.6620864868164062, 0.6902008056640625, 0.7183151245117188, 0.746429443359375, 0.7745437622070312, 0.8026580810546875, 0.8307723999023438, 0.85888671875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 21.0, 27.0, 57.0, 73.0, 166.0, 238.0, 393.0, 785.0, 1107.0, 2026.0, 3309.0, 5889.0, 10196.0, 17635.0, 30827.0, 53391.0, 91300.0, 149651.0, 236105.0, 349679.0, 470769.0, 561428.0, 579443.0, 510425.0, 397337.0, 277121.0, 179294.0, 110597.0, 64992.0, 38232.0, 22053.0, 12648.0, 7146.0, 4113.0, 2403.0, 1389.0, 786.0, 492.0, 306.0, 164.0, 119.0, 69.0, 31.0, 21.0, 10.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1825103759765625, -1.143341064453125, -1.1041717529296875, -1.06500244140625, -1.0258331298828125, -0.986663818359375, -0.9474945068359375, -0.9083251953125, -0.8691558837890625, -0.829986572265625, -0.7908172607421875, -0.75164794921875, -0.7124786376953125, -0.673309326171875, -0.6341400146484375, -0.594970703125, -0.5558013916015625, -0.516632080078125, -0.4774627685546875, -0.43829345703125, -0.3991241455078125, -0.359954833984375, -0.3207855224609375, -0.2816162109375, -0.2424468994140625, -0.203277587890625, -0.1641082763671875, -0.12493896484375, -0.0857696533203125, -0.046600341796875, -0.0074310302734375, 0.03173828125, 0.0709075927734375, 0.110076904296875, 0.1492462158203125, 0.18841552734375, 0.2275848388671875, 0.266754150390625, 0.3059234619140625, 0.3450927734375, 0.3842620849609375, 0.423431396484375, 0.4626007080078125, 0.50177001953125, 0.5409393310546875, 0.580108642578125, 0.6192779541015625, 0.658447265625, 0.6976165771484375, 0.736785888671875, 0.7759552001953125, 0.81512451171875, 0.8542938232421875, 0.893463134765625, 0.9326324462890625, 0.9718017578125, 1.0109710693359375, 1.050140380859375, 1.0893096923828125, 1.12847900390625, 1.1676483154296875, 1.206817626953125, 1.2459869384765625, 1.28515625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 36.0, 44.0, 40.0, 53.0, 71.0, 92.0, 107.0, 91.0, 145.0, 128.0, 168.0, 178.0, 196.0, 188.0, 209.0, 218.0, 199.0, 219.0, 220.0, 196.0, 173.0, 160.0, 141.0, 143.0, 105.0, 82.0, 75.0, 77.0, 69.0, 31.0, 26.0, 20.0, 26.0, 17.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.400146484375, -0.3865547180175781, -0.37296295166015625, -0.3593711853027344, -0.3457794189453125, -0.3321876525878906, -0.31859588623046875, -0.3050041198730469, -0.291412353515625, -0.2778205871582031, -0.26422882080078125, -0.2506370544433594, -0.2370452880859375, -0.22345352172851562, -0.20986175537109375, -0.19626998901367188, -0.18267822265625, -0.16908645629882812, -0.15549468994140625, -0.14190292358398438, -0.1283111572265625, -0.11471939086914062, -0.10112762451171875, -0.08753585815429688, -0.073944091796875, -0.060352325439453125, -0.04676055908203125, -0.033168792724609375, -0.0195770263671875, -0.005985260009765625, 0.00760650634765625, 0.021198272705078125, 0.0347900390625, 0.048381805419921875, 0.06197357177734375, 0.07556533813476562, 0.0891571044921875, 0.10274887084960938, 0.11634063720703125, 0.12993240356445312, 0.143524169921875, 0.15711593627929688, 0.17070770263671875, 0.18429946899414062, 0.1978912353515625, 0.21148300170898438, 0.22507476806640625, 0.23866653442382812, 0.25225830078125, 0.2658500671386719, 0.27944183349609375, 0.2930335998535156, 0.3066253662109375, 0.3202171325683594, 0.33380889892578125, 0.3474006652832031, 0.360992431640625, 0.3745841979980469, 0.38817596435546875, 0.4017677307128906, 0.4153594970703125, 0.4289512634277344, 0.44254302978515625, 0.4561347961425781, 0.4697265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 3.0, 1.0, 8.0, 13.0, 13.0, 14.0, 21.0, 20.0, 29.0, 31.0, 34.0, 49.0, 51.0, 42.0, 44.0, 43.0, 55.0, 61.0, 64.0, 59.0, 60.0, 48.0, 42.0, 34.0, 24.0, 24.0, 23.0, 15.0, 12.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5419496297836304, -1.49064040184021, -1.4393311738967896, -1.3880219459533691, -1.3367127180099487, -1.2854034900665283, -1.234094262123108, -1.1827850341796875, -1.131475806236267, -1.0801665782928467, -1.0288573503494263, -0.9775481224060059, -0.9262388944625854, -0.874929666519165, -0.8236204385757446, -0.7723112106323242, -0.721001923084259, -0.6696926951408386, -0.6183834671974182, -0.5670742392539978, -0.5157650113105774, -0.4644557535648346, -0.4131465256214142, -0.3618372976779938, -0.31052806973457336, -0.25921884179115295, -0.20790961384773254, -0.15660037100315094, -0.10529114305973053, -0.053981900215148926, -0.0026726722717285156, 0.048636555671691895, 0.0999457836151123, 0.15125501155853271, 0.20256423950195312, 0.25387346744537354, 0.30518269538879395, 0.35649195313453674, 0.40780118107795715, 0.45911040902137756, 0.5104196071624756, 0.561728835105896, 0.6130380630493164, 0.6643472909927368, 0.7156565189361572, 0.7669657468795776, 0.818274974822998, 0.8695842027664185, 0.9208934903144836, 0.972202718257904, 1.0235120058059692, 1.0748212337493896, 1.12613046169281, 1.1774396896362305, 1.2287489175796509, 1.2800581455230713, 1.3313673734664917, 1.382676601409912, 1.4339858293533325, 1.485295057296753, 1.5366042852401733, 1.5879135131835938, 1.6392227411270142, 1.6905319690704346, 1.741841197013855]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 0.0, 10.0, 7.0, 9.0, 7.0, 13.0, 8.0, 16.0, 18.0, 18.0, 23.0, 32.0, 38.0, 37.0, 31.0, 34.0, 29.0, 39.0, 33.0, 41.0, 39.0, 38.0, 24.0, 37.0, 25.0, 48.0, 47.0, 40.0, 33.0, 36.0, 22.0, 22.0, 16.0, 19.0, 16.0, 22.0, 15.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.0659161806106567, -1.0348045825958252, -1.0036929845809937, -0.9725813865661621, -0.9414697885513306, -0.910358190536499, -0.8792465329170227, -0.8481349349021912, -0.8170233368873596, -0.7859117388725281, -0.7548001408576965, -0.723688542842865, -0.6925768852233887, -0.6614652872085571, -0.6303536891937256, -0.599242091178894, -0.5681304931640625, -0.537018895149231, -0.5059072971343994, -0.4747956693172455, -0.44368407130241394, -0.4125724732875824, -0.38146084547042847, -0.3503492474555969, -0.3192376494407654, -0.28812605142593384, -0.2570144534111023, -0.22590282559394836, -0.19479122757911682, -0.16367962956428528, -0.13256801664829254, -0.1014564037322998, -0.07034474611282349, -0.039233140647411346, -0.008121535181999207, 0.022990070283412933, 0.05410167574882507, 0.08521327376365662, 0.11632488667964935, 0.1474364995956421, 0.17854809761047363, 0.20965969562530518, 0.2407713085412979, 0.27188292145729065, 0.3029945194721222, 0.33410611748695374, 0.36521774530410767, 0.3963293433189392, 0.42744094133377075, 0.4585525393486023, 0.48966413736343384, 0.5207757353782654, 0.5518873929977417, 0.5829989910125732, 0.6141105890274048, 0.6452221870422363, 0.6763337850570679, 0.7074453830718994, 0.738556981086731, 0.7696685791015625, 0.800780177116394, 0.8318917751312256, 0.8630034327507019, 0.8941150307655334, 0.925226628780365]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 5.0, 10.0, 21.0, 20.0, 36.0, 48.0, 81.0, 101.0, 197.0, 289.0, 464.0, 776.0, 1383.0, 2312.0, 4198.0, 7676.0, 14496.0, 28443.0, 54446.0, 105623.0, 185868.0, 241308.0, 183822.0, 104303.0, 53288.0, 27486.0, 14362.0, 7641.0, 4094.0, 2366.0, 1313.0, 816.0, 455.0, 271.0, 176.0, 127.0, 64.0, 51.0, 27.0, 23.0, 19.0, 13.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.404052734375, -0.3912200927734375, -0.378387451171875, -0.3655548095703125, -0.35272216796875, -0.3398895263671875, -0.327056884765625, -0.3142242431640625, -0.3013916015625, -0.2885589599609375, -0.275726318359375, -0.2628936767578125, -0.25006103515625, -0.2372283935546875, -0.224395751953125, -0.2115631103515625, -0.19873046875, -0.1858978271484375, -0.173065185546875, -0.1602325439453125, -0.14739990234375, -0.1345672607421875, -0.121734619140625, -0.1089019775390625, -0.0960693359375, -0.0832366943359375, -0.070404052734375, -0.0575714111328125, -0.04473876953125, -0.0319061279296875, -0.019073486328125, -0.0062408447265625, 0.006591796875, 0.0194244384765625, 0.032257080078125, 0.0450897216796875, 0.05792236328125, 0.0707550048828125, 0.083587646484375, 0.0964202880859375, 0.1092529296875, 0.1220855712890625, 0.134918212890625, 0.1477508544921875, 0.16058349609375, 0.1734161376953125, 0.186248779296875, 0.1990814208984375, 0.2119140625, 0.2247467041015625, 0.237579345703125, 0.2504119873046875, 0.26324462890625, 0.2760772705078125, 0.288909912109375, 0.3017425537109375, 0.3145751953125, 0.3274078369140625, 0.340240478515625, 0.3530731201171875, 0.36590576171875, 0.3787384033203125, 0.391571044921875, 0.4044036865234375, 0.417236328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 10.0, 8.0, 24.0, 25.0, 19.0, 31.0, 25.0, 32.0, 52.0, 36.0, 36.0, 43.0, 41.0, 42.0, 46.0, 41.0, 43.0, 44.0, 43.0, 44.0, 42.0, 41.0, 36.0, 38.0, 21.0, 19.0, 18.0, 19.0, 25.0, 8.0, 9.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.277587890625, -1.23681640625, -1.196044921875, -1.1552734375, -1.114501953125, -1.07373046875, -1.032958984375, -0.9921875, -0.951416015625, -0.91064453125, -0.869873046875, -0.8291015625, -0.788330078125, -0.74755859375, -0.706787109375, -0.666015625, -0.625244140625, -0.58447265625, -0.543701171875, -0.5029296875, -0.462158203125, -0.42138671875, -0.380615234375, -0.33984375, -0.299072265625, -0.25830078125, -0.217529296875, -0.1767578125, -0.135986328125, -0.09521484375, -0.054443359375, -0.013671875, 0.027099609375, 0.06787109375, 0.108642578125, 0.1494140625, 0.190185546875, 0.23095703125, 0.271728515625, 0.3125, 0.353271484375, 0.39404296875, 0.434814453125, 0.4755859375, 0.516357421875, 0.55712890625, 0.597900390625, 0.638671875, 0.679443359375, 0.72021484375, 0.760986328125, 0.8017578125, 0.842529296875, 0.88330078125, 0.924072265625, 0.96484375, 1.005615234375, 1.04638671875, 1.087158203125, 1.1279296875, 1.168701171875, 1.20947265625, 1.250244140625, 1.291015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 12.0, 24.0, 25.0, 58.0, 77.0, 111.0, 167.0, 244.0, 331.0, 498.0, 861.0, 1489.0, 2551.0, 5101.0, 9958.0, 21089.0, 45580.0, 99574.0, 198390.0, 276317.0, 197932.0, 99271.0, 46143.0, 21146.0, 10069.0, 4889.0, 2702.0, 1481.0, 866.0, 529.0, 335.0, 214.0, 157.0, 94.0, 70.0, 51.0, 31.0, 31.0, 20.0, 14.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.53369140625, -0.5190696716308594, -0.5044479370117188, -0.4898262023925781, -0.4752044677734375, -0.4605827331542969, -0.44596099853515625, -0.4313392639160156, -0.416717529296875, -0.4020957946777344, -0.38747406005859375, -0.3728523254394531, -0.3582305908203125, -0.3436088562011719, -0.32898712158203125, -0.3143653869628906, -0.29974365234375, -0.2851219177246094, -0.27050018310546875, -0.2558784484863281, -0.2412567138671875, -0.22663497924804688, -0.21201324462890625, -0.19739151000976562, -0.182769775390625, -0.16814804077148438, -0.15352630615234375, -0.13890457153320312, -0.1242828369140625, -0.10966110229492188, -0.09503936767578125, -0.08041763305664062, -0.0657958984375, -0.051174163818359375, -0.03655242919921875, -0.021930694580078125, -0.0073089599609375, 0.007312774658203125, 0.02193450927734375, 0.036556243896484375, 0.051177978515625, 0.06579971313476562, 0.08042144775390625, 0.09504318237304688, 0.1096649169921875, 0.12428665161132812, 0.13890838623046875, 0.15353012084960938, 0.16815185546875, 0.18277359008789062, 0.19739532470703125, 0.21201705932617188, 0.2266387939453125, 0.24126052856445312, 0.25588226318359375, 0.2705039978027344, 0.285125732421875, 0.2997474670410156, 0.31436920166015625, 0.3289909362792969, 0.3436126708984375, 0.3582344055175781, 0.37285614013671875, 0.3874778747558594, 0.402099609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 2.0, 9.0, 7.0, 13.0, 7.0, 20.0, 13.0, 31.0, 22.0, 28.0, 24.0, 21.0, 31.0, 22.0, 16.0, 33.0, 33.0, 33.0, 44.0, 38.0, 37.0, 46.0, 37.0, 39.0, 47.0, 31.0, 28.0, 27.0, 24.0, 25.0, 21.0, 26.0, 23.0, 18.0, 23.0, 12.0, 12.0, 14.0, 10.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56787109375, -0.5485000610351562, -0.5291290283203125, -0.5097579956054688, -0.490386962890625, -0.47101593017578125, -0.4516448974609375, -0.43227386474609375, -0.41290283203125, -0.39353179931640625, -0.3741607666015625, -0.35478973388671875, -0.335418701171875, -0.31604766845703125, -0.2966766357421875, -0.27730560302734375, -0.2579345703125, -0.23856353759765625, -0.2191925048828125, -0.19982147216796875, -0.180450439453125, -0.16107940673828125, -0.1417083740234375, -0.12233734130859375, -0.10296630859375, -0.08359527587890625, -0.0642242431640625, -0.04485321044921875, -0.025482177734375, -0.00611114501953125, 0.0132598876953125, 0.03263092041015625, 0.052001953125, 0.07137298583984375, 0.0907440185546875, 0.11011505126953125, 0.129486083984375, 0.14885711669921875, 0.1682281494140625, 0.18759918212890625, 0.20697021484375, 0.22634124755859375, 0.2457122802734375, 0.26508331298828125, 0.284454345703125, 0.30382537841796875, 0.3231964111328125, 0.34256744384765625, 0.3619384765625, 0.38130950927734375, 0.4006805419921875, 0.42005157470703125, 0.439422607421875, 0.45879364013671875, 0.4781646728515625, 0.49753570556640625, 0.51690673828125, 0.5362777709960938, 0.5556488037109375, 0.5750198364257812, 0.594390869140625, 0.6137619018554688, 0.6331329345703125, 0.6525039672851562, 0.671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 2.0, 16.0, 14.0, 34.0, 35.0, 45.0, 63.0, 93.0, 155.0, 224.0, 306.0, 520.0, 867.0, 1549.0, 3290.0, 8701.0, 36064.0, 429811.0, 509021.0, 40619.0, 9380.0, 3567.0, 1655.0, 952.0, 524.0, 364.0, 206.0, 135.0, 108.0, 70.0, 43.0, 32.0, 21.0, 13.0, 10.0, 9.0, 11.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.59375, -0.5768013000488281, -0.5598526000976562, -0.5429039001464844, -0.5259552001953125, -0.5090065002441406, -0.49205780029296875, -0.4751091003417969, -0.458160400390625, -0.4412117004394531, -0.42426300048828125, -0.4073143005371094, -0.3903656005859375, -0.3734169006347656, -0.35646820068359375, -0.3395195007324219, -0.32257080078125, -0.3056221008300781, -0.28867340087890625, -0.2717247009277344, -0.2547760009765625, -0.23782730102539062, -0.22087860107421875, -0.20392990112304688, -0.186981201171875, -0.17003250122070312, -0.15308380126953125, -0.13613510131835938, -0.1191864013671875, -0.10223770141601562, -0.08528900146484375, -0.06834030151367188, -0.0513916015625, -0.034442901611328125, -0.01749420166015625, -0.000545501708984375, 0.0164031982421875, 0.033351898193359375, 0.05030059814453125, 0.06724929809570312, 0.084197998046875, 0.10114669799804688, 0.11809539794921875, 0.13504409790039062, 0.1519927978515625, 0.16894149780273438, 0.18589019775390625, 0.20283889770507812, 0.21978759765625, 0.23673629760742188, 0.25368499755859375, 0.2706336975097656, 0.2875823974609375, 0.3045310974121094, 0.32147979736328125, 0.3384284973144531, 0.355377197265625, 0.3723258972167969, 0.38927459716796875, 0.4062232971191406, 0.4231719970703125, 0.4401206970214844, 0.45706939697265625, 0.4740180969238281, 0.490966796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 11.0, 12.0, 20.0, 54.0, 67.0, 94.0, 115.0, 132.0, 110.0, 125.0, 87.0, 68.0, 33.0, 26.0, 21.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7060508728027344e-05, -2.623721957206726e-05, -2.5413930416107178e-05, -2.4590641260147095e-05, -2.3767352104187012e-05, -2.294406294822693e-05, -2.2120773792266846e-05, -2.1297484636306763e-05, -2.047419548034668e-05, -1.9650906324386597e-05, -1.8827617168426514e-05, -1.800432801246643e-05, -1.7181038856506348e-05, -1.6357749700546265e-05, -1.553446054458618e-05, -1.4711171388626099e-05, -1.3887882232666016e-05, -1.3064593076705933e-05, -1.224130392074585e-05, -1.1418014764785767e-05, -1.0594725608825684e-05, -9.7714364528656e-06, -8.948147296905518e-06, -8.124858140945435e-06, -7.3015689849853516e-06, -6.4782798290252686e-06, -5.6549906730651855e-06, -4.8317015171051025e-06, -4.0084123611450195e-06, -3.1851232051849365e-06, -2.3618340492248535e-06, -1.5385448932647705e-06, -7.152557373046875e-07, 1.0803341865539551e-07, 9.313225746154785e-07, 1.7546117305755615e-06, 2.5779008865356445e-06, 3.4011900424957275e-06, 4.2244791984558105e-06, 5.0477683544158936e-06, 5.8710575103759766e-06, 6.6943466663360596e-06, 7.517635822296143e-06, 8.340924978256226e-06, 9.164214134216309e-06, 9.987503290176392e-06, 1.0810792446136475e-05, 1.1634081602096558e-05, 1.245737075805664e-05, 1.3280659914016724e-05, 1.4103949069976807e-05, 1.492723822593689e-05, 1.5750527381896973e-05, 1.6573816537857056e-05, 1.739710569381714e-05, 1.822039484977722e-05, 1.9043684005737305e-05, 1.9866973161697388e-05, 2.069026231765747e-05, 2.1513551473617554e-05, 2.2336840629577637e-05, 2.316012978553772e-05, 2.3983418941497803e-05, 2.4806708097457886e-05, 2.562999725341797e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 10.0, 7.0, 14.0, 26.0, 21.0, 38.0, 59.0, 56.0, 104.0, 129.0, 162.0, 249.0, 270.0, 353.0, 460.0, 659.0, 885.0, 1273.0, 1744.0, 2701.0, 4083.0, 7419.0, 15063.0, 36196.0, 98868.0, 284753.0, 360898.0, 139700.0, 48294.0, 19614.0, 9155.0, 5025.0, 3056.0, 1934.0, 1379.0, 998.0, 696.0, 548.0, 439.0, 302.0, 224.0, 178.0, 109.0, 118.0, 72.0, 68.0, 41.0, 34.0, 25.0, 19.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2734375, -0.2649345397949219, -0.25643157958984375, -0.24792861938476562, -0.2394256591796875, -0.23092269897460938, -0.22241973876953125, -0.21391677856445312, -0.205413818359375, -0.19691085815429688, -0.18840789794921875, -0.17990493774414062, -0.1714019775390625, -0.16289901733398438, -0.15439605712890625, -0.14589309692382812, -0.13739013671875, -0.12888717651367188, -0.12038421630859375, -0.11188125610351562, -0.1033782958984375, -0.09487533569335938, -0.08637237548828125, -0.07786941528320312, -0.069366455078125, -0.060863494873046875, -0.05236053466796875, -0.043857574462890625, -0.0353546142578125, -0.026851654052734375, -0.01834869384765625, -0.009845733642578125, -0.0013427734375, 0.007160186767578125, 0.01566314697265625, 0.024166107177734375, 0.0326690673828125, 0.041172027587890625, 0.04967498779296875, 0.058177947998046875, 0.066680908203125, 0.07518386840820312, 0.08368682861328125, 0.09218978881835938, 0.1006927490234375, 0.10919570922851562, 0.11769866943359375, 0.12620162963867188, 0.13470458984375, 0.14320755004882812, 0.15171051025390625, 0.16021347045898438, 0.1687164306640625, 0.17721939086914062, 0.18572235107421875, 0.19422531127929688, 0.202728271484375, 0.21123123168945312, 0.21973419189453125, 0.22823715209960938, 0.2367401123046875, 0.24524307250976562, 0.25374603271484375, 0.2622489929199219, 0.270751953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 12.0, 16.0, 25.0, 65.0, 80.0, 151.0, 188.0, 150.0, 119.0, 59.0, 40.0, 23.0, 15.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10774517059326172, -0.10434532165527344, -0.10094547271728516, -0.09754562377929688, -0.0941457748413086, -0.09074592590332031, -0.08734607696533203, -0.08394622802734375, -0.08054637908935547, -0.07714653015136719, -0.0737466812133789, -0.07034683227539062, -0.06694698333740234, -0.06354713439941406, -0.06014728546142578, -0.0567474365234375, -0.05334758758544922, -0.04994773864746094, -0.046547889709472656, -0.043148040771484375, -0.039748191833496094, -0.03634834289550781, -0.03294849395751953, -0.02954864501953125, -0.02614879608154297, -0.022748947143554688, -0.019349098205566406, -0.015949249267578125, -0.012549400329589844, -0.009149551391601562, -0.005749702453613281, -0.002349853515625, 0.0010499954223632812, 0.0044498443603515625, 0.007849693298339844, 0.011249542236328125, 0.014649391174316406, 0.018049240112304688, 0.02144908905029297, 0.02484893798828125, 0.02824878692626953, 0.03164863586425781, 0.035048484802246094, 0.038448333740234375, 0.041848182678222656, 0.04524803161621094, 0.04864788055419922, 0.0520477294921875, 0.05544757843017578, 0.05884742736816406, 0.062247276306152344, 0.06564712524414062, 0.0690469741821289, 0.07244682312011719, 0.07584667205810547, 0.07924652099609375, 0.08264636993408203, 0.08604621887207031, 0.0894460678100586, 0.09284591674804688, 0.09624576568603516, 0.09964561462402344, 0.10304546356201172, 0.1064453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 3.0, 9.0, 10.0, 17.0, 13.0, 16.0, 27.0, 27.0, 23.0, 40.0, 51.0, 56.0, 40.0, 43.0, 40.0, 57.0, 57.0, 69.0, 62.0, 64.0, 47.0, 32.0, 33.0, 28.0, 18.0, 27.0, 16.0, 11.0, 12.0, 11.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5451518297195435, -1.4936035871505737, -1.442055344581604, -1.3905071020126343, -1.3389588594436646, -1.2874106168746948, -1.2358622550964355, -1.1843140125274658, -1.132765769958496, -1.0812175273895264, -1.0296692848205566, -0.9781210422515869, -0.9265727996826172, -0.8750245571136475, -0.823476254940033, -0.7719280123710632, -0.7203798294067383, -0.6688315868377686, -0.6172833442687988, -0.5657351016998291, -0.5141868591308594, -0.46263858675956726, -0.41109031438827515, -0.3595420718193054, -0.3079938292503357, -0.25644558668136597, -0.20489732921123505, -0.15334907174110413, -0.1018008291721344, -0.05025258660316467, 0.0012956857681274414, 0.05284392833709717, 0.10439229011535645, 0.15594053268432617, 0.2074887901544571, 0.259037047624588, 0.31058529019355774, 0.36213353276252747, 0.4136818051338196, 0.4652300477027893, 0.516778290271759, 0.5683265328407288, 0.6198747754096985, 0.671423077583313, 0.7229713201522827, 0.7745195627212524, 0.8260678052902222, 0.8776160478591919, 0.9291642904281616, 0.9807125329971313, 1.032260775566101, 1.0838090181350708, 1.1353572607040405, 1.1869055032730103, 1.2384538650512695, 1.2900021076202393, 1.341550350189209, 1.3930985927581787, 1.4446468353271484, 1.4961950778961182, 1.547743320465088, 1.5992915630340576, 1.6508398056030273, 1.702388048171997, 1.7539362907409668]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 9.0, 5.0, 8.0, 8.0, 9.0, 10.0, 15.0, 23.0, 14.0, 26.0, 29.0, 34.0, 39.0, 35.0, 38.0, 22.0, 40.0, 37.0, 42.0, 35.0, 41.0, 28.0, 32.0, 28.0, 50.0, 43.0, 40.0, 39.0, 31.0, 30.0, 14.0, 25.0, 14.0, 17.0, 19.0, 15.0, 14.0, 5.0, 6.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.084733486175537, -1.0531185865402222, -1.0215036869049072, -0.9898887872695923, -0.9582739472389221, -0.9266590476036072, -0.8950441479682922, -0.8634292483329773, -0.8318144083023071, -0.8001995086669922, -0.7685846090316772, -0.7369697093963623, -0.7053548693656921, -0.6737399697303772, -0.6421250700950623, -0.6105101704597473, -0.5788952708244324, -0.5472803711891174, -0.5156654715538025, -0.48405060172080994, -0.4524357318878174, -0.42082083225250244, -0.3892059326171875, -0.35759103298187256, -0.32597616314888, -0.29436126351356506, -0.2627463936805725, -0.23113149404525757, -0.19951660931110382, -0.16790172457695007, -0.13628682494163513, -0.10467194020748138, -0.07305705547332764, -0.04144216701388359, -0.009827278554439545, 0.0217876136302948, 0.05340249836444855, 0.0850173830986023, 0.11663228273391724, 0.14824716746807098, 0.17986205220222473, 0.21147693693637848, 0.24309182167053223, 0.27470672130584717, 0.3063216209411621, 0.33793649077415466, 0.3695513904094696, 0.40116626024246216, 0.4327811598777771, 0.46439605951309204, 0.4960109293460846, 0.5276257991790771, 0.5592406988143921, 0.590855598449707, 0.622470498085022, 0.6540853977203369, 0.6857002973556519, 0.7173151969909668, 0.7489300966262817, 0.7805449962615967, 0.8121598362922668, 0.8437747359275818, 0.8753896355628967, 0.9070045351982117, 0.9386193752288818]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 6.0, 5.0, 12.0, 13.0, 12.0, 23.0, 36.0, 49.0, 92.0, 137.0, 210.0, 384.0, 712.0, 1241.0, 2273.0, 4014.0, 7296.0, 13048.0, 22807.0, 38352.0, 61084.0, 91232.0, 122152.0, 143329.0, 145623.0, 127589.0, 97427.0, 67908.0, 42830.0, 25478.0, 14627.0, 8248.0, 4399.0, 2518.0, 1425.0, 834.0, 477.0, 242.0, 149.0, 97.0, 50.0, 38.0, 25.0, 15.0, 15.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.015777587890625, -0.97686767578125, -0.937957763671875, -0.8990478515625, -0.860137939453125, -0.82122802734375, -0.782318115234375, -0.743408203125, -0.704498291015625, -0.66558837890625, -0.626678466796875, -0.5877685546875, -0.548858642578125, -0.50994873046875, -0.471038818359375, -0.43212890625, -0.393218994140625, -0.35430908203125, -0.315399169921875, -0.2764892578125, -0.237579345703125, -0.19866943359375, -0.159759521484375, -0.120849609375, -0.081939697265625, -0.04302978515625, -0.004119873046875, 0.0347900390625, 0.073699951171875, 0.11260986328125, 0.151519775390625, 0.1904296875, 0.229339599609375, 0.26824951171875, 0.307159423828125, 0.3460693359375, 0.384979248046875, 0.42388916015625, 0.462799072265625, 0.501708984375, 0.540618896484375, 0.57952880859375, 0.618438720703125, 0.6573486328125, 0.696258544921875, 0.73516845703125, 0.774078369140625, 0.81298828125, 0.851898193359375, 0.89080810546875, 0.929718017578125, 0.9686279296875, 1.007537841796875, 1.04644775390625, 1.085357666015625, 1.124267578125, 1.163177490234375, 1.20208740234375, 1.240997314453125, 1.2799072265625, 1.318817138671875, 1.35772705078125, 1.396636962890625, 1.435546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 3.0, 6.0, 10.0, 8.0, 9.0, 18.0, 15.0, 17.0, 14.0, 27.0, 23.0, 34.0, 29.0, 28.0, 26.0, 28.0, 35.0, 37.0, 33.0, 25.0, 34.0, 42.0, 36.0, 34.0, 34.0, 35.0, 40.0, 35.0, 22.0, 28.0, 32.0, 28.0, 21.0, 27.0, 15.0, 18.0, 13.0, 14.0, 11.0, 11.0, 7.0, 4.0, 8.0, 4.0, 10.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.99609375, -0.9644775390625, -0.932861328125, -0.9012451171875, -0.86962890625, -0.8380126953125, -0.806396484375, -0.7747802734375, -0.7431640625, -0.7115478515625, -0.679931640625, -0.6483154296875, -0.61669921875, -0.5850830078125, -0.553466796875, -0.5218505859375, -0.490234375, -0.4586181640625, -0.427001953125, -0.3953857421875, -0.36376953125, -0.3321533203125, -0.300537109375, -0.2689208984375, -0.2373046875, -0.2056884765625, -0.174072265625, -0.1424560546875, -0.11083984375, -0.0792236328125, -0.047607421875, -0.0159912109375, 0.015625, 0.0472412109375, 0.078857421875, 0.1104736328125, 0.14208984375, 0.1737060546875, 0.205322265625, 0.2369384765625, 0.2685546875, 0.3001708984375, 0.331787109375, 0.3634033203125, 0.39501953125, 0.4266357421875, 0.458251953125, 0.4898681640625, 0.521484375, 0.5531005859375, 0.584716796875, 0.6163330078125, 0.64794921875, 0.6795654296875, 0.711181640625, 0.7427978515625, 0.7744140625, 0.8060302734375, 0.837646484375, 0.8692626953125, 0.90087890625, 0.9324951171875, 0.964111328125, 0.9957275390625, 1.02734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 15.0, 26.0, 34.0, 56.0, 75.0, 121.0, 226.0, 399.0, 700.0, 1088.0, 1722.0, 3012.0, 4984.0, 8379.0, 13891.0, 21694.0, 33191.0, 48950.0, 69343.0, 91114.0, 110539.0, 121366.0, 120343.0, 108176.0, 88922.0, 67483.0, 47664.0, 31834.0, 20388.0, 12991.0, 7889.0, 4780.0, 2863.0, 1694.0, 1065.0, 628.0, 358.0, 208.0, 124.0, 84.0, 46.0, 31.0, 21.0, 14.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0368804931640625, -1.004425048828125, -0.9719696044921875, -0.93951416015625, -0.9070587158203125, -0.874603271484375, -0.8421478271484375, -0.8096923828125, -0.7772369384765625, -0.744781494140625, -0.7123260498046875, -0.67987060546875, -0.6474151611328125, -0.614959716796875, -0.5825042724609375, -0.550048828125, -0.5175933837890625, -0.485137939453125, -0.4526824951171875, -0.42022705078125, -0.3877716064453125, -0.355316162109375, -0.3228607177734375, -0.2904052734375, -0.2579498291015625, -0.225494384765625, -0.1930389404296875, -0.16058349609375, -0.1281280517578125, -0.095672607421875, -0.0632171630859375, -0.03076171875, 0.0016937255859375, 0.034149169921875, 0.0666046142578125, 0.09906005859375, 0.1315155029296875, 0.163970947265625, 0.1964263916015625, 0.2288818359375, 0.2613372802734375, 0.293792724609375, 0.3262481689453125, 0.35870361328125, 0.3911590576171875, 0.423614501953125, 0.4560699462890625, 0.488525390625, 0.5209808349609375, 0.553436279296875, 0.5858917236328125, 0.61834716796875, 0.6508026123046875, 0.683258056640625, 0.7157135009765625, 0.7481689453125, 0.7806243896484375, 0.813079833984375, 0.8455352783203125, 0.87799072265625, 0.9104461669921875, 0.942901611328125, 0.9753570556640625, 1.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 8.0, 6.0, 13.0, 16.0, 15.0, 15.0, 26.0, 22.0, 22.0, 28.0, 28.0, 39.0, 39.0, 32.0, 32.0, 38.0, 41.0, 40.0, 29.0, 44.0, 42.0, 56.0, 37.0, 22.0, 32.0, 32.0, 33.0, 31.0, 17.0, 22.0, 17.0, 21.0, 20.0, 15.0, 9.0, 8.0, 5.0, 5.0, 11.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.6943359375, -0.6731109619140625, -0.651885986328125, -0.6306610107421875, -0.60943603515625, -0.5882110595703125, -0.566986083984375, -0.5457611083984375, -0.5245361328125, -0.5033111572265625, -0.482086181640625, -0.4608612060546875, -0.43963623046875, -0.4184112548828125, -0.397186279296875, -0.3759613037109375, -0.354736328125, -0.3335113525390625, -0.312286376953125, -0.2910614013671875, -0.26983642578125, -0.2486114501953125, -0.227386474609375, -0.2061614990234375, -0.1849365234375, -0.1637115478515625, -0.142486572265625, -0.1212615966796875, -0.10003662109375, -0.0788116455078125, -0.057586669921875, -0.0363616943359375, -0.01513671875, 0.0060882568359375, 0.027313232421875, 0.0485382080078125, 0.06976318359375, 0.0909881591796875, 0.112213134765625, 0.1334381103515625, 0.1546630859375, 0.1758880615234375, 0.197113037109375, 0.2183380126953125, 0.23956298828125, 0.2607879638671875, 0.282012939453125, 0.3032379150390625, 0.324462890625, 0.3456878662109375, 0.366912841796875, 0.3881378173828125, 0.40936279296875, 0.4305877685546875, 0.451812744140625, 0.4730377197265625, 0.4942626953125, 0.5154876708984375, 0.536712646484375, 0.5579376220703125, 0.57916259765625, 0.6003875732421875, 0.621612548828125, 0.6428375244140625, 0.6640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 10.0, 12.0, 11.0, 9.0, 20.0, 23.0, 46.0, 50.0, 88.0, 131.0, 161.0, 282.0, 387.0, 716.0, 940.0, 1534.0, 2416.0, 3875.0, 7295.0, 22962.0, 200420.0, 637312.0, 135941.0, 17513.0, 6396.0, 3667.0, 2365.0, 1340.0, 876.0, 574.0, 380.0, 252.0, 153.0, 110.0, 93.0, 56.0, 47.0, 20.0, 23.0, 13.0, 13.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.880859375, -2.77947998046875, -2.6781005859375, -2.57672119140625, -2.475341796875, -2.37396240234375, -2.2725830078125, -2.17120361328125, -2.06982421875, -1.96844482421875, -1.8670654296875, -1.76568603515625, -1.664306640625, -1.56292724609375, -1.4615478515625, -1.36016845703125, -1.2587890625, -1.15740966796875, -1.0560302734375, -0.95465087890625, -0.853271484375, -0.75189208984375, -0.6505126953125, -0.54913330078125, -0.44775390625, -0.34637451171875, -0.2449951171875, -0.14361572265625, -0.042236328125, 0.05914306640625, 0.1605224609375, 0.26190185546875, 0.36328125, 0.46466064453125, 0.5660400390625, 0.66741943359375, 0.768798828125, 0.87017822265625, 0.9715576171875, 1.07293701171875, 1.17431640625, 1.27569580078125, 1.3770751953125, 1.47845458984375, 1.579833984375, 1.68121337890625, 1.7825927734375, 1.88397216796875, 1.9853515625, 2.08673095703125, 2.1881103515625, 2.28948974609375, 2.390869140625, 2.49224853515625, 2.5936279296875, 2.69500732421875, 2.79638671875, 2.89776611328125, 2.9991455078125, 3.10052490234375, 3.201904296875, 3.30328369140625, 3.4046630859375, 3.50604248046875, 3.607421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 27.0, 57.0, 98.0, 146.0, 205.0, 173.0, 135.0, 59.0, 35.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002510547637939453, -0.0002442058175802231, -0.00023735687136650085, -0.00023050792515277863, -0.0002236589789390564, -0.00021681003272533417, -0.00020996108651161194, -0.0002031121402978897, -0.00019626319408416748, -0.00018941424787044525, -0.00018256530165672302, -0.0001757163554430008, -0.00016886740922927856, -0.00016201846301555634, -0.0001551695168018341, -0.00014832057058811188, -0.00014147162437438965, -0.00013462267816066742, -0.0001277737319469452, -0.00012092478573322296, -0.00011407583951950073, -0.0001072268933057785, -0.00010037794709205627, -9.352900087833405e-05, -8.668005466461182e-05, -7.983110845088959e-05, -7.298216223716736e-05, -6.613321602344513e-05, -5.92842698097229e-05, -5.243532359600067e-05, -4.558637738227844e-05, -3.873743116855621e-05, -3.1888484954833984e-05, -2.5039538741111755e-05, -1.8190592527389526e-05, -1.1341646313667297e-05, -4.492700099945068e-06, 2.3562461137771606e-06, 9.20519232749939e-06, 1.605413854122162e-05, 2.2903084754943848e-05, 2.9752030968666077e-05, 3.6600977182388306e-05, 4.3449923396110535e-05, 5.0298869609832764e-05, 5.714781582355499e-05, 6.399676203727722e-05, 7.084570825099945e-05, 7.769465446472168e-05, 8.454360067844391e-05, 9.139254689216614e-05, 9.824149310588837e-05, 0.0001050904393196106, 0.00011193938553333282, 0.00011878833174705505, 0.00012563727796077728, 0.0001324862241744995, 0.00013933517038822174, 0.00014618411660194397, 0.0001530330628156662, 0.00015988200902938843, 0.00016673095524311066, 0.00017357990145683289, 0.00018042884767055511, 0.00018727779388427734]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 32.0, 38.0, 53.0, 65.0, 93.0, 137.0, 170.0, 295.0, 415.0, 596.0, 920.0, 1494.0, 2164.0, 3684.0, 7856.0, 29919.0, 198674.0, 553854.0, 199567.0, 30264.0, 7896.0, 3835.0, 2164.0, 1463.0, 918.0, 602.0, 404.0, 274.0, 185.0, 139.0, 95.0, 63.0, 55.0, 39.0, 23.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.76171875, -2.681671142578125, -2.60162353515625, -2.521575927734375, -2.4415283203125, -2.361480712890625, -2.28143310546875, -2.201385498046875, -2.121337890625, -2.041290283203125, -1.96124267578125, -1.881195068359375, -1.8011474609375, -1.721099853515625, -1.64105224609375, -1.561004638671875, -1.48095703125, -1.400909423828125, -1.32086181640625, -1.240814208984375, -1.1607666015625, -1.080718994140625, -1.00067138671875, -0.920623779296875, -0.840576171875, -0.760528564453125, -0.68048095703125, -0.600433349609375, -0.5203857421875, -0.440338134765625, -0.36029052734375, -0.280242919921875, -0.2001953125, -0.120147705078125, -0.04010009765625, 0.039947509765625, 0.1199951171875, 0.200042724609375, 0.28009033203125, 0.360137939453125, 0.440185546875, 0.520233154296875, 0.60028076171875, 0.680328369140625, 0.7603759765625, 0.840423583984375, 0.92047119140625, 1.000518798828125, 1.08056640625, 1.160614013671875, 1.24066162109375, 1.320709228515625, 1.4007568359375, 1.480804443359375, 1.56085205078125, 1.640899658203125, 1.720947265625, 1.800994873046875, 1.88104248046875, 1.961090087890625, 2.0411376953125, 2.121185302734375, 2.20123291015625, 2.281280517578125, 2.361328125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 9.0, 10.0, 13.0, 28.0, 25.0, 44.0, 32.0, 60.0, 69.0, 74.0, 74.0, 81.0, 88.0, 66.0, 70.0, 57.0, 37.0, 42.0, 23.0, 21.0, 10.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.292724609375, -0.28343963623046875, -0.2741546630859375, -0.26486968994140625, -0.255584716796875, -0.24629974365234375, -0.2370147705078125, -0.22772979736328125, -0.21844482421875, -0.20915985107421875, -0.1998748779296875, -0.19058990478515625, -0.181304931640625, -0.17201995849609375, -0.1627349853515625, -0.15345001220703125, -0.1441650390625, -0.13488006591796875, -0.1255950927734375, -0.11631011962890625, -0.107025146484375, -0.09774017333984375, -0.0884552001953125, -0.07917022705078125, -0.06988525390625, -0.06060028076171875, -0.0513153076171875, -0.04203033447265625, -0.032745361328125, -0.02346038818359375, -0.0141754150390625, -0.00489044189453125, 0.00439453125, 0.01367950439453125, 0.0229644775390625, 0.03224945068359375, 0.041534423828125, 0.05081939697265625, 0.0601043701171875, 0.06938934326171875, 0.07867431640625, 0.08795928955078125, 0.0972442626953125, 0.10652923583984375, 0.115814208984375, 0.12509918212890625, 0.1343841552734375, 0.14366912841796875, 0.1529541015625, 0.16223907470703125, 0.1715240478515625, 0.18080902099609375, 0.190093994140625, 0.19937896728515625, 0.2086639404296875, 0.21794891357421875, 0.22723388671875, 0.23651885986328125, 0.2458038330078125, 0.25508880615234375, 0.264373779296875, 0.27365875244140625, 0.2829437255859375, 0.29222869873046875, 0.301513671875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 7.0, 11.0, 10.0, 12.0, 16.0, 20.0, 31.0, 26.0, 29.0, 44.0, 40.0, 45.0, 46.0, 50.0, 49.0, 54.0, 76.0, 60.0, 41.0, 48.0, 51.0, 37.0, 35.0, 26.0, 20.0, 13.0, 12.0, 15.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4523892402648926, -1.4023908376693726, -1.352392554283142, -1.302394151687622, -1.2523958683013916, -1.2023974657058716, -1.1523990631103516, -1.102400779724121, -1.0524024963378906, -1.0024040937423706, -0.9524058103561401, -0.9024074077606201, -0.8524091243743896, -0.8024107217788696, -0.7524123787879944, -0.7024140357971191, -0.6524156332015991, -0.6024172902107239, -0.5524189472198486, -0.5024205446243286, -0.45242223143577576, -0.4024238884449005, -0.3524255156517029, -0.30242717266082764, -0.2524288296699524, -0.20243048667907715, -0.1524321287870407, -0.10243377089500427, -0.05243542790412903, -0.002437084913253784, 0.04756128787994385, 0.09755963087081909, 0.1475580930709839, 0.19755643606185913, 0.24755479395389557, 0.297553151845932, 0.34755149483680725, 0.3975498378276825, 0.4475482106208801, 0.49754655361175537, 0.5475448966026306, 0.5975432395935059, 0.6475415825843811, 0.6975399255752563, 0.7475383281707764, 0.7975366115570068, 0.8475350141525269, 0.8975333571434021, 0.9475317001342773, 0.9975300431251526, 1.0475283861160278, 1.0975267887115479, 1.1475250720977783, 1.1975234746932983, 1.2475218772888184, 1.2975201606750488, 1.3475184440612793, 1.3975168466567993, 1.4475151300430298, 1.4975135326385498, 1.5475118160247803, 1.5975102186203003, 1.6475086212158203, 1.6975069046020508, 1.7475053071975708]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 10.0, 14.0, 14.0, 15.0, 12.0, 11.0, 27.0, 39.0, 29.0, 22.0, 31.0, 40.0, 30.0, 48.0, 40.0, 41.0, 37.0, 46.0, 35.0, 38.0, 40.0, 37.0, 41.0, 46.0, 31.0, 30.0, 30.0, 19.0, 18.0, 16.0, 11.0, 18.0, 13.0, 10.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9461370706558228, -0.9124075770378113, -0.8786780834197998, -0.8449485898017883, -0.8112190961837769, -0.7774896025657654, -0.7437601089477539, -0.7100306153297424, -0.676301121711731, -0.6425716280937195, -0.608842134475708, -0.5751126408576965, -0.5413831472396851, -0.5076536536216736, -0.4739241600036621, -0.44019466638565063, -0.40646517276763916, -0.3727356791496277, -0.3390061855316162, -0.30527669191360474, -0.27154719829559326, -0.2378177046775818, -0.2040882110595703, -0.17035871744155884, -0.13662922382354736, -0.10289973020553589, -0.06917023658752441, -0.03544074296951294, -0.0017112493515014648, 0.03201824426651001, 0.06574773788452148, 0.09947723150253296, 0.13320660591125488, 0.16693609952926636, 0.20066559314727783, 0.2343950867652893, 0.2681245803833008, 0.30185407400131226, 0.33558356761932373, 0.3693130612373352, 0.4030425548553467, 0.43677204847335815, 0.47050154209136963, 0.5042310357093811, 0.5379605293273926, 0.571690022945404, 0.6054195165634155, 0.639149010181427, 0.6728785037994385, 0.70660799741745, 0.7403374910354614, 0.7740669846534729, 0.8077964782714844, 0.8415259718894958, 0.8752554655075073, 0.9089849591255188, 0.9427144527435303, 0.9764439463615417, 1.0101734399795532, 1.04390287399292, 1.0776324272155762, 1.1113619804382324, 1.1450914144515991, 1.1788208484649658, 1.212550401687622]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 14.0, 20.0, 47.0, 74.0, 134.0, 214.0, 368.0, 632.0, 1061.0, 1799.0, 3203.0, 6021.0, 11090.0, 20479.0, 39249.0, 72928.0, 136052.0, 243458.0, 407757.0, 595266.0, 715323.0, 678755.0, 515434.0, 330522.0, 191268.0, 104274.0, 55907.0, 29351.0, 15477.0, 8022.0, 4434.0, 2479.0, 1335.0, 711.0, 462.0, 249.0, 154.0, 102.0, 50.0, 36.0, 21.0, 9.0, 7.0, 11.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2174224853515625, -1.170196533203125, -1.1229705810546875, -1.07574462890625, -1.0285186767578125, -0.981292724609375, -0.9340667724609375, -0.8868408203125, -0.8396148681640625, -0.792388916015625, -0.7451629638671875, -0.69793701171875, -0.6507110595703125, -0.603485107421875, -0.5562591552734375, -0.509033203125, -0.4618072509765625, -0.414581298828125, -0.3673553466796875, -0.32012939453125, -0.2729034423828125, -0.225677490234375, -0.1784515380859375, -0.1312255859375, -0.0839996337890625, -0.036773681640625, 0.0104522705078125, 0.05767822265625, 0.1049041748046875, 0.152130126953125, 0.1993560791015625, 0.24658203125, 0.2938079833984375, 0.341033935546875, 0.3882598876953125, 0.43548583984375, 0.4827117919921875, 0.529937744140625, 0.5771636962890625, 0.6243896484375, 0.6716156005859375, 0.718841552734375, 0.7660675048828125, 0.81329345703125, 0.8605194091796875, 0.907745361328125, 0.9549713134765625, 1.002197265625, 1.0494232177734375, 1.096649169921875, 1.1438751220703125, 1.19110107421875, 1.2383270263671875, 1.285552978515625, 1.3327789306640625, 1.3800048828125, 1.4272308349609375, 1.474456787109375, 1.5216827392578125, 1.56890869140625, 1.6161346435546875, 1.663360595703125, 1.7105865478515625, 1.7578125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 10.0, 16.0, 14.0, 18.0, 17.0, 29.0, 27.0, 28.0, 41.0, 35.0, 49.0, 53.0, 46.0, 53.0, 54.0, 63.0, 47.0, 58.0, 40.0, 52.0, 32.0, 32.0, 36.0, 23.0, 28.0, 15.0, 17.0, 10.0, 19.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9773101806640625, -0.941925048828125, -0.9065399169921875, -0.87115478515625, -0.8357696533203125, -0.800384521484375, -0.7649993896484375, -0.7296142578125, -0.6942291259765625, -0.658843994140625, -0.6234588623046875, -0.58807373046875, -0.5526885986328125, -0.517303466796875, -0.4819183349609375, -0.446533203125, -0.4111480712890625, -0.375762939453125, -0.3403778076171875, -0.30499267578125, -0.2696075439453125, -0.234222412109375, -0.1988372802734375, -0.1634521484375, -0.1280670166015625, -0.092681884765625, -0.0572967529296875, -0.02191162109375, 0.0134735107421875, 0.048858642578125, 0.0842437744140625, 0.11962890625, 0.1550140380859375, 0.190399169921875, 0.2257843017578125, 0.26116943359375, 0.2965545654296875, 0.331939697265625, 0.3673248291015625, 0.4027099609375, 0.4380950927734375, 0.473480224609375, 0.5088653564453125, 0.54425048828125, 0.5796356201171875, 0.615020751953125, 0.6504058837890625, 0.685791015625, 0.7211761474609375, 0.756561279296875, 0.7919464111328125, 0.82733154296875, 0.8627166748046875, 0.898101806640625, 0.9334869384765625, 0.9688720703125, 1.0042572021484375, 1.039642333984375, 1.0750274658203125, 1.11041259765625, 1.1457977294921875, 1.181182861328125, 1.2165679931640625, 1.251953125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 15.0, 23.0, 38.0, 61.0, 103.0, 157.0, 284.0, 415.0, 661.0, 1177.0, 1817.0, 2773.0, 4503.0, 7114.0, 11331.0, 18261.0, 28860.0, 45113.0, 70205.0, 107095.0, 160165.0, 228873.0, 312064.0, 395004.0, 460143.0, 484807.0, 459232.0, 394357.0, 311583.0, 228009.0, 160185.0, 107599.0, 70442.0, 45002.0, 28526.0, 17976.0, 11296.0, 7058.0, 4404.0, 2856.0, 1727.0, 1111.0, 717.0, 424.0, 251.0, 182.0, 110.0, 59.0, 37.0, 30.0, 21.0, 11.0, 4.0, 4.0, 7.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0959014892578125, -1.059967041015625, -1.0240325927734375, -0.98809814453125, -0.9521636962890625, -0.916229248046875, -0.8802947998046875, -0.8443603515625, -0.8084259033203125, -0.772491455078125, -0.7365570068359375, -0.70062255859375, -0.6646881103515625, -0.628753662109375, -0.5928192138671875, -0.556884765625, -0.5209503173828125, -0.485015869140625, -0.4490814208984375, -0.41314697265625, -0.3772125244140625, -0.341278076171875, -0.3053436279296875, -0.2694091796875, -0.2334747314453125, -0.197540283203125, -0.1616058349609375, -0.12567138671875, -0.0897369384765625, -0.053802490234375, -0.0178680419921875, 0.01806640625, 0.0540008544921875, 0.089935302734375, 0.1258697509765625, 0.16180419921875, 0.1977386474609375, 0.233673095703125, 0.2696075439453125, 0.3055419921875, 0.3414764404296875, 0.377410888671875, 0.4133453369140625, 0.44927978515625, 0.4852142333984375, 0.521148681640625, 0.5570831298828125, 0.593017578125, 0.6289520263671875, 0.664886474609375, 0.7008209228515625, 0.73675537109375, 0.7726898193359375, 0.808624267578125, 0.8445587158203125, 0.8804931640625, 0.9164276123046875, 0.952362060546875, 0.9882965087890625, 1.02423095703125, 1.0601654052734375, 1.096099853515625, 1.1320343017578125, 1.16796875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 5.0, 15.0, 21.0, 19.0, 24.0, 41.0, 49.0, 56.0, 66.0, 72.0, 89.0, 86.0, 92.0, 140.0, 127.0, 155.0, 179.0, 191.0, 192.0, 222.0, 184.0, 216.0, 211.0, 202.0, 184.0, 167.0, 148.0, 143.0, 144.0, 97.0, 100.0, 61.0, 80.0, 69.0, 53.0, 36.0, 28.0, 25.0, 23.0, 9.0, 13.0, 6.0, 3.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.4287147521972656, -0.41431427001953125, -0.3999137878417969, -0.3855133056640625, -0.3711128234863281, -0.35671234130859375, -0.3423118591308594, -0.327911376953125, -0.3135108947753906, -0.29911041259765625, -0.2847099304199219, -0.2703094482421875, -0.2559089660644531, -0.24150848388671875, -0.22710800170898438, -0.21270751953125, -0.19830703735351562, -0.18390655517578125, -0.16950607299804688, -0.1551055908203125, -0.14070510864257812, -0.12630462646484375, -0.11190414428710938, -0.097503662109375, -0.08310317993164062, -0.06870269775390625, -0.054302215576171875, -0.0399017333984375, -0.025501251220703125, -0.01110076904296875, 0.003299713134765625, 0.0177001953125, 0.032100677490234375, 0.04650115966796875, 0.060901641845703125, 0.0753021240234375, 0.08970260620117188, 0.10410308837890625, 0.11850357055664062, 0.132904052734375, 0.14730453491210938, 0.16170501708984375, 0.17610549926757812, 0.1905059814453125, 0.20490646362304688, 0.21930694580078125, 0.23370742797851562, 0.24810791015625, 0.2625083923339844, 0.27690887451171875, 0.2913093566894531, 0.3057098388671875, 0.3201103210449219, 0.33451080322265625, 0.3489112854003906, 0.363311767578125, 0.3777122497558594, 0.39211273193359375, 0.4065132141113281, 0.4209136962890625, 0.4353141784667969, 0.44971466064453125, 0.4641151428222656, 0.478515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 7.0, 1.0, 3.0, 8.0, 9.0, 21.0, 4.0, 24.0, 27.0, 17.0, 29.0, 37.0, 31.0, 35.0, 49.0, 47.0, 49.0, 40.0, 48.0, 54.0, 40.0, 61.0, 48.0, 45.0, 51.0, 39.0, 34.0, 10.0, 22.0, 22.0, 11.0, 7.0, 11.0, 12.0, 9.0, 4.0, 2.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.58762526512146, -1.5393799543380737, -1.491134524345398, -1.4428892135620117, -1.394643783569336, -1.3463984727859497, -1.2981531620025635, -1.2499077320098877, -1.2016624212265015, -1.1534171104431152, -1.1051716804504395, -1.0569263696670532, -1.008681058883667, -0.9604356288909912, -0.912190318107605, -0.863944947719574, -0.815699577331543, -0.767454206943512, -0.719208836555481, -0.6709635257720947, -0.6227181553840637, -0.5744727849960327, -0.5262274742126465, -0.4779821038246155, -0.4297367334365845, -0.38149136304855347, -0.33324602246284485, -0.28500068187713623, -0.23675531148910522, -0.1885099560022354, -0.1402646005153656, -0.09201925992965698, -0.04377400875091553, 0.004471346735954285, 0.0527167022228241, 0.10096205770969391, 0.14920741319656372, 0.19745276868343353, 0.24569812417030334, 0.29394346475601196, 0.34218883514404297, 0.390434205532074, 0.4386795461177826, 0.4869248867034912, 0.5351702570915222, 0.5834156274795532, 0.6316609382629395, 0.6799063086509705, 0.7281516790390015, 0.7763970494270325, 0.8246424198150635, 0.8728877305984497, 0.9211331009864807, 0.9693784713745117, 1.017623782157898, 1.0658690929412842, 1.11411452293396, 1.1623598337173462, 1.210605263710022, 1.2588505744934082, 1.307096004486084, 1.3553413152694702, 1.4035866260528564, 1.4518320560455322, 1.5000773668289185]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 5.0, 8.0, 10.0, 14.0, 7.0, 19.0, 25.0, 15.0, 23.0, 26.0, 29.0, 31.0, 33.0, 30.0, 26.0, 41.0, 44.0, 38.0, 39.0, 40.0, 44.0, 33.0, 41.0, 34.0, 41.0, 33.0, 22.0, 33.0, 37.0, 34.0, 19.0, 18.0, 18.0, 15.0, 13.0, 7.0, 7.0, 13.0, 7.0, 3.0, 7.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9469460844993591, -0.91257643699646, -0.878206729888916, -0.8438370823860168, -0.8094674348831177, -0.7750977873802185, -0.7407281398773193, -0.7063584327697754, -0.6719887852668762, -0.637619137763977, -0.6032494306564331, -0.5688797831535339, -0.5345101356506348, -0.5001404881477356, -0.46577081084251404, -0.4314011335372925, -0.3970314860343933, -0.36266183853149414, -0.3282921612262726, -0.293922483921051, -0.25955283641815186, -0.2251831740140915, -0.19081351161003113, -0.15644384920597076, -0.1220741868019104, -0.08770452439785004, -0.05333486199378967, -0.01896519958972931, 0.015404462814331055, 0.04977412521839142, 0.08414378762245178, 0.11851345002651215, 0.15288305282592773, 0.1872527152299881, 0.22162237763404846, 0.25599205493927, 0.2903617024421692, 0.32473134994506836, 0.3591010272502899, 0.3934707045555115, 0.42784035205841064, 0.4622099995613098, 0.49657967686653137, 0.5309493541717529, 0.5653190016746521, 0.5996886491775513, 0.6340583562850952, 0.6684280037879944, 0.7027976512908936, 0.7371672987937927, 0.7715369462966919, 0.8059066534042358, 0.840276300907135, 0.8746459484100342, 0.9090156555175781, 0.9433853030204773, 0.9777549505233765, 1.0121246576309204, 1.0464942455291748, 1.0808639526367188, 1.1152336597442627, 1.149603247642517, 1.183972954750061, 1.2183425426483154, 1.2527122497558594]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 17.0, 29.0, 58.0, 80.0, 132.0, 217.0, 323.0, 509.0, 782.0, 1239.0, 1847.0, 2890.0, 4691.0, 7261.0, 11411.0, 17941.0, 28141.0, 44028.0, 66459.0, 97515.0, 131501.0, 153763.0, 144211.0, 110781.0, 78027.0, 51626.0, 33684.0, 21337.0, 13813.0, 8786.0, 5674.0, 3549.0, 2228.0, 1407.0, 933.0, 575.0, 392.0, 260.0, 143.0, 96.0, 64.0, 41.0, 31.0, 17.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22223663330078125, -0.2144927978515625, -0.20674896240234375, -0.199005126953125, -0.19126129150390625, -0.1835174560546875, -0.17577362060546875, -0.16802978515625, -0.16028594970703125, -0.1525421142578125, -0.14479827880859375, -0.137054443359375, -0.12931060791015625, -0.1215667724609375, -0.11382293701171875, -0.1060791015625, -0.09833526611328125, -0.0905914306640625, -0.08284759521484375, -0.075103759765625, -0.06735992431640625, -0.0596160888671875, -0.05187225341796875, -0.04412841796875, -0.03638458251953125, -0.0286407470703125, -0.02089691162109375, -0.013153076171875, -0.00540924072265625, 0.0023345947265625, 0.01007843017578125, 0.017822265625, 0.02556610107421875, 0.0333099365234375, 0.04105377197265625, 0.048797607421875, 0.05654144287109375, 0.0642852783203125, 0.07202911376953125, 0.07977294921875, 0.08751678466796875, 0.0952606201171875, 0.10300445556640625, 0.110748291015625, 0.11849212646484375, 0.1262359619140625, 0.13397979736328125, 0.1417236328125, 0.14946746826171875, 0.1572113037109375, 0.16495513916015625, 0.172698974609375, 0.18044281005859375, 0.1881866455078125, 0.19593048095703125, 0.20367431640625, 0.21141815185546875, 0.2191619873046875, 0.22690582275390625, 0.234649658203125, 0.24239349365234375, 0.2501373291015625, 0.25788116455078125, 0.265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 7.0, 4.0, 6.0, 3.0, 8.0, 10.0, 17.0, 16.0, 21.0, 29.0, 18.0, 30.0, 41.0, 39.0, 35.0, 35.0, 39.0, 43.0, 35.0, 40.0, 37.0, 54.0, 32.0, 39.0, 43.0, 32.0, 45.0, 27.0, 31.0, 37.0, 25.0, 23.0, 18.0, 12.0, 11.0, 12.0, 7.0, 9.0, 2.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2645416259765625, -1.225372314453125, -1.1862030029296875, -1.14703369140625, -1.1078643798828125, -1.068695068359375, -1.0295257568359375, -0.9903564453125, -0.9511871337890625, -0.912017822265625, -0.8728485107421875, -0.83367919921875, -0.7945098876953125, -0.755340576171875, -0.7161712646484375, -0.677001953125, -0.6378326416015625, -0.598663330078125, -0.5594940185546875, -0.52032470703125, -0.4811553955078125, -0.441986083984375, -0.4028167724609375, -0.3636474609375, -0.3244781494140625, -0.285308837890625, -0.2461395263671875, -0.20697021484375, -0.1678009033203125, -0.128631591796875, -0.0894622802734375, -0.05029296875, -0.0111236572265625, 0.028045654296875, 0.0672149658203125, 0.10638427734375, 0.1455535888671875, 0.184722900390625, 0.2238922119140625, 0.2630615234375, 0.3022308349609375, 0.341400146484375, 0.3805694580078125, 0.41973876953125, 0.4589080810546875, 0.498077392578125, 0.5372467041015625, 0.576416015625, 0.6155853271484375, 0.654754638671875, 0.6939239501953125, 0.73309326171875, 0.7722625732421875, 0.811431884765625, 0.8506011962890625, 0.8897705078125, 0.9289398193359375, 0.968109130859375, 1.0072784423828125, 1.04644775390625, 1.0856170654296875, 1.124786376953125, 1.1639556884765625, 1.203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 4.0, 13.0, 17.0, 16.0, 32.0, 70.0, 63.0, 132.0, 169.0, 250.0, 485.0, 729.0, 1315.0, 2065.0, 3783.0, 6854.0, 12615.0, 24199.0, 45849.0, 87053.0, 153431.0, 218223.0, 203564.0, 132397.0, 72529.0, 38114.0, 20149.0, 10826.0, 5734.0, 3248.0, 1827.0, 1050.0, 654.0, 389.0, 238.0, 164.0, 95.0, 54.0, 45.0, 30.0, 21.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3344306945800781, -0.32242584228515625, -0.3104209899902344, -0.2984161376953125, -0.2864112854003906, -0.27440643310546875, -0.2624015808105469, -0.250396728515625, -0.23839187622070312, -0.22638702392578125, -0.21438217163085938, -0.2023773193359375, -0.19037246704101562, -0.17836761474609375, -0.16636276245117188, -0.15435791015625, -0.14235305786132812, -0.13034820556640625, -0.11834335327148438, -0.1063385009765625, -0.09433364868164062, -0.08232879638671875, -0.07032394409179688, -0.058319091796875, -0.046314239501953125, -0.03430938720703125, -0.022304534912109375, -0.0102996826171875, 0.001705169677734375, 0.01371002197265625, 0.025714874267578125, 0.0377197265625, 0.049724578857421875, 0.06172943115234375, 0.07373428344726562, 0.0857391357421875, 0.09774398803710938, 0.10974884033203125, 0.12175369262695312, 0.133758544921875, 0.14576339721679688, 0.15776824951171875, 0.16977310180664062, 0.1817779541015625, 0.19378280639648438, 0.20578765869140625, 0.21779251098632812, 0.22979736328125, 0.24180221557617188, 0.25380706787109375, 0.2658119201660156, 0.2778167724609375, 0.2898216247558594, 0.30182647705078125, 0.3138313293457031, 0.325836181640625, 0.3378410339355469, 0.34984588623046875, 0.3618507385253906, 0.3738555908203125, 0.3858604431152344, 0.39786529541015625, 0.4098701477050781, 0.421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 15.0, 9.0, 12.0, 15.0, 18.0, 14.0, 20.0, 30.0, 21.0, 22.0, 25.0, 30.0, 25.0, 37.0, 48.0, 44.0, 34.0, 40.0, 42.0, 50.0, 34.0, 42.0, 43.0, 37.0, 32.0, 32.0, 43.0, 18.0, 36.0, 14.0, 14.0, 13.0, 11.0, 11.0, 8.0, 12.0, 9.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7030868530273438, -0.6800994873046875, -0.6571121215820312, -0.634124755859375, -0.6111373901367188, -0.5881500244140625, -0.5651626586914062, -0.54217529296875, -0.5191879272460938, -0.4962005615234375, -0.47321319580078125, -0.450225830078125, -0.42723846435546875, -0.4042510986328125, -0.38126373291015625, -0.3582763671875, -0.33528900146484375, -0.3123016357421875, -0.28931427001953125, -0.266326904296875, -0.24333953857421875, -0.2203521728515625, -0.19736480712890625, -0.17437744140625, -0.15139007568359375, -0.1284027099609375, -0.10541534423828125, -0.082427978515625, -0.05944061279296875, -0.0364532470703125, -0.01346588134765625, 0.009521484375, 0.03250885009765625, 0.0554962158203125, 0.07848358154296875, 0.101470947265625, 0.12445831298828125, 0.1474456787109375, 0.17043304443359375, 0.19342041015625, 0.21640777587890625, 0.2393951416015625, 0.26238250732421875, 0.285369873046875, 0.30835723876953125, 0.3313446044921875, 0.35433197021484375, 0.3773193359375, 0.40030670166015625, 0.4232940673828125, 0.44628143310546875, 0.469268798828125, 0.49225616455078125, 0.5152435302734375, 0.5382308959960938, 0.56121826171875, 0.5842056274414062, 0.6071929931640625, 0.6301803588867188, 0.653167724609375, 0.6761550903320312, 0.6991424560546875, 0.7221298217773438, 0.7451171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 32.0, 23.0, 46.0, 54.0, 102.0, 160.0, 184.0, 321.0, 511.0, 749.0, 1195.0, 1951.0, 3226.0, 5470.0, 10192.0, 20521.0, 47821.0, 132885.0, 374830.0, 283790.0, 92254.0, 35682.0, 16228.0, 8277.0, 4553.0, 2758.0, 1689.0, 1065.0, 693.0, 423.0, 242.0, 169.0, 99.0, 105.0, 70.0, 36.0, 26.0, 27.0, 15.0, 13.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.199462890625, -0.19373703002929688, -0.18801116943359375, -0.18228530883789062, -0.1765594482421875, -0.17083358764648438, -0.16510772705078125, -0.15938186645507812, -0.153656005859375, -0.14793014526367188, -0.14220428466796875, -0.13647842407226562, -0.1307525634765625, -0.12502670288085938, -0.11930084228515625, -0.11357498168945312, -0.10784912109375, -0.10212326049804688, -0.09639739990234375, -0.09067153930664062, -0.0849456787109375, -0.07921981811523438, -0.07349395751953125, -0.06776809692382812, -0.062042236328125, -0.056316375732421875, -0.05059051513671875, -0.044864654541015625, -0.0391387939453125, -0.033412933349609375, -0.02768707275390625, -0.021961212158203125, -0.0162353515625, -0.010509490966796875, -0.00478363037109375, 0.000942230224609375, 0.0066680908203125, 0.012393951416015625, 0.01811981201171875, 0.023845672607421875, 0.029571533203125, 0.035297393798828125, 0.04102325439453125, 0.046749114990234375, 0.0524749755859375, 0.058200836181640625, 0.06392669677734375, 0.06965255737304688, 0.07537841796875, 0.08110427856445312, 0.08683013916015625, 0.09255599975585938, 0.0982818603515625, 0.10400772094726562, 0.10973358154296875, 0.11545944213867188, 0.121185302734375, 0.12691116333007812, 0.13263702392578125, 0.13836288452148438, 0.1440887451171875, 0.14981460571289062, 0.15554046630859375, 0.16126632690429688, 0.1669921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 6.0, 12.0, 11.0, 6.0, 14.0, 20.0, 10.0, 15.0, 18.0, 15.0, 26.0, 30.0, 46.0, 36.0, 36.0, 37.0, 46.0, 37.0, 43.0, 44.0, 41.0, 32.0, 30.0, 40.0, 50.0, 46.0, 29.0, 26.0, 29.0, 27.0, 15.0, 21.0, 16.0, 15.0, 7.0, 15.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.445923984050751e-06, -7.202848792076111e-06, -6.959773600101471e-06, -6.716698408126831e-06, -6.473623216152191e-06, -6.230548024177551e-06, -5.987472832202911e-06, -5.7443976402282715e-06, -5.501322448253632e-06, -5.258247256278992e-06, -5.015172064304352e-06, -4.772096872329712e-06, -4.529021680355072e-06, -4.285946488380432e-06, -4.042871296405792e-06, -3.7997961044311523e-06, -3.5567209124565125e-06, -3.3136457204818726e-06, -3.0705705285072327e-06, -2.8274953365325928e-06, -2.584420144557953e-06, -2.341344952583313e-06, -2.098269760608673e-06, -1.8551945686340332e-06, -1.6121193766593933e-06, -1.3690441846847534e-06, -1.1259689927101135e-06, -8.828938007354736e-07, -6.398186087608337e-07, -3.9674341678619385e-07, -1.5366822481155396e-07, 8.940696716308594e-08, 3.3248215913772583e-07, 5.755573511123657e-07, 8.186325430870056e-07, 1.0617077350616455e-06, 1.3047829270362854e-06, 1.5478581190109253e-06, 1.7909333109855652e-06, 2.034008502960205e-06, 2.277083694934845e-06, 2.520158886909485e-06, 2.7632340788841248e-06, 3.0063092708587646e-06, 3.2493844628334045e-06, 3.4924596548080444e-06, 3.7355348467826843e-06, 3.978610038757324e-06, 4.221685230731964e-06, 4.464760422706604e-06, 4.707835614681244e-06, 4.950910806655884e-06, 5.193985998630524e-06, 5.4370611906051636e-06, 5.6801363825798035e-06, 5.923211574554443e-06, 6.166286766529083e-06, 6.409361958503723e-06, 6.652437150478363e-06, 6.895512342453003e-06, 7.138587534427643e-06, 7.381662726402283e-06, 7.624737918376923e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 12.0, 23.0, 30.0, 36.0, 62.0, 116.0, 164.0, 239.0, 424.0, 666.0, 1065.0, 1836.0, 3230.0, 5851.0, 11140.0, 22446.0, 46314.0, 101049.0, 209933.0, 286311.0, 186535.0, 88597.0, 40421.0, 19503.0, 10092.0, 5292.0, 2853.0, 1686.0, 985.0, 625.0, 366.0, 221.0, 153.0, 120.0, 59.0, 43.0, 16.0, 16.0, 7.0, 1.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.197998046875, -0.19256019592285156, -0.18712234497070312, -0.1816844940185547, -0.17624664306640625, -0.1708087921142578, -0.16537094116210938, -0.15993309020996094, -0.1544952392578125, -0.14905738830566406, -0.14361953735351562, -0.1381816864013672, -0.13274383544921875, -0.1273059844970703, -0.12186813354492188, -0.11643028259277344, -0.110992431640625, -0.10555458068847656, -0.10011672973632812, -0.09467887878417969, -0.08924102783203125, -0.08380317687988281, -0.07836532592773438, -0.07292747497558594, -0.0674896240234375, -0.06205177307128906, -0.056613922119140625, -0.05117607116699219, -0.04573822021484375, -0.04030036926269531, -0.034862518310546875, -0.029424667358398438, -0.02398681640625, -0.018548965454101562, -0.013111114501953125, -0.0076732635498046875, -0.00223541259765625, 0.0032024383544921875, 0.008640289306640625, 0.014078140258789062, 0.0195159912109375, 0.024953842163085938, 0.030391693115234375, 0.03582954406738281, 0.04126739501953125, 0.04670524597167969, 0.052143096923828125, 0.05758094787597656, 0.063018798828125, 0.06845664978027344, 0.07389450073242188, 0.07933235168457031, 0.08477020263671875, 0.09020805358886719, 0.09564590454101562, 0.10108375549316406, 0.1065216064453125, 0.11195945739746094, 0.11739730834960938, 0.12283515930175781, 0.12827301025390625, 0.1337108612060547, 0.13914871215820312, 0.14458656311035156, 0.1500244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 8.0, 5.0, 11.0, 14.0, 20.0, 12.0, 13.0, 18.0, 36.0, 37.0, 40.0, 36.0, 49.0, 58.0, 58.0, 65.0, 49.0, 57.0, 44.0, 44.0, 40.0, 41.0, 34.0, 31.0, 25.0, 25.0, 19.0, 17.0, 10.0, 7.0, 9.0, 13.0, 6.0, 8.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.036956787109375, -0.0358738899230957, -0.034790992736816406, -0.03370809555053711, -0.03262519836425781, -0.031542301177978516, -0.03045940399169922, -0.029376506805419922, -0.028293609619140625, -0.027210712432861328, -0.02612781524658203, -0.025044918060302734, -0.023962020874023438, -0.02287912368774414, -0.021796226501464844, -0.020713329315185547, -0.01963043212890625, -0.018547534942626953, -0.017464637756347656, -0.01638174057006836, -0.015298843383789062, -0.014215946197509766, -0.013133049011230469, -0.012050151824951172, -0.010967254638671875, -0.009884357452392578, -0.008801460266113281, -0.007718563079833984, -0.0066356658935546875, -0.005552768707275391, -0.004469871520996094, -0.003386974334716797, -0.0023040771484375, -0.0012211799621582031, -0.00013828277587890625, 0.0009446144104003906, 0.0020275115966796875, 0.0031104087829589844, 0.004193305969238281, 0.005276203155517578, 0.006359100341796875, 0.007441997528076172, 0.008524894714355469, 0.009607791900634766, 0.010690689086914062, 0.01177358627319336, 0.012856483459472656, 0.013939380645751953, 0.01502227783203125, 0.016105175018310547, 0.017188072204589844, 0.01827096939086914, 0.019353866577148438, 0.020436763763427734, 0.02151966094970703, 0.022602558135986328, 0.023685455322265625, 0.024768352508544922, 0.02585124969482422, 0.026934146881103516, 0.028017044067382812, 0.02909994125366211, 0.030182838439941406, 0.0312657356262207, 0.0323486328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 1.0, 1.0, 9.0, 8.0, 15.0, 14.0, 18.0, 26.0, 26.0, 23.0, 32.0, 25.0, 36.0, 49.0, 51.0, 45.0, 37.0, 51.0, 54.0, 48.0, 56.0, 47.0, 41.0, 46.0, 47.0, 32.0, 20.0, 21.0, 17.0, 16.0, 11.0, 9.0, 10.0, 11.0, 5.0, 3.0, 7.0, 3.0, 6.0, 5.0, 0.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.542368769645691, -1.4943792819976807, -1.44638991355896, -1.3984004259109497, -1.3504109382629395, -1.3024214506149292, -1.254431962966919, -1.2064425945281982, -1.158453106880188, -1.1104636192321777, -1.062474250793457, -1.0144847631454468, -0.9664952754974365, -0.9185057878494263, -0.8705163598060608, -0.8225269317626953, -0.7745374441146851, -0.7265479564666748, -0.6785585284233093, -0.6305691003799438, -0.5825796127319336, -0.5345901250839233, -0.48660069704055786, -0.43861123919487, -0.39062178134918213, -0.34263232350349426, -0.2946428656578064, -0.24665340781211853, -0.19866394996643066, -0.1506744921207428, -0.10268503427505493, -0.054695576429367065, -0.0067059993743896484, 0.04128345847129822, 0.08927291631698608, 0.13726237416267395, 0.18525183200836182, 0.23324128985404968, 0.28123074769973755, 0.3292202055454254, 0.3772096633911133, 0.42519912123680115, 0.473188579082489, 0.5211780071258545, 0.5691674947738647, 0.617156982421875, 0.6651464104652405, 0.713135838508606, 0.7611253261566162, 0.8091148138046265, 0.8571042418479919, 0.9050936698913574, 0.9530831575393677, 1.001072645187378, 1.0490620136260986, 1.0970515012741089, 1.1450409889221191, 1.1930304765701294, 1.2410199642181396, 1.2890093326568604, 1.3369988203048706, 1.3849883079528809, 1.4329776763916016, 1.4809671640396118, 1.528956651687622]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 10.0, 6.0, 7.0, 9.0, 8.0, 13.0, 8.0, 19.0, 25.0, 16.0, 24.0, 26.0, 27.0, 30.0, 31.0, 34.0, 26.0, 38.0, 40.0, 36.0, 50.0, 38.0, 41.0, 36.0, 34.0, 34.0, 42.0, 34.0, 27.0, 29.0, 35.0, 34.0, 25.0, 17.0, 18.0, 15.0, 13.0, 6.0, 8.0, 12.0, 7.0, 4.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9426308274269104, -0.908301591873169, -0.8739722967147827, -0.8396430611610413, -0.8053138256072998, -0.7709845900535583, -0.7366553544998169, -0.7023260593414307, -0.6679968237876892, -0.6336675882339478, -0.5993382930755615, -0.5650090575218201, -0.5306798219680786, -0.49635058641433716, -0.4620213210582733, -0.4276920557022095, -0.393362820148468, -0.35903358459472656, -0.3247043192386627, -0.2903750538825989, -0.2560458183288574, -0.22171656787395477, -0.18738731741905212, -0.15305806696414948, -0.11872881650924683, -0.08439956605434418, -0.05007031559944153, -0.01574106514453888, 0.01858818531036377, 0.05291743576526642, 0.08724668622016907, 0.12157593667507172, 0.1559051275253296, 0.19023437798023224, 0.2245636284351349, 0.25889289379119873, 0.2932221293449402, 0.32755136489868164, 0.3618806302547455, 0.3962098956108093, 0.4305391311645508, 0.46486836671829224, 0.4991976320743561, 0.5335268974304199, 0.5678561329841614, 0.6021853685379028, 0.6365146636962891, 0.6708438992500305, 0.705173134803772, 0.7395023703575134, 0.7738316059112549, 0.8081609010696411, 0.8424901366233826, 0.876819372177124, 0.9111486673355103, 0.9454779028892517, 0.9798071384429932, 1.0141364336013794, 1.048465609550476, 1.0827949047088623, 1.117124080657959, 1.1514533758163452, 1.1857826709747314, 1.2201118469238281, 1.2544411420822144]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 18.0, 10.0, 23.0, 45.0, 56.0, 101.0, 196.0, 313.0, 462.0, 797.0, 1301.0, 2144.0, 3470.0, 5554.0, 9074.0, 14025.0, 21432.0, 31929.0, 46236.0, 62590.0, 81074.0, 98146.0, 109613.0, 112145.0, 106358.0, 92312.0, 74645.0, 56736.0, 40207.0, 27881.0, 18387.0, 11884.0, 7364.0, 4746.0, 2857.0, 1695.0, 1077.0, 691.0, 396.0, 217.0, 130.0, 94.0, 48.0, 28.0, 21.0, 16.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.0693359375, -1.0381698608398438, -1.0070037841796875, -0.9758377075195312, -0.944671630859375, -0.9135055541992188, -0.8823394775390625, -0.8511734008789062, -0.82000732421875, -0.7888412475585938, -0.7576751708984375, -0.7265090942382812, -0.695343017578125, -0.6641769409179688, -0.6330108642578125, -0.6018447875976562, -0.5706787109375, -0.5395126342773438, -0.5083465576171875, -0.47718048095703125, -0.446014404296875, -0.41484832763671875, -0.3836822509765625, -0.35251617431640625, -0.32135009765625, -0.29018402099609375, -0.2590179443359375, -0.22785186767578125, -0.196685791015625, -0.16551971435546875, -0.1343536376953125, -0.10318756103515625, -0.072021484375, -0.04085540771484375, -0.0096893310546875, 0.02147674560546875, 0.052642822265625, 0.08380889892578125, 0.1149749755859375, 0.14614105224609375, 0.17730712890625, 0.20847320556640625, 0.2396392822265625, 0.27080535888671875, 0.301971435546875, 0.33313751220703125, 0.3643035888671875, 0.39546966552734375, 0.4266357421875, 0.45780181884765625, 0.4889678955078125, 0.5201339721679688, 0.551300048828125, 0.5824661254882812, 0.6136322021484375, 0.6447982788085938, 0.67596435546875, 0.7071304321289062, 0.7382965087890625, 0.7694625854492188, 0.800628662109375, 0.8317947387695312, 0.8629608154296875, 0.8941268920898438, 0.92529296875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 3.0, 9.0, 7.0, 13.0, 10.0, 19.0, 14.0, 21.0, 14.0, 16.0, 20.0, 20.0, 23.0, 25.0, 37.0, 24.0, 39.0, 31.0, 36.0, 32.0, 36.0, 47.0, 38.0, 40.0, 34.0, 45.0, 32.0, 35.0, 29.0, 18.0, 35.0, 30.0, 14.0, 26.0, 17.0, 14.0, 10.0, 19.0, 12.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.00390625, -0.969512939453125, -0.93511962890625, -0.900726318359375, -0.8663330078125, -0.831939697265625, -0.79754638671875, -0.763153076171875, -0.728759765625, -0.694366455078125, -0.65997314453125, -0.625579833984375, -0.5911865234375, -0.556793212890625, -0.52239990234375, -0.488006591796875, -0.45361328125, -0.419219970703125, -0.38482666015625, -0.350433349609375, -0.3160400390625, -0.281646728515625, -0.24725341796875, -0.212860107421875, -0.178466796875, -0.144073486328125, -0.10968017578125, -0.075286865234375, -0.0408935546875, -0.006500244140625, 0.02789306640625, 0.062286376953125, 0.0966796875, 0.131072998046875, 0.16546630859375, 0.199859619140625, 0.2342529296875, 0.268646240234375, 0.30303955078125, 0.337432861328125, 0.371826171875, 0.406219482421875, 0.44061279296875, 0.475006103515625, 0.5093994140625, 0.543792724609375, 0.57818603515625, 0.612579345703125, 0.64697265625, 0.681365966796875, 0.71575927734375, 0.750152587890625, 0.7845458984375, 0.818939208984375, 0.85333251953125, 0.887725830078125, 0.922119140625, 0.956512451171875, 0.99090576171875, 1.025299072265625, 1.0596923828125, 1.094085693359375, 1.12847900390625, 1.162872314453125, 1.197265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 9.0, 4.0, 9.0, 13.0, 26.0, 39.0, 72.0, 82.0, 121.0, 177.0, 266.0, 477.0, 676.0, 978.0, 1503.0, 2389.0, 3548.0, 5526.0, 8398.0, 12473.0, 18010.0, 26113.0, 36334.0, 48920.0, 63210.0, 77698.0, 89308.0, 97870.0, 99361.0, 95435.0, 84868.0, 71558.0, 57634.0, 43627.0, 32365.0, 22577.0, 15850.0, 10575.0, 7127.0, 4665.0, 2954.0, 2017.0, 1277.0, 825.0, 554.0, 376.0, 219.0, 164.0, 90.0, 83.0, 33.0, 30.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0], "bins": [-0.88916015625, -0.86163330078125, -0.8341064453125, -0.80657958984375, -0.779052734375, -0.75152587890625, -0.7239990234375, -0.69647216796875, -0.6689453125, -0.64141845703125, -0.6138916015625, -0.58636474609375, -0.558837890625, -0.53131103515625, -0.5037841796875, -0.47625732421875, -0.44873046875, -0.42120361328125, -0.3936767578125, -0.36614990234375, -0.338623046875, -0.31109619140625, -0.2835693359375, -0.25604248046875, -0.228515625, -0.20098876953125, -0.1734619140625, -0.14593505859375, -0.118408203125, -0.09088134765625, -0.0633544921875, -0.03582763671875, -0.00830078125, 0.01922607421875, 0.0467529296875, 0.07427978515625, 0.101806640625, 0.12933349609375, 0.1568603515625, 0.18438720703125, 0.2119140625, 0.23944091796875, 0.2669677734375, 0.29449462890625, 0.322021484375, 0.34954833984375, 0.3770751953125, 0.40460205078125, 0.43212890625, 0.45965576171875, 0.4871826171875, 0.51470947265625, 0.542236328125, 0.56976318359375, 0.5972900390625, 0.62481689453125, 0.65234375, 0.67987060546875, 0.7073974609375, 0.73492431640625, 0.762451171875, 0.78997802734375, 0.8175048828125, 0.84503173828125, 0.87255859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 8.0, 9.0, 6.0, 10.0, 15.0, 18.0, 18.0, 26.0, 32.0, 27.0, 33.0, 34.0, 35.0, 38.0, 47.0, 41.0, 43.0, 39.0, 51.0, 46.0, 33.0, 35.0, 25.0, 42.0, 33.0, 27.0, 24.0, 31.0, 25.0, 22.0, 24.0, 21.0, 9.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7119598388671875, -0.688568115234375, -0.6651763916015625, -0.64178466796875, -0.6183929443359375, -0.595001220703125, -0.5716094970703125, -0.5482177734375, -0.5248260498046875, -0.501434326171875, -0.4780426025390625, -0.45465087890625, -0.4312591552734375, -0.407867431640625, -0.3844757080078125, -0.361083984375, -0.3376922607421875, -0.314300537109375, -0.2909088134765625, -0.26751708984375, -0.2441253662109375, -0.220733642578125, -0.1973419189453125, -0.1739501953125, -0.1505584716796875, -0.127166748046875, -0.1037750244140625, -0.08038330078125, -0.0569915771484375, -0.033599853515625, -0.0102081298828125, 0.01318359375, 0.0365753173828125, 0.059967041015625, 0.0833587646484375, 0.10675048828125, 0.1301422119140625, 0.153533935546875, 0.1769256591796875, 0.2003173828125, 0.2237091064453125, 0.247100830078125, 0.2704925537109375, 0.29388427734375, 0.3172760009765625, 0.340667724609375, 0.3640594482421875, 0.387451171875, 0.4108428955078125, 0.434234619140625, 0.4576263427734375, 0.48101806640625, 0.5044097900390625, 0.527801513671875, 0.5511932373046875, 0.5745849609375, 0.5979766845703125, 0.621368408203125, 0.6447601318359375, 0.66815185546875, 0.6915435791015625, 0.714935302734375, 0.7383270263671875, 0.76171875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 26.0, 23.0, 34.0, 67.0, 91.0, 140.0, 204.0, 316.0, 442.0, 720.0, 1123.0, 1711.0, 2578.0, 4119.0, 6639.0, 10492.0, 16850.0, 27204.0, 43180.0, 67381.0, 97196.0, 128152.0, 145784.0, 140292.0, 115908.0, 84659.0, 56949.0, 36088.0, 22574.0, 13903.0, 8576.0, 5370.0, 3394.0, 2155.0, 1455.0, 917.0, 654.0, 435.0, 239.0, 160.0, 125.0, 72.0, 58.0, 33.0, 16.0, 18.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65234375, -0.6318283081054688, -0.6113128662109375, -0.5907974243164062, -0.570281982421875, -0.5497665405273438, -0.5292510986328125, -0.5087356567382812, -0.48822021484375, -0.46770477294921875, -0.4471893310546875, -0.42667388916015625, -0.406158447265625, -0.38564300537109375, -0.3651275634765625, -0.34461212158203125, -0.3240966796875, -0.30358123779296875, -0.2830657958984375, -0.26255035400390625, -0.242034912109375, -0.22151947021484375, -0.2010040283203125, -0.18048858642578125, -0.15997314453125, -0.13945770263671875, -0.1189422607421875, -0.09842681884765625, -0.077911376953125, -0.05739593505859375, -0.0368804931640625, -0.01636505126953125, 0.004150390625, 0.02466583251953125, 0.0451812744140625, 0.06569671630859375, 0.086212158203125, 0.10672760009765625, 0.1272430419921875, 0.14775848388671875, 0.16827392578125, 0.18878936767578125, 0.2093048095703125, 0.22982025146484375, 0.250335693359375, 0.27085113525390625, 0.2913665771484375, 0.31188201904296875, 0.3323974609375, 0.35291290283203125, 0.3734283447265625, 0.39394378662109375, 0.414459228515625, 0.43497467041015625, 0.4554901123046875, 0.47600555419921875, 0.49652099609375, 0.5170364379882812, 0.5375518798828125, 0.5580673217773438, 0.578582763671875, 0.5990982055664062, 0.6196136474609375, 0.6401290893554688, 0.66064453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 7.0, 9.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 30.0, 35.0, 46.0, 53.0, 49.0, 44.0, 57.0, 58.0, 58.0, 58.0, 49.0, 57.0, 52.0, 35.0, 46.0, 29.0, 26.0, 18.0, 16.0, 14.0, 11.0, 15.0, 11.0, 4.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.841868162155151e-05, -6.614625453948975e-05, -6.387382745742798e-05, -6.160140037536621e-05, -5.932897329330444e-05, -5.7056546211242676e-05, -5.478411912918091e-05, -5.251169204711914e-05, -5.023926496505737e-05, -4.7966837882995605e-05, -4.569441080093384e-05, -4.342198371887207e-05, -4.11495566368103e-05, -3.8877129554748535e-05, -3.660470247268677e-05, -3.4332275390625e-05, -3.205984830856323e-05, -2.9787421226501465e-05, -2.7514994144439697e-05, -2.524256706237793e-05, -2.2970139980316162e-05, -2.0697712898254395e-05, -1.8425285816192627e-05, -1.615285873413086e-05, -1.3880431652069092e-05, -1.1608004570007324e-05, -9.335577487945557e-06, -7.063150405883789e-06, -4.7907233238220215e-06, -2.518296241760254e-06, -2.4586915969848633e-07, 2.0265579223632812e-06, 4.298985004425049e-06, 6.571412086486816e-06, 8.843839168548584e-06, 1.1116266250610352e-05, 1.3388693332672119e-05, 1.5661120414733887e-05, 1.7933547496795654e-05, 2.0205974578857422e-05, 2.247840166091919e-05, 2.4750828742980957e-05, 2.7023255825042725e-05, 2.9295682907104492e-05, 3.156810998916626e-05, 3.384053707122803e-05, 3.6112964153289795e-05, 3.838539123535156e-05, 4.065781831741333e-05, 4.29302453994751e-05, 4.5202672481536865e-05, 4.747509956359863e-05, 4.97475266456604e-05, 5.201995372772217e-05, 5.4292380809783936e-05, 5.65648078918457e-05, 5.883723497390747e-05, 6.110966205596924e-05, 6.3382089138031e-05, 6.565451622009277e-05, 6.792694330215454e-05, 7.019937038421631e-05, 7.247179746627808e-05, 7.474422454833984e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 3.0, 15.0, 19.0, 29.0, 46.0, 42.0, 90.0, 113.0, 141.0, 227.0, 312.0, 487.0, 711.0, 1077.0, 1674.0, 2668.0, 4250.0, 6433.0, 10284.0, 16137.0, 24976.0, 38845.0, 57677.0, 81109.0, 107378.0, 127329.0, 132846.0, 120742.0, 98360.0, 72531.0, 49906.0, 32907.0, 21387.0, 13490.0, 8662.0, 5562.0, 3464.0, 2240.0, 1455.0, 980.0, 598.0, 416.0, 283.0, 193.0, 122.0, 95.0, 65.0, 56.0, 35.0, 22.0, 21.0, 10.0, 10.0, 10.0, 4.0, 4.0, 2.0, 5.0], "bins": [-0.60009765625, -0.5815277099609375, -0.562957763671875, -0.5443878173828125, -0.52581787109375, -0.5072479248046875, -0.488677978515625, -0.4701080322265625, -0.4515380859375, -0.4329681396484375, -0.414398193359375, -0.3958282470703125, -0.37725830078125, -0.3586883544921875, -0.340118408203125, -0.3215484619140625, -0.302978515625, -0.2844085693359375, -0.265838623046875, -0.2472686767578125, -0.22869873046875, -0.2101287841796875, -0.191558837890625, -0.1729888916015625, -0.1544189453125, -0.1358489990234375, -0.117279052734375, -0.0987091064453125, -0.08013916015625, -0.0615692138671875, -0.042999267578125, -0.0244293212890625, -0.005859375, 0.0127105712890625, 0.031280517578125, 0.0498504638671875, 0.06842041015625, 0.0869903564453125, 0.105560302734375, 0.1241302490234375, 0.1427001953125, 0.1612701416015625, 0.179840087890625, 0.1984100341796875, 0.21697998046875, 0.2355499267578125, 0.254119873046875, 0.2726898193359375, 0.291259765625, 0.3098297119140625, 0.328399658203125, 0.3469696044921875, 0.36553955078125, 0.3841094970703125, 0.402679443359375, 0.4212493896484375, 0.4398193359375, 0.4583892822265625, 0.476959228515625, 0.4955291748046875, 0.51409912109375, 0.5326690673828125, 0.551239013671875, 0.5698089599609375, 0.58837890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 18.0, 18.0, 21.0, 19.0, 27.0, 23.0, 30.0, 37.0, 37.0, 47.0, 44.0, 58.0, 50.0, 42.0, 56.0, 39.0, 45.0, 51.0, 28.0, 35.0, 42.0, 40.0, 33.0, 28.0, 15.0, 19.0, 15.0, 13.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 0.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2127685546875, -0.20659637451171875, -0.2004241943359375, -0.19425201416015625, -0.188079833984375, -0.18190765380859375, -0.1757354736328125, -0.16956329345703125, -0.16339111328125, -0.15721893310546875, -0.1510467529296875, -0.14487457275390625, -0.138702392578125, -0.13253021240234375, -0.1263580322265625, -0.12018585205078125, -0.114013671875, -0.10784149169921875, -0.1016693115234375, -0.09549713134765625, -0.089324951171875, -0.08315277099609375, -0.0769805908203125, -0.07080841064453125, -0.06463623046875, -0.05846405029296875, -0.0522918701171875, -0.04611968994140625, -0.039947509765625, -0.03377532958984375, -0.0276031494140625, -0.02143096923828125, -0.0152587890625, -0.00908660888671875, -0.0029144287109375, 0.00325775146484375, 0.009429931640625, 0.01560211181640625, 0.0217742919921875, 0.02794647216796875, 0.03411865234375, 0.04029083251953125, 0.0464630126953125, 0.05263519287109375, 0.058807373046875, 0.06497955322265625, 0.0711517333984375, 0.07732391357421875, 0.08349609375, 0.08966827392578125, 0.0958404541015625, 0.10201263427734375, 0.108184814453125, 0.11435699462890625, 0.1205291748046875, 0.12670135498046875, 0.13287353515625, 0.13904571533203125, 0.1452178955078125, 0.15139007568359375, 0.157562255859375, 0.16373443603515625, 0.1699066162109375, 0.17607879638671875, 0.1822509765625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 5.0, 10.0, 22.0, 28.0, 24.0, 28.0, 32.0, 47.0, 38.0, 48.0, 46.0, 44.0, 66.0, 51.0, 47.0, 59.0, 63.0, 50.0, 51.0, 39.0, 27.0, 36.0, 18.0, 14.0, 20.0, 11.0, 7.0, 13.0, 7.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67812180519104, -1.6232253313064575, -1.568328857421875, -1.513432264328003, -1.4585357904434204, -1.403639316558838, -1.3487428426742554, -1.2938463687896729, -1.2389497756958008, -1.1840533018112183, -1.1291568279266357, -1.0742602348327637, -1.0193637609481812, -0.9644672870635986, -0.9095708131790161, -0.8546743392944336, -0.7997778654098511, -0.7448813915252686, -0.6899848580360413, -0.6350883841514587, -0.5801918506622314, -0.5252953767776489, -0.4703989028930664, -0.4155023992061615, -0.3606058955192566, -0.3057093918323517, -0.2508128881454468, -0.19591641426086426, -0.14101991057395935, -0.08612340688705444, -0.031226933002471924, 0.023669570684432983, 0.07856607437133789, 0.1334625780582428, 0.1883590668439865, 0.24325555562973022, 0.29815205931663513, 0.35304856300354004, 0.40794503688812256, 0.46284154057502747, 0.5177380442619324, 0.5726345181465149, 0.6275310516357422, 0.6824275255203247, 0.7373239994049072, 0.7922205328941345, 0.847117006778717, 0.9020135402679443, 0.9569100141525269, 1.0118064880371094, 1.066702961921692, 1.1215994358062744, 1.1764960289001465, 1.231392502784729, 1.2862889766693115, 1.341185450553894, 1.3960819244384766, 1.450978398323059, 1.5058748722076416, 1.5607714653015137, 1.6156679391860962, 1.6705644130706787, 1.7254608869552612, 1.7803573608398438, 1.8352539539337158]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 9.0, 8.0, 8.0, 19.0, 20.0, 25.0, 13.0, 19.0, 25.0, 33.0, 29.0, 29.0, 41.0, 40.0, 35.0, 44.0, 31.0, 44.0, 44.0, 41.0, 44.0, 41.0, 37.0, 31.0, 44.0, 33.0, 25.0, 40.0, 22.0, 26.0, 19.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1000877618789673, -1.062829852104187, -1.0255720615386963, -0.988314151763916, -0.9510563015937805, -0.913798451423645, -0.8765405416488647, -0.8392826914787292, -0.8020248413085938, -0.7647669911384583, -0.7275091409683228, -0.6902512311935425, -0.652993381023407, -0.6157355308532715, -0.5784776210784912, -0.5412197709083557, -0.5039619207382202, -0.4667040705680847, -0.42944619059562683, -0.39218831062316895, -0.35493046045303345, -0.31767261028289795, -0.28041473031044006, -0.24315685033798218, -0.20589900016784668, -0.16864113509655, -0.1313832700252533, -0.0941254049539566, -0.05686753988265991, -0.01960967481136322, 0.01764819025993347, 0.05490607023239136, 0.0921638011932373, 0.129421666264534, 0.1666795313358307, 0.20393739640712738, 0.24119526147842407, 0.27845311164855957, 0.31571099162101746, 0.35296887159347534, 0.39022672176361084, 0.42748457193374634, 0.4647424519062042, 0.5020003318786621, 0.5392581820487976, 0.5765160322189331, 0.6137739419937134, 0.6510317921638489, 0.6882896423339844, 0.7255474925041199, 0.7628053426742554, 0.8000632524490356, 0.8373211026191711, 0.8745789527893066, 0.9118368625640869, 0.9490947127342224, 0.9863525629043579, 1.0236104726791382, 1.060868263244629, 1.0981261730194092, 1.1353840827941895, 1.1726418733596802, 1.2098997831344604, 1.2471575736999512, 1.2844154834747314]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 5.0, 13.0, 14.0, 29.0, 27.0, 59.0, 82.0, 137.0, 238.0, 369.0, 606.0, 1014.0, 1689.0, 2746.0, 4712.0, 7934.0, 13483.0, 23605.0, 40828.0, 69666.0, 118268.0, 195329.0, 304290.0, 438709.0, 559336.0, 611423.0, 561969.0, 443387.0, 306077.0, 197396.0, 120363.0, 71279.0, 41336.0, 24236.0, 13786.0, 8127.0, 4683.0, 2835.0, 1607.0, 979.0, 621.0, 346.0, 234.0, 141.0, 97.0, 76.0, 37.0, 18.0, 17.0, 16.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1665802001953125, -1.124176025390625, -1.0817718505859375, -1.03936767578125, -0.9969635009765625, -0.954559326171875, -0.9121551513671875, -0.8697509765625, -0.8273468017578125, -0.784942626953125, -0.7425384521484375, -0.70013427734375, -0.6577301025390625, -0.615325927734375, -0.5729217529296875, -0.530517578125, -0.4881134033203125, -0.445709228515625, -0.4033050537109375, -0.36090087890625, -0.3184967041015625, -0.276092529296875, -0.2336883544921875, -0.1912841796875, -0.1488800048828125, -0.106475830078125, -0.0640716552734375, -0.02166748046875, 0.0207366943359375, 0.063140869140625, 0.1055450439453125, 0.14794921875, 0.1903533935546875, 0.232757568359375, 0.2751617431640625, 0.31756591796875, 0.3599700927734375, 0.402374267578125, 0.4447784423828125, 0.4871826171875, 0.5295867919921875, 0.571990966796875, 0.6143951416015625, 0.65679931640625, 0.6992034912109375, 0.741607666015625, 0.7840118408203125, 0.826416015625, 0.8688201904296875, 0.911224365234375, 0.9536285400390625, 0.99603271484375, 1.0384368896484375, 1.080841064453125, 1.1232452392578125, 1.1656494140625, 1.2080535888671875, 1.250457763671875, 1.2928619384765625, 1.33526611328125, 1.3776702880859375, 1.420074462890625, 1.4624786376953125, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 3.0, 6.0, 5.0, 15.0, 11.0, 7.0, 11.0, 12.0, 10.0, 17.0, 20.0, 25.0, 16.0, 25.0, 26.0, 22.0, 30.0, 37.0, 35.0, 34.0, 41.0, 30.0, 39.0, 36.0, 40.0, 40.0, 32.0, 42.0, 40.0, 38.0, 29.0, 31.0, 32.0, 26.0, 19.0, 24.0, 14.0, 11.0, 13.0, 14.0, 12.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8059539794921875, -0.777923583984375, -0.7498931884765625, -0.72186279296875, -0.6938323974609375, -0.665802001953125, -0.6377716064453125, -0.6097412109375, -0.5817108154296875, -0.553680419921875, -0.5256500244140625, -0.49761962890625, -0.4695892333984375, -0.441558837890625, -0.4135284423828125, -0.385498046875, -0.3574676513671875, -0.329437255859375, -0.3014068603515625, -0.27337646484375, -0.2453460693359375, -0.217315673828125, -0.1892852783203125, -0.1612548828125, -0.1332244873046875, -0.105194091796875, -0.0771636962890625, -0.04913330078125, -0.0211029052734375, 0.006927490234375, 0.0349578857421875, 0.06298828125, 0.0910186767578125, 0.119049072265625, 0.1470794677734375, 0.17510986328125, 0.2031402587890625, 0.231170654296875, 0.2592010498046875, 0.2872314453125, 0.3152618408203125, 0.343292236328125, 0.3713226318359375, 0.39935302734375, 0.4273834228515625, 0.455413818359375, 0.4834442138671875, 0.511474609375, 0.5395050048828125, 0.567535400390625, 0.5955657958984375, 0.62359619140625, 0.6516265869140625, 0.679656982421875, 0.7076873779296875, 0.7357177734375, 0.7637481689453125, 0.791778564453125, 0.8198089599609375, 0.84783935546875, 0.8758697509765625, 0.903900146484375, 0.9319305419921875, 0.9599609375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 9.0, 13.0, 14.0, 22.0, 28.0, 48.0, 107.0, 162.0, 224.0, 382.0, 589.0, 933.0, 1483.0, 2336.0, 3826.0, 6323.0, 10166.0, 16238.0, 26151.0, 41231.0, 65015.0, 100398.0, 149506.0, 216368.0, 296933.0, 380937.0, 449834.0, 482505.0, 464970.0, 409577.0, 326725.0, 244496.0, 173521.0, 116501.0, 75851.0, 49122.0, 30594.0, 19613.0, 11908.0, 7454.0, 4564.0, 2829.0, 1779.0, 1123.0, 702.0, 443.0, 246.0, 170.0, 119.0, 77.0, 40.0, 32.0, 24.0, 17.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1.263671875, -1.225006103515625, -1.18634033203125, -1.147674560546875, -1.1090087890625, -1.070343017578125, -1.03167724609375, -0.993011474609375, -0.954345703125, -0.915679931640625, -0.87701416015625, -0.838348388671875, -0.7996826171875, -0.761016845703125, -0.72235107421875, -0.683685302734375, -0.64501953125, -0.606353759765625, -0.56768798828125, -0.529022216796875, -0.4903564453125, -0.451690673828125, -0.41302490234375, -0.374359130859375, -0.335693359375, -0.297027587890625, -0.25836181640625, -0.219696044921875, -0.1810302734375, -0.142364501953125, -0.10369873046875, -0.065032958984375, -0.0263671875, 0.012298583984375, 0.05096435546875, 0.089630126953125, 0.1282958984375, 0.166961669921875, 0.20562744140625, 0.244293212890625, 0.282958984375, 0.321624755859375, 0.36029052734375, 0.398956298828125, 0.4376220703125, 0.476287841796875, 0.51495361328125, 0.553619384765625, 0.59228515625, 0.630950927734375, 0.66961669921875, 0.708282470703125, 0.7469482421875, 0.785614013671875, 0.82427978515625, 0.862945556640625, 0.901611328125, 0.940277099609375, 0.97894287109375, 1.017608642578125, 1.0562744140625, 1.094940185546875, 1.13360595703125, 1.172271728515625, 1.2109375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 12.0, 15.0, 10.0, 16.0, 27.0, 26.0, 39.0, 36.0, 45.0, 64.0, 79.0, 91.0, 106.0, 135.0, 119.0, 128.0, 166.0, 171.0, 160.0, 187.0, 192.0, 185.0, 195.0, 188.0, 213.0, 169.0, 189.0, 167.0, 148.0, 126.0, 105.0, 91.0, 82.0, 72.0, 68.0, 40.0, 35.0, 32.0, 25.0, 17.0, 18.0, 20.0, 11.0, 4.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.50634765625, -0.4912910461425781, -0.47623443603515625, -0.4611778259277344, -0.4461212158203125, -0.4310646057128906, -0.41600799560546875, -0.4009513854980469, -0.385894775390625, -0.3708381652832031, -0.35578155517578125, -0.3407249450683594, -0.3256683349609375, -0.3106117248535156, -0.29555511474609375, -0.2804985046386719, -0.26544189453125, -0.2503852844238281, -0.23532867431640625, -0.22027206420898438, -0.2052154541015625, -0.19015884399414062, -0.17510223388671875, -0.16004562377929688, -0.144989013671875, -0.12993240356445312, -0.11487579345703125, -0.09981918334960938, -0.0847625732421875, -0.06970596313476562, -0.05464935302734375, -0.039592742919921875, -0.0245361328125, -0.009479522705078125, 0.00557708740234375, 0.020633697509765625, 0.0356903076171875, 0.050746917724609375, 0.06580352783203125, 0.08086013793945312, 0.095916748046875, 0.11097335815429688, 0.12602996826171875, 0.14108657836914062, 0.1561431884765625, 0.17119979858398438, 0.18625640869140625, 0.20131301879882812, 0.21636962890625, 0.23142623901367188, 0.24648284912109375, 0.2615394592285156, 0.2765960693359375, 0.2916526794433594, 0.30670928955078125, 0.3217658996582031, 0.336822509765625, 0.3518791198730469, 0.36693572998046875, 0.3819923400878906, 0.3970489501953125, 0.4121055603027344, 0.42716217041015625, 0.4422187805175781, 0.457275390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 5.0, 18.0, 17.0, 16.0, 16.0, 23.0, 26.0, 44.0, 34.0, 49.0, 50.0, 45.0, 51.0, 60.0, 58.0, 46.0, 55.0, 57.0, 40.0, 46.0, 46.0, 31.0, 22.0, 35.0, 25.0, 19.0, 8.0, 10.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8614811897277832, -1.8005732297897339, -1.7396652698516846, -1.6787573099136353, -1.617849349975586, -1.5569415092468262, -1.4960334300994873, -1.4351255893707275, -1.3742176294326782, -1.313309669494629, -1.2524017095565796, -1.1914937496185303, -1.130585789680481, -1.0696778297424316, -1.0087699890136719, -0.9478620290756226, -0.8869540095329285, -0.8260460495948792, -0.7651380896568298, -0.7042301893234253, -0.643322229385376, -0.5824142694473267, -0.5215063095092773, -0.4605983793735504, -0.3996904194355011, -0.3387824594974518, -0.27787452936172485, -0.21696656942367554, -0.15605862438678741, -0.09515067934989929, -0.034242719411849976, 0.026665210723876953, 0.08757317066192627, 0.1484811156988144, 0.20938906073570251, 0.27029702067375183, 0.33120495080947876, 0.3921129107475281, 0.4530208706855774, 0.5139287710189819, 0.5748367309570312, 0.6357446908950806, 0.6966526508331299, 0.7575606107711792, 0.8184685111045837, 0.8793764710426331, 0.9402844309806824, 1.001192331314087, 1.0621004104614258, 1.123008370399475, 1.1839163303375244, 1.2448242902755737, 1.305732250213623, 1.3666400909423828, 1.4275481700897217, 1.4884560108184814, 1.5493639707565308, 1.61027193069458, 1.6711798906326294, 1.7320878505706787, 1.792995810508728, 1.8539037704467773, 1.914811611175537, 1.9757195711135864, 2.0366275310516357]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 9.0, 7.0, 10.0, 12.0, 13.0, 19.0, 27.0, 17.0, 26.0, 37.0, 43.0, 49.0, 52.0, 42.0, 40.0, 48.0, 55.0, 45.0, 52.0, 41.0, 47.0, 39.0, 44.0, 46.0, 25.0, 23.0, 27.0, 16.0, 24.0, 17.0, 8.0, 7.0, 6.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4232420921325684, -1.3767975568771362, -1.3303531408309937, -1.2839086055755615, -1.237464189529419, -1.1910196542739868, -1.1445751190185547, -1.098130702972412, -1.0516862869262695, -1.0052417516708374, -0.9587973356246948, -0.9123528003692627, -0.8659083843231201, -0.819463849067688, -0.7730193734169006, -0.7265748977661133, -0.6801303625106812, -0.6336858868598938, -0.5872414112091064, -0.5407968759536743, -0.49435243010520935, -0.447907954454422, -0.40146344900131226, -0.3550189733505249, -0.30857449769973755, -0.2621300220489502, -0.21568553149700165, -0.1692410409450531, -0.12279656529426575, -0.0763520896434784, -0.029907584190368652, 0.0165368914604187, 0.06298136711120605, 0.109425850212574, 0.15587033331394196, 0.2023148238658905, 0.24875929951667786, 0.2952037751674652, 0.34164828062057495, 0.3880927562713623, 0.43453723192214966, 0.480981707572937, 0.5274261832237244, 0.5738706588745117, 0.6203151941299438, 0.6667596101760864, 0.7132041454315186, 0.7596486210823059, 0.8060930967330933, 0.8525375723838806, 0.898982048034668, 0.9454265832901001, 0.9918709993362427, 1.0383155345916748, 1.0847599506378174, 1.1312044858932495, 1.1776490211486816, 1.2240935564041138, 1.2705379724502563, 1.3169825077056885, 1.363426923751831, 1.4098714590072632, 1.4563159942626953, 1.502760410308838, 1.5492048263549805]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 12.0, 19.0, 29.0, 50.0, 48.0, 107.0, 147.0, 221.0, 325.0, 534.0, 786.0, 1106.0, 1828.0, 3008.0, 4740.0, 7689.0, 12914.0, 21252.0, 35628.0, 58930.0, 94956.0, 143121.0, 179111.0, 166344.0, 120305.0, 76739.0, 46917.0, 27907.0, 16792.0, 10252.0, 6125.0, 3879.0, 2443.0, 1487.0, 926.0, 641.0, 441.0, 263.0, 177.0, 102.0, 81.0, 55.0, 31.0, 19.0, 21.0, 11.0, 2.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.35888671875, -0.3479347229003906, -0.33698272705078125, -0.3260307312011719, -0.3150787353515625, -0.3041267395019531, -0.29317474365234375, -0.2822227478027344, -0.271270751953125, -0.2603187561035156, -0.24936676025390625, -0.23841476440429688, -0.2274627685546875, -0.21651077270507812, -0.20555877685546875, -0.19460678100585938, -0.18365478515625, -0.17270278930664062, -0.16175079345703125, -0.15079879760742188, -0.1398468017578125, -0.12889480590820312, -0.11794281005859375, -0.10699081420898438, -0.096038818359375, -0.08508682250976562, -0.07413482666015625, -0.06318283081054688, -0.0522308349609375, -0.041278839111328125, -0.03032684326171875, -0.019374847412109375, -0.0084228515625, 0.002529144287109375, 0.01348114013671875, 0.024433135986328125, 0.0353851318359375, 0.046337127685546875, 0.05728912353515625, 0.06824111938476562, 0.079193115234375, 0.09014511108398438, 0.10109710693359375, 0.11204910278320312, 0.1230010986328125, 0.13395309448242188, 0.14490509033203125, 0.15585708618164062, 0.16680908203125, 0.17776107788085938, 0.18871307373046875, 0.19966506958007812, 0.2106170654296875, 0.22156906127929688, 0.23252105712890625, 0.24347305297851562, 0.254425048828125, 0.2653770446777344, 0.27632904052734375, 0.2872810363769531, 0.2982330322265625, 0.3091850280761719, 0.32013702392578125, 0.3310890197753906, 0.342041015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 12.0, 13.0, 14.0, 15.0, 33.0, 17.0, 29.0, 49.0, 27.0, 40.0, 44.0, 51.0, 38.0, 33.0, 51.0, 46.0, 45.0, 47.0, 44.0, 52.0, 43.0, 42.0, 35.0, 27.0, 23.0, 16.0, 15.0, 17.0, 11.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4326171875, -1.384765625, -1.3369140625, -1.2890625, -1.2412109375, -1.193359375, -1.1455078125, -1.09765625, -1.0498046875, -1.001953125, -0.9541015625, -0.90625, -0.8583984375, -0.810546875, -0.7626953125, -0.71484375, -0.6669921875, -0.619140625, -0.5712890625, -0.5234375, -0.4755859375, -0.427734375, -0.3798828125, -0.33203125, -0.2841796875, -0.236328125, -0.1884765625, -0.140625, -0.0927734375, -0.044921875, 0.0029296875, 0.05078125, 0.0986328125, 0.146484375, 0.1943359375, 0.2421875, 0.2900390625, 0.337890625, 0.3857421875, 0.43359375, 0.4814453125, 0.529296875, 0.5771484375, 0.625, 0.6728515625, 0.720703125, 0.7685546875, 0.81640625, 0.8642578125, 0.912109375, 0.9599609375, 1.0078125, 1.0556640625, 1.103515625, 1.1513671875, 1.19921875, 1.2470703125, 1.294921875, 1.3427734375, 1.390625, 1.4384765625, 1.486328125, 1.5341796875, 1.58203125, 1.6298828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 12.0, 8.0, 7.0, 12.0, 13.0, 19.0, 25.0, 48.0, 63.0, 100.0, 141.0, 213.0, 288.0, 442.0, 691.0, 1057.0, 1655.0, 2696.0, 4574.0, 8210.0, 14611.0, 27187.0, 50959.0, 95104.0, 166356.0, 227233.0, 192001.0, 115673.0, 63178.0, 33557.0, 18064.0, 9982.0, 5562.0, 3213.0, 2044.0, 1256.0, 772.0, 470.0, 340.0, 213.0, 144.0, 103.0, 66.0, 62.0, 44.0, 18.0, 19.0, 14.0, 12.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-0.45361328125, -0.439727783203125, -0.42584228515625, -0.411956787109375, -0.3980712890625, -0.384185791015625, -0.37030029296875, -0.356414794921875, -0.342529296875, -0.328643798828125, -0.31475830078125, -0.300872802734375, -0.2869873046875, -0.273101806640625, -0.25921630859375, -0.245330810546875, -0.2314453125, -0.217559814453125, -0.20367431640625, -0.189788818359375, -0.1759033203125, -0.162017822265625, -0.14813232421875, -0.134246826171875, -0.120361328125, -0.106475830078125, -0.09259033203125, -0.078704833984375, -0.0648193359375, -0.050933837890625, -0.03704833984375, -0.023162841796875, -0.00927734375, 0.004608154296875, 0.01849365234375, 0.032379150390625, 0.0462646484375, 0.060150146484375, 0.07403564453125, 0.087921142578125, 0.101806640625, 0.115692138671875, 0.12957763671875, 0.143463134765625, 0.1573486328125, 0.171234130859375, 0.18511962890625, 0.199005126953125, 0.212890625, 0.226776123046875, 0.24066162109375, 0.254547119140625, 0.2684326171875, 0.282318115234375, 0.29620361328125, 0.310089111328125, 0.323974609375, 0.337860107421875, 0.35174560546875, 0.365631103515625, 0.3795166015625, 0.393402099609375, 0.40728759765625, 0.421173095703125, 0.43505859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 7.0, 8.0, 8.0, 18.0, 25.0, 29.0, 26.0, 26.0, 29.0, 33.0, 32.0, 40.0, 38.0, 35.0, 37.0, 50.0, 53.0, 40.0, 53.0, 28.0, 35.0, 29.0, 38.0, 34.0, 29.0, 26.0, 19.0, 29.0, 19.0, 26.0, 13.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8212203979492188, -0.7942962646484375, -0.7673721313476562, -0.740447998046875, -0.7135238647460938, -0.6865997314453125, -0.6596755981445312, -0.63275146484375, -0.6058273315429688, -0.5789031982421875, -0.5519790649414062, -0.525054931640625, -0.49813079833984375, -0.4712066650390625, -0.44428253173828125, -0.4173583984375, -0.39043426513671875, -0.3635101318359375, -0.33658599853515625, -0.309661865234375, -0.28273773193359375, -0.2558135986328125, -0.22888946533203125, -0.20196533203125, -0.17504119873046875, -0.1481170654296875, -0.12119293212890625, -0.094268798828125, -0.06734466552734375, -0.0404205322265625, -0.01349639892578125, 0.013427734375, 0.04035186767578125, 0.0672760009765625, 0.09420013427734375, 0.121124267578125, 0.14804840087890625, 0.1749725341796875, 0.20189666748046875, 0.22882080078125, 0.25574493408203125, 0.2826690673828125, 0.30959320068359375, 0.336517333984375, 0.36344146728515625, 0.3903656005859375, 0.41728973388671875, 0.4442138671875, 0.47113800048828125, 0.4980621337890625, 0.5249862670898438, 0.551910400390625, 0.5788345336914062, 0.6057586669921875, 0.6326828002929688, 0.65960693359375, 0.6865310668945312, 0.7134552001953125, 0.7403793334960938, 0.767303466796875, 0.7942276000976562, 0.8211517333984375, 0.8480758666992188, 0.875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 10.0, 11.0, 13.0, 21.0, 18.0, 24.0, 37.0, 43.0, 63.0, 79.0, 85.0, 175.0, 235.0, 393.0, 629.0, 959.0, 1778.0, 3458.0, 7204.0, 18633.0, 66772.0, 420814.0, 425475.0, 67459.0, 18764.0, 7329.0, 3400.0, 1820.0, 1036.0, 588.0, 393.0, 236.0, 185.0, 97.0, 80.0, 62.0, 34.0, 28.0, 24.0, 18.0, 20.0, 10.0, 9.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3502845764160156, -0.33777618408203125, -0.3252677917480469, -0.3127593994140625, -0.3002510070800781, -0.28774261474609375, -0.2752342224121094, -0.262725830078125, -0.2502174377441406, -0.23770904541015625, -0.22520065307617188, -0.2126922607421875, -0.20018386840820312, -0.18767547607421875, -0.17516708374023438, -0.16265869140625, -0.15015029907226562, -0.13764190673828125, -0.12513351440429688, -0.1126251220703125, -0.10011672973632812, -0.08760833740234375, -0.07509994506835938, -0.062591552734375, -0.050083160400390625, -0.03757476806640625, -0.025066375732421875, -0.0125579833984375, -4.9591064453125e-05, 0.01245880126953125, 0.024967193603515625, 0.0374755859375, 0.049983978271484375, 0.06249237060546875, 0.07500076293945312, 0.0875091552734375, 0.10001754760742188, 0.11252593994140625, 0.12503433227539062, 0.137542724609375, 0.15005111694335938, 0.16255950927734375, 0.17506790161132812, 0.1875762939453125, 0.20008468627929688, 0.21259307861328125, 0.22510147094726562, 0.23760986328125, 0.2501182556152344, 0.26262664794921875, 0.2751350402832031, 0.2876434326171875, 0.3001518249511719, 0.31266021728515625, 0.3251686096191406, 0.337677001953125, 0.3501853942871094, 0.36269378662109375, 0.3752021789550781, 0.3877105712890625, 0.4002189636230469, 0.41272735595703125, 0.4252357482910156, 0.437744140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 14.0, 15.0, 18.0, 22.0, 41.0, 39.0, 47.0, 44.0, 61.0, 72.0, 62.0, 76.0, 60.0, 67.0, 48.0, 63.0, 47.0, 38.0, 33.0, 19.0, 24.0, 18.0, 17.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5463680028915405e-05, -1.5012919902801514e-05, -1.4562159776687622e-05, -1.411139965057373e-05, -1.3660639524459839e-05, -1.3209879398345947e-05, -1.2759119272232056e-05, -1.2308359146118164e-05, -1.1857599020004272e-05, -1.1406838893890381e-05, -1.095607876777649e-05, -1.0505318641662598e-05, -1.0054558515548706e-05, -9.603798389434814e-06, -9.153038263320923e-06, -8.702278137207031e-06, -8.25151801109314e-06, -7.800757884979248e-06, -7.3499977588653564e-06, -6.899237632751465e-06, -6.448477506637573e-06, -5.997717380523682e-06, -5.54695725440979e-06, -5.0961971282958984e-06, -4.645437002182007e-06, -4.194676876068115e-06, -3.7439167499542236e-06, -3.293156623840332e-06, -2.8423964977264404e-06, -2.391636371612549e-06, -1.9408762454986572e-06, -1.4901161193847656e-06, -1.039355993270874e-06, -5.885958671569824e-07, -1.3783574104309082e-07, 3.129243850708008e-07, 7.636845111846924e-07, 1.214444637298584e-06, 1.6652047634124756e-06, 2.115964889526367e-06, 2.566725015640259e-06, 3.0174851417541504e-06, 3.468245267868042e-06, 3.919005393981934e-06, 4.369765520095825e-06, 4.820525646209717e-06, 5.271285772323608e-06, 5.7220458984375e-06, 6.172806024551392e-06, 6.623566150665283e-06, 7.074326276779175e-06, 7.525086402893066e-06, 7.975846529006958e-06, 8.42660665512085e-06, 8.877366781234741e-06, 9.328126907348633e-06, 9.778887033462524e-06, 1.0229647159576416e-05, 1.0680407285690308e-05, 1.11311674118042e-05, 1.158192753791809e-05, 1.2032687664031982e-05, 1.2483447790145874e-05, 1.2934207916259766e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 14.0, 10.0, 24.0, 30.0, 29.0, 39.0, 42.0, 60.0, 89.0, 146.0, 195.0, 269.0, 371.0, 540.0, 776.0, 1207.0, 1838.0, 2898.0, 4977.0, 8937.0, 17829.0, 40222.0, 100456.0, 249803.0, 332979.0, 164280.0, 63700.0, 26940.0, 12380.0, 6590.0, 3778.0, 2273.0, 1515.0, 1034.0, 663.0, 449.0, 341.0, 241.0, 177.0, 114.0, 95.0, 60.0, 43.0, 29.0, 18.0, 16.0, 9.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2736701965332031, -0.26462554931640625, -0.2555809020996094, -0.2465362548828125, -0.23749160766601562, -0.22844696044921875, -0.21940231323242188, -0.210357666015625, -0.20131301879882812, -0.19226837158203125, -0.18322372436523438, -0.1741790771484375, -0.16513442993164062, -0.15608978271484375, -0.14704513549804688, -0.13800048828125, -0.12895584106445312, -0.11991119384765625, -0.11086654663085938, -0.1018218994140625, -0.09277725219726562, -0.08373260498046875, -0.07468795776367188, -0.065643310546875, -0.056598663330078125, -0.04755401611328125, -0.038509368896484375, -0.0294647216796875, -0.020420074462890625, -0.01137542724609375, -0.002330780029296875, 0.0067138671875, 0.015758514404296875, 0.02480316162109375, 0.033847808837890625, 0.0428924560546875, 0.051937103271484375, 0.06098175048828125, 0.07002639770507812, 0.079071044921875, 0.08811569213867188, 0.09716033935546875, 0.10620498657226562, 0.1152496337890625, 0.12429428100585938, 0.13333892822265625, 0.14238357543945312, 0.15142822265625, 0.16047286987304688, 0.16951751708984375, 0.17856216430664062, 0.1876068115234375, 0.19665145874023438, 0.20569610595703125, 0.21474075317382812, 0.223785400390625, 0.23283004760742188, 0.24187469482421875, 0.2509193420410156, 0.2599639892578125, 0.2690086364746094, 0.27805328369140625, 0.2870979309082031, 0.296142578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 10.0, 14.0, 24.0, 33.0, 49.0, 69.0, 109.0, 129.0, 151.0, 145.0, 98.0, 52.0, 37.0, 18.0, 12.0, 7.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08376884460449219, -0.08056259155273438, -0.07735633850097656, -0.07415008544921875, -0.07094383239746094, -0.06773757934570312, -0.06453132629394531, -0.0613250732421875, -0.05811882019042969, -0.054912567138671875, -0.05170631408691406, -0.04850006103515625, -0.04529380798339844, -0.042087554931640625, -0.03888130187988281, -0.035675048828125, -0.03246879577636719, -0.029262542724609375, -0.026056289672851562, -0.02285003662109375, -0.019643783569335938, -0.016437530517578125, -0.013231277465820312, -0.0100250244140625, -0.0068187713623046875, -0.003612518310546875, -0.0004062652587890625, 0.00279998779296875, 0.0060062408447265625, 0.009212493896484375, 0.012418746948242188, 0.015625, 0.018831253051757812, 0.022037506103515625, 0.025243759155273438, 0.02845001220703125, 0.03165626525878906, 0.034862518310546875, 0.03806877136230469, 0.0412750244140625, 0.04448127746582031, 0.047687530517578125, 0.05089378356933594, 0.05410003662109375, 0.05730628967285156, 0.060512542724609375, 0.06371879577636719, 0.066925048828125, 0.07013130187988281, 0.07333755493164062, 0.07654380798339844, 0.07975006103515625, 0.08295631408691406, 0.08616256713867188, 0.08936882019042969, 0.0925750732421875, 0.09578132629394531, 0.09898757934570312, 0.10219383239746094, 0.10540008544921875, 0.10860633850097656, 0.11181259155273438, 0.11501884460449219, 0.11822509765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 1.0, 9.0, 3.0, 12.0, 12.0, 19.0, 14.0, 21.0, 27.0, 29.0, 42.0, 43.0, 47.0, 41.0, 52.0, 60.0, 60.0, 50.0, 56.0, 53.0, 54.0, 41.0, 49.0, 42.0, 23.0, 34.0, 24.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9357694387435913, -1.8736472129821777, -1.8115248680114746, -1.7494025230407715, -1.687280297279358, -1.6251580715179443, -1.5630357265472412, -1.500913381576538, -1.4387911558151245, -1.376668930053711, -1.3145465850830078, -1.2524242401123047, -1.1903020143508911, -1.1281797885894775, -1.0660574436187744, -1.0039350986480713, -0.9418128728866577, -0.8796905875205994, -0.817568302154541, -0.7554460167884827, -0.6933237314224243, -0.631201446056366, -0.5690791606903076, -0.5069568753242493, -0.4448345899581909, -0.38271230459213257, -0.3205900192260742, -0.25846773386001587, -0.19634544849395752, -0.13422316312789917, -0.07210087776184082, -0.00997859239578247, 0.05214381217956543, 0.11426609754562378, 0.17638838291168213, 0.23851066827774048, 0.30063295364379883, 0.3627552390098572, 0.4248775243759155, 0.4869998097419739, 0.5491220951080322, 0.6112443804740906, 0.6733666658401489, 0.7354889512062073, 0.7976112365722656, 0.859733521938324, 0.9218558073043823, 0.9839780926704407, 1.046100378036499, 1.1082227230072021, 1.1703449487686157, 1.2324671745300293, 1.2945895195007324, 1.3567118644714355, 1.4188340902328491, 1.4809563159942627, 1.5430786609649658, 1.605201005935669, 1.6673232316970825, 1.729445457458496, 1.7915678024291992, 1.8536901473999023, 1.915812373161316, 1.9779345989227295, 2.0400569438934326]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 9.0, 13.0, 5.0, 9.0, 9.0, 13.0, 12.0, 18.0, 29.0, 18.0, 27.0, 41.0, 40.0, 51.0, 52.0, 37.0, 46.0, 52.0, 50.0, 46.0, 47.0, 45.0, 48.0, 35.0, 46.0, 46.0, 25.0, 21.0, 31.0, 14.0, 19.0, 16.0, 10.0, 6.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4187204837799072, -1.3720732927322388, -1.3254261016845703, -1.2787789106369019, -1.2321317195892334, -1.1854846477508545, -1.1388373374938965, -1.0921902656555176, -1.0455430746078491, -0.9988958835601807, -0.9522486925125122, -0.9056015014648438, -0.8589543700218201, -0.8123071789741516, -0.7656599879264832, -0.7190128564834595, -0.6723656058311462, -0.6257184147834778, -0.5790712237358093, -0.5324240922927856, -0.4857769012451172, -0.43912971019744873, -0.3924825191497803, -0.3458353579044342, -0.29918816685676575, -0.2525409758090973, -0.20589381456375122, -0.15924662351608276, -0.1125994473695755, -0.06595227122306824, -0.01930508017539978, 0.02734208106994629, 0.07398927211761475, 0.12063644826412201, 0.16728362441062927, 0.21393081545829773, 0.2605779767036438, 0.30722516775131226, 0.3538723587989807, 0.4005195200443268, 0.44716671109199524, 0.4938139021396637, 0.5404610633850098, 0.5871082544326782, 0.6337554454803467, 0.6804026365280151, 0.7270498275756836, 0.7736969590187073, 0.8203441500663757, 0.8669913411140442, 0.9136385321617126, 0.9602856636047363, 1.0069328546524048, 1.0535800457000732, 1.1002272367477417, 1.1468744277954102, 1.1935216188430786, 1.240168809890747, 1.2868160009384155, 1.333463191986084, 1.3801103830337524, 1.426757574081421, 1.4734046459197998, 1.5200518369674683, 1.5666990280151367]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 21.0, 29.0, 59.0, 93.0, 115.0, 215.0, 357.0, 556.0, 914.0, 1436.0, 2456.0, 3962.0, 6272.0, 9967.0, 15798.0, 23710.0, 35374.0, 50109.0, 67737.0, 86839.0, 102476.0, 112177.0, 112537.0, 103339.0, 87901.0, 69103.0, 51012.0, 36121.0, 24443.0, 16034.0, 10233.0, 6615.0, 4023.0, 2534.0, 1472.0, 913.0, 580.0, 382.0, 253.0, 143.0, 83.0, 54.0, 30.0, 26.0, 7.0, 16.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.033203125, -0.999908447265625, -0.96661376953125, -0.933319091796875, -0.9000244140625, -0.866729736328125, -0.83343505859375, -0.800140380859375, -0.766845703125, -0.733551025390625, -0.70025634765625, -0.666961669921875, -0.6336669921875, -0.600372314453125, -0.56707763671875, -0.533782958984375, -0.50048828125, -0.467193603515625, -0.43389892578125, -0.400604248046875, -0.3673095703125, -0.334014892578125, -0.30072021484375, -0.267425537109375, -0.234130859375, -0.200836181640625, -0.16754150390625, -0.134246826171875, -0.1009521484375, -0.067657470703125, -0.03436279296875, -0.001068115234375, 0.0322265625, 0.065521240234375, 0.09881591796875, 0.132110595703125, 0.1654052734375, 0.198699951171875, 0.23199462890625, 0.265289306640625, 0.298583984375, 0.331878662109375, 0.36517333984375, 0.398468017578125, 0.4317626953125, 0.465057373046875, 0.49835205078125, 0.531646728515625, 0.56494140625, 0.598236083984375, 0.63153076171875, 0.664825439453125, 0.6981201171875, 0.731414794921875, 0.76470947265625, 0.798004150390625, 0.831298828125, 0.864593505859375, 0.89788818359375, 0.931182861328125, 0.9644775390625, 0.997772216796875, 1.03106689453125, 1.064361572265625, 1.09765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 9.0, 9.0, 25.0, 8.0, 13.0, 27.0, 31.0, 25.0, 28.0, 30.0, 48.0, 50.0, 44.0, 47.0, 55.0, 59.0, 42.0, 49.0, 54.0, 43.0, 54.0, 38.0, 31.0, 30.0, 31.0, 19.0, 16.0, 20.0, 20.0, 8.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6743927001953125, -1.623199462890625, -1.5720062255859375, -1.52081298828125, -1.4696197509765625, -1.418426513671875, -1.3672332763671875, -1.3160400390625, -1.2648468017578125, -1.213653564453125, -1.1624603271484375, -1.11126708984375, -1.0600738525390625, -1.008880615234375, -0.9576873779296875, -0.906494140625, -0.8553009033203125, -0.804107666015625, -0.7529144287109375, -0.70172119140625, -0.6505279541015625, -0.599334716796875, -0.5481414794921875, -0.4969482421875, -0.4457550048828125, -0.394561767578125, -0.3433685302734375, -0.29217529296875, -0.2409820556640625, -0.189788818359375, -0.1385955810546875, -0.08740234375, -0.0362091064453125, 0.014984130859375, 0.0661773681640625, 0.11737060546875, 0.1685638427734375, 0.219757080078125, 0.2709503173828125, 0.3221435546875, 0.3733367919921875, 0.424530029296875, 0.4757232666015625, 0.52691650390625, 0.5781097412109375, 0.629302978515625, 0.6804962158203125, 0.731689453125, 0.7828826904296875, 0.834075927734375, 0.8852691650390625, 0.93646240234375, 0.9876556396484375, 1.038848876953125, 1.0900421142578125, 1.1412353515625, 1.1924285888671875, 1.243621826171875, 1.2948150634765625, 1.34600830078125, 1.3972015380859375, 1.448394775390625, 1.4995880126953125, 1.55078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 37.0, 47.0, 80.0, 149.0, 207.0, 298.0, 477.0, 771.0, 1205.0, 1883.0, 2874.0, 4354.0, 6469.0, 9581.0, 14008.0, 20079.0, 28277.0, 38270.0, 49942.0, 63771.0, 76515.0, 86947.0, 94432.0, 95371.0, 91425.0, 82589.0, 70116.0, 56284.0, 44099.0, 33042.0, 23600.0, 16956.0, 11675.0, 7698.0, 5212.0, 3450.0, 2238.0, 1459.0, 972.0, 607.0, 346.0, 238.0, 160.0, 110.0, 68.0, 41.0, 24.0, 27.0, 14.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8673171997070312, -0.8386383056640625, -0.8099594116210938, -0.781280517578125, -0.7526016235351562, -0.7239227294921875, -0.6952438354492188, -0.66656494140625, -0.6378860473632812, -0.6092071533203125, -0.5805282592773438, -0.551849365234375, -0.5231704711914062, -0.4944915771484375, -0.46581268310546875, -0.4371337890625, -0.40845489501953125, -0.3797760009765625, -0.35109710693359375, -0.322418212890625, -0.29373931884765625, -0.2650604248046875, -0.23638153076171875, -0.20770263671875, -0.17902374267578125, -0.1503448486328125, -0.12166595458984375, -0.092987060546875, -0.06430816650390625, -0.0356292724609375, -0.00695037841796875, 0.021728515625, 0.05040740966796875, 0.0790863037109375, 0.10776519775390625, 0.136444091796875, 0.16512298583984375, 0.1938018798828125, 0.22248077392578125, 0.25115966796875, 0.27983856201171875, 0.3085174560546875, 0.33719635009765625, 0.365875244140625, 0.39455413818359375, 0.4232330322265625, 0.45191192626953125, 0.4805908203125, 0.5092697143554688, 0.5379486083984375, 0.5666275024414062, 0.595306396484375, 0.6239852905273438, 0.6526641845703125, 0.6813430786132812, 0.71002197265625, 0.7387008666992188, 0.7673797607421875, 0.7960586547851562, 0.824737548828125, 0.8534164428710938, 0.8820953369140625, 0.9107742309570312, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 13.0, 5.0, 14.0, 15.0, 11.0, 19.0, 19.0, 22.0, 21.0, 22.0, 34.0, 38.0, 25.0, 30.0, 36.0, 39.0, 37.0, 39.0, 28.0, 30.0, 40.0, 36.0, 29.0, 42.0, 38.0, 32.0, 33.0, 30.0, 26.0, 26.0, 26.0, 16.0, 20.0, 9.0, 19.0, 15.0, 10.0, 8.0, 7.0, 5.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.8330078125, -0.8095779418945312, -0.7861480712890625, -0.7627182006835938, -0.739288330078125, -0.7158584594726562, -0.6924285888671875, -0.6689987182617188, -0.64556884765625, -0.6221389770507812, -0.5987091064453125, -0.5752792358398438, -0.551849365234375, -0.5284194946289062, -0.5049896240234375, -0.48155975341796875, -0.4581298828125, -0.43470001220703125, -0.4112701416015625, -0.38784027099609375, -0.364410400390625, -0.34098052978515625, -0.3175506591796875, -0.29412078857421875, -0.27069091796875, -0.24726104736328125, -0.2238311767578125, -0.20040130615234375, -0.176971435546875, -0.15354156494140625, -0.1301116943359375, -0.10668182373046875, -0.083251953125, -0.05982208251953125, -0.0363922119140625, -0.01296234130859375, 0.010467529296875, 0.03389739990234375, 0.0573272705078125, 0.08075714111328125, 0.10418701171875, 0.12761688232421875, 0.1510467529296875, 0.17447662353515625, 0.197906494140625, 0.22133636474609375, 0.2447662353515625, 0.26819610595703125, 0.2916259765625, 0.31505584716796875, 0.3384857177734375, 0.36191558837890625, 0.385345458984375, 0.40877532958984375, 0.4322052001953125, 0.45563507080078125, 0.47906494140625, 0.5024948120117188, 0.5259246826171875, 0.5493545532226562, 0.572784423828125, 0.5962142944335938, 0.6196441650390625, 0.6430740356445312, 0.66650390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 13.0, 27.0, 30.0, 53.0, 72.0, 89.0, 119.0, 186.0, 221.0, 362.0, 500.0, 748.0, 1130.0, 1782.0, 2819.0, 5074.0, 9421.0, 18078.0, 34812.0, 65433.0, 114540.0, 168930.0, 195492.0, 170623.0, 115426.0, 65912.0, 35101.0, 18451.0, 9577.0, 5133.0, 2947.0, 1789.0, 1155.0, 753.0, 505.0, 362.0, 243.0, 165.0, 114.0, 116.0, 55.0, 62.0, 33.0, 22.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.9111328125, -0.8822174072265625, -0.853302001953125, -0.8243865966796875, -0.79547119140625, -0.7665557861328125, -0.737640380859375, -0.7087249755859375, -0.6798095703125, -0.6508941650390625, -0.621978759765625, -0.5930633544921875, -0.56414794921875, -0.5352325439453125, -0.506317138671875, -0.4774017333984375, -0.448486328125, -0.4195709228515625, -0.390655517578125, -0.3617401123046875, -0.33282470703125, -0.3039093017578125, -0.274993896484375, -0.2460784912109375, -0.2171630859375, -0.1882476806640625, -0.159332275390625, -0.1304168701171875, -0.10150146484375, -0.0725860595703125, -0.043670654296875, -0.0147552490234375, 0.01416015625, 0.0430755615234375, 0.071990966796875, 0.1009063720703125, 0.12982177734375, 0.1587371826171875, 0.187652587890625, 0.2165679931640625, 0.2454833984375, 0.2743988037109375, 0.303314208984375, 0.3322296142578125, 0.36114501953125, 0.3900604248046875, 0.418975830078125, 0.4478912353515625, 0.476806640625, 0.5057220458984375, 0.534637451171875, 0.5635528564453125, 0.59246826171875, 0.6213836669921875, 0.650299072265625, 0.6792144775390625, 0.7081298828125, 0.7370452880859375, 0.765960693359375, 0.7948760986328125, 0.82379150390625, 0.8527069091796875, 0.881622314453125, 0.9105377197265625, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 15.0, 32.0, 34.0, 52.0, 69.0, 104.0, 114.0, 99.0, 115.0, 98.0, 70.0, 53.0, 46.0, 29.0, 16.0, 12.0, 8.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010120868682861328, -9.655021131038666e-05, -9.189173579216003e-05, -8.723326027393341e-05, -8.257478475570679e-05, -7.791630923748016e-05, -7.325783371925354e-05, -6.859935820102692e-05, -6.394088268280029e-05, -5.928240716457367e-05, -5.4623931646347046e-05, -4.996545612812042e-05, -4.53069806098938e-05, -4.0648505091667175e-05, -3.599002957344055e-05, -3.133155405521393e-05, -2.6673078536987305e-05, -2.201460301876068e-05, -1.7356127500534058e-05, -1.2697651982307434e-05, -8.03917646408081e-06, -3.380700945854187e-06, 1.2777745723724365e-06, 5.93625009059906e-06, 1.0594725608825684e-05, 1.5253201127052307e-05, 1.991167664527893e-05, 2.4570152163505554e-05, 2.9228627681732178e-05, 3.38871031999588e-05, 3.8545578718185425e-05, 4.320405423641205e-05, 4.786252975463867e-05, 5.2521005272865295e-05, 5.717948079109192e-05, 6.183795630931854e-05, 6.649643182754517e-05, 7.115490734577179e-05, 7.581338286399841e-05, 8.047185838222504e-05, 8.513033390045166e-05, 8.978880941867828e-05, 9.444728493690491e-05, 9.910576045513153e-05, 0.00010376423597335815, 0.00010842271149158478, 0.0001130811870098114, 0.00011773966252803802, 0.00012239813804626465, 0.00012705661356449127, 0.0001317150890827179, 0.00013637356460094452, 0.00014103204011917114, 0.00014569051563739777, 0.0001503489911556244, 0.000155007466673851, 0.00015966594219207764, 0.00016432441771030426, 0.00016898289322853088, 0.0001736413687467575, 0.00017829984426498413, 0.00018295831978321075, 0.00018761679530143738, 0.000192275270819664, 0.00019693374633789062]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 8.0, 5.0, 7.0, 17.0, 10.0, 26.0, 35.0, 40.0, 62.0, 87.0, 135.0, 178.0, 259.0, 351.0, 536.0, 766.0, 1161.0, 1730.0, 2595.0, 4006.0, 6300.0, 10164.0, 17278.0, 28996.0, 49312.0, 79210.0, 115121.0, 147790.0, 158166.0, 139796.0, 105500.0, 69976.0, 42988.0, 25683.0, 14877.0, 9033.0, 5630.0, 3598.0, 2328.0, 1536.0, 975.0, 685.0, 483.0, 327.0, 240.0, 169.0, 111.0, 83.0, 58.0, 35.0, 36.0, 24.0, 13.0, 7.0, 11.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.73828125, -0.7147445678710938, -0.6912078857421875, -0.6676712036132812, -0.644134521484375, -0.6205978393554688, -0.5970611572265625, -0.5735244750976562, -0.54998779296875, -0.5264511108398438, -0.5029144287109375, -0.47937774658203125, -0.455841064453125, -0.43230438232421875, -0.4087677001953125, -0.38523101806640625, -0.3616943359375, -0.33815765380859375, -0.3146209716796875, -0.29108428955078125, -0.267547607421875, -0.24401092529296875, -0.2204742431640625, -0.19693756103515625, -0.17340087890625, -0.14986419677734375, -0.1263275146484375, -0.10279083251953125, -0.079254150390625, -0.05571746826171875, -0.0321807861328125, -0.00864410400390625, 0.014892578125, 0.03842926025390625, 0.0619659423828125, 0.08550262451171875, 0.109039306640625, 0.13257598876953125, 0.1561126708984375, 0.17964935302734375, 0.20318603515625, 0.22672271728515625, 0.2502593994140625, 0.27379608154296875, 0.297332763671875, 0.32086944580078125, 0.3444061279296875, 0.36794281005859375, 0.3914794921875, 0.41501617431640625, 0.4385528564453125, 0.46208953857421875, 0.485626220703125, 0.5091629028320312, 0.5326995849609375, 0.5562362670898438, 0.57977294921875, 0.6033096313476562, 0.6268463134765625, 0.6503829956054688, 0.673919677734375, 0.6974563598632812, 0.7209930419921875, 0.7445297241210938, 0.76806640625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 2.0, 8.0, 12.0, 6.0, 11.0, 25.0, 22.0, 31.0, 34.0, 34.0, 39.0, 50.0, 43.0, 52.0, 66.0, 65.0, 69.0, 64.0, 56.0, 43.0, 44.0, 43.0, 27.0, 25.0, 29.0, 20.0, 8.0, 6.0, 12.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.234619140625, -0.22672653198242188, -0.21883392333984375, -0.21094131469726562, -0.2030487060546875, -0.19515609741210938, -0.18726348876953125, -0.17937088012695312, -0.171478271484375, -0.16358566284179688, -0.15569305419921875, -0.14780044555664062, -0.1399078369140625, -0.13201522827148438, -0.12412261962890625, -0.11623001098632812, -0.10833740234375, -0.10044479370117188, -0.09255218505859375, -0.08465957641601562, -0.0767669677734375, -0.06887435913085938, -0.06098175048828125, -0.053089141845703125, -0.045196533203125, -0.037303924560546875, -0.02941131591796875, -0.021518707275390625, -0.0136260986328125, -0.005733489990234375, 0.00215911865234375, 0.010051727294921875, 0.0179443359375, 0.025836944580078125, 0.03372955322265625, 0.041622161865234375, 0.0495147705078125, 0.057407379150390625, 0.06529998779296875, 0.07319259643554688, 0.081085205078125, 0.08897781372070312, 0.09687042236328125, 0.10476303100585938, 0.1126556396484375, 0.12054824829101562, 0.12844085693359375, 0.13633346557617188, 0.14422607421875, 0.15211868286132812, 0.16001129150390625, 0.16790390014648438, 0.1757965087890625, 0.18368911743164062, 0.19158172607421875, 0.19947433471679688, 0.207366943359375, 0.21525955200195312, 0.22315216064453125, 0.23104476928710938, 0.2389373779296875, 0.24682998657226562, 0.25472259521484375, 0.2626152038574219, 0.2705078125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 11.0, 10.0, 14.0, 4.0, 14.0, 14.0, 15.0, 23.0, 26.0, 42.0, 51.0, 41.0, 34.0, 42.0, 54.0, 45.0, 47.0, 48.0, 51.0, 48.0, 40.0, 40.0, 44.0, 42.0, 32.0, 33.0, 23.0, 21.0, 16.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6329678297042847, -1.5764333009719849, -1.519898772239685, -1.4633642435073853, -1.4068297147750854, -1.3502951860427856, -1.2937607765197754, -1.2372262477874756, -1.1806917190551758, -1.124157190322876, -1.0676226615905762, -1.0110881328582764, -0.9545536041259766, -0.8980190753936768, -0.8414846062660217, -0.7849500775337219, -0.7284154891967773, -0.6718809604644775, -0.6153464317321777, -0.5588119029998779, -0.5022773742675781, -0.4457428753376007, -0.3892083764076233, -0.3326738476753235, -0.2761393189430237, -0.21960479021072388, -0.16307027637958527, -0.10653576254844666, -0.05000123381614685, 0.006533294916152954, 0.06306779384613037, 0.11960232257843018, 0.17613673210144043, 0.23267126083374023, 0.28920578956604004, 0.34574028849601746, 0.40227481722831726, 0.45880934596061707, 0.5153438448905945, 0.5718783736228943, 0.6284129023551941, 0.6849474310874939, 0.7414819598197937, 0.7980164289474487, 0.8545509576797485, 0.9110854864120483, 0.9676200151443481, 1.024154543876648, 1.0806890726089478, 1.1372236013412476, 1.1937581300735474, 1.2502926588058472, 1.306827187538147, 1.3633617162704468, 1.419896125793457, 1.4764306545257568, 1.5329651832580566, 1.5894997119903564, 1.6460342407226562, 1.702568769454956, 1.7591032981872559, 1.8156378269195557, 1.8721723556518555, 1.9287068843841553, 1.985241413116455]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 16.0, 6.0, 16.0, 16.0, 18.0, 22.0, 23.0, 22.0, 32.0, 30.0, 46.0, 34.0, 39.0, 52.0, 40.0, 35.0, 49.0, 42.0, 42.0, 46.0, 38.0, 35.0, 38.0, 32.0, 35.0, 30.0, 28.0, 21.0, 19.0, 17.0, 14.0, 15.0, 5.0, 6.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3978337049484253, -1.353912115097046, -1.309990406036377, -1.2660688161849976, -1.2221472263336182, -1.1782256364822388, -1.1343040466308594, -1.0903823375701904, -1.046460747718811, -1.0025391578674316, -0.9586175084114075, -0.9146958589553833, -0.8707742691040039, -0.8268526792526245, -0.7829310297966003, -0.7390093803405762, -0.6950877904891968, -0.6511662006378174, -0.6072445511817932, -0.563322901725769, -0.5194013118743896, -0.47547969222068787, -0.4315580725669861, -0.3876364529132843, -0.3437148332595825, -0.29979321360588074, -0.25587159395217896, -0.21194997429847717, -0.1680283546447754, -0.12410673499107361, -0.08018511533737183, -0.036263495683670044, 0.007658123970031738, 0.05157974362373352, 0.0955013632774353, 0.13942298293113708, 0.18334460258483887, 0.22726622223854065, 0.27118784189224243, 0.3151094615459442, 0.359031081199646, 0.4029527008533478, 0.44687432050704956, 0.49079594016075134, 0.5347175598144531, 0.5786391496658325, 0.6225607991218567, 0.6664824485778809, 0.7104040384292603, 0.7543256282806396, 0.7982472777366638, 0.842168927192688, 0.8860905170440674, 0.9300121068954468, 0.973933756351471, 1.0178554058074951, 1.0617769956588745, 1.105698585510254, 1.1496202945709229, 1.1935418844223022, 1.2374634742736816, 1.281385064125061, 1.3253066539764404, 1.3692283630371094, 1.4131499528884888]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 6.0, 13.0, 25.0, 33.0, 57.0, 92.0, 168.0, 263.0, 480.0, 773.0, 1243.0, 2205.0, 3993.0, 7227.0, 12803.0, 23414.0, 42565.0, 76368.0, 134845.0, 227770.0, 360197.0, 510090.0, 622073.0, 637597.0, 540215.0, 391226.0, 252904.0, 151390.0, 86177.0, 48244.0, 26735.0, 14644.0, 8074.0, 4462.0, 2513.0, 1424.0, 809.0, 477.0, 285.0, 168.0, 93.0, 50.0, 41.0, 21.0, 16.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4785308837890625, -1.427764892578125, -1.3769989013671875, -1.32623291015625, -1.2754669189453125, -1.224700927734375, -1.1739349365234375, -1.1231689453125, -1.0724029541015625, -1.021636962890625, -0.9708709716796875, -0.92010498046875, -0.8693389892578125, -0.818572998046875, -0.7678070068359375, -0.717041015625, -0.6662750244140625, -0.615509033203125, -0.5647430419921875, -0.51397705078125, -0.4632110595703125, -0.412445068359375, -0.3616790771484375, -0.3109130859375, -0.2601470947265625, -0.209381103515625, -0.1586151123046875, -0.10784912109375, -0.0570831298828125, -0.006317138671875, 0.0444488525390625, 0.09521484375, 0.1459808349609375, 0.196746826171875, 0.2475128173828125, 0.29827880859375, 0.3490447998046875, 0.399810791015625, 0.4505767822265625, 0.5013427734375, 0.5521087646484375, 0.602874755859375, 0.6536407470703125, 0.70440673828125, 0.7551727294921875, 0.805938720703125, 0.8567047119140625, 0.907470703125, 0.9582366943359375, 1.009002685546875, 1.0597686767578125, 1.11053466796875, 1.1613006591796875, 1.212066650390625, 1.2628326416015625, 1.3135986328125, 1.3643646240234375, 1.415130615234375, 1.4658966064453125, 1.51666259765625, 1.5674285888671875, 1.618194580078125, 1.6689605712890625, 1.7197265625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 8.0, 13.0, 13.0, 15.0, 18.0, 29.0, 25.0, 27.0, 19.0, 30.0, 26.0, 43.0, 40.0, 52.0, 27.0, 33.0, 51.0, 43.0, 37.0, 45.0, 37.0, 31.0, 34.0, 41.0, 40.0, 34.0, 31.0, 27.0, 13.0, 22.0, 14.0, 19.0, 11.0, 10.0, 4.0, 11.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1434173583984375, -1.108123779296875, -1.0728302001953125, -1.03753662109375, -1.0022430419921875, -0.966949462890625, -0.9316558837890625, -0.8963623046875, -0.8610687255859375, -0.825775146484375, -0.7904815673828125, -0.75518798828125, -0.7198944091796875, -0.684600830078125, -0.6493072509765625, -0.614013671875, -0.5787200927734375, -0.543426513671875, -0.5081329345703125, -0.47283935546875, -0.4375457763671875, -0.402252197265625, -0.3669586181640625, -0.3316650390625, -0.2963714599609375, -0.261077880859375, -0.2257843017578125, -0.19049072265625, -0.1551971435546875, -0.119903564453125, -0.0846099853515625, -0.04931640625, -0.0140228271484375, 0.021270751953125, 0.0565643310546875, 0.09185791015625, 0.1271514892578125, 0.162445068359375, 0.1977386474609375, 0.2330322265625, 0.2683258056640625, 0.303619384765625, 0.3389129638671875, 0.37420654296875, 0.4095001220703125, 0.444793701171875, 0.4800872802734375, 0.515380859375, 0.5506744384765625, 0.585968017578125, 0.6212615966796875, 0.65655517578125, 0.6918487548828125, 0.727142333984375, 0.7624359130859375, 0.7977294921875, 0.8330230712890625, 0.868316650390625, 0.9036102294921875, 0.93890380859375, 0.9741973876953125, 1.009490966796875, 1.0447845458984375, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 18.0, 18.0, 42.0, 58.0, 88.0, 126.0, 195.0, 327.0, 564.0, 890.0, 1364.0, 2316.0, 3681.0, 5795.0, 9585.0, 15446.0, 25553.0, 40369.0, 63993.0, 98149.0, 146268.0, 212878.0, 290699.0, 372180.0, 438707.0, 474247.0, 462564.0, 411738.0, 337848.0, 254038.0, 181491.0, 123446.0, 81500.0, 52030.0, 32834.0, 20388.0, 12460.0, 7816.0, 4756.0, 2940.0, 1811.0, 1181.0, 682.0, 464.0, 255.0, 188.0, 111.0, 65.0, 49.0, 28.0, 17.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.388671875, -1.344970703125, -1.30126953125, -1.257568359375, -1.2138671875, -1.170166015625, -1.12646484375, -1.082763671875, -1.0390625, -0.995361328125, -0.95166015625, -0.907958984375, -0.8642578125, -0.820556640625, -0.77685546875, -0.733154296875, -0.689453125, -0.645751953125, -0.60205078125, -0.558349609375, -0.5146484375, -0.470947265625, -0.42724609375, -0.383544921875, -0.33984375, -0.296142578125, -0.25244140625, -0.208740234375, -0.1650390625, -0.121337890625, -0.07763671875, -0.033935546875, 0.009765625, 0.053466796875, 0.09716796875, 0.140869140625, 0.1845703125, 0.228271484375, 0.27197265625, 0.315673828125, 0.359375, 0.403076171875, 0.44677734375, 0.490478515625, 0.5341796875, 0.577880859375, 0.62158203125, 0.665283203125, 0.708984375, 0.752685546875, 0.79638671875, 0.840087890625, 0.8837890625, 0.927490234375, 0.97119140625, 1.014892578125, 1.05859375, 1.102294921875, 1.14599609375, 1.189697265625, 1.2333984375, 1.277099609375, 1.32080078125, 1.364501953125, 1.408203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 14.0, 16.0, 19.0, 20.0, 32.0, 30.0, 31.0, 39.0, 49.0, 58.0, 71.0, 74.0, 109.0, 119.0, 122.0, 127.0, 154.0, 171.0, 174.0, 193.0, 206.0, 210.0, 168.0, 207.0, 190.0, 159.0, 157.0, 140.0, 148.0, 126.0, 119.0, 113.0, 82.0, 79.0, 68.0, 42.0, 45.0, 45.0, 30.0, 27.0, 20.0, 15.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.54931640625, -0.5322036743164062, -0.5150909423828125, -0.49797821044921875, -0.480865478515625, -0.46375274658203125, -0.4466400146484375, -0.42952728271484375, -0.41241455078125, -0.39530181884765625, -0.3781890869140625, -0.36107635498046875, -0.343963623046875, -0.32685089111328125, -0.3097381591796875, -0.29262542724609375, -0.2755126953125, -0.25839996337890625, -0.2412872314453125, -0.22417449951171875, -0.207061767578125, -0.18994903564453125, -0.1728363037109375, -0.15572357177734375, -0.13861083984375, -0.12149810791015625, -0.1043853759765625, -0.08727264404296875, -0.070159912109375, -0.05304718017578125, -0.0359344482421875, -0.01882171630859375, -0.001708984375, 0.01540374755859375, 0.0325164794921875, 0.04962921142578125, 0.066741943359375, 0.08385467529296875, 0.1009674072265625, 0.11808013916015625, 0.13519287109375, 0.15230560302734375, 0.1694183349609375, 0.18653106689453125, 0.203643798828125, 0.22075653076171875, 0.2378692626953125, 0.25498199462890625, 0.2720947265625, 0.28920745849609375, 0.3063201904296875, 0.32343292236328125, 0.340545654296875, 0.35765838623046875, 0.3747711181640625, 0.39188385009765625, 0.40899658203125, 0.42610931396484375, 0.4432220458984375, 0.46033477783203125, 0.477447509765625, 0.49456024169921875, 0.5116729736328125, 0.5287857055664062, 0.5458984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 7.0, 14.0, 15.0, 9.0, 17.0, 16.0, 26.0, 27.0, 28.0, 41.0, 41.0, 48.0, 55.0, 64.0, 52.0, 57.0, 49.0, 62.0, 42.0, 48.0, 49.0, 30.0, 28.0, 28.0, 23.0, 22.0, 24.0, 12.0, 17.0, 11.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.348088264465332, -2.280186176300049, -2.2122840881347656, -2.1443819999694824, -2.0764801502227783, -2.008578062057495, -1.940675973892212, -1.8727738857269287, -1.8048717975616455, -1.7369697093963623, -1.6690677404403687, -1.6011656522750854, -1.5332635641098022, -1.4653615951538086, -1.3974595069885254, -1.3295574188232422, -1.2616554498672485, -1.1937533617019653, -1.1258513927459717, -1.0579493045806885, -0.9900472164154053, -0.9221451878547668, -0.8542431592941284, -0.7863410711288452, -0.7184390425682068, -0.6505370140075684, -0.5826349258422852, -0.5147328972816467, -0.4468308389186859, -0.3789287805557251, -0.31102675199508667, -0.24312469363212585, -0.17522263526916504, -0.10732058435678482, -0.0394185334444046, 0.02848351001739502, 0.09638556838035583, 0.16428762674331665, 0.23218965530395508, 0.3000917136669159, 0.3679937720298767, 0.4358958303928375, 0.5037978887557983, 0.5716999173164368, 0.6396019458770752, 0.7075040340423584, 0.7754060626029968, 0.8433080911636353, 0.9112101793289185, 0.9791122078895569, 1.0470142364501953, 1.1149163246154785, 1.1828184127807617, 1.250720500946045, 1.3186224699020386, 1.3865245580673218, 1.4544265270233154, 1.5223286151885986, 1.5902305841445923, 1.6581326723098755, 1.7260347604751587, 1.7939367294311523, 1.8618388175964355, 1.9297409057617188, 1.997642993927002]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 12.0, 9.0, 12.0, 18.0, 15.0, 23.0, 14.0, 24.0, 18.0, 29.0, 36.0, 47.0, 40.0, 33.0, 39.0, 46.0, 42.0, 39.0, 41.0, 51.0, 44.0, 42.0, 49.0, 30.0, 27.0, 26.0, 26.0, 31.0, 19.0, 19.0, 16.0, 17.0, 11.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.7488301992416382, -1.7021123170852661, -1.6553945541381836, -1.6086766719818115, -1.561958909034729, -1.515241026878357, -1.4685232639312744, -1.4218053817749023, -1.3750876188278198, -1.3283697366714478, -1.2816519737243652, -1.2349340915679932, -1.1882163286209106, -1.1414984464645386, -1.094780683517456, -1.048062801361084, -1.001344919204712, -0.9546270966529846, -0.9079092741012573, -0.86119145154953, -0.8144736289978027, -0.7677558064460754, -0.7210379838943481, -0.6743201017379761, -0.6276023387908936, -0.5808845162391663, -0.534166693687439, -0.48744887113571167, -0.4407310485839844, -0.3940132260322571, -0.3472953736782074, -0.3005775511264801, -0.2538597583770752, -0.2071419358253479, -0.1604241132736206, -0.11370627582073212, -0.06698845326900482, -0.020270630717277527, 0.026447206735610962, 0.07316502928733826, 0.11988285183906555, 0.16660067439079285, 0.21331849694252014, 0.2600363492965698, 0.3067541718482971, 0.3534719944000244, 0.4001898169517517, 0.446907639503479, 0.4936254620552063, 0.5403432846069336, 0.5870611071586609, 0.6337789297103882, 0.6804967522621155, 0.7272145748138428, 0.7739324569702148, 0.8206502199172974, 0.8673681020736694, 0.9140859246253967, 0.960803747177124, 1.007521629333496, 1.0542393922805786, 1.1009572744369507, 1.1476750373840332, 1.1943929195404053, 1.2411106824874878]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 11.0, 23.0, 20.0, 47.0, 77.0, 111.0, 146.0, 239.0, 363.0, 558.0, 883.0, 1192.0, 2080.0, 3223.0, 4981.0, 8184.0, 13213.0, 21773.0, 36158.0, 58197.0, 92153.0, 137461.0, 174055.0, 164789.0, 121882.0, 78916.0, 49423.0, 30329.0, 18173.0, 11106.0, 6880.0, 4364.0, 2661.0, 1746.0, 1066.0, 699.0, 425.0, 289.0, 197.0, 147.0, 114.0, 68.0, 41.0, 25.0, 22.0, 12.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.343505859375, -0.3323631286621094, -0.32122039794921875, -0.3100776672363281, -0.2989349365234375, -0.2877922058105469, -0.27664947509765625, -0.2655067443847656, -0.254364013671875, -0.24322128295898438, -0.23207855224609375, -0.22093582153320312, -0.2097930908203125, -0.19865036010742188, -0.18750762939453125, -0.17636489868164062, -0.16522216796875, -0.15407943725585938, -0.14293670654296875, -0.13179397583007812, -0.1206512451171875, -0.10950851440429688, -0.09836578369140625, -0.08722305297851562, -0.076080322265625, -0.06493759155273438, -0.05379486083984375, -0.042652130126953125, -0.0315093994140625, -0.020366668701171875, -0.00922393798828125, 0.001918792724609375, 0.0130615234375, 0.024204254150390625, 0.03534698486328125, 0.046489715576171875, 0.0576324462890625, 0.06877517700195312, 0.07991790771484375, 0.09106063842773438, 0.102203369140625, 0.11334609985351562, 0.12448883056640625, 0.13563156127929688, 0.1467742919921875, 0.15791702270507812, 0.16905975341796875, 0.18020248413085938, 0.19134521484375, 0.20248794555664062, 0.21363067626953125, 0.22477340698242188, 0.2359161376953125, 0.24705886840820312, 0.25820159912109375, 0.2693443298339844, 0.280487060546875, 0.2916297912597656, 0.30277252197265625, 0.3139152526855469, 0.3250579833984375, 0.3362007141113281, 0.34734344482421875, 0.3584861755371094, 0.36962890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 8.0, 12.0, 12.0, 21.0, 19.0, 21.0, 30.0, 28.0, 34.0, 27.0, 26.0, 35.0, 42.0, 40.0, 52.0, 40.0, 38.0, 34.0, 51.0, 34.0, 43.0, 51.0, 43.0, 37.0, 28.0, 16.0, 30.0, 23.0, 16.0, 27.0, 10.0, 12.0, 12.0, 7.0, 6.0, 8.0, 1.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7933349609375, -1.741943359375, -1.6905517578125, -1.63916015625, -1.5877685546875, -1.536376953125, -1.4849853515625, -1.43359375, -1.3822021484375, -1.330810546875, -1.2794189453125, -1.22802734375, -1.1766357421875, -1.125244140625, -1.0738525390625, -1.0224609375, -0.9710693359375, -0.919677734375, -0.8682861328125, -0.81689453125, -0.7655029296875, -0.714111328125, -0.6627197265625, -0.611328125, -0.5599365234375, -0.508544921875, -0.4571533203125, -0.40576171875, -0.3543701171875, -0.302978515625, -0.2515869140625, -0.2001953125, -0.1488037109375, -0.097412109375, -0.0460205078125, 0.00537109375, 0.0567626953125, 0.108154296875, 0.1595458984375, 0.2109375, 0.2623291015625, 0.313720703125, 0.3651123046875, 0.41650390625, 0.4678955078125, 0.519287109375, 0.5706787109375, 0.6220703125, 0.6734619140625, 0.724853515625, 0.7762451171875, 0.82763671875, 0.8790283203125, 0.930419921875, 0.9818115234375, 1.033203125, 1.0845947265625, 1.135986328125, 1.1873779296875, 1.23876953125, 1.2901611328125, 1.341552734375, 1.3929443359375, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 9.0, 20.0, 31.0, 26.0, 39.0, 78.0, 102.0, 152.0, 248.0, 371.0, 628.0, 1072.0, 1912.0, 3275.0, 5853.0, 11076.0, 20867.0, 40352.0, 77504.0, 140286.0, 212390.0, 215760.0, 146346.0, 80335.0, 42153.0, 21871.0, 11529.0, 6166.0, 3297.0, 1877.0, 1071.0, 650.0, 395.0, 272.0, 172.0, 89.0, 75.0, 47.0, 47.0, 23.0, 10.0, 18.0, 11.0, 9.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49560546875, -0.4806022644042969, -0.46559906005859375, -0.4505958557128906, -0.4355926513671875, -0.4205894470214844, -0.40558624267578125, -0.3905830383300781, -0.375579833984375, -0.3605766296386719, -0.34557342529296875, -0.3305702209472656, -0.3155670166015625, -0.3005638122558594, -0.28556060791015625, -0.2705574035644531, -0.25555419921875, -0.24055099487304688, -0.22554779052734375, -0.21054458618164062, -0.1955413818359375, -0.18053817749023438, -0.16553497314453125, -0.15053176879882812, -0.135528564453125, -0.12052536010742188, -0.10552215576171875, -0.09051895141601562, -0.0755157470703125, -0.060512542724609375, -0.04550933837890625, -0.030506134033203125, -0.0155029296875, -0.000499725341796875, 0.01450347900390625, 0.029506683349609375, 0.0445098876953125, 0.059513092041015625, 0.07451629638671875, 0.08951950073242188, 0.104522705078125, 0.11952590942382812, 0.13452911376953125, 0.14953231811523438, 0.1645355224609375, 0.17953872680664062, 0.19454193115234375, 0.20954513549804688, 0.22454833984375, 0.23955154418945312, 0.25455474853515625, 0.2695579528808594, 0.2845611572265625, 0.2995643615722656, 0.31456756591796875, 0.3295707702636719, 0.344573974609375, 0.3595771789550781, 0.37458038330078125, 0.3895835876464844, 0.4045867919921875, 0.4195899963378906, 0.43459320068359375, 0.4495964050292969, 0.464599609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 9.0, 3.0, 15.0, 12.0, 10.0, 17.0, 16.0, 23.0, 12.0, 32.0, 34.0, 40.0, 34.0, 51.0, 44.0, 53.0, 38.0, 37.0, 48.0, 40.0, 50.0, 42.0, 34.0, 39.0, 35.0, 36.0, 32.0, 29.0, 26.0, 22.0, 17.0, 21.0, 11.0, 8.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9091796875, -0.8769073486328125, -0.844635009765625, -0.8123626708984375, -0.78009033203125, -0.7478179931640625, -0.715545654296875, -0.6832733154296875, -0.6510009765625, -0.6187286376953125, -0.586456298828125, -0.5541839599609375, -0.52191162109375, -0.4896392822265625, -0.457366943359375, -0.4250946044921875, -0.392822265625, -0.3605499267578125, -0.328277587890625, -0.2960052490234375, -0.26373291015625, -0.2314605712890625, -0.199188232421875, -0.1669158935546875, -0.1346435546875, -0.1023712158203125, -0.070098876953125, -0.0378265380859375, -0.00555419921875, 0.0267181396484375, 0.058990478515625, 0.0912628173828125, 0.12353515625, 0.1558074951171875, 0.188079833984375, 0.2203521728515625, 0.25262451171875, 0.2848968505859375, 0.317169189453125, 0.3494415283203125, 0.3817138671875, 0.4139862060546875, 0.446258544921875, 0.4785308837890625, 0.51080322265625, 0.5430755615234375, 0.575347900390625, 0.6076202392578125, 0.639892578125, 0.6721649169921875, 0.704437255859375, 0.7367095947265625, 0.76898193359375, 0.8012542724609375, 0.833526611328125, 0.8657989501953125, 0.8980712890625, 0.9303436279296875, 0.962615966796875, 0.9948883056640625, 1.02716064453125, 1.0594329833984375, 1.091705322265625, 1.1239776611328125, 1.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 4.0, 9.0, 6.0, 17.0, 19.0, 29.0, 34.0, 51.0, 65.0, 86.0, 133.0, 175.0, 242.0, 401.0, 768.0, 1356.0, 2700.0, 6069.0, 16988.0, 70262.0, 511066.0, 363189.0, 50721.0, 13666.0, 5096.0, 2273.0, 1161.0, 669.0, 425.0, 267.0, 157.0, 124.0, 79.0, 57.0, 33.0, 30.0, 23.0, 18.0, 17.0, 14.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.47998046875, -0.4662284851074219, -0.45247650146484375, -0.4387245178222656, -0.4249725341796875, -0.4112205505371094, -0.39746856689453125, -0.3837165832519531, -0.369964599609375, -0.3562126159667969, -0.34246063232421875, -0.3287086486816406, -0.3149566650390625, -0.3012046813964844, -0.28745269775390625, -0.2737007141113281, -0.25994873046875, -0.24619674682617188, -0.23244476318359375, -0.21869277954101562, -0.2049407958984375, -0.19118881225585938, -0.17743682861328125, -0.16368484497070312, -0.149932861328125, -0.13618087768554688, -0.12242889404296875, -0.10867691040039062, -0.0949249267578125, -0.08117294311523438, -0.06742095947265625, -0.053668975830078125, -0.0399169921875, -0.026165008544921875, -0.01241302490234375, 0.001338958740234375, 0.0150909423828125, 0.028842926025390625, 0.04259490966796875, 0.056346893310546875, 0.070098876953125, 0.08385086059570312, 0.09760284423828125, 0.11135482788085938, 0.1251068115234375, 0.13885879516601562, 0.15261077880859375, 0.16636276245117188, 0.18011474609375, 0.19386672973632812, 0.20761871337890625, 0.22137069702148438, 0.2351226806640625, 0.24887466430664062, 0.26262664794921875, 0.2763786315917969, 0.290130615234375, 0.3038825988769531, 0.31763458251953125, 0.3313865661621094, 0.3451385498046875, 0.3588905334472656, 0.37264251708984375, 0.3863945007324219, 0.400146484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 20.0, 21.0, 21.0, 43.0, 45.0, 60.0, 68.0, 90.0, 97.0, 97.0, 79.0, 96.0, 56.0, 61.0, 38.0, 34.0, 21.0, 8.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.907162368297577e-05, -1.841410994529724e-05, -1.7756596207618713e-05, -1.7099082469940186e-05, -1.6441568732261658e-05, -1.578405499458313e-05, -1.5126541256904602e-05, -1.4469027519226074e-05, -1.3811513781547546e-05, -1.3154000043869019e-05, -1.249648630619049e-05, -1.1838972568511963e-05, -1.1181458830833435e-05, -1.0523945093154907e-05, -9.86643135547638e-06, -9.208917617797852e-06, -8.551403880119324e-06, -7.893890142440796e-06, -7.236376404762268e-06, -6.57886266708374e-06, -5.921348929405212e-06, -5.2638351917266846e-06, -4.606321454048157e-06, -3.948807716369629e-06, -3.291293978691101e-06, -2.6337802410125732e-06, -1.9762665033340454e-06, -1.3187527656555176e-06, -6.612390279769897e-07, -3.725290298461914e-09, 6.537884473800659e-07, 1.3113021850585938e-06, 1.9688159227371216e-06, 2.6263296604156494e-06, 3.2838433980941772e-06, 3.941357135772705e-06, 4.598870873451233e-06, 5.256384611129761e-06, 5.9138983488082886e-06, 6.571412086486816e-06, 7.228925824165344e-06, 7.886439561843872e-06, 8.5439532995224e-06, 9.201467037200928e-06, 9.858980774879456e-06, 1.0516494512557983e-05, 1.1174008250236511e-05, 1.1831521987915039e-05, 1.2489035725593567e-05, 1.3146549463272095e-05, 1.3804063200950623e-05, 1.446157693862915e-05, 1.5119090676307678e-05, 1.5776604413986206e-05, 1.6434118151664734e-05, 1.7091631889343262e-05, 1.774914562702179e-05, 1.8406659364700317e-05, 1.9064173102378845e-05, 1.9721686840057373e-05, 2.03792005777359e-05, 2.103671431541443e-05, 2.1694228053092957e-05, 2.2351741790771484e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 19.0, 19.0, 34.0, 47.0, 37.0, 83.0, 87.0, 142.0, 181.0, 217.0, 326.0, 407.0, 591.0, 808.0, 1166.0, 1744.0, 3056.0, 6147.0, 14618.0, 44795.0, 169416.0, 469661.0, 238226.0, 60446.0, 18656.0, 7510.0, 3536.0, 2064.0, 1343.0, 893.0, 569.0, 415.0, 330.0, 246.0, 163.0, 148.0, 97.0, 81.0, 60.0, 39.0, 23.0, 28.0, 16.0, 17.0, 8.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.372314453125, -0.35930633544921875, -0.3462982177734375, -0.33329010009765625, -0.320281982421875, -0.30727386474609375, -0.2942657470703125, -0.28125762939453125, -0.26824951171875, -0.25524139404296875, -0.2422332763671875, -0.22922515869140625, -0.216217041015625, -0.20320892333984375, -0.1902008056640625, -0.17719268798828125, -0.1641845703125, -0.15117645263671875, -0.1381683349609375, -0.12516021728515625, -0.112152099609375, -0.09914398193359375, -0.0861358642578125, -0.07312774658203125, -0.06011962890625, -0.04711151123046875, -0.0341033935546875, -0.02109527587890625, -0.008087158203125, 0.00492095947265625, 0.0179290771484375, 0.03093719482421875, 0.0439453125, 0.05695343017578125, 0.0699615478515625, 0.08296966552734375, 0.095977783203125, 0.10898590087890625, 0.1219940185546875, 0.13500213623046875, 0.14801025390625, 0.16101837158203125, 0.1740264892578125, 0.18703460693359375, 0.200042724609375, 0.21305084228515625, 0.2260589599609375, 0.23906707763671875, 0.2520751953125, 0.26508331298828125, 0.2780914306640625, 0.29109954833984375, 0.304107666015625, 0.31711578369140625, 0.3301239013671875, 0.34313201904296875, 0.35614013671875, 0.36914825439453125, 0.3821563720703125, 0.39516448974609375, 0.408172607421875, 0.42118072509765625, 0.4341888427734375, 0.44719696044921875, 0.460205078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 10.0, 4.0, 10.0, 17.0, 22.0, 34.0, 32.0, 49.0, 59.0, 91.0, 123.0, 127.0, 113.0, 66.0, 53.0, 51.0, 26.0, 22.0, 16.0, 15.0, 9.0, 3.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07037353515625, -0.06778240203857422, -0.06519126892089844, -0.06260013580322266, -0.060009002685546875, -0.057417869567871094, -0.05482673645019531, -0.05223560333251953, -0.04964447021484375, -0.04705333709716797, -0.04446220397949219, -0.041871070861816406, -0.039279937744140625, -0.036688804626464844, -0.03409767150878906, -0.03150653839111328, -0.0289154052734375, -0.02632427215576172, -0.023733139038085938, -0.021142005920410156, -0.018550872802734375, -0.015959739685058594, -0.013368606567382812, -0.010777473449707031, -0.00818634033203125, -0.005595207214355469, -0.0030040740966796875, -0.00041294097900390625, 0.002178192138671875, 0.004769325256347656, 0.0073604583740234375, 0.009951591491699219, 0.012542724609375, 0.015133857727050781, 0.017724990844726562, 0.020316123962402344, 0.022907257080078125, 0.025498390197753906, 0.028089523315429688, 0.03068065643310547, 0.03327178955078125, 0.03586292266845703, 0.03845405578613281, 0.041045188903808594, 0.043636322021484375, 0.046227455139160156, 0.04881858825683594, 0.05140972137451172, 0.0540008544921875, 0.05659198760986328, 0.05918312072753906, 0.061774253845214844, 0.06436538696289062, 0.0669565200805664, 0.06954765319824219, 0.07213878631591797, 0.07472991943359375, 0.07732105255126953, 0.07991218566894531, 0.0825033187866211, 0.08509445190429688, 0.08768558502197266, 0.09027671813964844, 0.09286785125732422, 0.095458984375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 18.0, 11.0, 19.0, 15.0, 33.0, 24.0, 36.0, 47.0, 32.0, 59.0, 61.0, 55.0, 60.0, 58.0, 49.0, 56.0, 40.0, 53.0, 39.0, 26.0, 28.0, 24.0, 22.0, 28.0, 12.0, 12.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4011058807373047, -2.3326547145843506, -2.2642035484313965, -2.1957523822784424, -2.1273012161254883, -2.058850049972534, -1.9903987646102905, -1.9219475984573364, -1.8534964323043823, -1.7850452661514282, -1.7165940999984741, -1.64814293384552, -1.5796916484832764, -1.5112404823303223, -1.4427893161773682, -1.374338150024414, -1.30588698387146, -1.2374358177185059, -1.1689846515655518, -1.1005334854125977, -1.0320823192596436, -0.9636310935020447, -0.8951798677444458, -0.8267287015914917, -0.7582775354385376, -0.6898263692855835, -0.6213752031326294, -0.5529239773750305, -0.4844728112220764, -0.4160216450691223, -0.3475704491138458, -0.27911925315856934, -0.21066796779632568, -0.1422167867422104, -0.07376560568809509, -0.005314424633979797, 0.0631367564201355, 0.1315879225730896, 0.2000391185283661, 0.2684903144836426, 0.3369414806365967, 0.4053926467895508, 0.47384384274482727, 0.5422950387001038, 0.6107462048530579, 0.679197371006012, 0.7476485967636108, 0.8160997629165649, 0.884550929069519, 0.9530020952224731, 1.0214532613754272, 1.0899044275283813, 1.158355712890625, 1.226806879043579, 1.2952580451965332, 1.3637092113494873, 1.4321603775024414, 1.5006115436553955, 1.5690627098083496, 1.6375138759613037, 1.7059650421142578, 1.774416208267212, 1.8428674936294556, 1.9113186597824097, 1.9797698259353638]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 23.0, 15.0, 22.0, 15.0, 22.0, 19.0, 31.0, 35.0, 46.0, 43.0, 30.0, 41.0, 52.0, 41.0, 38.0, 51.0, 41.0, 44.0, 44.0, 47.0, 27.0, 26.0, 29.0, 31.0, 25.0, 17.0, 20.0, 18.0, 12.0, 14.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.7654094696044922, -1.7181633710861206, -1.6709171533584595, -1.623671054840088, -1.5764248371124268, -1.5291787385940552, -1.4819326400756836, -1.4346864223480225, -1.3874403238296509, -1.3401942253112793, -1.2929480075836182, -1.2457019090652466, -1.198455810546875, -1.1512095928192139, -1.1039634943008423, -1.0567173957824707, -1.0094711780548096, -0.9622250199317932, -0.9149788618087769, -0.8677327632904053, -0.8204866051673889, -0.7732404470443726, -0.725994348526001, -0.6787481904029846, -0.6315020322799683, -0.5842558741569519, -0.5370097160339355, -0.48976361751556396, -0.4425174593925476, -0.39527130126953125, -0.3480251729488373, -0.3007790446281433, -0.25353288650512695, -0.2062867432832718, -0.15904060006141663, -0.11179445683956146, -0.0645483136177063, -0.017302170395851135, 0.02994397282600403, 0.077190101146698, 0.12443625926971436, 0.17168240249156952, 0.21892854571342468, 0.26617467403411865, 0.313420832157135, 0.36066699028015137, 0.40791311860084534, 0.4551592469215393, 0.5024054050445557, 0.549651563167572, 0.5968977212905884, 0.64414381980896, 0.6913899779319763, 0.7386361360549927, 0.7858822345733643, 0.8331283926963806, 0.880374550819397, 0.9276207089424133, 0.9748668670654297, 1.0221129655838013, 1.0693590641021729, 1.116605281829834, 1.1638513803482056, 1.2110974788665771, 1.2583436965942383]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 8.0, 15.0, 14.0, 25.0, 55.0, 81.0, 128.0, 197.0, 338.0, 544.0, 797.0, 1232.0, 1752.0, 2857.0, 4235.0, 6360.0, 9471.0, 13672.0, 19373.0, 27283.0, 36458.0, 47943.0, 60727.0, 72949.0, 84306.0, 91300.0, 93304.0, 90939.0, 83174.0, 71981.0, 59448.0, 46977.0, 35271.0, 26278.0, 18658.0, 13315.0, 9156.0, 6069.0, 4165.0, 2670.0, 1849.0, 1127.0, 762.0, 437.0, 297.0, 231.0, 133.0, 78.0, 47.0, 33.0, 19.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8684616088867188, -0.8389739990234375, -0.8094863891601562, -0.779998779296875, -0.7505111694335938, -0.7210235595703125, -0.6915359497070312, -0.66204833984375, -0.6325607299804688, -0.6030731201171875, -0.5735855102539062, -0.544097900390625, -0.5146102905273438, -0.4851226806640625, -0.45563507080078125, -0.4261474609375, -0.39665985107421875, -0.3671722412109375, -0.33768463134765625, -0.308197021484375, -0.27870941162109375, -0.2492218017578125, -0.21973419189453125, -0.19024658203125, -0.16075897216796875, -0.1312713623046875, -0.10178375244140625, -0.072296142578125, -0.04280853271484375, -0.0133209228515625, 0.01616668701171875, 0.045654296875, 0.07514190673828125, 0.1046295166015625, 0.13411712646484375, 0.163604736328125, 0.19309234619140625, 0.2225799560546875, 0.25206756591796875, 0.28155517578125, 0.31104278564453125, 0.3405303955078125, 0.37001800537109375, 0.399505615234375, 0.42899322509765625, 0.4584808349609375, 0.48796844482421875, 0.5174560546875, 0.5469436645507812, 0.5764312744140625, 0.6059188842773438, 0.635406494140625, 0.6648941040039062, 0.6943817138671875, 0.7238693237304688, 0.75335693359375, 0.7828445434570312, 0.8123321533203125, 0.8418197631835938, 0.871307373046875, 0.9007949829101562, 0.9302825927734375, 0.9597702026367188, 0.9892578125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 9.0, 10.0, 6.0, 6.0, 5.0, 15.0, 15.0, 20.0, 16.0, 21.0, 26.0, 43.0, 33.0, 31.0, 40.0, 37.0, 50.0, 41.0, 45.0, 42.0, 37.0, 36.0, 48.0, 45.0, 41.0, 46.0, 32.0, 26.0, 29.0, 22.0, 16.0, 32.0, 9.0, 19.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.822265625, -1.7723846435546875, -1.722503662109375, -1.6726226806640625, -1.62274169921875, -1.5728607177734375, -1.522979736328125, -1.4730987548828125, -1.4232177734375, -1.3733367919921875, -1.323455810546875, -1.2735748291015625, -1.22369384765625, -1.1738128662109375, -1.123931884765625, -1.0740509033203125, -1.024169921875, -0.9742889404296875, -0.924407958984375, -0.8745269775390625, -0.82464599609375, -0.7747650146484375, -0.724884033203125, -0.6750030517578125, -0.6251220703125, -0.5752410888671875, -0.525360107421875, -0.4754791259765625, -0.42559814453125, -0.3757171630859375, -0.325836181640625, -0.2759552001953125, -0.22607421875, -0.1761932373046875, -0.126312255859375, -0.0764312744140625, -0.02655029296875, 0.0233306884765625, 0.073211669921875, 0.1230926513671875, 0.1729736328125, 0.2228546142578125, 0.272735595703125, 0.3226165771484375, 0.37249755859375, 0.4223785400390625, 0.472259521484375, 0.5221405029296875, 0.572021484375, 0.6219024658203125, 0.671783447265625, 0.7216644287109375, 0.77154541015625, 0.8214263916015625, 0.871307373046875, 0.9211883544921875, 0.9710693359375, 1.0209503173828125, 1.070831298828125, 1.1207122802734375, 1.17059326171875, 1.2204742431640625, 1.270355224609375, 1.3202362060546875, 1.3701171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 29.0, 34.0, 61.0, 110.0, 157.0, 240.0, 434.0, 709.0, 1150.0, 1840.0, 3092.0, 4683.0, 7584.0, 11518.0, 17911.0, 26462.0, 37853.0, 52354.0, 68496.0, 84795.0, 98785.0, 105512.0, 105893.0, 98562.0, 84539.0, 68253.0, 52906.0, 38203.0, 26530.0, 17758.0, 11975.0, 7527.0, 4816.0, 3004.0, 1841.0, 1144.0, 702.0, 449.0, 256.0, 144.0, 82.0, 57.0, 32.0, 23.0, 24.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9275665283203125, -0.893218994140625, -0.8588714599609375, -0.82452392578125, -0.7901763916015625, -0.755828857421875, -0.7214813232421875, -0.6871337890625, -0.6527862548828125, -0.618438720703125, -0.5840911865234375, -0.54974365234375, -0.5153961181640625, -0.481048583984375, -0.4467010498046875, -0.412353515625, -0.3780059814453125, -0.343658447265625, -0.3093109130859375, -0.27496337890625, -0.2406158447265625, -0.206268310546875, -0.1719207763671875, -0.1375732421875, -0.1032257080078125, -0.068878173828125, -0.0345306396484375, -0.00018310546875, 0.0341644287109375, 0.068511962890625, 0.1028594970703125, 0.13720703125, 0.1715545654296875, 0.205902099609375, 0.2402496337890625, 0.27459716796875, 0.3089447021484375, 0.343292236328125, 0.3776397705078125, 0.4119873046875, 0.4463348388671875, 0.480682373046875, 0.5150299072265625, 0.54937744140625, 0.5837249755859375, 0.618072509765625, 0.6524200439453125, 0.686767578125, 0.7211151123046875, 0.755462646484375, 0.7898101806640625, 0.82415771484375, 0.8585052490234375, 0.892852783203125, 0.9272003173828125, 0.9615478515625, 0.9958953857421875, 1.030242919921875, 1.0645904541015625, 1.09893798828125, 1.1332855224609375, 1.167633056640625, 1.2019805908203125, 1.236328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 13.0, 11.0, 23.0, 25.0, 24.0, 21.0, 35.0, 26.0, 33.0, 36.0, 44.0, 45.0, 40.0, 41.0, 44.0, 53.0, 36.0, 49.0, 40.0, 42.0, 31.0, 28.0, 26.0, 30.0, 31.0, 24.0, 22.0, 18.0, 16.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.9163818359375, -0.885986328125, -0.8555908203125, -0.8251953125, -0.7947998046875, -0.764404296875, -0.7340087890625, -0.70361328125, -0.6732177734375, -0.642822265625, -0.6124267578125, -0.58203125, -0.5516357421875, -0.521240234375, -0.4908447265625, -0.46044921875, -0.4300537109375, -0.399658203125, -0.3692626953125, -0.3388671875, -0.3084716796875, -0.278076171875, -0.2476806640625, -0.21728515625, -0.1868896484375, -0.156494140625, -0.1260986328125, -0.095703125, -0.0653076171875, -0.034912109375, -0.0045166015625, 0.02587890625, 0.0562744140625, 0.086669921875, 0.1170654296875, 0.1474609375, 0.1778564453125, 0.208251953125, 0.2386474609375, 0.26904296875, 0.2994384765625, 0.329833984375, 0.3602294921875, 0.390625, 0.4210205078125, 0.451416015625, 0.4818115234375, 0.51220703125, 0.5426025390625, 0.572998046875, 0.6033935546875, 0.6337890625, 0.6641845703125, 0.694580078125, 0.7249755859375, 0.75537109375, 0.7857666015625, 0.816162109375, 0.8465576171875, 0.876953125, 0.9073486328125, 0.937744140625, 0.9681396484375, 0.99853515625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 7.0, 13.0, 20.0, 28.0, 53.0, 79.0, 105.0, 174.0, 261.0, 406.0, 630.0, 997.0, 1690.0, 2523.0, 4260.0, 6978.0, 11316.0, 17798.0, 28071.0, 42237.0, 61801.0, 84552.0, 106911.0, 122931.0, 126065.0, 115297.0, 96278.0, 72106.0, 51564.0, 34392.0, 22055.0, 14036.0, 8641.0, 5505.0, 3283.0, 1967.0, 1261.0, 832.0, 511.0, 333.0, 210.0, 130.0, 85.0, 53.0, 46.0, 24.0, 17.0, 6.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.654296875, -0.634613037109375, -0.61492919921875, -0.595245361328125, -0.5755615234375, -0.555877685546875, -0.53619384765625, -0.516510009765625, -0.496826171875, -0.477142333984375, -0.45745849609375, -0.437774658203125, -0.4180908203125, -0.398406982421875, -0.37872314453125, -0.359039306640625, -0.33935546875, -0.319671630859375, -0.29998779296875, -0.280303955078125, -0.2606201171875, -0.240936279296875, -0.22125244140625, -0.201568603515625, -0.181884765625, -0.162200927734375, -0.14251708984375, -0.122833251953125, -0.1031494140625, -0.083465576171875, -0.06378173828125, -0.044097900390625, -0.0244140625, -0.004730224609375, 0.01495361328125, 0.034637451171875, 0.0543212890625, 0.074005126953125, 0.09368896484375, 0.113372802734375, 0.133056640625, 0.152740478515625, 0.17242431640625, 0.192108154296875, 0.2117919921875, 0.231475830078125, 0.25115966796875, 0.270843505859375, 0.29052734375, 0.310211181640625, 0.32989501953125, 0.349578857421875, 0.3692626953125, 0.388946533203125, 0.40863037109375, 0.428314208984375, 0.447998046875, 0.467681884765625, 0.48736572265625, 0.507049560546875, 0.5267333984375, 0.546417236328125, 0.56610107421875, 0.585784912109375, 0.60546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0, 9.0, 2.0, 10.0, 11.0, 16.0, 7.0, 16.0, 16.0, 21.0, 24.0, 36.0, 43.0, 44.0, 47.0, 47.0, 43.0, 38.0, 31.0, 49.0, 54.0, 54.0, 47.0, 47.0, 45.0, 33.0, 37.0, 34.0, 20.0, 22.0, 21.0, 16.0, 18.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.736682891845703e-05, -7.528718560934067e-05, -7.32075423002243e-05, -7.112789899110794e-05, -6.904825568199158e-05, -6.696861237287521e-05, -6.488896906375885e-05, -6.280932575464249e-05, -6.072968244552612e-05, -5.865003913640976e-05, -5.6570395827293396e-05, -5.449075251817703e-05, -5.241110920906067e-05, -5.0331465899944305e-05, -4.825182259082794e-05, -4.617217928171158e-05, -4.4092535972595215e-05, -4.201289266347885e-05, -3.993324935436249e-05, -3.7853606045246124e-05, -3.577396273612976e-05, -3.36943194270134e-05, -3.1614676117897034e-05, -2.953503280878067e-05, -2.7455389499664307e-05, -2.5375746190547943e-05, -2.329610288143158e-05, -2.1216459572315216e-05, -1.9136816263198853e-05, -1.705717295408249e-05, -1.4977529644966125e-05, -1.2897886335849762e-05, -1.0818243026733398e-05, -8.738599717617035e-06, -6.658956408500671e-06, -4.579313099384308e-06, -2.4996697902679443e-06, -4.200264811515808e-07, 1.6596168279647827e-06, 3.7392601370811462e-06, 5.81890344619751e-06, 7.898546755313873e-06, 9.978190064430237e-06, 1.20578333735466e-05, 1.4137476682662964e-05, 1.6217119991779327e-05, 1.829676330089569e-05, 2.0376406610012054e-05, 2.2456049919128418e-05, 2.453569322824478e-05, 2.6615336537361145e-05, 2.869497984647751e-05, 3.077462315559387e-05, 3.2854266464710236e-05, 3.49339097738266e-05, 3.701355308294296e-05, 3.9093196392059326e-05, 4.117283970117569e-05, 4.325248301029205e-05, 4.533212631940842e-05, 4.741176962852478e-05, 4.9491412937641144e-05, 5.157105624675751e-05, 5.365069955587387e-05, 5.5730342864990234e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 7.0, 17.0, 30.0, 34.0, 49.0, 73.0, 124.0, 189.0, 261.0, 408.0, 609.0, 955.0, 1427.0, 2153.0, 3295.0, 4967.0, 7789.0, 11594.0, 17740.0, 25976.0, 37427.0, 52088.0, 69389.0, 87052.0, 102017.0, 110650.0, 109008.0, 99364.0, 83872.0, 65065.0, 49103.0, 34702.0, 24081.0, 16095.0, 10594.0, 7042.0, 4707.0, 2985.0, 1938.0, 1269.0, 880.0, 544.0, 339.0, 236.0, 130.0, 91.0, 70.0, 41.0, 22.0, 20.0, 16.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.57080078125, -0.5529022216796875, -0.535003662109375, -0.5171051025390625, -0.49920654296875, -0.4813079833984375, -0.463409423828125, -0.4455108642578125, -0.4276123046875, -0.4097137451171875, -0.391815185546875, -0.3739166259765625, -0.35601806640625, -0.3381195068359375, -0.320220947265625, -0.3023223876953125, -0.284423828125, -0.2665252685546875, -0.248626708984375, -0.2307281494140625, -0.21282958984375, -0.1949310302734375, -0.177032470703125, -0.1591339111328125, -0.1412353515625, -0.1233367919921875, -0.105438232421875, -0.0875396728515625, -0.06964111328125, -0.0517425537109375, -0.033843994140625, -0.0159454345703125, 0.001953125, 0.0198516845703125, 0.037750244140625, 0.0556488037109375, 0.07354736328125, 0.0914459228515625, 0.109344482421875, 0.1272430419921875, 0.1451416015625, 0.1630401611328125, 0.180938720703125, 0.1988372802734375, 0.21673583984375, 0.2346343994140625, 0.252532958984375, 0.2704315185546875, 0.288330078125, 0.3062286376953125, 0.324127197265625, 0.3420257568359375, 0.35992431640625, 0.3778228759765625, 0.395721435546875, 0.4136199951171875, 0.4315185546875, 0.4494171142578125, 0.467315673828125, 0.4852142333984375, 0.50311279296875, 0.5210113525390625, 0.538909912109375, 0.5568084716796875, 0.57470703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 10.0, 19.0, 16.0, 18.0, 22.0, 29.0, 20.0, 31.0, 34.0, 35.0, 39.0, 40.0, 50.0, 38.0, 51.0, 52.0, 52.0, 55.0, 34.0, 49.0, 38.0, 42.0, 39.0, 38.0, 28.0, 21.0, 20.0, 8.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1801280975341797, -0.17263412475585938, -0.16514015197753906, -0.15764617919921875, -0.15015220642089844, -0.14265823364257812, -0.1351642608642578, -0.1276702880859375, -0.12017631530761719, -0.11268234252929688, -0.10518836975097656, -0.09769439697265625, -0.09020042419433594, -0.08270645141601562, -0.07521247863769531, -0.067718505859375, -0.06022453308105469, -0.052730560302734375, -0.04523658752441406, -0.03774261474609375, -0.030248641967773438, -0.022754669189453125, -0.015260696411132812, -0.0077667236328125, -0.0002727508544921875, 0.007221221923828125, 0.014715194702148438, 0.02220916748046875, 0.029703140258789062, 0.037197113037109375, 0.04469108581542969, 0.05218505859375, 0.05967903137207031, 0.06717300415039062, 0.07466697692871094, 0.08216094970703125, 0.08965492248535156, 0.09714889526367188, 0.10464286804199219, 0.1121368408203125, 0.11963081359863281, 0.12712478637695312, 0.13461875915527344, 0.14211273193359375, 0.14960670471191406, 0.15710067749023438, 0.1645946502685547, 0.172088623046875, 0.1795825958251953, 0.18707656860351562, 0.19457054138183594, 0.20206451416015625, 0.20955848693847656, 0.21705245971679688, 0.2245464324951172, 0.2320404052734375, 0.2395343780517578, 0.24702835083007812, 0.25452232360839844, 0.26201629638671875, 0.26951026916503906, 0.2770042419433594, 0.2844982147216797, 0.2919921875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 18.0, 17.0, 27.0, 16.0, 23.0, 25.0, 41.0, 26.0, 50.0, 58.0, 47.0, 53.0, 62.0, 71.0, 58.0, 40.0, 45.0, 51.0, 34.0, 36.0, 31.0, 28.0, 23.0, 20.0, 24.0, 18.0, 12.0, 10.0, 5.0, 3.0, 5.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052737236022949, -1.9824645519256592, -1.9121919870376587, -1.8419193029403687, -1.7716466188430786, -1.7013740539550781, -1.631101369857788, -1.560828685760498, -1.490556001663208, -1.420283317565918, -1.3500107526779175, -1.2797380685806274, -1.2094653844833374, -1.139192819595337, -1.0689201354980469, -0.9986474514007568, -0.9283748865127563, -0.8581022620201111, -0.787829577922821, -0.7175569534301758, -0.6472842693328857, -0.5770116448402405, -0.5067390203475952, -0.43646636605262756, -0.3661937117576599, -0.29592105746269226, -0.2256484180688858, -0.15537577867507935, -0.0851031243801117, -0.014830470085144043, 0.05544215440750122, 0.12571480870246887, 0.19598746299743652, 0.2662601172924042, 0.3365327715873718, 0.4068053960800171, 0.47707805037498474, 0.5473507046699524, 0.6176233291625977, 0.6878960132598877, 0.758168637752533, 0.8284412622451782, 0.8987139463424683, 0.9689865708351135, 1.0392591953277588, 1.1095318794250488, 1.1798045635223389, 1.2500771284103394, 1.3203498125076294, 1.3906224966049194, 1.46089506149292, 1.53116774559021, 1.6014404296875, 1.67171311378479, 1.7419856786727905, 1.8122583627700806, 1.882530927658081, 1.952803611755371, 2.023076295852661, 2.093348979949951, 2.163621425628662, 2.233894109725952, 2.304166793823242, 2.3744394779205322, 2.4447121620178223]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 10.0, 8.0, 7.0, 18.0, 9.0, 21.0, 15.0, 27.0, 24.0, 26.0, 31.0, 35.0, 28.0, 39.0, 49.0, 44.0, 54.0, 34.0, 40.0, 41.0, 37.0, 48.0, 31.0, 43.0, 36.0, 32.0, 33.0, 25.0, 25.0, 21.0, 19.0, 11.0, 16.0, 7.0, 10.0, 10.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6441646814346313, -1.5958521366119385, -1.547539472579956, -1.4992269277572632, -1.4509143829345703, -1.4026018381118774, -1.3542892932891846, -1.3059766292572021, -1.2576640844345093, -1.2093515396118164, -1.161038875579834, -1.1127263307571411, -1.0644137859344482, -1.0161012411117554, -0.9677886366844177, -0.9194760322570801, -0.8711634874343872, -0.8228509426116943, -0.7745383381843567, -0.726225733757019, -0.6779131889343262, -0.6296006441116333, -0.5812880396842957, -0.532975435256958, -0.48466289043426514, -0.4363503158092499, -0.3880377411842346, -0.33972516655921936, -0.2914125919342041, -0.24310001730918884, -0.19478744268417358, -0.14647486805915833, -0.09816241264343262, -0.04984983801841736, -0.0015372633934020996, 0.04677531123161316, 0.09508788585662842, 0.14340046048164368, 0.19171303510665894, 0.2400256097316742, 0.28833818435668945, 0.3366507589817047, 0.38496333360671997, 0.43327590823173523, 0.4815884828567505, 0.5299010276794434, 0.578213632106781, 0.6265262365341187, 0.6748387813568115, 0.7231513261795044, 0.771463930606842, 0.8197765350341797, 0.8680890798568726, 0.9164016246795654, 0.9647142291069031, 1.0130268335342407, 1.0613393783569336, 1.1096519231796265, 1.1579644680023193, 1.2062771320343018, 1.2545896768569946, 1.3029022216796875, 1.35121488571167, 1.3995274305343628, 1.4478399753570557]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 16.0, 31.0, 52.0, 80.0, 104.0, 179.0, 311.0, 472.0, 780.0, 1244.0, 2147.0, 3646.0, 6049.0, 10341.0, 17374.0, 29901.0, 51538.0, 86344.0, 140587.0, 222680.0, 327754.0, 445322.0, 538683.0, 567637.0, 519751.0, 415012.0, 299586.0, 199195.0, 124863.0, 75576.0, 44861.0, 26159.0, 15083.0, 8728.0, 5065.0, 2967.0, 1662.0, 995.0, 599.0, 335.0, 211.0, 132.0, 92.0, 46.0, 30.0, 17.0, 17.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003570556640625, -1.549346923828125, -1.4983367919921875, -1.44732666015625, -1.3963165283203125, -1.345306396484375, -1.2942962646484375, -1.2432861328125, -1.1922760009765625, -1.141265869140625, -1.0902557373046875, -1.03924560546875, -0.9882354736328125, -0.937225341796875, -0.8862152099609375, -0.835205078125, -0.7841949462890625, -0.733184814453125, -0.6821746826171875, -0.63116455078125, -0.5801544189453125, -0.529144287109375, -0.4781341552734375, -0.4271240234375, -0.3761138916015625, -0.325103759765625, -0.2740936279296875, -0.22308349609375, -0.1720733642578125, -0.121063232421875, -0.0700531005859375, -0.01904296875, 0.0319671630859375, 0.082977294921875, 0.1339874267578125, 0.18499755859375, 0.2360076904296875, 0.287017822265625, 0.3380279541015625, 0.3890380859375, 0.4400482177734375, 0.491058349609375, 0.5420684814453125, 0.59307861328125, 0.6440887451171875, 0.695098876953125, 0.7461090087890625, 0.797119140625, 0.8481292724609375, 0.899139404296875, 0.9501495361328125, 1.00115966796875, 1.0521697998046875, 1.103179931640625, 1.1541900634765625, 1.2052001953125, 1.2562103271484375, 1.307220458984375, 1.3582305908203125, 1.40924072265625, 1.4602508544921875, 1.511260986328125, 1.5622711181640625, 1.61328125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 9.0, 11.0, 6.0, 15.0, 13.0, 16.0, 15.0, 27.0, 22.0, 28.0, 35.0, 32.0, 37.0, 40.0, 41.0, 39.0, 31.0, 37.0, 44.0, 42.0, 40.0, 37.0, 38.0, 35.0, 44.0, 25.0, 24.0, 23.0, 26.0, 25.0, 13.0, 12.0, 17.0, 18.0, 14.0, 5.0, 7.0, 5.0, 4.0, 8.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3056640625, -1.2673187255859375, -1.228973388671875, -1.1906280517578125, -1.15228271484375, -1.1139373779296875, -1.075592041015625, -1.0372467041015625, -0.9989013671875, -0.9605560302734375, -0.922210693359375, -0.8838653564453125, -0.84552001953125, -0.8071746826171875, -0.768829345703125, -0.7304840087890625, -0.692138671875, -0.6537933349609375, -0.615447998046875, -0.5771026611328125, -0.53875732421875, -0.5004119873046875, -0.462066650390625, -0.4237213134765625, -0.3853759765625, -0.3470306396484375, -0.308685302734375, -0.2703399658203125, -0.23199462890625, -0.1936492919921875, -0.155303955078125, -0.1169586181640625, -0.07861328125, -0.0402679443359375, -0.001922607421875, 0.0364227294921875, 0.07476806640625, 0.1131134033203125, 0.151458740234375, 0.1898040771484375, 0.2281494140625, 0.2664947509765625, 0.304840087890625, 0.3431854248046875, 0.38153076171875, 0.4198760986328125, 0.458221435546875, 0.4965667724609375, 0.534912109375, 0.5732574462890625, 0.611602783203125, 0.6499481201171875, 0.68829345703125, 0.7266387939453125, 0.764984130859375, 0.8033294677734375, 0.8416748046875, 0.8800201416015625, 0.918365478515625, 0.9567108154296875, 0.99505615234375, 1.0334014892578125, 1.071746826171875, 1.1100921630859375, 1.1484375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 17.0, 29.0, 42.0, 73.0, 120.0, 215.0, 351.0, 556.0, 932.0, 1594.0, 2777.0, 4568.0, 8097.0, 13402.0, 22683.0, 38392.0, 62227.0, 100217.0, 154234.0, 226711.0, 314267.0, 402179.0, 472768.0, 500720.0, 478665.0, 410040.0, 321211.0, 232322.0, 158581.0, 103429.0, 64824.0, 39677.0, 24078.0, 14092.0, 8348.0, 4799.0, 2918.0, 1680.0, 1009.0, 549.0, 338.0, 224.0, 133.0, 85.0, 49.0, 17.0, 13.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6858062744140625, -1.632354736328125, -1.5789031982421875, -1.52545166015625, -1.4720001220703125, -1.418548583984375, -1.3650970458984375, -1.3116455078125, -1.2581939697265625, -1.204742431640625, -1.1512908935546875, -1.09783935546875, -1.0443878173828125, -0.990936279296875, -0.9374847412109375, -0.884033203125, -0.8305816650390625, -0.777130126953125, -0.7236785888671875, -0.67022705078125, -0.6167755126953125, -0.563323974609375, -0.5098724365234375, -0.4564208984375, -0.4029693603515625, -0.349517822265625, -0.2960662841796875, -0.24261474609375, -0.1891632080078125, -0.135711669921875, -0.0822601318359375, -0.02880859375, 0.0246429443359375, 0.078094482421875, 0.1315460205078125, 0.18499755859375, 0.2384490966796875, 0.291900634765625, 0.3453521728515625, 0.3988037109375, 0.4522552490234375, 0.505706787109375, 0.5591583251953125, 0.61260986328125, 0.6660614013671875, 0.719512939453125, 0.7729644775390625, 0.826416015625, 0.8798675537109375, 0.933319091796875, 0.9867706298828125, 1.04022216796875, 1.0936737060546875, 1.147125244140625, 1.2005767822265625, 1.2540283203125, 1.3074798583984375, 1.360931396484375, 1.4143829345703125, 1.46783447265625, 1.5212860107421875, 1.574737548828125, 1.6281890869140625, 1.681640625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 12.0, 10.0, 6.0, 27.0, 34.0, 30.0, 34.0, 60.0, 67.0, 84.0, 118.0, 136.0, 149.0, 142.0, 168.0, 206.0, 203.0, 215.0, 216.0, 240.0, 238.0, 212.0, 217.0, 170.0, 155.0, 151.0, 142.0, 147.0, 105.0, 80.0, 63.0, 57.0, 44.0, 42.0, 29.0, 12.0, 17.0, 5.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7265853881835938, -0.7026824951171875, -0.6787796020507812, -0.654876708984375, -0.6309738159179688, -0.6070709228515625, -0.5831680297851562, -0.55926513671875, -0.5353622436523438, -0.5114593505859375, -0.48755645751953125, -0.463653564453125, -0.43975067138671875, -0.4158477783203125, -0.39194488525390625, -0.3680419921875, -0.34413909912109375, -0.3202362060546875, -0.29633331298828125, -0.272430419921875, -0.24852752685546875, -0.2246246337890625, -0.20072174072265625, -0.17681884765625, -0.15291595458984375, -0.1290130615234375, -0.10511016845703125, -0.081207275390625, -0.05730438232421875, -0.0334014892578125, -0.00949859619140625, 0.014404296875, 0.03830718994140625, 0.0622100830078125, 0.08611297607421875, 0.110015869140625, 0.13391876220703125, 0.1578216552734375, 0.18172454833984375, 0.20562744140625, 0.22953033447265625, 0.2534332275390625, 0.27733612060546875, 0.301239013671875, 0.32514190673828125, 0.3490447998046875, 0.37294769287109375, 0.3968505859375, 0.42075347900390625, 0.4446563720703125, 0.46855926513671875, 0.492462158203125, 0.5163650512695312, 0.5402679443359375, 0.5641708374023438, 0.58807373046875, 0.6119766235351562, 0.6358795166015625, 0.6597824096679688, 0.683685302734375, 0.7075881958007812, 0.7314910888671875, 0.7553939819335938, 0.779296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 13.0, 17.0, 9.0, 28.0, 33.0, 22.0, 31.0, 34.0, 48.0, 62.0, 64.0, 61.0, 71.0, 49.0, 55.0, 50.0, 66.0, 49.0, 39.0, 40.0, 28.0, 27.0, 23.0, 13.0, 15.0, 13.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.804446220397949, -2.719447135925293, -2.6344478130340576, -2.5494487285614014, -2.464449644088745, -2.3794503211975098, -2.2944512367248535, -2.2094521522521973, -2.124453067779541, -2.0394539833068848, -1.954454779624939, -1.8694555759429932, -1.784456491470337, -1.6994572877883911, -1.6144580841064453, -1.529458999633789, -1.4444596767425537, -1.359460473060608, -1.2744613885879517, -1.1894621849060059, -1.1044631004333496, -1.0194638967514038, -0.934464693069458, -0.849465548992157, -0.764466404914856, -0.6794672608375549, -0.5944681167602539, -0.5094689130783081, -0.4244697690010071, -0.33947062492370605, -0.25447142124176025, -0.16947227716445923, -0.0844733715057373, 0.0005257874727249146, 0.08552494645118713, 0.17052412033081055, 0.2555232644081116, 0.3405224084854126, 0.4255216121673584, 0.5105207562446594, 0.5955199003219604, 0.6805190443992615, 0.7655181884765625, 0.8505173921585083, 0.9355165362358093, 1.0205156803131104, 1.1055148839950562, 1.190514087677002, 1.2755131721496582, 1.360512375831604, 1.4455114603042603, 1.530510663986206, 1.6155097484588623, 1.700508952140808, 1.785508155822754, 1.8705072402954102, 1.955506443977356, 2.0405056476593018, 2.125504732131958, 2.2105040550231934, 2.2955031394958496, 2.380502223968506, 2.465501308441162, 2.5505006313323975, 2.6354997158050537]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 12.0, 9.0, 10.0, 15.0, 18.0, 14.0, 23.0, 21.0, 30.0, 21.0, 36.0, 36.0, 27.0, 31.0, 42.0, 49.0, 43.0, 33.0, 42.0, 44.0, 42.0, 34.0, 46.0, 35.0, 35.0, 28.0, 24.0, 29.0, 25.0, 21.0, 18.0, 19.0, 14.0, 6.0, 8.0, 8.0, 3.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6612660884857178, -1.6119011640548706, -1.5625362396240234, -1.5131713151931763, -1.463806390762329, -1.414441466331482, -1.3650765419006348, -1.3157117366790771, -1.2663466930389404, -1.2169817686080933, -1.167616844177246, -1.118251919746399, -1.0688869953155518, -1.0195220708847046, -0.9701572060585022, -0.920792281627655, -0.8714274168014526, -0.8220624923706055, -0.7726975679397583, -0.7233326435089111, -0.673967719078064, -0.6246027946472168, -0.5752379298210144, -0.5258730053901672, -0.47650808095932007, -0.4271431565284729, -0.37777823209762573, -0.32841333746910095, -0.2790484130382538, -0.22968348860740662, -0.18031859397888184, -0.13095366954803467, -0.08158862590789795, -0.03222370892763138, 0.017141208052635193, 0.06650611758232117, 0.11587104201316833, 0.1652359664440155, 0.21460086107254028, 0.26396578550338745, 0.3133307099342346, 0.3626956343650818, 0.41206055879592896, 0.46142545342445374, 0.5107903480529785, 0.5601552724838257, 0.6095201969146729, 0.65888512134552, 0.7082500457763672, 0.7576149702072144, 0.8069798946380615, 0.8563448190689087, 0.9057097434997559, 0.955074667930603, 1.0044395923614502, 1.0538043975830078, 1.1031694412231445, 1.1525343656539917, 1.2018992900848389, 1.251264214515686, 1.3006291389465332, 1.3499940633773804, 1.3993589878082275, 1.4487237930297852, 1.4980887174606323]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 14.0, 12.0, 23.0, 38.0, 53.0, 72.0, 121.0, 181.0, 308.0, 468.0, 734.0, 1318.0, 2311.0, 4126.0, 7945.0, 15267.0, 29808.0, 56438.0, 105028.0, 179337.0, 231757.0, 182776.0, 108068.0, 57877.0, 30468.0, 15650.0, 8120.0, 4429.0, 2416.0, 1325.0, 769.0, 482.0, 291.0, 173.0, 97.0, 68.0, 58.0, 43.0, 17.0, 19.0, 15.0, 10.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5322265625, -0.5141983032226562, -0.4961700439453125, -0.47814178466796875, -0.460113525390625, -0.44208526611328125, -0.4240570068359375, -0.40602874755859375, -0.38800048828125, -0.36997222900390625, -0.3519439697265625, -0.33391571044921875, -0.315887451171875, -0.29785919189453125, -0.2798309326171875, -0.26180267333984375, -0.2437744140625, -0.22574615478515625, -0.2077178955078125, -0.18968963623046875, -0.171661376953125, -0.15363311767578125, -0.1356048583984375, -0.11757659912109375, -0.09954833984375, -0.08152008056640625, -0.0634918212890625, -0.04546356201171875, -0.027435302734375, -0.00940704345703125, 0.0086212158203125, 0.02664947509765625, 0.044677734375, 0.06270599365234375, 0.0807342529296875, 0.09876251220703125, 0.116790771484375, 0.13481903076171875, 0.1528472900390625, 0.17087554931640625, 0.18890380859375, 0.20693206787109375, 0.2249603271484375, 0.24298858642578125, 0.261016845703125, 0.27904510498046875, 0.2970733642578125, 0.31510162353515625, 0.3331298828125, 0.35115814208984375, 0.3691864013671875, 0.38721466064453125, 0.405242919921875, 0.42327117919921875, 0.4412994384765625, 0.45932769775390625, 0.47735595703125, 0.49538421630859375, 0.5134124755859375, 0.5314407348632812, 0.549468994140625, 0.5674972534179688, 0.5855255126953125, 0.6035537719726562, 0.62158203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 20.0, 15.0, 19.0, 23.0, 22.0, 34.0, 30.0, 34.0, 26.0, 32.0, 35.0, 37.0, 37.0, 40.0, 47.0, 39.0, 45.0, 38.0, 40.0, 30.0, 33.0, 33.0, 29.0, 26.0, 20.0, 30.0, 14.0, 19.0, 26.0, 14.0, 5.0, 12.0, 10.0, 7.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.587890625, -1.536163330078125, -1.48443603515625, -1.432708740234375, -1.3809814453125, -1.329254150390625, -1.27752685546875, -1.225799560546875, -1.174072265625, -1.122344970703125, -1.07061767578125, -1.018890380859375, -0.9671630859375, -0.915435791015625, -0.86370849609375, -0.811981201171875, -0.76025390625, -0.708526611328125, -0.65679931640625, -0.605072021484375, -0.5533447265625, -0.501617431640625, -0.44989013671875, -0.398162841796875, -0.346435546875, -0.294708251953125, -0.24298095703125, -0.191253662109375, -0.1395263671875, -0.087799072265625, -0.03607177734375, 0.015655517578125, 0.0673828125, 0.119110107421875, 0.17083740234375, 0.222564697265625, 0.2742919921875, 0.326019287109375, 0.37774658203125, 0.429473876953125, 0.481201171875, 0.532928466796875, 0.58465576171875, 0.636383056640625, 0.6881103515625, 0.739837646484375, 0.79156494140625, 0.843292236328125, 0.89501953125, 0.946746826171875, 0.99847412109375, 1.050201416015625, 1.1019287109375, 1.153656005859375, 1.20538330078125, 1.257110595703125, 1.308837890625, 1.360565185546875, 1.41229248046875, 1.464019775390625, 1.5157470703125, 1.567474365234375, 1.61920166015625, 1.670928955078125, 1.72265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 9.0, 11.0, 11.0, 25.0, 28.0, 34.0, 53.0, 74.0, 120.0, 184.0, 246.0, 363.0, 602.0, 935.0, 1483.0, 2676.0, 4663.0, 9102.0, 17957.0, 36978.0, 79615.0, 163223.0, 261603.0, 228074.0, 124296.0, 58646.0, 27684.0, 13572.0, 6828.0, 3792.0, 2123.0, 1329.0, 766.0, 462.0, 319.0, 200.0, 126.0, 87.0, 61.0, 55.0, 46.0, 34.0, 18.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5990371704101562, -0.5789337158203125, -0.5588302612304688, -0.538726806640625, -0.5186233520507812, -0.4985198974609375, -0.47841644287109375, -0.45831298828125, -0.43820953369140625, -0.4181060791015625, -0.39800262451171875, -0.377899169921875, -0.35779571533203125, -0.3376922607421875, -0.31758880615234375, -0.2974853515625, -0.27738189697265625, -0.2572784423828125, -0.23717498779296875, -0.217071533203125, -0.19696807861328125, -0.1768646240234375, -0.15676116943359375, -0.13665771484375, -0.11655426025390625, -0.0964508056640625, -0.07634735107421875, -0.056243896484375, -0.03614044189453125, -0.0160369873046875, 0.00406646728515625, 0.024169921875, 0.04427337646484375, 0.0643768310546875, 0.08448028564453125, 0.104583740234375, 0.12468719482421875, 0.1447906494140625, 0.16489410400390625, 0.18499755859375, 0.20510101318359375, 0.2252044677734375, 0.24530792236328125, 0.265411376953125, 0.28551483154296875, 0.3056182861328125, 0.32572174072265625, 0.3458251953125, 0.36592864990234375, 0.3860321044921875, 0.40613555908203125, 0.426239013671875, 0.44634246826171875, 0.4664459228515625, 0.48654937744140625, 0.50665283203125, 0.5267562866210938, 0.5468597412109375, 0.5669631958007812, 0.587066650390625, 0.6071701049804688, 0.6272735595703125, 0.6473770141601562, 0.66748046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 11.0, 8.0, 16.0, 14.0, 15.0, 22.0, 28.0, 22.0, 23.0, 30.0, 28.0, 35.0, 35.0, 62.0, 38.0, 39.0, 52.0, 42.0, 52.0, 42.0, 41.0, 39.0, 41.0, 34.0, 24.0, 33.0, 23.0, 21.0, 23.0, 14.0, 19.0, 16.0, 7.0, 14.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -0.99884033203125, -0.9635009765625, -0.92816162109375, -0.892822265625, -0.85748291015625, -0.8221435546875, -0.78680419921875, -0.75146484375, -0.71612548828125, -0.6807861328125, -0.64544677734375, -0.610107421875, -0.57476806640625, -0.5394287109375, -0.50408935546875, -0.46875, -0.43341064453125, -0.3980712890625, -0.36273193359375, -0.327392578125, -0.29205322265625, -0.2567138671875, -0.22137451171875, -0.18603515625, -0.15069580078125, -0.1153564453125, -0.08001708984375, -0.044677734375, -0.00933837890625, 0.0260009765625, 0.06134033203125, 0.0966796875, 0.13201904296875, 0.1673583984375, 0.20269775390625, 0.238037109375, 0.27337646484375, 0.3087158203125, 0.34405517578125, 0.37939453125, 0.41473388671875, 0.4500732421875, 0.48541259765625, 0.520751953125, 0.55609130859375, 0.5914306640625, 0.62677001953125, 0.662109375, 0.69744873046875, 0.7327880859375, 0.76812744140625, 0.803466796875, 0.83880615234375, 0.8741455078125, 0.90948486328125, 0.94482421875, 0.98016357421875, 1.0155029296875, 1.05084228515625, 1.086181640625, 1.12152099609375, 1.1568603515625, 1.19219970703125, 1.2275390625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 7.0, 7.0, 6.0, 6.0, 13.0, 16.0, 19.0, 22.0, 49.0, 57.0, 61.0, 68.0, 98.0, 142.0, 179.0, 253.0, 331.0, 470.0, 718.0, 1055.0, 1608.0, 2597.0, 4691.0, 8932.0, 19480.0, 54137.0, 201674.0, 482523.0, 181015.0, 49612.0, 18402.0, 8207.0, 4572.0, 2545.0, 1480.0, 1001.0, 698.0, 479.0, 363.0, 221.0, 176.0, 157.0, 118.0, 77.0, 53.0, 48.0, 22.0, 27.0, 17.0, 14.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.33349609375, -0.32254791259765625, -0.3115997314453125, -0.30065155029296875, -0.289703369140625, -0.27875518798828125, -0.2678070068359375, -0.25685882568359375, -0.24591064453125, -0.23496246337890625, -0.2240142822265625, -0.21306610107421875, -0.202117919921875, -0.19116973876953125, -0.1802215576171875, -0.16927337646484375, -0.1583251953125, -0.14737701416015625, -0.1364288330078125, -0.12548065185546875, -0.114532470703125, -0.10358428955078125, -0.0926361083984375, -0.08168792724609375, -0.07073974609375, -0.05979156494140625, -0.0488433837890625, -0.03789520263671875, -0.026947021484375, -0.01599884033203125, -0.0050506591796875, 0.00589752197265625, 0.016845703125, 0.02779388427734375, 0.0387420654296875, 0.04969024658203125, 0.060638427734375, 0.07158660888671875, 0.0825347900390625, 0.09348297119140625, 0.10443115234375, 0.11537933349609375, 0.1263275146484375, 0.13727569580078125, 0.148223876953125, 0.15917205810546875, 0.1701202392578125, 0.18106842041015625, 0.1920166015625, 0.20296478271484375, 0.2139129638671875, 0.22486114501953125, 0.235809326171875, 0.24675750732421875, 0.2577056884765625, 0.26865386962890625, 0.27960205078125, 0.29055023193359375, 0.3014984130859375, 0.31244659423828125, 0.323394775390625, 0.33434295654296875, 0.3452911376953125, 0.35623931884765625, 0.3671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 10.0, 6.0, 9.0, 11.0, 9.0, 14.0, 14.0, 15.0, 35.0, 35.0, 32.0, 35.0, 42.0, 36.0, 56.0, 34.0, 48.0, 43.0, 43.0, 57.0, 41.0, 41.0, 35.0, 42.0, 40.0, 37.0, 23.0, 23.0, 15.0, 21.0, 14.0, 11.0, 9.0, 10.0, 13.0, 7.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.049041748046875e-05, -1.0143034160137177e-05, -9.795650839805603e-06, -9.44826751947403e-06, -9.100884199142456e-06, -8.753500878810883e-06, -8.406117558479309e-06, -8.058734238147736e-06, -7.711350917816162e-06, -7.363967597484589e-06, -7.016584277153015e-06, -6.669200956821442e-06, -6.321817636489868e-06, -5.974434316158295e-06, -5.627050995826721e-06, -5.279667675495148e-06, -4.932284355163574e-06, -4.584901034832001e-06, -4.237517714500427e-06, -3.890134394168854e-06, -3.5427510738372803e-06, -3.1953677535057068e-06, -2.8479844331741333e-06, -2.50060111284256e-06, -2.1532177925109863e-06, -1.8058344721794128e-06, -1.4584511518478394e-06, -1.1110678315162659e-06, -7.636845111846924e-07, -4.163011908531189e-07, -6.891787052154541e-08, 2.784654498100281e-07, 6.258487701416016e-07, 9.73232090473175e-07, 1.3206154108047485e-06, 1.667998731136322e-06, 2.0153820514678955e-06, 2.362765371799469e-06, 2.7101486921310425e-06, 3.057532012462616e-06, 3.4049153327941895e-06, 3.752298653125763e-06, 4.0996819734573364e-06, 4.44706529378891e-06, 4.794448614120483e-06, 5.141831934452057e-06, 5.48921525478363e-06, 5.836598575115204e-06, 6.183981895446777e-06, 6.531365215778351e-06, 6.878748536109924e-06, 7.226131856441498e-06, 7.573515176773071e-06, 7.920898497104645e-06, 8.268281817436218e-06, 8.615665137767792e-06, 8.963048458099365e-06, 9.310431778430939e-06, 9.657815098762512e-06, 1.0005198419094086e-05, 1.035258173942566e-05, 1.0699965059757233e-05, 1.1047348380088806e-05, 1.139473170042038e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 27.0, 18.0, 42.0, 53.0, 85.0, 121.0, 199.0, 227.0, 386.0, 571.0, 860.0, 1284.0, 2241.0, 4135.0, 8937.0, 22001.0, 67106.0, 226908.0, 433895.0, 188161.0, 55375.0, 18818.0, 7780.0, 3694.0, 1961.0, 1204.0, 713.0, 552.0, 357.0, 253.0, 169.0, 126.0, 68.0, 61.0, 48.0, 24.0, 17.0, 11.0, 10.0, 10.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5, -0.48503875732421875, -0.4700775146484375, -0.45511627197265625, -0.440155029296875, -0.42519378662109375, -0.4102325439453125, -0.39527130126953125, -0.38031005859375, -0.36534881591796875, -0.3503875732421875, -0.33542633056640625, -0.320465087890625, -0.30550384521484375, -0.2905426025390625, -0.27558135986328125, -0.2606201171875, -0.24565887451171875, -0.2306976318359375, -0.21573638916015625, -0.200775146484375, -0.18581390380859375, -0.1708526611328125, -0.15589141845703125, -0.14093017578125, -0.12596893310546875, -0.1110076904296875, -0.09604644775390625, -0.081085205078125, -0.06612396240234375, -0.0511627197265625, -0.03620147705078125, -0.021240234375, -0.00627899169921875, 0.0086822509765625, 0.02364349365234375, 0.038604736328125, 0.05356597900390625, 0.0685272216796875, 0.08348846435546875, 0.09844970703125, 0.11341094970703125, 0.1283721923828125, 0.14333343505859375, 0.158294677734375, 0.17325592041015625, 0.1882171630859375, 0.20317840576171875, 0.2181396484375, 0.23310089111328125, 0.2480621337890625, 0.26302337646484375, 0.277984619140625, 0.29294586181640625, 0.3079071044921875, 0.32286834716796875, 0.33782958984375, 0.35279083251953125, 0.3677520751953125, 0.38271331787109375, 0.397674560546875, 0.41263580322265625, 0.4275970458984375, 0.44255828857421875, 0.45751953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 6.0, 13.0, 7.0, 19.0, 29.0, 37.0, 70.0, 85.0, 147.0, 130.0, 124.0, 95.0, 69.0, 41.0, 33.0, 21.0, 17.0, 21.0, 4.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.12743854522705078, -0.12365150451660156, -0.11986446380615234, -0.11607742309570312, -0.1122903823852539, -0.10850334167480469, -0.10471630096435547, -0.10092926025390625, -0.09714221954345703, -0.09335517883300781, -0.0895681381225586, -0.08578109741210938, -0.08199405670166016, -0.07820701599121094, -0.07441997528076172, -0.0706329345703125, -0.06684589385986328, -0.06305885314941406, -0.059271812438964844, -0.055484771728515625, -0.051697731018066406, -0.04791069030761719, -0.04412364959716797, -0.04033660888671875, -0.03654956817626953, -0.03276252746582031, -0.028975486755371094, -0.025188446044921875, -0.021401405334472656, -0.017614364624023438, -0.013827323913574219, -0.010040283203125, -0.006253242492675781, -0.0024662017822265625, 0.0013208389282226562, 0.005107879638671875, 0.008894920349121094, 0.012681961059570312, 0.01646900177001953, 0.02025604248046875, 0.02404308319091797, 0.027830123901367188, 0.031617164611816406, 0.035404205322265625, 0.039191246032714844, 0.04297828674316406, 0.04676532745361328, 0.0505523681640625, 0.05433940887451172, 0.05812644958496094, 0.061913490295410156, 0.06570053100585938, 0.0694875717163086, 0.07327461242675781, 0.07706165313720703, 0.08084869384765625, 0.08463573455810547, 0.08842277526855469, 0.0922098159790039, 0.09599685668945312, 0.09978389739990234, 0.10357093811035156, 0.10735797882080078, 0.11114501953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 15.0, 15.0, 26.0, 32.0, 17.0, 39.0, 36.0, 53.0, 71.0, 64.0, 69.0, 63.0, 46.0, 53.0, 58.0, 55.0, 50.0, 39.0, 35.0, 33.0, 21.0, 21.0, 11.0, 13.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8028035163879395, -2.7170827388763428, -2.631361961364746, -2.5456411838531494, -2.4599204063415527, -2.374199628829956, -2.2884788513183594, -2.202758312225342, -2.117037296295166, -2.0313165187835693, -1.9455957412719727, -1.859874963760376, -1.7741541862487793, -1.6884334087371826, -1.6027127504348755, -1.5169919729232788, -1.4312713146209717, -1.345550537109375, -1.2598297595977783, -1.1741089820861816, -1.088388204574585, -1.0026674270629883, -0.9169467687606812, -0.8312259912490845, -0.7455052137374878, -0.6597844362258911, -0.5740636587142944, -0.48834294080734253, -0.40262216329574585, -0.31690138578414917, -0.23118066787719727, -0.14545989036560059, -0.059739112854003906, 0.02598164975643158, 0.11170241236686707, 0.19742316007614136, 0.28314393758773804, 0.3688647150993347, 0.4545854330062866, 0.5403062105178833, 0.62602698802948, 0.7117477655410767, 0.7974685430526733, 0.8831892609596252, 0.9689100384712219, 1.0546307563781738, 1.1403515338897705, 1.2260723114013672, 1.3117930889129639, 1.3975138664245605, 1.4832346439361572, 1.568955421447754, 1.6546761989593506, 1.7403969764709473, 1.8261176347732544, 1.911838412284851, 1.9975591897964478, 2.083279848098755, 2.1690006256103516, 2.2547214031219482, 2.340442180633545, 2.4261629581451416, 2.5118837356567383, 2.597604513168335, 2.6833252906799316]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 21.0, 23.0, 23.0, 28.0, 29.0, 42.0, 27.0, 33.0, 39.0, 48.0, 47.0, 29.0, 47.0, 48.0, 28.0, 41.0, 49.0, 36.0, 32.0, 34.0, 17.0, 34.0, 21.0, 20.0, 21.0, 19.0, 10.0, 8.0, 9.0, 6.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6686097383499146, -1.6190205812454224, -1.5694313049316406, -1.5198421478271484, -1.4702529907226562, -1.4206637144088745, -1.3710745573043823, -1.3214852809906006, -1.2718961238861084, -1.2223069667816162, -1.1727176904678345, -1.1231285333633423, -1.0735392570495605, -1.0239500999450684, -0.9743609428405762, -0.9247717261314392, -0.8751825094223022, -0.8255932927131653, -0.7760040760040283, -0.7264149188995361, -0.6768257021903992, -0.6272364854812622, -0.57764732837677, -0.5280581116676331, -0.4784688949584961, -0.42887967824935913, -0.37929049134254456, -0.32970130443573, -0.280112087726593, -0.23052288591861725, -0.18093368411064148, -0.1313444972038269, -0.08175528049468994, -0.03216607868671417, 0.017423123121261597, 0.06701232492923737, 0.11660152673721313, 0.1661907285451889, 0.21577993035316467, 0.26536911725997925, 0.3149583339691162, 0.3645475506782532, 0.41413673758506775, 0.4637259244918823, 0.5133151412010193, 0.5629043579101562, 0.6124935150146484, 0.6620827317237854, 0.7116719484329224, 0.7612611651420593, 0.8108503818511963, 0.8604395389556885, 0.9100287556648254, 0.9596179723739624, 1.0092071294784546, 1.0587964057922363, 1.1083855628967285, 1.1579747200012207, 1.2075639963150024, 1.2571531534194946, 1.3067424297332764, 1.3563315868377686, 1.4059207439422607, 1.455509901046753, 1.5050991773605347]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 16.0, 25.0, 37.0, 70.0, 107.0, 142.0, 226.0, 396.0, 625.0, 1031.0, 1565.0, 2541.0, 3896.0, 6096.0, 9060.0, 13846.0, 20351.0, 29148.0, 39452.0, 52889.0, 66788.0, 80266.0, 91485.0, 98529.0, 98322.0, 92410.0, 82139.0, 68646.0, 54180.0, 40819.0, 29955.0, 21244.0, 14587.0, 9797.0, 6427.0, 4045.0, 2712.0, 1763.0, 1078.0, 691.0, 433.0, 243.0, 172.0, 116.0, 77.0, 39.0, 25.0, 22.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0188446044921875, -0.984954833984375, -0.9510650634765625, -0.91717529296875, -0.8832855224609375, -0.849395751953125, -0.8155059814453125, -0.7816162109375, -0.7477264404296875, -0.713836669921875, -0.6799468994140625, -0.64605712890625, -0.6121673583984375, -0.578277587890625, -0.5443878173828125, -0.510498046875, -0.4766082763671875, -0.442718505859375, -0.4088287353515625, -0.37493896484375, -0.3410491943359375, -0.307159423828125, -0.2732696533203125, -0.2393798828125, -0.2054901123046875, -0.171600341796875, -0.1377105712890625, -0.10382080078125, -0.0699310302734375, -0.036041259765625, -0.0021514892578125, 0.03173828125, 0.0656280517578125, 0.099517822265625, 0.1334075927734375, 0.16729736328125, 0.2011871337890625, 0.235076904296875, 0.2689666748046875, 0.3028564453125, 0.3367462158203125, 0.370635986328125, 0.4045257568359375, 0.43841552734375, 0.4723052978515625, 0.506195068359375, 0.5400848388671875, 0.573974609375, 0.6078643798828125, 0.641754150390625, 0.6756439208984375, 0.70953369140625, 0.7434234619140625, 0.777313232421875, 0.8112030029296875, 0.8450927734375, 0.8789825439453125, 0.912872314453125, 0.9467620849609375, 0.98065185546875, 1.0145416259765625, 1.048431396484375, 1.0823211669921875, 1.1162109375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 8.0, 10.0, 10.0, 14.0, 20.0, 23.0, 19.0, 22.0, 31.0, 34.0, 27.0, 40.0, 48.0, 38.0, 50.0, 43.0, 44.0, 55.0, 43.0, 44.0, 37.0, 42.0, 32.0, 31.0, 28.0, 34.0, 24.0, 24.0, 14.0, 15.0, 19.0, 17.0, 9.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9345703125, -1.8772125244140625, -1.819854736328125, -1.7624969482421875, -1.70513916015625, -1.6477813720703125, -1.590423583984375, -1.5330657958984375, -1.4757080078125, -1.4183502197265625, -1.360992431640625, -1.3036346435546875, -1.24627685546875, -1.1889190673828125, -1.131561279296875, -1.0742034912109375, -1.016845703125, -0.9594879150390625, -0.902130126953125, -0.8447723388671875, -0.78741455078125, -0.7300567626953125, -0.672698974609375, -0.6153411865234375, -0.5579833984375, -0.5006256103515625, -0.443267822265625, -0.3859100341796875, -0.32855224609375, -0.2711944580078125, -0.213836669921875, -0.1564788818359375, -0.09912109375, -0.0417633056640625, 0.015594482421875, 0.0729522705078125, 0.13031005859375, 0.1876678466796875, 0.245025634765625, 0.3023834228515625, 0.3597412109375, 0.4170989990234375, 0.474456787109375, 0.5318145751953125, 0.58917236328125, 0.6465301513671875, 0.703887939453125, 0.7612457275390625, 0.818603515625, 0.8759613037109375, 0.933319091796875, 0.9906768798828125, 1.04803466796875, 1.1053924560546875, 1.162750244140625, 1.2201080322265625, 1.2774658203125, 1.3348236083984375, 1.392181396484375, 1.4495391845703125, 1.50689697265625, 1.5642547607421875, 1.621612548828125, 1.6789703369140625, 1.736328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 26.0, 31.0, 64.0, 89.0, 140.0, 188.0, 310.0, 489.0, 766.0, 1134.0, 1903.0, 2869.0, 4493.0, 6856.0, 10342.0, 15388.0, 22428.0, 31941.0, 43266.0, 57743.0, 72693.0, 86664.0, 96855.0, 101445.0, 98873.0, 90408.0, 76969.0, 63033.0, 48504.0, 35833.0, 24916.0, 17667.0, 11958.0, 7671.0, 5072.0, 3315.0, 2268.0, 1367.0, 953.0, 630.0, 353.0, 239.0, 149.0, 86.0, 54.0, 32.0, 21.0, 20.0, 9.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-1.1435546875, -1.108551025390625, -1.07354736328125, -1.038543701171875, -1.0035400390625, -0.968536376953125, -0.93353271484375, -0.898529052734375, -0.863525390625, -0.828521728515625, -0.79351806640625, -0.758514404296875, -0.7235107421875, -0.688507080078125, -0.65350341796875, -0.618499755859375, -0.58349609375, -0.548492431640625, -0.51348876953125, -0.478485107421875, -0.4434814453125, -0.408477783203125, -0.37347412109375, -0.338470458984375, -0.303466796875, -0.268463134765625, -0.23345947265625, -0.198455810546875, -0.1634521484375, -0.128448486328125, -0.09344482421875, -0.058441162109375, -0.0234375, 0.011566162109375, 0.04656982421875, 0.081573486328125, 0.1165771484375, 0.151580810546875, 0.18658447265625, 0.221588134765625, 0.256591796875, 0.291595458984375, 0.32659912109375, 0.361602783203125, 0.3966064453125, 0.431610107421875, 0.46661376953125, 0.501617431640625, 0.53662109375, 0.571624755859375, 0.60662841796875, 0.641632080078125, 0.6766357421875, 0.711639404296875, 0.74664306640625, 0.781646728515625, 0.816650390625, 0.851654052734375, 0.88665771484375, 0.921661376953125, 0.9566650390625, 0.991668701171875, 1.02667236328125, 1.061676025390625, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 9.0, 15.0, 15.0, 14.0, 25.0, 24.0, 29.0, 30.0, 20.0, 26.0, 40.0, 48.0, 33.0, 40.0, 36.0, 39.0, 45.0, 58.0, 36.0, 41.0, 45.0, 37.0, 49.0, 46.0, 31.0, 30.0, 19.0, 20.0, 28.0, 13.0, 13.0, 9.0, 8.0, 6.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1130523681640625, -1.076690673828125, -1.0403289794921875, -1.00396728515625, -0.9676055908203125, -0.931243896484375, -0.8948822021484375, -0.8585205078125, -0.8221588134765625, -0.785797119140625, -0.7494354248046875, -0.71307373046875, -0.6767120361328125, -0.640350341796875, -0.6039886474609375, -0.567626953125, -0.5312652587890625, -0.494903564453125, -0.4585418701171875, -0.42218017578125, -0.3858184814453125, -0.349456787109375, -0.3130950927734375, -0.2767333984375, -0.2403717041015625, -0.204010009765625, -0.1676483154296875, -0.13128662109375, -0.0949249267578125, -0.058563232421875, -0.0222015380859375, 0.01416015625, 0.0505218505859375, 0.086883544921875, 0.1232452392578125, 0.15960693359375, 0.1959686279296875, 0.232330322265625, 0.2686920166015625, 0.3050537109375, 0.3414154052734375, 0.377777099609375, 0.4141387939453125, 0.45050048828125, 0.4868621826171875, 0.523223876953125, 0.5595855712890625, 0.595947265625, 0.6323089599609375, 0.668670654296875, 0.7050323486328125, 0.74139404296875, 0.7777557373046875, 0.814117431640625, 0.8504791259765625, 0.8868408203125, 0.9232025146484375, 0.959564208984375, 0.9959259033203125, 1.03228759765625, 1.0686492919921875, 1.105010986328125, 1.1413726806640625, 1.177734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 26.0, 14.0, 18.0, 29.0, 40.0, 55.0, 84.0, 155.0, 195.0, 365.0, 556.0, 951.0, 1644.0, 3090.0, 5693.0, 10394.0, 19512.0, 35968.0, 64015.0, 104060.0, 149177.0, 175861.0, 165834.0, 126548.0, 80438.0, 47252.0, 25694.0, 14114.0, 7355.0, 3912.0, 2306.0, 1224.0, 716.0, 423.0, 240.0, 181.0, 126.0, 75.0, 52.0, 35.0, 35.0, 16.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.91845703125, -0.8895111083984375, -0.860565185546875, -0.8316192626953125, -0.80267333984375, -0.7737274169921875, -0.744781494140625, -0.7158355712890625, -0.6868896484375, -0.6579437255859375, -0.628997802734375, -0.6000518798828125, -0.57110595703125, -0.5421600341796875, -0.513214111328125, -0.4842681884765625, -0.455322265625, -0.4263763427734375, -0.397430419921875, -0.3684844970703125, -0.33953857421875, -0.3105926513671875, -0.281646728515625, -0.2527008056640625, -0.2237548828125, -0.1948089599609375, -0.165863037109375, -0.1369171142578125, -0.10797119140625, -0.0790252685546875, -0.050079345703125, -0.0211334228515625, 0.0078125, 0.0367584228515625, 0.065704345703125, 0.0946502685546875, 0.12359619140625, 0.1525421142578125, 0.181488037109375, 0.2104339599609375, 0.2393798828125, 0.2683258056640625, 0.297271728515625, 0.3262176513671875, 0.35516357421875, 0.3841094970703125, 0.413055419921875, 0.4420013427734375, 0.470947265625, 0.4998931884765625, 0.528839111328125, 0.5577850341796875, 0.58673095703125, 0.6156768798828125, 0.644622802734375, 0.6735687255859375, 0.7025146484375, 0.7314605712890625, 0.760406494140625, 0.7893524169921875, 0.81829833984375, 0.8472442626953125, 0.876190185546875, 0.9051361083984375, 0.93408203125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 5.0, 3.0, 12.0, 16.0, 13.0, 24.0, 30.0, 39.0, 30.0, 42.0, 49.0, 52.0, 62.0, 66.0, 63.0, 75.0, 50.0, 67.0, 58.0, 51.0, 35.0, 39.0, 26.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.512901306152344e-05, -9.219907224178314e-05, -8.926913142204285e-05, -8.633919060230255e-05, -8.340924978256226e-05, -8.047930896282196e-05, -7.754936814308167e-05, -7.461942732334137e-05, -7.168948650360107e-05, -6.875954568386078e-05, -6.582960486412048e-05, -6.289966404438019e-05, -5.996972322463989e-05, -5.70397824048996e-05, -5.41098415851593e-05, -5.1179900765419006e-05, -4.824995994567871e-05, -4.5320019125938416e-05, -4.239007830619812e-05, -3.9460137486457825e-05, -3.653019666671753e-05, -3.3600255846977234e-05, -3.067031502723694e-05, -2.7740374207496643e-05, -2.4810433387756348e-05, -2.1880492568016052e-05, -1.8950551748275757e-05, -1.602061092853546e-05, -1.3090670108795166e-05, -1.016072928905487e-05, -7.230788469314575e-06, -4.30084764957428e-06, -1.3709068298339844e-06, 1.559033989906311e-06, 4.4889748096466064e-06, 7.418915629386902e-06, 1.0348856449127197e-05, 1.3278797268867493e-05, 1.6208738088607788e-05, 1.9138678908348083e-05, 2.206861972808838e-05, 2.4998560547828674e-05, 2.792850136756897e-05, 3.0858442187309265e-05, 3.378838300704956e-05, 3.6718323826789856e-05, 3.964826464653015e-05, 4.257820546627045e-05, 4.550814628601074e-05, 4.843808710575104e-05, 5.136802792549133e-05, 5.429796874523163e-05, 5.7227909564971924e-05, 6.015785038471222e-05, 6.308779120445251e-05, 6.601773202419281e-05, 6.89476728439331e-05, 7.18776136636734e-05, 7.48075544834137e-05, 7.773749530315399e-05, 8.066743612289429e-05, 8.359737694263458e-05, 8.652731776237488e-05, 8.945725858211517e-05, 9.238719940185547e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 5.0, 14.0, 18.0, 34.0, 54.0, 56.0, 102.0, 127.0, 160.0, 267.0, 471.0, 735.0, 1167.0, 2161.0, 3877.0, 7541.0, 14839.0, 29396.0, 56962.0, 103039.0, 159489.0, 196257.0, 182200.0, 129725.0, 76541.0, 40230.0, 20638.0, 10244.0, 5273.0, 2858.0, 1562.0, 887.0, 555.0, 350.0, 223.0, 157.0, 118.0, 71.0, 52.0, 35.0, 22.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1484375, -1.1143951416015625, -1.080352783203125, -1.0463104248046875, -1.01226806640625, -0.9782257080078125, -0.944183349609375, -0.9101409912109375, -0.8760986328125, -0.8420562744140625, -0.808013916015625, -0.7739715576171875, -0.73992919921875, -0.7058868408203125, -0.671844482421875, -0.6378021240234375, -0.603759765625, -0.5697174072265625, -0.535675048828125, -0.5016326904296875, -0.46759033203125, -0.4335479736328125, -0.399505615234375, -0.3654632568359375, -0.3314208984375, -0.2973785400390625, -0.263336181640625, -0.2292938232421875, -0.19525146484375, -0.1612091064453125, -0.127166748046875, -0.0931243896484375, -0.05908203125, -0.0250396728515625, 0.009002685546875, 0.0430450439453125, 0.07708740234375, 0.1111297607421875, 0.145172119140625, 0.1792144775390625, 0.2132568359375, 0.2472991943359375, 0.281341552734375, 0.3153839111328125, 0.34942626953125, 0.3834686279296875, 0.417510986328125, 0.4515533447265625, 0.485595703125, 0.5196380615234375, 0.553680419921875, 0.5877227783203125, 0.62176513671875, 0.6558074951171875, 0.689849853515625, 0.7238922119140625, 0.7579345703125, 0.7919769287109375, 0.826019287109375, 0.8600616455078125, 0.89410400390625, 0.9281463623046875, 0.962188720703125, 0.9962310791015625, 1.0302734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 11.0, 14.0, 15.0, 23.0, 31.0, 32.0, 42.0, 44.0, 64.0, 61.0, 85.0, 73.0, 75.0, 72.0, 47.0, 50.0, 39.0, 57.0, 35.0, 25.0, 20.0, 19.0, 19.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.344482421875, -0.3343162536621094, -0.32415008544921875, -0.3139839172363281, -0.3038177490234375, -0.2936515808105469, -0.28348541259765625, -0.2733192443847656, -0.263153076171875, -0.2529869079589844, -0.24282073974609375, -0.23265457153320312, -0.2224884033203125, -0.21232223510742188, -0.20215606689453125, -0.19198989868164062, -0.18182373046875, -0.17165756225585938, -0.16149139404296875, -0.15132522583007812, -0.1411590576171875, -0.13099288940429688, -0.12082672119140625, -0.11066055297851562, -0.100494384765625, -0.09032821655273438, -0.08016204833984375, -0.06999588012695312, -0.0598297119140625, -0.049663543701171875, -0.03949737548828125, -0.029331207275390625, -0.0191650390625, -0.008998870849609375, 0.00116729736328125, 0.011333465576171875, 0.0214996337890625, 0.031665802001953125, 0.04183197021484375, 0.051998138427734375, 0.062164306640625, 0.07233047485351562, 0.08249664306640625, 0.09266281127929688, 0.1028289794921875, 0.11299514770507812, 0.12316131591796875, 0.13332748413085938, 0.14349365234375, 0.15365982055664062, 0.16382598876953125, 0.17399215698242188, 0.1841583251953125, 0.19432449340820312, 0.20449066162109375, 0.21465682983398438, 0.224822998046875, 0.23498916625976562, 0.24515533447265625, 0.2553215026855469, 0.2654876708984375, 0.2756538391113281, 0.28582000732421875, 0.2959861755371094, 0.30615234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 9.0, 10.0, 6.0, 4.0, 27.0, 21.0, 21.0, 22.0, 32.0, 40.0, 40.0, 51.0, 54.0, 64.0, 65.0, 55.0, 51.0, 53.0, 50.0, 61.0, 34.0, 46.0, 37.0, 36.0, 23.0, 19.0, 19.0, 13.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6378824710845947, -2.55696964263916, -2.4760570526123047, -2.39514422416687, -2.3142313957214355, -2.233318567276001, -2.1524057388305664, -2.071493148803711, -1.9905803203582764, -1.9096674919128418, -1.8287547826766968, -1.7478420734405518, -1.6669292449951172, -1.5860164165496826, -1.5051037073135376, -1.4241909980773926, -1.343278169631958, -1.2623653411865234, -1.1814526319503784, -1.1005399227142334, -1.0196270942687988, -0.938714325428009, -0.8578015565872192, -0.7768887877464294, -0.6959760189056396, -0.6150632500648499, -0.5341504812240601, -0.45323771238327026, -0.37232494354248047, -0.2914121747016907, -0.21049940586090088, -0.12958663702011108, -0.04867410659790039, 0.032238662242889404, 0.1131514310836792, 0.194064199924469, 0.2749769687652588, 0.3558897376060486, 0.4368025064468384, 0.5177152752876282, 0.598628044128418, 0.6795408129692078, 0.7604535818099976, 0.8413663506507874, 0.9222791194915771, 1.0031919479370117, 1.0841046571731567, 1.1650173664093018, 1.2459301948547363, 1.326843023300171, 1.407755732536316, 1.488668441772461, 1.5695812702178955, 1.65049409866333, 1.731406807899475, 1.8123195171356201, 1.8932323455810547, 1.9741451740264893, 2.055058002471924, 2.1359705924987793, 2.216883420944214, 2.2977962493896484, 2.378708839416504, 2.4596216678619385, 2.540534496307373]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 9.0, 12.0, 15.0, 6.0, 17.0, 16.0, 8.0, 24.0, 22.0, 28.0, 30.0, 26.0, 32.0, 40.0, 32.0, 43.0, 37.0, 35.0, 43.0, 46.0, 31.0, 46.0, 38.0, 22.0, 40.0, 34.0, 42.0, 29.0, 30.0, 29.0, 23.0, 25.0, 15.0, 12.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7800862789154053, -1.7279075384140015, -1.6757287979125977, -1.6235501766204834, -1.5713714361190796, -1.5191926956176758, -1.4670140743255615, -1.4148353338241577, -1.362656593322754, -1.31047785282135, -1.2582991123199463, -1.206120491027832, -1.1539417505264282, -1.1017630100250244, -1.0495843887329102, -0.9974056482315063, -0.9452269077301025, -0.8930481672286987, -0.8408694863319397, -0.7886908054351807, -0.7365120649337769, -0.684333324432373, -0.632154643535614, -0.579975962638855, -0.5277972221374512, -0.47561851143836975, -0.42343980073928833, -0.3712610900402069, -0.3190823793411255, -0.26690366864204407, -0.21472495794296265, -0.16254624724388123, -0.11036765575408936, -0.058188945055007935, -0.006010234355926514, 0.04616847634315491, 0.09834718704223633, 0.15052589774131775, 0.20270460844039917, 0.2548833191394806, 0.307062029838562, 0.35924074053764343, 0.41141945123672485, 0.4635981619358063, 0.5157768726348877, 0.5679556131362915, 0.6201342940330505, 0.6723129749298096, 0.7244917154312134, 0.7766704559326172, 0.8288491368293762, 0.8810278177261353, 0.9332065582275391, 0.9853852987289429, 1.0375640392303467, 1.089742660522461, 1.1419214010238647, 1.1941001415252686, 1.2462787628173828, 1.2984575033187866, 1.3506362438201904, 1.4028149843215942, 1.454993724822998, 1.5071723461151123, 1.5593510866165161]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 9.0, 18.0, 27.0, 35.0, 54.0, 83.0, 121.0, 187.0, 340.0, 522.0, 886.0, 1481.0, 2412.0, 4237.0, 7285.0, 12654.0, 21566.0, 36922.0, 62354.0, 104771.0, 166104.0, 252475.0, 357782.0, 462754.0, 534085.0, 543572.0, 487063.0, 385959.0, 277514.0, 184558.0, 116806.0, 70856.0, 41709.0, 24144.0, 13981.0, 7839.0, 4576.0, 2691.0, 1488.0, 938.0, 586.0, 295.0, 212.0, 128.0, 87.0, 43.0, 35.0, 13.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8046875, -1.7467193603515625, -1.688751220703125, -1.6307830810546875, -1.57281494140625, -1.5148468017578125, -1.456878662109375, -1.3989105224609375, -1.3409423828125, -1.2829742431640625, -1.225006103515625, -1.1670379638671875, -1.10906982421875, -1.0511016845703125, -0.993133544921875, -0.9351654052734375, -0.877197265625, -0.8192291259765625, -0.761260986328125, -0.7032928466796875, -0.64532470703125, -0.5873565673828125, -0.529388427734375, -0.4714202880859375, -0.4134521484375, -0.3554840087890625, -0.297515869140625, -0.2395477294921875, -0.18157958984375, -0.1236114501953125, -0.065643310546875, -0.0076751708984375, 0.05029296875, 0.1082611083984375, 0.166229248046875, 0.2241973876953125, 0.28216552734375, 0.3401336669921875, 0.398101806640625, 0.4560699462890625, 0.5140380859375, 0.5720062255859375, 0.629974365234375, 0.6879425048828125, 0.74591064453125, 0.8038787841796875, 0.861846923828125, 0.9198150634765625, 0.977783203125, 1.0357513427734375, 1.093719482421875, 1.1516876220703125, 1.20965576171875, 1.2676239013671875, 1.325592041015625, 1.3835601806640625, 1.4415283203125, 1.4994964599609375, 1.557464599609375, 1.6154327392578125, 1.67340087890625, 1.7313690185546875, 1.789337158203125, 1.8473052978515625, 1.9052734375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 3.0, 5.0, 10.0, 11.0, 12.0, 12.0, 9.0, 17.0, 14.0, 12.0, 16.0, 20.0, 26.0, 27.0, 40.0, 33.0, 30.0, 39.0, 42.0, 31.0, 44.0, 48.0, 40.0, 35.0, 36.0, 47.0, 34.0, 32.0, 30.0, 34.0, 35.0, 29.0, 21.0, 26.0, 18.0, 10.0, 13.0, 10.0, 8.0, 5.0, 2.0, 4.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0], "bins": [-1.611328125, -1.5662841796875, -1.521240234375, -1.4761962890625, -1.43115234375, -1.3861083984375, -1.341064453125, -1.2960205078125, -1.2509765625, -1.2059326171875, -1.160888671875, -1.1158447265625, -1.07080078125, -1.0257568359375, -0.980712890625, -0.9356689453125, -0.890625, -0.8455810546875, -0.800537109375, -0.7554931640625, -0.71044921875, -0.6654052734375, -0.620361328125, -0.5753173828125, -0.5302734375, -0.4852294921875, -0.440185546875, -0.3951416015625, -0.35009765625, -0.3050537109375, -0.260009765625, -0.2149658203125, -0.169921875, -0.1248779296875, -0.079833984375, -0.0347900390625, 0.01025390625, 0.0552978515625, 0.100341796875, 0.1453857421875, 0.1904296875, 0.2354736328125, 0.280517578125, 0.3255615234375, 0.37060546875, 0.4156494140625, 0.460693359375, 0.5057373046875, 0.55078125, 0.5958251953125, 0.640869140625, 0.6859130859375, 0.73095703125, 0.7760009765625, 0.821044921875, 0.8660888671875, 0.9111328125, 0.9561767578125, 1.001220703125, 1.0462646484375, 1.09130859375, 1.1363525390625, 1.181396484375, 1.2264404296875, 1.271484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 13.0, 15.0, 37.0, 48.0, 85.0, 127.0, 245.0, 460.0, 784.0, 1379.0, 2343.0, 4176.0, 7597.0, 13104.0, 22841.0, 39031.0, 65387.0, 106857.0, 166479.0, 247792.0, 340674.0, 431886.0, 497237.0, 511027.0, 474096.0, 395133.0, 300736.0, 211483.0, 138844.0, 87820.0, 53205.0, 31266.0, 18204.0, 10393.0, 5901.0, 3267.0, 1893.0, 1020.0, 568.0, 372.0, 186.0, 103.0, 66.0, 39.0, 19.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.890533447265625, -1.82598876953125, -1.761444091796875, -1.6968994140625, -1.632354736328125, -1.56781005859375, -1.503265380859375, -1.438720703125, -1.374176025390625, -1.30963134765625, -1.245086669921875, -1.1805419921875, -1.115997314453125, -1.05145263671875, -0.986907958984375, -0.92236328125, -0.857818603515625, -0.79327392578125, -0.728729248046875, -0.6641845703125, -0.599639892578125, -0.53509521484375, -0.470550537109375, -0.406005859375, -0.341461181640625, -0.27691650390625, -0.212371826171875, -0.1478271484375, -0.083282470703125, -0.01873779296875, 0.045806884765625, 0.1103515625, 0.174896240234375, 0.23944091796875, 0.303985595703125, 0.3685302734375, 0.433074951171875, 0.49761962890625, 0.562164306640625, 0.626708984375, 0.691253662109375, 0.75579833984375, 0.820343017578125, 0.8848876953125, 0.949432373046875, 1.01397705078125, 1.078521728515625, 1.14306640625, 1.207611083984375, 1.27215576171875, 1.336700439453125, 1.4012451171875, 1.465789794921875, 1.53033447265625, 1.594879150390625, 1.659423828125, 1.723968505859375, 1.78851318359375, 1.853057861328125, 1.9176025390625, 1.982147216796875, 2.04669189453125, 2.111236572265625, 2.17578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 12.0, 24.0, 16.0, 20.0, 33.0, 40.0, 54.0, 63.0, 68.0, 90.0, 95.0, 98.0, 117.0, 140.0, 147.0, 162.0, 183.0, 193.0, 188.0, 219.0, 235.0, 223.0, 207.0, 172.0, 175.0, 147.0, 146.0, 110.0, 122.0, 111.0, 78.0, 80.0, 60.0, 51.0, 39.0, 21.0, 25.0, 28.0, 10.0, 12.0, 10.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83203125, -0.8075332641601562, -0.7830352783203125, -0.7585372924804688, -0.734039306640625, -0.7095413208007812, -0.6850433349609375, -0.6605453491210938, -0.63604736328125, -0.6115493774414062, -0.5870513916015625, -0.5625534057617188, -0.538055419921875, -0.5135574340820312, -0.4890594482421875, -0.46456146240234375, -0.4400634765625, -0.41556549072265625, -0.3910675048828125, -0.36656951904296875, -0.342071533203125, -0.31757354736328125, -0.2930755615234375, -0.26857757568359375, -0.24407958984375, -0.21958160400390625, -0.1950836181640625, -0.17058563232421875, -0.146087646484375, -0.12158966064453125, -0.0970916748046875, -0.07259368896484375, -0.048095703125, -0.02359771728515625, 0.0009002685546875, 0.02539825439453125, 0.049896240234375, 0.07439422607421875, 0.0988922119140625, 0.12339019775390625, 0.14788818359375, 0.17238616943359375, 0.1968841552734375, 0.22138214111328125, 0.245880126953125, 0.27037811279296875, 0.2948760986328125, 0.31937408447265625, 0.3438720703125, 0.36837005615234375, 0.3928680419921875, 0.41736602783203125, 0.441864013671875, 0.46636199951171875, 0.4908599853515625, 0.5153579711914062, 0.53985595703125, 0.5643539428710938, 0.5888519287109375, 0.6133499145507812, 0.637847900390625, 0.6623458862304688, 0.6868438720703125, 0.7113418579101562, 0.73583984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 7.0, 4.0, 13.0, 13.0, 21.0, 14.0, 28.0, 33.0, 40.0, 54.0, 44.0, 39.0, 58.0, 60.0, 70.0, 74.0, 50.0, 57.0, 55.0, 43.0, 45.0, 42.0, 34.0, 22.0, 22.0, 12.0, 17.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2938148975372314, -3.1929543018341064, -3.0920934677124023, -2.9912328720092773, -2.8903722763061523, -2.7895114421844482, -2.6886508464813232, -2.587790012359619, -2.486929416656494, -2.386068820953369, -2.285207986831665, -2.18434739112854, -2.083486557006836, -1.982625961303711, -1.881765365600586, -1.7809046506881714, -1.6800439357757568, -1.5791832208633423, -1.4783225059509277, -1.3774619102478027, -1.2766011953353882, -1.1757404804229736, -1.0748798847198486, -0.9740191698074341, -0.8731584548950195, -0.772297739982605, -0.6714370846748352, -0.5705764293670654, -0.4697157144546509, -0.36885499954223633, -0.26799434423446655, -0.16713368892669678, -0.06627321243286133, 0.034587472677230835, 0.135448157787323, 0.23630884289741516, 0.3371695280075073, 0.4380302429199219, 0.5388908982276917, 0.6397515535354614, 0.740612268447876, 0.8414729833602905, 0.9423336386680603, 1.04319429397583, 1.1440550088882446, 1.2449157238006592, 1.3457763195037842, 1.4466370344161987, 1.5474977493286133, 1.6483584642410278, 1.7492191791534424, 1.8500797748565674, 1.950940489768982, 2.0518012046813965, 2.1526618003845215, 2.2535223960876465, 2.3543832302093506, 2.4552438259124756, 2.5561046600341797, 2.6569652557373047, 2.7578258514404297, 2.858686685562134, 2.959547281265259, 3.060408115386963, 3.161268711090088]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 12.0, 4.0, 6.0, 9.0, 13.0, 13.0, 23.0, 17.0, 14.0, 13.0, 28.0, 24.0, 20.0, 27.0, 28.0, 34.0, 43.0, 36.0, 44.0, 32.0, 45.0, 36.0, 46.0, 39.0, 36.0, 37.0, 32.0, 23.0, 38.0, 35.0, 33.0, 29.0, 21.0, 22.0, 11.0, 15.0, 17.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8168824911117554, -1.7598389387130737, -1.7027955055236816, -1.645751953125, -1.5887084007263184, -1.5316649675369263, -1.4746214151382446, -1.4175779819488525, -1.360534429550171, -1.3034908771514893, -1.2464474439620972, -1.1894038915634155, -1.1323603391647339, -1.0753169059753418, -1.0182733535766602, -0.9612298607826233, -0.9041863083839417, -0.8471428155899048, -0.7900992631912231, -0.7330557703971863, -0.6760122776031494, -0.6189687252044678, -0.5619252324104309, -0.504881739616394, -0.4478382170200348, -0.39079469442367554, -0.33375120162963867, -0.2767076790332794, -0.21966417133808136, -0.1626206636428833, -0.10557714104652405, -0.04853364825248718, 0.00850987434387207, 0.06555338203907013, 0.12259689718484879, 0.17964041233062744, 0.2366839200258255, 0.29372742772102356, 0.3507709503173828, 0.4078144431114197, 0.46485796570777893, 0.5219014883041382, 0.578944981098175, 0.6359884738922119, 0.6930320262908936, 0.7500755190849304, 0.8071190118789673, 0.8641625642776489, 0.9212060570716858, 0.9782495498657227, 1.0352931022644043, 1.092336654663086, 1.149380087852478, 1.2064236402511597, 1.2634670734405518, 1.3205106258392334, 1.377554178237915, 1.4345977306365967, 1.4916411638259888, 1.5486847162246704, 1.605728268623352, 1.6627717018127441, 1.7198152542114258, 1.7768588066101074, 1.8339022397994995]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 12.0, 23.0, 24.0, 46.0, 58.0, 106.0, 145.0, 224.0, 279.0, 439.0, 660.0, 1019.0, 1419.0, 2146.0, 3322.0, 4931.0, 7488.0, 11555.0, 17962.0, 28246.0, 42907.0, 65004.0, 94734.0, 128331.0, 149902.0, 141480.0, 112387.0, 80042.0, 53264.0, 34856.0, 22861.0, 14528.0, 9563.0, 6222.0, 4150.0, 2714.0, 1820.0, 1166.0, 818.0, 557.0, 362.0, 244.0, 181.0, 119.0, 71.0, 55.0, 47.0, 21.0, 14.0, 8.0, 7.0, 3.0, 1.0, 5.0], "bins": [-0.473388671875, -0.45977020263671875, -0.4461517333984375, -0.43253326416015625, -0.418914794921875, -0.40529632568359375, -0.3916778564453125, -0.37805938720703125, -0.36444091796875, -0.35082244873046875, -0.3372039794921875, -0.32358551025390625, -0.309967041015625, -0.29634857177734375, -0.2827301025390625, -0.26911163330078125, -0.2554931640625, -0.24187469482421875, -0.2282562255859375, -0.21463775634765625, -0.201019287109375, -0.18740081787109375, -0.1737823486328125, -0.16016387939453125, -0.14654541015625, -0.13292694091796875, -0.1193084716796875, -0.10569000244140625, -0.092071533203125, -0.07845306396484375, -0.0648345947265625, -0.05121612548828125, -0.03759765625, -0.02397918701171875, -0.0103607177734375, 0.00325775146484375, 0.016876220703125, 0.03049468994140625, 0.0441131591796875, 0.05773162841796875, 0.07135009765625, 0.08496856689453125, 0.0985870361328125, 0.11220550537109375, 0.125823974609375, 0.13944244384765625, 0.1530609130859375, 0.16667938232421875, 0.1802978515625, 0.19391632080078125, 0.2075347900390625, 0.22115325927734375, 0.234771728515625, 0.24839019775390625, 0.2620086669921875, 0.27562713623046875, 0.28924560546875, 0.30286407470703125, 0.3164825439453125, 0.33010101318359375, 0.343719482421875, 0.35733795166015625, 0.3709564208984375, 0.38457489013671875, 0.398193359375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 13.0, 19.0, 17.0, 22.0, 18.0, 16.0, 21.0, 19.0, 27.0, 19.0, 29.0, 33.0, 41.0, 32.0, 43.0, 44.0, 52.0, 45.0, 28.0, 50.0, 42.0, 41.0, 26.0, 40.0, 28.0, 34.0, 30.0, 26.0, 19.0, 12.0, 10.0, 18.0, 14.0, 2.0, 7.0, 4.0, 5.0, 8.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8527374267578125, -1.790435791015625, -1.7281341552734375, -1.66583251953125, -1.6035308837890625, -1.541229248046875, -1.4789276123046875, -1.4166259765625, -1.3543243408203125, -1.292022705078125, -1.2297210693359375, -1.16741943359375, -1.1051177978515625, -1.042816162109375, -0.9805145263671875, -0.918212890625, -0.8559112548828125, -0.793609619140625, -0.7313079833984375, -0.66900634765625, -0.6067047119140625, -0.544403076171875, -0.4821014404296875, -0.4197998046875, -0.3574981689453125, -0.295196533203125, -0.2328948974609375, -0.17059326171875, -0.1082916259765625, -0.045989990234375, 0.0163116455078125, 0.07861328125, 0.1409149169921875, 0.203216552734375, 0.2655181884765625, 0.32781982421875, 0.3901214599609375, 0.452423095703125, 0.5147247314453125, 0.5770263671875, 0.6393280029296875, 0.701629638671875, 0.7639312744140625, 0.82623291015625, 0.8885345458984375, 0.950836181640625, 1.0131378173828125, 1.075439453125, 1.1377410888671875, 1.200042724609375, 1.2623443603515625, 1.32464599609375, 1.3869476318359375, 1.449249267578125, 1.5115509033203125, 1.5738525390625, 1.6361541748046875, 1.698455810546875, 1.7607574462890625, 1.82305908203125, 1.8853607177734375, 1.947662353515625, 2.0099639892578125, 2.072265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 10.0, 19.0, 26.0, 35.0, 45.0, 76.0, 117.0, 174.0, 238.0, 412.0, 608.0, 1016.0, 1660.0, 2632.0, 4724.0, 8713.0, 16049.0, 30628.0, 59733.0, 114975.0, 198380.0, 239234.0, 171293.0, 93696.0, 48393.0, 25064.0, 13174.0, 7166.0, 3990.0, 2397.0, 1403.0, 875.0, 563.0, 345.0, 227.0, 139.0, 105.0, 60.0, 52.0, 26.0, 26.0, 13.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0], "bins": [-0.669921875, -0.6492080688476562, -0.6284942626953125, -0.6077804565429688, -0.587066650390625, -0.5663528442382812, -0.5456390380859375, -0.5249252319335938, -0.50421142578125, -0.48349761962890625, -0.4627838134765625, -0.44207000732421875, -0.421356201171875, -0.40064239501953125, -0.3799285888671875, -0.35921478271484375, -0.3385009765625, -0.31778717041015625, -0.2970733642578125, -0.27635955810546875, -0.255645751953125, -0.23493194580078125, -0.2142181396484375, -0.19350433349609375, -0.17279052734375, -0.15207672119140625, -0.1313629150390625, -0.11064910888671875, -0.089935302734375, -0.06922149658203125, -0.0485076904296875, -0.02779388427734375, -0.007080078125, 0.01363372802734375, 0.0343475341796875, 0.05506134033203125, 0.075775146484375, 0.09648895263671875, 0.1172027587890625, 0.13791656494140625, 0.15863037109375, 0.17934417724609375, 0.2000579833984375, 0.22077178955078125, 0.241485595703125, 0.26219940185546875, 0.2829132080078125, 0.30362701416015625, 0.3243408203125, 0.34505462646484375, 0.3657684326171875, 0.38648223876953125, 0.407196044921875, 0.42790985107421875, 0.4486236572265625, 0.46933746337890625, 0.49005126953125, 0.5107650756835938, 0.5314788818359375, 0.5521926879882812, 0.572906494140625, 0.5936203002929688, 0.6143341064453125, 0.6350479125976562, 0.65576171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 10.0, 9.0, 7.0, 11.0, 9.0, 15.0, 14.0, 27.0, 26.0, 25.0, 31.0, 31.0, 43.0, 32.0, 32.0, 38.0, 51.0, 60.0, 45.0, 40.0, 37.0, 34.0, 56.0, 36.0, 31.0, 28.0, 50.0, 21.0, 33.0, 23.0, 14.0, 12.0, 13.0, 18.0, 12.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1537017822265625, -1.113067626953125, -1.0724334716796875, -1.03179931640625, -0.9911651611328125, -0.950531005859375, -0.9098968505859375, -0.8692626953125, -0.8286285400390625, -0.787994384765625, -0.7473602294921875, -0.70672607421875, -0.6660919189453125, -0.625457763671875, -0.5848236083984375, -0.544189453125, -0.5035552978515625, -0.462921142578125, -0.4222869873046875, -0.38165283203125, -0.3410186767578125, -0.300384521484375, -0.2597503662109375, -0.2191162109375, -0.1784820556640625, -0.137847900390625, -0.0972137451171875, -0.05657958984375, -0.0159454345703125, 0.024688720703125, 0.0653228759765625, 0.10595703125, 0.1465911865234375, 0.187225341796875, 0.2278594970703125, 0.26849365234375, 0.3091278076171875, 0.349761962890625, 0.3903961181640625, 0.4310302734375, 0.4716644287109375, 0.512298583984375, 0.5529327392578125, 0.59356689453125, 0.6342010498046875, 0.674835205078125, 0.7154693603515625, 0.756103515625, 0.7967376708984375, 0.837371826171875, 0.8780059814453125, 0.91864013671875, 0.9592742919921875, 0.999908447265625, 1.0405426025390625, 1.0811767578125, 1.1218109130859375, 1.162445068359375, 1.2030792236328125, 1.24371337890625, 1.2843475341796875, 1.324981689453125, 1.3656158447265625, 1.40625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 14.0, 7.0, 28.0, 31.0, 29.0, 44.0, 53.0, 65.0, 86.0, 141.0, 183.0, 244.0, 351.0, 505.0, 727.0, 1222.0, 1885.0, 3160.0, 5712.0, 11583.0, 27475.0, 88541.0, 393989.0, 375300.0, 84834.0, 26569.0, 11473.0, 5771.0, 3045.0, 1827.0, 1134.0, 736.0, 498.0, 344.0, 238.0, 162.0, 130.0, 118.0, 88.0, 63.0, 39.0, 30.0, 18.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4084968566894531, -0.39389801025390625, -0.3792991638183594, -0.3647003173828125, -0.3501014709472656, -0.33550262451171875, -0.3209037780761719, -0.306304931640625, -0.2917060852050781, -0.27710723876953125, -0.2625083923339844, -0.2479095458984375, -0.23331069946289062, -0.21871185302734375, -0.20411300659179688, -0.18951416015625, -0.17491531372070312, -0.16031646728515625, -0.14571762084960938, -0.1311187744140625, -0.11651992797851562, -0.10192108154296875, -0.08732223510742188, -0.072723388671875, -0.058124542236328125, -0.04352569580078125, -0.028926849365234375, -0.0143280029296875, 0.000270843505859375, 0.01486968994140625, 0.029468536376953125, 0.0440673828125, 0.058666229248046875, 0.07326507568359375, 0.08786392211914062, 0.1024627685546875, 0.11706161499023438, 0.13166046142578125, 0.14625930786132812, 0.160858154296875, 0.17545700073242188, 0.19005584716796875, 0.20465469360351562, 0.2192535400390625, 0.23385238647460938, 0.24845123291015625, 0.2630500793457031, 0.27764892578125, 0.2922477722167969, 0.30684661865234375, 0.3214454650878906, 0.3360443115234375, 0.3506431579589844, 0.36524200439453125, 0.3798408508300781, 0.394439697265625, 0.4090385437011719, 0.42363739013671875, 0.4382362365722656, 0.4528350830078125, 0.4674339294433594, 0.48203277587890625, 0.4966316223144531, 0.51123046875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 6.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 4.0, 5.0, 7.0, 9.0, 12.0, 16.0, 12.0, 27.0, 15.0, 44.0, 45.0, 35.0, 40.0, 53.0, 57.0, 57.0, 62.0, 59.0, 51.0, 50.0, 36.0, 44.0, 36.0, 37.0, 22.0, 25.0, 23.0, 13.0, 20.0, 9.0, 7.0, 5.0, 9.0, 16.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.328345388174057e-05, -1.2798234820365906e-05, -1.2313015758991241e-05, -1.1827796697616577e-05, -1.1342577636241913e-05, -1.0857358574867249e-05, -1.0372139513492584e-05, -9.88692045211792e-06, -9.401701390743256e-06, -8.916482329368591e-06, -8.431263267993927e-06, -7.946044206619263e-06, -7.460825145244598e-06, -6.975606083869934e-06, -6.49038702249527e-06, -6.0051679611206055e-06, -5.519948899745941e-06, -5.034729838371277e-06, -4.5495107769966125e-06, -4.064291715621948e-06, -3.579072654247284e-06, -3.0938535928726196e-06, -2.6086345314979553e-06, -2.123415470123291e-06, -1.6381964087486267e-06, -1.1529773473739624e-06, -6.677582859992981e-07, -1.825392246246338e-07, 3.026798367500305e-07, 7.878988981246948e-07, 1.2731179594993591e-06, 1.7583370208740234e-06, 2.2435560822486877e-06, 2.728775143623352e-06, 3.2139942049980164e-06, 3.6992132663726807e-06, 4.184432327747345e-06, 4.669651389122009e-06, 5.154870450496674e-06, 5.640089511871338e-06, 6.125308573246002e-06, 6.6105276346206665e-06, 7.095746695995331e-06, 7.580965757369995e-06, 8.06618481874466e-06, 8.551403880119324e-06, 9.036622941493988e-06, 9.521842002868652e-06, 1.0007061064243317e-05, 1.0492280125617981e-05, 1.0977499186992645e-05, 1.146271824836731e-05, 1.1947937309741974e-05, 1.2433156371116638e-05, 1.2918375432491302e-05, 1.3403594493865967e-05, 1.3888813555240631e-05, 1.4374032616615295e-05, 1.485925167798996e-05, 1.5344470739364624e-05, 1.582968980073929e-05, 1.6314908862113953e-05, 1.6800127923488617e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 19.0, 18.0, 40.0, 34.0, 47.0, 96.0, 113.0, 158.0, 223.0, 314.0, 446.0, 686.0, 974.0, 1476.0, 2254.0, 3524.0, 5962.0, 10912.0, 23249.0, 58464.0, 172586.0, 384852.0, 238732.0, 80543.0, 30208.0, 13690.0, 7018.0, 4096.0, 2522.0, 1621.0, 1121.0, 772.0, 552.0, 369.0, 269.0, 181.0, 131.0, 95.0, 59.0, 37.0, 24.0, 15.0, 19.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5106124877929688, -0.4933929443359375, -0.47617340087890625, -0.458953857421875, -0.44173431396484375, -0.4245147705078125, -0.40729522705078125, -0.39007568359375, -0.37285614013671875, -0.3556365966796875, -0.33841705322265625, -0.321197509765625, -0.30397796630859375, -0.2867584228515625, -0.26953887939453125, -0.2523193359375, -0.23509979248046875, -0.2178802490234375, -0.20066070556640625, -0.183441162109375, -0.16622161865234375, -0.1490020751953125, -0.13178253173828125, -0.11456298828125, -0.09734344482421875, -0.0801239013671875, -0.06290435791015625, -0.045684814453125, -0.02846527099609375, -0.0112457275390625, 0.00597381591796875, 0.023193359375, 0.04041290283203125, 0.0576324462890625, 0.07485198974609375, 0.092071533203125, 0.10929107666015625, 0.1265106201171875, 0.14373016357421875, 0.16094970703125, 0.17816925048828125, 0.1953887939453125, 0.21260833740234375, 0.229827880859375, 0.24704742431640625, 0.2642669677734375, 0.28148651123046875, 0.2987060546875, 0.31592559814453125, 0.3331451416015625, 0.35036468505859375, 0.367584228515625, 0.38480377197265625, 0.4020233154296875, 0.41924285888671875, 0.43646240234375, 0.45368194580078125, 0.4709014892578125, 0.48812103271484375, 0.505340576171875, 0.5225601196289062, 0.5397796630859375, 0.5569992065429688, 0.57421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 16.0, 11.0, 19.0, 23.0, 31.0, 40.0, 44.0, 71.0, 73.0, 73.0, 90.0, 70.0, 86.0, 59.0, 45.0, 40.0, 23.0, 27.0, 18.0, 22.0, 8.0, 9.0, 9.0, 14.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.11407470703125, -0.11100006103515625, -0.1079254150390625, -0.10485076904296875, -0.101776123046875, -0.09870147705078125, -0.0956268310546875, -0.09255218505859375, -0.0894775390625, -0.08640289306640625, -0.0833282470703125, -0.08025360107421875, -0.077178955078125, -0.07410430908203125, -0.0710296630859375, -0.06795501708984375, -0.06488037109375, -0.06180572509765625, -0.0587310791015625, -0.05565643310546875, -0.052581787109375, -0.04950714111328125, -0.0464324951171875, -0.04335784912109375, -0.040283203125, -0.03720855712890625, -0.0341339111328125, -0.03105926513671875, -0.027984619140625, -0.02490997314453125, -0.0218353271484375, -0.01876068115234375, -0.01568603515625, -0.01261138916015625, -0.0095367431640625, -0.00646209716796875, -0.003387451171875, -0.00031280517578125, 0.0027618408203125, 0.00583648681640625, 0.0089111328125, 0.01198577880859375, 0.0150604248046875, 0.01813507080078125, 0.021209716796875, 0.02428436279296875, 0.0273590087890625, 0.03043365478515625, 0.03350830078125, 0.03658294677734375, 0.0396575927734375, 0.04273223876953125, 0.045806884765625, 0.04888153076171875, 0.0519561767578125, 0.05503082275390625, 0.05810546875, 0.06118011474609375, 0.0642547607421875, 0.06732940673828125, 0.070404052734375, 0.07347869873046875, 0.0765533447265625, 0.07962799072265625, 0.08270263671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 6.0, 5.0, 6.0, 8.0, 10.0, 16.0, 17.0, 15.0, 29.0, 36.0, 37.0, 45.0, 46.0, 47.0, 52.0, 63.0, 68.0, 78.0, 50.0, 57.0, 51.0, 43.0, 48.0, 36.0, 35.0, 28.0, 20.0, 18.0, 10.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2994351387023926, -3.1985461711883545, -3.0976574420928955, -2.9967684745788574, -2.8958797454833984, -2.7949907779693604, -2.6941020488739014, -2.5932130813598633, -2.4923243522644043, -2.391435384750366, -2.2905466556549072, -2.189657688140869, -2.08876895904541, -1.987879991531372, -1.886991262435913, -1.786102294921875, -1.6852134466171265, -1.584324598312378, -1.4834357500076294, -1.3825469017028809, -1.2816580533981323, -1.1807692050933838, -1.0798802375793457, -0.9789914488792419, -0.8781026005744934, -0.7772137522697449, -0.6763249039649963, -0.575435996055603, -0.4745471775531769, -0.37365829944610596, -0.2727694511413574, -0.1718806028366089, -0.07099175453186035, 0.02989710122346878, 0.1307859569787979, 0.23167482018470764, 0.3325636684894562, 0.4334525465965271, 0.5343413949012756, 0.6352302432060242, 0.7361190915107727, 0.8370079398155212, 0.9378967881202698, 1.038785696029663, 1.1396745443344116, 1.2405633926391602, 1.3414522409439087, 1.4423410892486572, 1.5432299375534058, 1.6441187858581543, 1.7450076341629028, 1.8458964824676514, 1.9467853307724, 2.0476741790771484, 2.1485631465911865, 2.2494518756866455, 2.3503408432006836, 2.4512298107147217, 2.5521185398101807, 2.6530075073242188, 2.7538962364196777, 2.854785203933716, 2.955673933029175, 3.056562900543213, 3.157451629638672]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 4.0, 7.0, 10.0, 10.0, 18.0, 18.0, 21.0, 13.0, 16.0, 35.0, 17.0, 23.0, 29.0, 31.0, 37.0, 37.0, 41.0, 34.0, 41.0, 45.0, 40.0, 40.0, 39.0, 34.0, 42.0, 29.0, 26.0, 39.0, 36.0, 27.0, 24.0, 20.0, 17.0, 16.0, 15.0, 15.0, 6.0, 6.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7987110614776611, -1.7415999174118042, -1.6844886541366577, -1.6273775100708008, -1.5702662467956543, -1.5131551027297974, -1.4560439586639404, -1.398932695388794, -1.3418214321136475, -1.2847102880477905, -1.227599024772644, -1.170487880706787, -1.1133766174316406, -1.0562654733657837, -0.999154269695282, -0.9420430660247803, -0.8849319219589233, -0.8278207182884216, -0.7707095146179199, -0.713598370552063, -0.6564871072769165, -0.5993759632110596, -0.5422647595405579, -0.48515355587005615, -0.42804235219955444, -0.37093114852905273, -0.313819944858551, -0.2567087709903717, -0.19959756731987, -0.1424863636493683, -0.08537518978118896, -0.028263986110687256, 0.028847098350524902, 0.08595829457044601, 0.14306949079036713, 0.20018067955970764, 0.25729188323020935, 0.31440308690071106, 0.3715142607688904, 0.4286254644393921, 0.4857366681098938, 0.5428478717803955, 0.5999590754508972, 0.6570702791213989, 0.7141814231872559, 0.7712926864624023, 0.8284038305282593, 0.885515034198761, 0.9426262378692627, 0.9997374415397644, 1.0568486452102661, 1.113959789276123, 1.1710710525512695, 1.2281821966171265, 1.2852933406829834, 1.3424046039581299, 1.3995158672332764, 1.4566270112991333, 1.5137382745742798, 1.5708494186401367, 1.6279606819152832, 1.6850718259811401, 1.742182970046997, 1.7992942333221436, 1.8564053773880005]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 12.0, 11.0, 15.0, 33.0, 44.0, 73.0, 122.0, 205.0, 321.0, 533.0, 811.0, 1353.0, 2180.0, 3316.0, 5119.0, 7668.0, 11589.0, 16934.0, 24338.0, 34025.0, 45224.0, 58397.0, 72075.0, 83815.0, 92661.0, 96235.0, 94346.0, 87113.0, 76141.0, 62501.0, 49458.0, 37534.0, 27068.0, 18914.0, 13310.0, 8831.0, 5919.0, 3782.0, 2428.0, 1487.0, 963.0, 614.0, 393.0, 233.0, 172.0, 97.0, 64.0, 32.0, 26.0, 10.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0713043212890625, -1.035186767578125, -0.9990692138671875, -0.96295166015625, -0.9268341064453125, -0.890716552734375, -0.8545989990234375, -0.8184814453125, -0.7823638916015625, -0.746246337890625, -0.7101287841796875, -0.67401123046875, -0.6378936767578125, -0.601776123046875, -0.5656585693359375, -0.529541015625, -0.4934234619140625, -0.457305908203125, -0.4211883544921875, -0.38507080078125, -0.3489532470703125, -0.312835693359375, -0.2767181396484375, -0.2406005859375, -0.2044830322265625, -0.168365478515625, -0.1322479248046875, -0.09613037109375, -0.0600128173828125, -0.023895263671875, 0.0122222900390625, 0.04833984375, 0.0844573974609375, 0.120574951171875, 0.1566925048828125, 0.19281005859375, 0.2289276123046875, 0.265045166015625, 0.3011627197265625, 0.3372802734375, 0.3733978271484375, 0.409515380859375, 0.4456329345703125, 0.48175048828125, 0.5178680419921875, 0.553985595703125, 0.5901031494140625, 0.626220703125, 0.6623382568359375, 0.698455810546875, 0.7345733642578125, 0.77069091796875, 0.8068084716796875, 0.842926025390625, 0.8790435791015625, 0.9151611328125, 0.9512786865234375, 0.987396240234375, 1.0235137939453125, 1.05963134765625, 1.0957489013671875, 1.131866455078125, 1.1679840087890625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 7.0, 15.0, 20.0, 14.0, 21.0, 19.0, 14.0, 30.0, 24.0, 32.0, 19.0, 38.0, 39.0, 38.0, 41.0, 38.0, 45.0, 49.0, 42.0, 47.0, 36.0, 43.0, 34.0, 31.0, 40.0, 32.0, 22.0, 19.0, 23.0, 15.0, 12.0, 19.0, 17.0, 10.0, 11.0, 5.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7926788330078125, -1.728912353515625, -1.6651458740234375, -1.60137939453125, -1.5376129150390625, -1.473846435546875, -1.4100799560546875, -1.3463134765625, -1.2825469970703125, -1.218780517578125, -1.1550140380859375, -1.09124755859375, -1.0274810791015625, -0.963714599609375, -0.8999481201171875, -0.836181640625, -0.7724151611328125, -0.708648681640625, -0.6448822021484375, -0.58111572265625, -0.5173492431640625, -0.453582763671875, -0.3898162841796875, -0.3260498046875, -0.2622833251953125, -0.198516845703125, -0.1347503662109375, -0.07098388671875, -0.0072174072265625, 0.056549072265625, 0.1203155517578125, 0.18408203125, 0.2478485107421875, 0.311614990234375, 0.3753814697265625, 0.43914794921875, 0.5029144287109375, 0.566680908203125, 0.6304473876953125, 0.6942138671875, 0.7579803466796875, 0.821746826171875, 0.8855133056640625, 0.94927978515625, 1.0130462646484375, 1.076812744140625, 1.1405792236328125, 1.204345703125, 1.2681121826171875, 1.331878662109375, 1.3956451416015625, 1.45941162109375, 1.5231781005859375, 1.586944580078125, 1.6507110595703125, 1.7144775390625, 1.7782440185546875, 1.842010498046875, 1.9057769775390625, 1.96954345703125, 2.0333099365234375, 2.097076416015625, 2.1608428955078125, 2.224609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 21.0, 33.0, 60.0, 73.0, 135.0, 171.0, 295.0, 467.0, 771.0, 1237.0, 1877.0, 2916.0, 4384.0, 6577.0, 10310.0, 14945.0, 21212.0, 30042.0, 40877.0, 53925.0, 67250.0, 80181.0, 90402.0, 95305.0, 95868.0, 90125.0, 79853.0, 67319.0, 53853.0, 41463.0, 30134.0, 21714.0, 15144.0, 10312.0, 6724.0, 4518.0, 2883.0, 1893.0, 1218.0, 728.0, 460.0, 314.0, 203.0, 144.0, 80.0, 35.0, 37.0, 29.0, 10.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0953369140625, -1.058837890625, -1.0223388671875, -0.98583984375, -0.9493408203125, -0.912841796875, -0.8763427734375, -0.83984375, -0.8033447265625, -0.766845703125, -0.7303466796875, -0.69384765625, -0.6573486328125, -0.620849609375, -0.5843505859375, -0.5478515625, -0.5113525390625, -0.474853515625, -0.4383544921875, -0.40185546875, -0.3653564453125, -0.328857421875, -0.2923583984375, -0.255859375, -0.2193603515625, -0.182861328125, -0.1463623046875, -0.10986328125, -0.0733642578125, -0.036865234375, -0.0003662109375, 0.0361328125, 0.0726318359375, 0.109130859375, 0.1456298828125, 0.18212890625, 0.2186279296875, 0.255126953125, 0.2916259765625, 0.328125, 0.3646240234375, 0.401123046875, 0.4376220703125, 0.47412109375, 0.5106201171875, 0.547119140625, 0.5836181640625, 0.6201171875, 0.6566162109375, 0.693115234375, 0.7296142578125, 0.76611328125, 0.8026123046875, 0.839111328125, 0.8756103515625, 0.912109375, 0.9486083984375, 0.985107421875, 1.0216064453125, 1.05810546875, 1.0946044921875, 1.131103515625, 1.1676025390625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 14.0, 14.0, 17.0, 17.0, 20.0, 23.0, 16.0, 32.0, 27.0, 33.0, 44.0, 26.0, 59.0, 38.0, 42.0, 43.0, 43.0, 44.0, 42.0, 38.0, 44.0, 40.0, 40.0, 26.0, 27.0, 21.0, 34.0, 18.0, 16.0, 16.0, 15.0, 9.0, 9.0, 5.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3603515625, -1.3197479248046875, -1.279144287109375, -1.2385406494140625, -1.19793701171875, -1.1573333740234375, -1.116729736328125, -1.0761260986328125, -1.0355224609375, -0.9949188232421875, -0.954315185546875, -0.9137115478515625, -0.87310791015625, -0.8325042724609375, -0.791900634765625, -0.7512969970703125, -0.710693359375, -0.6700897216796875, -0.629486083984375, -0.5888824462890625, -0.54827880859375, -0.5076751708984375, -0.467071533203125, -0.4264678955078125, -0.3858642578125, -0.3452606201171875, -0.304656982421875, -0.2640533447265625, -0.22344970703125, -0.1828460693359375, -0.142242431640625, -0.1016387939453125, -0.06103515625, -0.0204315185546875, 0.020172119140625, 0.0607757568359375, 0.10137939453125, 0.1419830322265625, 0.182586669921875, 0.2231903076171875, 0.2637939453125, 0.3043975830078125, 0.345001220703125, 0.3856048583984375, 0.42620849609375, 0.4668121337890625, 0.507415771484375, 0.5480194091796875, 0.588623046875, 0.6292266845703125, 0.669830322265625, 0.7104339599609375, 0.75103759765625, 0.7916412353515625, 0.832244873046875, 0.8728485107421875, 0.9134521484375, 0.9540557861328125, 0.994659423828125, 1.0352630615234375, 1.07586669921875, 1.1164703369140625, 1.157073974609375, 1.1976776123046875, 1.23828125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 19.0, 32.0, 61.0, 77.0, 131.0, 188.0, 313.0, 555.0, 697.0, 1216.0, 1949.0, 2962.0, 4571.0, 7234.0, 11177.0, 17053.0, 25180.0, 37040.0, 51644.0, 68870.0, 85769.0, 101227.0, 109306.0, 109602.0, 100557.0, 85509.0, 67554.0, 50302.0, 35657.0, 24786.0, 16555.0, 11197.0, 7003.0, 4657.0, 2830.0, 1828.0, 1165.0, 746.0, 481.0, 308.0, 197.0, 124.0, 76.0, 59.0, 28.0, 19.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.57110595703125, -0.5513916015625, -0.53167724609375, -0.511962890625, -0.49224853515625, -0.4725341796875, -0.45281982421875, -0.43310546875, -0.41339111328125, -0.3936767578125, -0.37396240234375, -0.354248046875, -0.33453369140625, -0.3148193359375, -0.29510498046875, -0.275390625, -0.25567626953125, -0.2359619140625, -0.21624755859375, -0.196533203125, -0.17681884765625, -0.1571044921875, -0.13739013671875, -0.11767578125, -0.09796142578125, -0.0782470703125, -0.05853271484375, -0.038818359375, -0.01910400390625, 0.0006103515625, 0.02032470703125, 0.0400390625, 0.05975341796875, 0.0794677734375, 0.09918212890625, 0.118896484375, 0.13861083984375, 0.1583251953125, 0.17803955078125, 0.19775390625, 0.21746826171875, 0.2371826171875, 0.25689697265625, 0.276611328125, 0.29632568359375, 0.3160400390625, 0.33575439453125, 0.35546875, 0.37518310546875, 0.3948974609375, 0.41461181640625, 0.434326171875, 0.45404052734375, 0.4737548828125, 0.49346923828125, 0.51318359375, 0.53289794921875, 0.5526123046875, 0.57232666015625, 0.592041015625, 0.61175537109375, 0.6314697265625, 0.65118408203125, 0.6708984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 16.0, 9.0, 19.0, 24.0, 21.0, 31.0, 32.0, 34.0, 43.0, 43.0, 37.0, 52.0, 66.0, 58.0, 51.0, 47.0, 58.0, 44.0, 42.0, 43.0, 35.0, 38.0, 24.0, 21.0, 20.0, 18.0, 11.0, 10.0, 11.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.399652481079102e-05, -9.12155956029892e-05, -8.843466639518738e-05, -8.565373718738556e-05, -8.287280797958374e-05, -8.009187877178192e-05, -7.73109495639801e-05, -7.453002035617828e-05, -7.174909114837646e-05, -6.896816194057465e-05, -6.618723273277283e-05, -6.340630352497101e-05, -6.062537431716919e-05, -5.784444510936737e-05, -5.506351590156555e-05, -5.228258669376373e-05, -4.9501657485961914e-05, -4.6720728278160095e-05, -4.3939799070358276e-05, -4.115886986255646e-05, -3.837794065475464e-05, -3.559701144695282e-05, -3.2816082239151e-05, -3.0035153031349182e-05, -2.7254223823547363e-05, -2.4473294615745544e-05, -2.1692365407943726e-05, -1.8911436200141907e-05, -1.6130506992340088e-05, -1.3349577784538269e-05, -1.056864857673645e-05, -7.787719368934631e-06, -5.0067901611328125e-06, -2.2258609533309937e-06, 5.550682544708252e-07, 3.335997462272644e-06, 6.116926670074463e-06, 8.897855877876282e-06, 1.16787850856781e-05, 1.445971429347992e-05, 1.7240643501281738e-05, 2.0021572709083557e-05, 2.2802501916885376e-05, 2.5583431124687195e-05, 2.8364360332489014e-05, 3.114528954029083e-05, 3.392621874809265e-05, 3.670714795589447e-05, 3.948807716369629e-05, 4.226900637149811e-05, 4.504993557929993e-05, 4.7830864787101746e-05, 5.0611793994903564e-05, 5.339272320270538e-05, 5.61736524105072e-05, 5.895458161830902e-05, 6.173551082611084e-05, 6.451644003391266e-05, 6.729736924171448e-05, 7.00782984495163e-05, 7.285922765731812e-05, 7.564015686511993e-05, 7.842108607292175e-05, 8.120201528072357e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 5.0, 7.0, 15.0, 24.0, 34.0, 70.0, 86.0, 129.0, 211.0, 299.0, 504.0, 748.0, 1220.0, 1941.0, 3099.0, 4886.0, 7731.0, 11867.0, 18267.0, 27525.0, 40138.0, 56625.0, 75412.0, 94927.0, 109401.0, 115207.0, 111321.0, 97903.0, 79672.0, 60504.0, 43184.0, 29808.0, 19820.0, 12948.0, 8397.0, 5274.0, 3350.0, 2224.0, 1393.0, 888.0, 555.0, 367.0, 214.0, 122.0, 88.0, 45.0, 41.0, 23.0, 19.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.59466552734375, -0.5731201171875, -0.55157470703125, -0.530029296875, -0.50848388671875, -0.4869384765625, -0.46539306640625, -0.44384765625, -0.42230224609375, -0.4007568359375, -0.37921142578125, -0.357666015625, -0.33612060546875, -0.3145751953125, -0.29302978515625, -0.271484375, -0.24993896484375, -0.2283935546875, -0.20684814453125, -0.185302734375, -0.16375732421875, -0.1422119140625, -0.12066650390625, -0.09912109375, -0.07757568359375, -0.0560302734375, -0.03448486328125, -0.012939453125, 0.00860595703125, 0.0301513671875, 0.05169677734375, 0.0732421875, 0.09478759765625, 0.1163330078125, 0.13787841796875, 0.159423828125, 0.18096923828125, 0.2025146484375, 0.22406005859375, 0.24560546875, 0.26715087890625, 0.2886962890625, 0.31024169921875, 0.331787109375, 0.35333251953125, 0.3748779296875, 0.39642333984375, 0.41796875, 0.43951416015625, 0.4610595703125, 0.48260498046875, 0.504150390625, 0.52569580078125, 0.5472412109375, 0.56878662109375, 0.59033203125, 0.61187744140625, 0.6334228515625, 0.65496826171875, 0.676513671875, 0.69805908203125, 0.7196044921875, 0.74114990234375, 0.7626953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 7.0, 6.0, 11.0, 14.0, 11.0, 17.0, 17.0, 20.0, 29.0, 31.0, 41.0, 42.0, 31.0, 46.0, 41.0, 57.0, 38.0, 51.0, 53.0, 54.0, 38.0, 30.0, 35.0, 36.0, 32.0, 31.0, 24.0, 23.0, 19.0, 27.0, 14.0, 14.0, 11.0, 9.0, 4.0, 7.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2149658203125, -0.20800018310546875, -0.2010345458984375, -0.19406890869140625, -0.187103271484375, -0.18013763427734375, -0.1731719970703125, -0.16620635986328125, -0.15924072265625, -0.15227508544921875, -0.1453094482421875, -0.13834381103515625, -0.131378173828125, -0.12441253662109375, -0.1174468994140625, -0.11048126220703125, -0.103515625, -0.09654998779296875, -0.0895843505859375, -0.08261871337890625, -0.075653076171875, -0.06868743896484375, -0.0617218017578125, -0.05475616455078125, -0.04779052734375, -0.04082489013671875, -0.0338592529296875, -0.02689361572265625, -0.019927978515625, -0.01296234130859375, -0.0059967041015625, 0.00096893310546875, 0.0079345703125, 0.01490020751953125, 0.0218658447265625, 0.02883148193359375, 0.035797119140625, 0.04276275634765625, 0.0497283935546875, 0.05669403076171875, 0.06365966796875, 0.07062530517578125, 0.0775909423828125, 0.08455657958984375, 0.091522216796875, 0.09848785400390625, 0.1054534912109375, 0.11241912841796875, 0.119384765625, 0.12635040283203125, 0.1333160400390625, 0.14028167724609375, 0.147247314453125, 0.15421295166015625, 0.1611785888671875, 0.16814422607421875, 0.17510986328125, 0.18207550048828125, 0.1890411376953125, 0.19600677490234375, 0.202972412109375, 0.20993804931640625, 0.2169036865234375, 0.22386932373046875, 0.2308349609375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 4.0, 7.0, 6.0, 5.0, 14.0, 16.0, 14.0, 17.0, 24.0, 28.0, 29.0, 51.0, 41.0, 52.0, 48.0, 78.0, 62.0, 54.0, 57.0, 50.0, 53.0, 43.0, 48.0, 37.0, 43.0, 25.0, 23.0, 13.0, 21.0, 13.0, 15.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.274965286254883, -3.179086208343506, -3.083207130432129, -2.987328052520752, -2.891448974609375, -2.795569896697998, -2.699690818786621, -2.603811740875244, -2.507932662963867, -2.4120535850524902, -2.3161745071411133, -2.2202954292297363, -2.1244163513183594, -2.0285372734069824, -1.932658076286316, -1.836778998374939, -1.7408998012542725, -1.6450207233428955, -1.5491416454315186, -1.4532625675201416, -1.3573834896087646, -1.2615044116973877, -1.1656252145767212, -1.0697461366653442, -0.9738670587539673, -0.8779879808425903, -0.7821089029312134, -0.6862297654151917, -0.5903506875038147, -0.49447160959243774, -0.398592472076416, -0.30271339416503906, -0.2068345546722412, -0.11095546185970306, -0.015076369047164917, 0.08080273866653442, 0.17668181657791138, 0.27256089448928833, 0.36844003200531006, 0.464319109916687, 0.560198187828064, 0.6560772657394409, 0.7519563436508179, 0.8478354811668396, 0.9437145590782166, 1.0395936965942383, 1.1354727745056152, 1.2313518524169922, 1.3272309303283691, 1.423110008239746, 1.518989086151123, 1.6148681640625, 1.710747241973877, 1.806626319885254, 1.9025055170059204, 1.9983845949172974, 2.0942635536193848, 2.1901426315307617, 2.2860217094421387, 2.3819007873535156, 2.4777798652648926, 2.5736589431762695, 2.6695380210876465, 2.7654170989990234, 2.8612964153289795]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 8.0, 11.0, 7.0, 16.0, 7.0, 14.0, 12.0, 28.0, 19.0, 25.0, 27.0, 28.0, 32.0, 26.0, 32.0, 35.0, 42.0, 38.0, 34.0, 36.0, 49.0, 29.0, 36.0, 43.0, 41.0, 34.0, 34.0, 31.0, 35.0, 31.0, 28.0, 22.0, 16.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.041332721710205, -1.9815632104873657, -1.921793818473816, -1.8620243072509766, -1.8022549152374268, -1.7424854040145874, -1.682715892791748, -1.6229465007781982, -1.5631769895553589, -1.5034074783325195, -1.4436380863189697, -1.3838685750961304, -1.324099063873291, -1.2643296718597412, -1.2045601606369019, -1.1447906494140625, -1.0850212574005127, -1.0252517461776733, -0.9654823541641235, -0.9057128429412842, -0.8459433913230896, -0.786173939704895, -0.7264044284820557, -0.6666349768638611, -0.6068655252456665, -0.5470960736274719, -0.48732659220695496, -0.427557110786438, -0.3677876591682434, -0.30801820755004883, -0.24824872612953186, -0.1884792447090149, -0.12870991230010986, -0.06894044578075409, -0.009170979261398315, 0.05059848725795746, 0.11036795377731323, 0.1701374053955078, 0.22990688681602478, 0.28967636823654175, 0.34944581985473633, 0.4092152714729309, 0.4689847528934479, 0.5287542343139648, 0.5885236859321594, 0.648293137550354, 0.7080626487731934, 0.7678321003913879, 0.8276015520095825, 0.8873710036277771, 0.9471404552459717, 1.006909966468811, 1.0666794776916504, 1.1264488697052002, 1.1862183809280396, 1.245987892150879, 1.3057572841644287, 1.365526795387268, 1.4252961874008179, 1.4850656986236572, 1.544835090637207, 1.6046046018600464, 1.6643741130828857, 1.7241435050964355, 1.783913016319275]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 9.0, 17.0, 17.0, 25.0, 35.0, 63.0, 113.0, 176.0, 273.0, 428.0, 660.0, 1147.0, 1776.0, 2867.0, 4608.0, 7447.0, 12084.0, 19588.0, 31849.0, 50790.0, 79422.0, 121833.0, 179768.0, 252160.0, 335220.0, 414206.0, 465715.0, 478873.0, 443079.0, 374101.0, 291771.0, 212306.0, 146118.0, 97448.0, 62956.0, 40249.0, 24850.0, 15443.0, 9426.0, 5844.0, 3558.0, 2225.0, 1409.0, 835.0, 548.0, 340.0, 230.0, 139.0, 96.0, 62.0, 30.0, 24.0, 17.0, 8.0, 2.0, 2.0, 1.0], "bins": [-2.076171875, -2.015533447265625, -1.95489501953125, -1.894256591796875, -1.8336181640625, -1.772979736328125, -1.71234130859375, -1.651702880859375, -1.591064453125, -1.530426025390625, -1.46978759765625, -1.409149169921875, -1.3485107421875, -1.287872314453125, -1.22723388671875, -1.166595458984375, -1.10595703125, -1.045318603515625, -0.98468017578125, -0.924041748046875, -0.8634033203125, -0.802764892578125, -0.74212646484375, -0.681488037109375, -0.620849609375, -0.560211181640625, -0.49957275390625, -0.438934326171875, -0.3782958984375, -0.317657470703125, -0.25701904296875, -0.196380615234375, -0.1357421875, -0.075103759765625, -0.01446533203125, 0.046173095703125, 0.1068115234375, 0.167449951171875, 0.22808837890625, 0.288726806640625, 0.349365234375, 0.410003662109375, 0.47064208984375, 0.531280517578125, 0.5919189453125, 0.652557373046875, 0.71319580078125, 0.773834228515625, 0.83447265625, 0.895111083984375, 0.95574951171875, 1.016387939453125, 1.0770263671875, 1.137664794921875, 1.19830322265625, 1.258941650390625, 1.319580078125, 1.380218505859375, 1.44085693359375, 1.501495361328125, 1.5621337890625, 1.622772216796875, 1.68341064453125, 1.744049072265625, 1.8046875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 12.0, 16.0, 17.0, 18.0, 25.0, 12.0, 25.0, 41.0, 23.0, 24.0, 31.0, 39.0, 53.0, 31.0, 47.0, 40.0, 43.0, 41.0, 45.0, 36.0, 35.0, 29.0, 41.0, 33.0, 27.0, 25.0, 21.0, 28.0, 28.0, 15.0, 10.0, 16.0, 10.0, 5.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0, -1.9428863525390625, -1.885772705078125, -1.8286590576171875, -1.77154541015625, -1.7144317626953125, -1.657318115234375, -1.6002044677734375, -1.5430908203125, -1.4859771728515625, -1.428863525390625, -1.3717498779296875, -1.31463623046875, -1.2575225830078125, -1.200408935546875, -1.1432952880859375, -1.086181640625, -1.0290679931640625, -0.971954345703125, -0.9148406982421875, -0.85772705078125, -0.8006134033203125, -0.743499755859375, -0.6863861083984375, -0.6292724609375, -0.5721588134765625, -0.515045166015625, -0.4579315185546875, -0.40081787109375, -0.3437042236328125, -0.286590576171875, -0.2294769287109375, -0.17236328125, -0.1152496337890625, -0.058135986328125, -0.0010223388671875, 0.05609130859375, 0.1132049560546875, 0.170318603515625, 0.2274322509765625, 0.2845458984375, 0.3416595458984375, 0.398773193359375, 0.4558868408203125, 0.51300048828125, 0.5701141357421875, 0.627227783203125, 0.6843414306640625, 0.741455078125, 0.7985687255859375, 0.855682373046875, 0.9127960205078125, 0.96990966796875, 1.0270233154296875, 1.084136962890625, 1.1412506103515625, 1.1983642578125, 1.2554779052734375, 1.312591552734375, 1.3697052001953125, 1.42681884765625, 1.4839324951171875, 1.541046142578125, 1.5981597900390625, 1.6552734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 6.0, 7.0, 13.0, 23.0, 25.0, 53.0, 66.0, 131.0, 243.0, 362.0, 605.0, 910.0, 1679.0, 2669.0, 4494.0, 7434.0, 12098.0, 19061.0, 31376.0, 49142.0, 75290.0, 113694.0, 164516.0, 227795.0, 299132.0, 368460.0, 422066.0, 445540.0, 434341.0, 388886.0, 322999.0, 250898.0, 183483.0, 128823.0, 86431.0, 56921.0, 36118.0, 22885.0, 13929.0, 8472.0, 5158.0, 3149.0, 1984.0, 1168.0, 644.0, 447.0, 231.0, 168.0, 106.0, 58.0, 41.0, 23.0, 18.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9755859375, -1.9066619873046875, -1.837738037109375, -1.7688140869140625, -1.69989013671875, -1.6309661865234375, -1.562042236328125, -1.4931182861328125, -1.4241943359375, -1.3552703857421875, -1.286346435546875, -1.2174224853515625, -1.14849853515625, -1.0795745849609375, -1.010650634765625, -0.9417266845703125, -0.872802734375, -0.8038787841796875, -0.734954833984375, -0.6660308837890625, -0.59710693359375, -0.5281829833984375, -0.459259033203125, -0.3903350830078125, -0.3214111328125, -0.2524871826171875, -0.183563232421875, -0.1146392822265625, -0.04571533203125, 0.0232086181640625, 0.092132568359375, 0.1610565185546875, 0.22998046875, 0.2989044189453125, 0.367828369140625, 0.4367523193359375, 0.50567626953125, 0.5746002197265625, 0.643524169921875, 0.7124481201171875, 0.7813720703125, 0.8502960205078125, 0.919219970703125, 0.9881439208984375, 1.05706787109375, 1.1259918212890625, 1.194915771484375, 1.2638397216796875, 1.332763671875, 1.4016876220703125, 1.470611572265625, 1.5395355224609375, 1.60845947265625, 1.6773834228515625, 1.746307373046875, 1.8152313232421875, 1.8841552734375, 1.9530792236328125, 2.022003173828125, 2.0909271240234375, 2.15985107421875, 2.2287750244140625, 2.297698974609375, 2.3666229248046875, 2.435546875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 3.0, 8.0, 7.0, 12.0, 17.0, 16.0, 24.0, 29.0, 37.0, 38.0, 56.0, 64.0, 80.0, 90.0, 107.0, 155.0, 161.0, 179.0, 207.0, 213.0, 211.0, 219.0, 251.0, 214.0, 212.0, 178.0, 201.0, 193.0, 167.0, 140.0, 129.0, 105.0, 65.0, 68.0, 40.0, 37.0, 38.0, 26.0, 14.0, 17.0, 10.0, 11.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.197265625, -1.16339111328125, -1.1295166015625, -1.09564208984375, -1.061767578125, -1.02789306640625, -0.9940185546875, -0.96014404296875, -0.92626953125, -0.89239501953125, -0.8585205078125, -0.82464599609375, -0.790771484375, -0.75689697265625, -0.7230224609375, -0.68914794921875, -0.6552734375, -0.62139892578125, -0.5875244140625, -0.55364990234375, -0.519775390625, -0.48590087890625, -0.4520263671875, -0.41815185546875, -0.38427734375, -0.35040283203125, -0.3165283203125, -0.28265380859375, -0.248779296875, -0.21490478515625, -0.1810302734375, -0.14715576171875, -0.11328125, -0.07940673828125, -0.0455322265625, -0.01165771484375, 0.022216796875, 0.05609130859375, 0.0899658203125, 0.12384033203125, 0.15771484375, 0.19158935546875, 0.2254638671875, 0.25933837890625, 0.293212890625, 0.32708740234375, 0.3609619140625, 0.39483642578125, 0.4287109375, 0.46258544921875, 0.4964599609375, 0.53033447265625, 0.564208984375, 0.59808349609375, 0.6319580078125, 0.66583251953125, 0.69970703125, 0.73358154296875, 0.7674560546875, 0.80133056640625, 0.835205078125, 0.86907958984375, 0.9029541015625, 0.93682861328125, 0.970703125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 12.0, 12.0, 9.0, 16.0, 18.0, 23.0, 17.0, 18.0, 34.0, 30.0, 27.0, 36.0, 52.0, 61.0, 46.0, 39.0, 48.0, 54.0, 46.0, 45.0, 55.0, 43.0, 36.0, 37.0, 35.0, 25.0, 18.0, 22.0, 18.0, 11.0, 10.0, 11.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.551114559173584, -3.4483602046966553, -3.3456058502197266, -3.242851495742798, -3.140097141265869, -3.0373425483703613, -2.9345881938934326, -2.831833839416504, -2.729079484939575, -2.6263251304626465, -2.5235707759857178, -2.420816421508789, -2.3180618286132812, -2.2153077125549316, -2.112553119659424, -2.009798765182495, -1.9070444107055664, -1.8042900562286377, -1.701535701751709, -1.5987812280654907, -1.496026873588562, -1.3932725191116333, -1.290518045425415, -1.1877636909484863, -1.0850093364715576, -0.9822549819946289, -0.8795005679130554, -0.7767461538314819, -0.6739917993545532, -0.5712374448776245, -0.468483030796051, -0.36572861671447754, -0.26297426223754883, -0.16021987795829773, -0.05746549367904663, 0.04528889060020447, 0.14804327487945557, 0.2507976293563843, 0.35355204343795776, 0.45630645751953125, 0.55906081199646, 0.6618151664733887, 0.7645695805549622, 0.8673239946365356, 0.9700783491134644, 1.072832703590393, 1.1755871772766113, 1.27834153175354, 1.3810958862304688, 1.4838502407073975, 1.5866045951843262, 1.6893590688705444, 1.7921134233474731, 1.8948677778244019, 1.9976222515106201, 2.100376605987549, 2.2031309604644775, 2.3058853149414062, 2.408639669418335, 2.5113940238952637, 2.6141486167907715, 2.716902732849121, 2.819657325744629, 2.9224116802215576, 3.0251660346984863]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 13.0, 9.0, 14.0, 18.0, 25.0, 16.0, 21.0, 27.0, 22.0, 29.0, 23.0, 33.0, 31.0, 36.0, 45.0, 43.0, 35.0, 45.0, 33.0, 56.0, 37.0, 30.0, 45.0, 37.0, 31.0, 30.0, 31.0, 18.0, 23.0, 22.0, 15.0, 17.0, 12.0, 21.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2918717861175537, -2.2207958698272705, -2.149719715118408, -2.078643798828125, -2.007567882537842, -1.936491847038269, -1.8654158115386963, -1.794339895248413, -1.7232638597488403, -1.6521878242492676, -1.5811119079589844, -1.5100358724594116, -1.4389598369598389, -1.3678839206695557, -1.296807885169983, -1.2257318496704102, -1.154655933380127, -1.0835798978805542, -1.012503981590271, -0.9414279460906982, -0.8703519701957703, -0.7992759943008423, -0.7281999588012695, -0.6571239829063416, -0.5860480070114136, -0.5149720311164856, -0.44389602541923523, -0.37282001972198486, -0.3017440438270569, -0.2306680679321289, -0.15959206223487854, -0.08851605653762817, -0.017440319061279297, 0.053635671734809875, 0.12471166253089905, 0.19578765332698822, 0.2668636441230774, 0.33793962001800537, 0.40901562571525574, 0.4800916314125061, 0.5511676073074341, 0.6222435832023621, 0.69331955909729, 0.7643955945968628, 0.8354715704917908, 0.9065475463867188, 0.9776235818862915, 1.0486996173858643, 1.1197755336761475, 1.1908515691757202, 1.2619274854660034, 1.3330035209655762, 1.4040794372558594, 1.4751554727554321, 1.5462315082550049, 1.617307424545288, 1.6883834600448608, 1.7594594955444336, 1.8305354118347168, 1.9016114473342896, 1.9726874828338623, 2.0437633991241455, 2.1148393154144287, 2.185915470123291, 2.256991386413574]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 12.0, 16.0, 18.0, 46.0, 68.0, 113.0, 166.0, 259.0, 476.0, 764.0, 1189.0, 2090.0, 3248.0, 5497.0, 9269.0, 15074.0, 25590.0, 41840.0, 68155.0, 105195.0, 150384.0, 176266.0, 152980.0, 108877.0, 70472.0, 43816.0, 26700.0, 16060.0, 9500.0, 5573.0, 3500.0, 2055.0, 1265.0, 785.0, 473.0, 300.0, 158.0, 94.0, 79.0, 42.0, 27.0, 10.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5694046020507812, -0.5494537353515625, -0.5295028686523438, -0.509552001953125, -0.48960113525390625, -0.4696502685546875, -0.44969940185546875, -0.42974853515625, -0.40979766845703125, -0.3898468017578125, -0.36989593505859375, -0.349945068359375, -0.32999420166015625, -0.3100433349609375, -0.29009246826171875, -0.2701416015625, -0.25019073486328125, -0.2302398681640625, -0.21028900146484375, -0.190338134765625, -0.17038726806640625, -0.1504364013671875, -0.13048553466796875, -0.11053466796875, -0.09058380126953125, -0.0706329345703125, -0.05068206787109375, -0.030731201171875, -0.01078033447265625, 0.0091705322265625, 0.02912139892578125, 0.049072265625, 0.06902313232421875, 0.0889739990234375, 0.10892486572265625, 0.128875732421875, 0.14882659912109375, 0.1687774658203125, 0.18872833251953125, 0.20867919921875, 0.22863006591796875, 0.2485809326171875, 0.26853179931640625, 0.288482666015625, 0.30843353271484375, 0.3283843994140625, 0.34833526611328125, 0.3682861328125, 0.38823699951171875, 0.4081878662109375, 0.42813873291015625, 0.448089599609375, 0.46804046630859375, 0.4879913330078125, 0.5079421997070312, 0.52789306640625, 0.5478439331054688, 0.5677947998046875, 0.5877456665039062, 0.607696533203125, 0.6276473999023438, 0.6475982666015625, 0.6675491333007812, 0.6875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 12.0, 21.0, 18.0, 13.0, 14.0, 31.0, 22.0, 33.0, 27.0, 31.0, 24.0, 35.0, 32.0, 38.0, 38.0, 40.0, 37.0, 41.0, 33.0, 28.0, 39.0, 25.0, 32.0, 32.0, 28.0, 27.0, 18.0, 22.0, 32.0, 23.0, 24.0, 14.0, 10.0, 12.0, 8.0, 9.0, 5.0, 8.0, 9.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.263671875, -2.193115234375, -2.12255859375, -2.052001953125, -1.9814453125, -1.910888671875, -1.84033203125, -1.769775390625, -1.69921875, -1.628662109375, -1.55810546875, -1.487548828125, -1.4169921875, -1.346435546875, -1.27587890625, -1.205322265625, -1.134765625, -1.064208984375, -0.99365234375, -0.923095703125, -0.8525390625, -0.781982421875, -0.71142578125, -0.640869140625, -0.5703125, -0.499755859375, -0.42919921875, -0.358642578125, -0.2880859375, -0.217529296875, -0.14697265625, -0.076416015625, -0.005859375, 0.064697265625, 0.13525390625, 0.205810546875, 0.2763671875, 0.346923828125, 0.41748046875, 0.488037109375, 0.55859375, 0.629150390625, 0.69970703125, 0.770263671875, 0.8408203125, 0.911376953125, 0.98193359375, 1.052490234375, 1.123046875, 1.193603515625, 1.26416015625, 1.334716796875, 1.4052734375, 1.475830078125, 1.54638671875, 1.616943359375, 1.6875, 1.758056640625, 1.82861328125, 1.899169921875, 1.9697265625, 2.040283203125, 2.11083984375, 2.181396484375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 12.0, 13.0, 22.0, 28.0, 32.0, 43.0, 98.0, 127.0, 193.0, 317.0, 504.0, 742.0, 1140.0, 1819.0, 3116.0, 4966.0, 8508.0, 14459.0, 25566.0, 46035.0, 82897.0, 142215.0, 204576.0, 198779.0, 134398.0, 77006.0, 42954.0, 23990.0, 13607.0, 7939.0, 4697.0, 2896.0, 1741.0, 1103.0, 678.0, 459.0, 293.0, 180.0, 123.0, 76.0, 63.0, 34.0, 37.0, 19.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.75146484375, -0.7286529541015625, -0.705841064453125, -0.6830291748046875, -0.66021728515625, -0.6374053955078125, -0.614593505859375, -0.5917816162109375, -0.5689697265625, -0.5461578369140625, -0.523345947265625, -0.5005340576171875, -0.47772216796875, -0.4549102783203125, -0.432098388671875, -0.4092864990234375, -0.386474609375, -0.3636627197265625, -0.340850830078125, -0.3180389404296875, -0.29522705078125, -0.2724151611328125, -0.249603271484375, -0.2267913818359375, -0.2039794921875, -0.1811676025390625, -0.158355712890625, -0.1355438232421875, -0.11273193359375, -0.0899200439453125, -0.067108154296875, -0.0442962646484375, -0.021484375, 0.0013275146484375, 0.024139404296875, 0.0469512939453125, 0.06976318359375, 0.0925750732421875, 0.115386962890625, 0.1381988525390625, 0.1610107421875, 0.1838226318359375, 0.206634521484375, 0.2294464111328125, 0.25225830078125, 0.2750701904296875, 0.297882080078125, 0.3206939697265625, 0.343505859375, 0.3663177490234375, 0.389129638671875, 0.4119415283203125, 0.43475341796875, 0.4575653076171875, 0.480377197265625, 0.5031890869140625, 0.5260009765625, 0.5488128662109375, 0.571624755859375, 0.5944366455078125, 0.61724853515625, 0.6400604248046875, 0.662872314453125, 0.6856842041015625, 0.70849609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 5.0, 10.0, 8.0, 12.0, 16.0, 22.0, 21.0, 13.0, 30.0, 25.0, 33.0, 21.0, 19.0, 26.0, 26.0, 37.0, 31.0, 33.0, 37.0, 42.0, 26.0, 36.0, 21.0, 41.0, 37.0, 40.0, 35.0, 38.0, 30.0, 32.0, 25.0, 17.0, 18.0, 20.0, 15.0, 15.0, 12.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.267578125, -1.2251129150390625, -1.182647705078125, -1.1401824951171875, -1.09771728515625, -1.0552520751953125, -1.012786865234375, -0.9703216552734375, -0.9278564453125, -0.8853912353515625, -0.842926025390625, -0.8004608154296875, -0.75799560546875, -0.7155303955078125, -0.673065185546875, -0.6305999755859375, -0.588134765625, -0.5456695556640625, -0.503204345703125, -0.4607391357421875, -0.41827392578125, -0.3758087158203125, -0.333343505859375, -0.2908782958984375, -0.2484130859375, -0.2059478759765625, -0.163482666015625, -0.1210174560546875, -0.07855224609375, -0.0360870361328125, 0.006378173828125, 0.0488433837890625, 0.09130859375, 0.1337738037109375, 0.176239013671875, 0.2187042236328125, 0.26116943359375, 0.3036346435546875, 0.346099853515625, 0.3885650634765625, 0.4310302734375, 0.4734954833984375, 0.515960693359375, 0.5584259033203125, 0.60089111328125, 0.6433563232421875, 0.685821533203125, 0.7282867431640625, 0.770751953125, 0.8132171630859375, 0.855682373046875, 0.8981475830078125, 0.94061279296875, 0.9830780029296875, 1.025543212890625, 1.0680084228515625, 1.1104736328125, 1.1529388427734375, 1.195404052734375, 1.2378692626953125, 1.28033447265625, 1.3227996826171875, 1.365264892578125, 1.4077301025390625, 1.4501953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 9.0, 14.0, 24.0, 21.0, 33.0, 46.0, 57.0, 95.0, 125.0, 195.0, 272.0, 426.0, 648.0, 985.0, 1684.0, 2921.0, 5313.0, 10752.0, 24373.0, 73210.0, 327167.0, 440721.0, 101124.0, 30718.0, 12651.0, 6329.0, 3391.0, 1953.0, 1110.0, 659.0, 499.0, 304.0, 218.0, 152.0, 96.0, 61.0, 47.0, 40.0, 28.0, 16.0, 19.0, 16.0, 5.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5685272216796875, -0.549652099609375, -0.5307769775390625, -0.51190185546875, -0.4930267333984375, -0.474151611328125, -0.4552764892578125, -0.4364013671875, -0.4175262451171875, -0.398651123046875, -0.3797760009765625, -0.36090087890625, -0.3420257568359375, -0.323150634765625, -0.3042755126953125, -0.285400390625, -0.2665252685546875, -0.247650146484375, -0.2287750244140625, -0.20989990234375, -0.1910247802734375, -0.172149658203125, -0.1532745361328125, -0.1343994140625, -0.1155242919921875, -0.096649169921875, -0.0777740478515625, -0.05889892578125, -0.0400238037109375, -0.021148681640625, -0.0022735595703125, 0.0166015625, 0.0354766845703125, 0.054351806640625, 0.0732269287109375, 0.09210205078125, 0.1109771728515625, 0.129852294921875, 0.1487274169921875, 0.1676025390625, 0.1864776611328125, 0.205352783203125, 0.2242279052734375, 0.24310302734375, 0.2619781494140625, 0.280853271484375, 0.2997283935546875, 0.318603515625, 0.3374786376953125, 0.356353759765625, 0.3752288818359375, 0.39410400390625, 0.4129791259765625, 0.431854248046875, 0.4507293701171875, 0.4696044921875, 0.4884796142578125, 0.507354736328125, 0.5262298583984375, 0.54510498046875, 0.5639801025390625, 0.582855224609375, 0.6017303466796875, 0.62060546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 20.0, 14.0, 19.0, 32.0, 34.0, 47.0, 43.0, 50.0, 54.0, 69.0, 72.0, 66.0, 67.0, 67.0, 56.0, 56.0, 41.0, 37.0, 27.0, 24.0, 18.0, 13.0, 10.0, 4.0, 8.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.7286278307437897e-05, -1.6571953892707825e-05, -1.5857629477977753e-05, -1.514330506324768e-05, -1.4428980648517609e-05, -1.3714656233787537e-05, -1.3000331819057465e-05, -1.2286007404327393e-05, -1.157168298959732e-05, -1.0857358574867249e-05, -1.0143034160137177e-05, -9.428709745407104e-06, -8.714385330677032e-06, -8.00006091594696e-06, -7.2857365012168884e-06, -6.571412086486816e-06, -5.857087671756744e-06, -5.142763257026672e-06, -4.4284388422966e-06, -3.7141144275665283e-06, -2.9997900128364563e-06, -2.2854655981063843e-06, -1.5711411833763123e-06, -8.568167686462402e-07, -1.424923539161682e-07, 5.718320608139038e-07, 1.2861564755439758e-06, 2.000480890274048e-06, 2.71480530500412e-06, 3.429129719734192e-06, 4.143454134464264e-06, 4.857778549194336e-06, 5.572102963924408e-06, 6.28642737865448e-06, 7.000751793384552e-06, 7.715076208114624e-06, 8.429400622844696e-06, 9.143725037574768e-06, 9.85804945230484e-06, 1.0572373867034912e-05, 1.1286698281764984e-05, 1.2001022696495056e-05, 1.2715347111225128e-05, 1.34296715259552e-05, 1.4143995940685272e-05, 1.4858320355415344e-05, 1.5572644770145416e-05, 1.6286969184875488e-05, 1.700129359960556e-05, 1.7715618014335632e-05, 1.8429942429065704e-05, 1.9144266843795776e-05, 1.985859125852585e-05, 2.057291567325592e-05, 2.1287240087985992e-05, 2.2001564502716064e-05, 2.2715888917446136e-05, 2.343021333217621e-05, 2.414453774690628e-05, 2.4858862161636353e-05, 2.5573186576366425e-05, 2.6287510991096497e-05, 2.700183540582657e-05, 2.771615982055664e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 18.0, 28.0, 55.0, 53.0, 79.0, 120.0, 173.0, 246.0, 332.0, 539.0, 810.0, 1210.0, 1789.0, 2973.0, 5186.0, 8758.0, 16601.0, 34334.0, 81535.0, 206398.0, 341909.0, 196609.0, 77668.0, 33355.0, 15950.0, 8483.0, 4859.0, 3007.0, 1874.0, 1177.0, 754.0, 537.0, 358.0, 219.0, 168.0, 106.0, 72.0, 57.0, 48.0, 26.0, 17.0, 12.0, 6.0, 13.0, 3.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.73046875, -0.7098770141601562, -0.6892852783203125, -0.6686935424804688, -0.648101806640625, -0.6275100708007812, -0.6069183349609375, -0.5863265991210938, -0.56573486328125, -0.5451431274414062, -0.5245513916015625, -0.5039596557617188, -0.483367919921875, -0.46277618408203125, -0.4421844482421875, -0.42159271240234375, -0.4010009765625, -0.38040924072265625, -0.3598175048828125, -0.33922576904296875, -0.318634033203125, -0.29804229736328125, -0.2774505615234375, -0.25685882568359375, -0.23626708984375, -0.21567535400390625, -0.1950836181640625, -0.17449188232421875, -0.153900146484375, -0.13330841064453125, -0.1127166748046875, -0.09212493896484375, -0.071533203125, -0.05094146728515625, -0.0303497314453125, -0.00975799560546875, 0.010833740234375, 0.03142547607421875, 0.0520172119140625, 0.07260894775390625, 0.09320068359375, 0.11379241943359375, 0.1343841552734375, 0.15497589111328125, 0.175567626953125, 0.19615936279296875, 0.2167510986328125, 0.23734283447265625, 0.2579345703125, 0.27852630615234375, 0.2991180419921875, 0.31970977783203125, 0.340301513671875, 0.36089324951171875, 0.3814849853515625, 0.40207672119140625, 0.42266845703125, 0.44326019287109375, 0.4638519287109375, 0.48444366455078125, 0.505035400390625, 0.5256271362304688, 0.5462188720703125, 0.5668106079101562, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 6.0, 10.0, 12.0, 17.0, 13.0, 17.0, 34.0, 39.0, 71.0, 65.0, 88.0, 110.0, 108.0, 99.0, 68.0, 54.0, 23.0, 25.0, 23.0, 22.0, 15.0, 15.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.14951324462890625, -0.1443634033203125, -0.13921356201171875, -0.134063720703125, -0.12891387939453125, -0.1237640380859375, -0.11861419677734375, -0.11346435546875, -0.10831451416015625, -0.1031646728515625, -0.09801483154296875, -0.092864990234375, -0.08771514892578125, -0.0825653076171875, -0.07741546630859375, -0.072265625, -0.06711578369140625, -0.0619659423828125, -0.05681610107421875, -0.051666259765625, -0.04651641845703125, -0.0413665771484375, -0.03621673583984375, -0.03106689453125, -0.02591705322265625, -0.0207672119140625, -0.01561737060546875, -0.010467529296875, -0.00531768798828125, -0.0001678466796875, 0.00498199462890625, 0.0101318359375, 0.01528167724609375, 0.0204315185546875, 0.02558135986328125, 0.030731201171875, 0.03588104248046875, 0.0410308837890625, 0.04618072509765625, 0.05133056640625, 0.05648040771484375, 0.0616302490234375, 0.06678009033203125, 0.071929931640625, 0.07707977294921875, 0.0822296142578125, 0.08737945556640625, 0.092529296875, 0.09767913818359375, 0.1028289794921875, 0.10797882080078125, 0.113128662109375, 0.11827850341796875, 0.1234283447265625, 0.12857818603515625, 0.13372802734375, 0.13887786865234375, 0.1440277099609375, 0.14917755126953125, 0.154327392578125, 0.15947723388671875, 0.1646270751953125, 0.16977691650390625, 0.1749267578125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 6.0, 4.0, 8.0, 11.0, 15.0, 17.0, 20.0, 17.0, 14.0, 30.0, 26.0, 34.0, 31.0, 35.0, 52.0, 56.0, 44.0, 46.0, 52.0, 46.0, 49.0, 51.0, 46.0, 45.0, 38.0, 36.0, 33.0, 16.0, 31.0, 16.0, 16.0, 11.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.535590648651123, -3.4327683448791504, -3.3299460411071777, -3.227123737335205, -3.1243014335632324, -3.0214791297912598, -2.918656826019287, -2.8158345222473145, -2.713012218475342, -2.610189914703369, -2.5073676109313965, -2.404545307159424, -2.301723003387451, -2.1989006996154785, -2.096078395843506, -1.9932562112808228, -1.8904340267181396, -1.787611722946167, -1.6847894191741943, -1.5819671154022217, -1.479144811630249, -1.3763225078582764, -1.2735003232955933, -1.1706780195236206, -1.067855715751648, -0.9650334119796753, -0.8622111082077026, -0.7593888640403748, -0.6565665602684021, -0.5537442564964294, -0.45092201232910156, -0.3480997085571289, -0.24527764320373535, -0.1424553543329239, -0.03963306546211243, 0.06318920850753784, 0.1660115122795105, 0.26883381605148315, 0.37165606021881104, 0.4744783639907837, 0.5773006677627563, 0.680122971534729, 0.7829452753067017, 0.8857675194740295, 0.9885898232460022, 1.09141206741333, 1.1942343711853027, 1.2970566749572754, 1.399878978729248, 1.5027012825012207, 1.6055235862731934, 1.708345890045166, 1.8111681938171387, 1.9139904975891113, 2.016812801361084, 2.1196351051330566, 2.2224574089050293, 2.325279712677002, 2.4281020164489746, 2.5309243202209473, 2.63374662399292, 2.7365689277648926, 2.8393912315368652, 2.942213535308838, 3.0450356006622314]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 14.0, 13.0, 20.0, 21.0, 17.0, 21.0, 27.0, 16.0, 35.0, 21.0, 36.0, 26.0, 38.0, 46.0, 46.0, 31.0, 47.0, 35.0, 48.0, 41.0, 34.0, 39.0, 42.0, 32.0, 27.0, 26.0, 24.0, 20.0, 23.0, 13.0, 20.0, 10.0, 17.0, 12.0, 8.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2628321647644043, -2.1919450759887695, -2.1210579872131348, -2.0501708984375, -1.9792838096618652, -1.9083967208862305, -1.8375095129013062, -1.7666224241256714, -1.6957353353500366, -1.6248482465744019, -1.553961157798767, -1.4830740690231323, -1.412186861038208, -1.3412997722625732, -1.2704126834869385, -1.1995255947113037, -1.128638505935669, -1.0577514171600342, -0.9868643283843994, -0.9159771800041199, -0.8450900912284851, -0.7742030024528503, -0.7033158540725708, -0.632428765296936, -0.5615416765213013, -0.4906545877456665, -0.41976746916770935, -0.3488803505897522, -0.27799326181411743, -0.20710617303848267, -0.1362190544605255, -0.06533193588256836, 0.005554914474487305, 0.07644201815128326, 0.14732912182807922, 0.21821622550487518, 0.28910332918167114, 0.3599904179573059, 0.43087753653526306, 0.5017646551132202, 0.572651743888855, 0.6435388326644897, 0.7144259214401245, 0.785313069820404, 0.8562001585960388, 0.9270872473716736, 0.9979743957519531, 1.068861484527588, 1.1397485733032227, 1.2106356620788574, 1.2815227508544922, 1.352409839630127, 1.4232969284057617, 1.4941840171813965, 1.5650712251663208, 1.6359583139419556, 1.7068454027175903, 1.777732491493225, 1.8486195802688599, 1.9195066690444946, 1.990393877029419, 2.0612809658050537, 2.1321680545806885, 2.2030551433563232, 2.273942232131958]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 9.0, 5.0, 24.0, 28.0, 58.0, 67.0, 137.0, 199.0, 332.0, 472.0, 767.0, 1159.0, 1739.0, 2823.0, 4318.0, 6322.0, 9443.0, 13741.0, 19412.0, 27325.0, 36716.0, 47635.0, 59910.0, 71428.0, 81431.0, 89062.0, 91416.0, 89418.0, 82300.0, 72935.0, 60789.0, 48772.0, 37208.0, 28021.0, 19952.0, 14287.0, 9767.0, 6516.0, 4361.0, 2902.0, 1954.0, 1210.0, 819.0, 497.0, 319.0, 208.0, 138.0, 73.0, 47.0, 36.0, 17.0, 13.0, 9.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1797943115234375, -1.139862060546875, -1.0999298095703125, -1.05999755859375, -1.0200653076171875, -0.980133056640625, -0.9402008056640625, -0.9002685546875, -0.8603363037109375, -0.820404052734375, -0.7804718017578125, -0.74053955078125, -0.7006072998046875, -0.660675048828125, -0.6207427978515625, -0.580810546875, -0.5408782958984375, -0.500946044921875, -0.4610137939453125, -0.42108154296875, -0.3811492919921875, -0.341217041015625, -0.3012847900390625, -0.2613525390625, -0.2214202880859375, -0.181488037109375, -0.1415557861328125, -0.10162353515625, -0.0616912841796875, -0.021759033203125, 0.0181732177734375, 0.05810546875, 0.0980377197265625, 0.137969970703125, 0.1779022216796875, 0.21783447265625, 0.2577667236328125, 0.297698974609375, 0.3376312255859375, 0.3775634765625, 0.4174957275390625, 0.457427978515625, 0.4973602294921875, 0.53729248046875, 0.5772247314453125, 0.617156982421875, 0.6570892333984375, 0.697021484375, 0.7369537353515625, 0.776885986328125, 0.8168182373046875, 0.85675048828125, 0.8966827392578125, 0.936614990234375, 0.9765472412109375, 1.0164794921875, 1.0564117431640625, 1.096343994140625, 1.1362762451171875, 1.17620849609375, 1.2161407470703125, 1.256072998046875, 1.2960052490234375, 1.3359375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 13.0, 11.0, 10.0, 21.0, 14.0, 13.0, 15.0, 21.0, 26.0, 29.0, 33.0, 35.0, 43.0, 31.0, 41.0, 30.0, 38.0, 45.0, 37.0, 45.0, 38.0, 40.0, 45.0, 39.0, 36.0, 24.0, 30.0, 29.0, 15.0, 24.0, 23.0, 13.0, 15.0, 11.0, 13.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.541015625, -2.4637451171875, -2.386474609375, -2.3092041015625, -2.23193359375, -2.1546630859375, -2.077392578125, -2.0001220703125, -1.9228515625, -1.8455810546875, -1.768310546875, -1.6910400390625, -1.61376953125, -1.5364990234375, -1.459228515625, -1.3819580078125, -1.3046875, -1.2274169921875, -1.150146484375, -1.0728759765625, -0.99560546875, -0.9183349609375, -0.841064453125, -0.7637939453125, -0.6865234375, -0.6092529296875, -0.531982421875, -0.4547119140625, -0.37744140625, -0.3001708984375, -0.222900390625, -0.1456298828125, -0.068359375, 0.0089111328125, 0.086181640625, 0.1634521484375, 0.24072265625, 0.3179931640625, 0.395263671875, 0.4725341796875, 0.5498046875, 0.6270751953125, 0.704345703125, 0.7816162109375, 0.85888671875, 0.9361572265625, 1.013427734375, 1.0906982421875, 1.16796875, 1.2452392578125, 1.322509765625, 1.3997802734375, 1.47705078125, 1.5543212890625, 1.631591796875, 1.7088623046875, 1.7861328125, 1.8634033203125, 1.940673828125, 2.0179443359375, 2.09521484375, 2.1724853515625, 2.249755859375, 2.3270263671875, 2.404296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 8.0, 9.0, 23.0, 24.0, 46.0, 82.0, 127.0, 164.0, 326.0, 501.0, 723.0, 1202.0, 1879.0, 2946.0, 4518.0, 6836.0, 10184.0, 15255.0, 21617.0, 29999.0, 41417.0, 53773.0, 66959.0, 79651.0, 89229.0, 95397.0, 94963.0, 89799.0, 79778.0, 67221.0, 54069.0, 41362.0, 30831.0, 22153.0, 15329.0, 10471.0, 6819.0, 4752.0, 2926.0, 1920.0, 1243.0, 717.0, 512.0, 298.0, 200.0, 114.0, 66.0, 49.0, 37.0, 12.0, 14.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-1.4267578125, -1.383544921875, -1.34033203125, -1.297119140625, -1.25390625, -1.210693359375, -1.16748046875, -1.124267578125, -1.0810546875, -1.037841796875, -0.99462890625, -0.951416015625, -0.908203125, -0.864990234375, -0.82177734375, -0.778564453125, -0.7353515625, -0.692138671875, -0.64892578125, -0.605712890625, -0.5625, -0.519287109375, -0.47607421875, -0.432861328125, -0.3896484375, -0.346435546875, -0.30322265625, -0.260009765625, -0.216796875, -0.173583984375, -0.13037109375, -0.087158203125, -0.0439453125, -0.000732421875, 0.04248046875, 0.085693359375, 0.12890625, 0.172119140625, 0.21533203125, 0.258544921875, 0.3017578125, 0.344970703125, 0.38818359375, 0.431396484375, 0.474609375, 0.517822265625, 0.56103515625, 0.604248046875, 0.6474609375, 0.690673828125, 0.73388671875, 0.777099609375, 0.8203125, 0.863525390625, 0.90673828125, 0.949951171875, 0.9931640625, 1.036376953125, 1.07958984375, 1.122802734375, 1.166015625, 1.209228515625, 1.25244140625, 1.295654296875, 1.3388671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 4.0, 16.0, 16.0, 24.0, 31.0, 23.0, 21.0, 35.0, 23.0, 31.0, 36.0, 24.0, 30.0, 45.0, 36.0, 36.0, 43.0, 41.0, 42.0, 40.0, 42.0, 38.0, 46.0, 30.0, 25.0, 30.0, 22.0, 17.0, 20.0, 19.0, 14.0, 17.0, 10.0, 15.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.6552734375, -1.6083831787109375, -1.561492919921875, -1.5146026611328125, -1.46771240234375, -1.4208221435546875, -1.373931884765625, -1.3270416259765625, -1.2801513671875, -1.2332611083984375, -1.186370849609375, -1.1394805908203125, -1.09259033203125, -1.0457000732421875, -0.998809814453125, -0.9519195556640625, -0.905029296875, -0.8581390380859375, -0.811248779296875, -0.7643585205078125, -0.71746826171875, -0.6705780029296875, -0.623687744140625, -0.5767974853515625, -0.5299072265625, -0.4830169677734375, -0.436126708984375, -0.3892364501953125, -0.34234619140625, -0.2954559326171875, -0.248565673828125, -0.2016754150390625, -0.15478515625, -0.1078948974609375, -0.061004638671875, -0.0141143798828125, 0.03277587890625, 0.0796661376953125, 0.126556396484375, 0.1734466552734375, 0.2203369140625, 0.2672271728515625, 0.314117431640625, 0.3610076904296875, 0.40789794921875, 0.4547882080078125, 0.501678466796875, 0.5485687255859375, 0.595458984375, 0.6423492431640625, 0.689239501953125, 0.7361297607421875, 0.78302001953125, 0.8299102783203125, 0.876800537109375, 0.9236907958984375, 0.9705810546875, 1.0174713134765625, 1.064361572265625, 1.1112518310546875, 1.15814208984375, 1.2050323486328125, 1.251922607421875, 1.2988128662109375, 1.345703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 16.0, 18.0, 35.0, 56.0, 67.0, 136.0, 195.0, 277.0, 441.0, 752.0, 1171.0, 1809.0, 3073.0, 4911.0, 7819.0, 12768.0, 20684.0, 31294.0, 46198.0, 65024.0, 85707.0, 104289.0, 116774.0, 117972.0, 109350.0, 92306.0, 72120.0, 53091.0, 36384.0, 23633.0, 15138.0, 9616.0, 5870.0, 3600.0, 2229.0, 1348.0, 852.0, 524.0, 344.0, 220.0, 153.0, 95.0, 65.0, 45.0, 24.0, 18.0, 13.0, 9.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.76220703125, -0.7392349243164062, -0.7162628173828125, -0.6932907104492188, -0.670318603515625, -0.6473464965820312, -0.6243743896484375, -0.6014022827148438, -0.57843017578125, -0.5554580688476562, -0.5324859619140625, -0.5095138549804688, -0.486541748046875, -0.46356964111328125, -0.4405975341796875, -0.41762542724609375, -0.3946533203125, -0.37168121337890625, -0.3487091064453125, -0.32573699951171875, -0.302764892578125, -0.27979278564453125, -0.2568206787109375, -0.23384857177734375, -0.21087646484375, -0.18790435791015625, -0.1649322509765625, -0.14196014404296875, -0.118988037109375, -0.09601593017578125, -0.0730438232421875, -0.05007171630859375, -0.027099609375, -0.00412750244140625, 0.0188446044921875, 0.04181671142578125, 0.064788818359375, 0.08776092529296875, 0.1107330322265625, 0.13370513916015625, 0.15667724609375, 0.17964935302734375, 0.2026214599609375, 0.22559356689453125, 0.248565673828125, 0.27153778076171875, 0.2945098876953125, 0.31748199462890625, 0.3404541015625, 0.36342620849609375, 0.3863983154296875, 0.40937042236328125, 0.432342529296875, 0.45531463623046875, 0.4782867431640625, 0.5012588500976562, 0.52423095703125, 0.5472030639648438, 0.5701751708984375, 0.5931472778320312, 0.616119384765625, 0.6390914916992188, 0.6620635986328125, 0.6850357055664062, 0.7080078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 10.0, 14.0, 12.0, 15.0, 14.0, 19.0, 23.0, 19.0, 27.0, 31.0, 31.0, 47.0, 36.0, 35.0, 40.0, 39.0, 47.0, 57.0, 54.0, 39.0, 42.0, 50.0, 49.0, 30.0, 29.0, 29.0, 24.0, 22.0, 19.0, 18.0, 16.0, 8.0, 13.0, 5.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.502920925617218e-05, -7.22743570804596e-05, -6.951950490474701e-05, -6.676465272903442e-05, -6.400980055332184e-05, -6.125494837760925e-05, -5.850009620189667e-05, -5.574524402618408e-05, -5.2990391850471497e-05, -5.023553967475891e-05, -4.7480687499046326e-05, -4.472583532333374e-05, -4.1970983147621155e-05, -3.921613097190857e-05, -3.6461278796195984e-05, -3.37064266204834e-05, -3.095157444477081e-05, -2.8196722269058228e-05, -2.5441870093345642e-05, -2.2687017917633057e-05, -1.993216574192047e-05, -1.7177313566207886e-05, -1.44224613904953e-05, -1.1667609214782715e-05, -8.91275703907013e-06, -6.157904863357544e-06, -3.4030526876449585e-06, -6.48200511932373e-07, 2.1066516637802124e-06, 4.861503839492798e-06, 7.616356015205383e-06, 1.0371208190917969e-05, 1.3126060366630554e-05, 1.588091254234314e-05, 1.8635764718055725e-05, 2.139061689376831e-05, 2.4145469069480896e-05, 2.690032124519348e-05, 2.9655173420906067e-05, 3.241002559661865e-05, 3.516487777233124e-05, 3.791972994804382e-05, 4.067458212375641e-05, 4.3429434299468994e-05, 4.618428647518158e-05, 4.8939138650894165e-05, 5.169399082660675e-05, 5.4448843002319336e-05, 5.720369517803192e-05, 5.995854735374451e-05, 6.271339952945709e-05, 6.546825170516968e-05, 6.822310388088226e-05, 7.097795605659485e-05, 7.373280823230743e-05, 7.648766040802002e-05, 7.92425125837326e-05, 8.199736475944519e-05, 8.475221693515778e-05, 8.750706911087036e-05, 9.026192128658295e-05, 9.301677346229553e-05, 9.577162563800812e-05, 9.85264778137207e-05]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 21.0, 30.0, 37.0, 61.0, 100.0, 138.0, 212.0, 378.0, 548.0, 957.0, 1466.0, 2512.0, 4045.0, 7152.0, 12209.0, 21844.0, 36953.0, 59736.0, 89391.0, 119891.0, 142460.0, 145242.0, 129061.0, 99974.0, 68303.0, 43575.0, 26191.0, 15054.0, 8518.0, 4930.0, 2922.0, 1726.0, 1023.0, 686.0, 409.0, 280.0, 151.0, 139.0, 85.0, 39.0, 30.0, 22.0, 17.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9258499145507812, -0.8951568603515625, -0.8644638061523438, -0.833770751953125, -0.8030776977539062, -0.7723846435546875, -0.7416915893554688, -0.71099853515625, -0.6803054809570312, -0.6496124267578125, -0.6189193725585938, -0.588226318359375, -0.5575332641601562, -0.5268402099609375, -0.49614715576171875, -0.4654541015625, -0.43476104736328125, -0.4040679931640625, -0.37337493896484375, -0.342681884765625, -0.31198883056640625, -0.2812957763671875, -0.25060272216796875, -0.21990966796875, -0.18921661376953125, -0.1585235595703125, -0.12783050537109375, -0.097137451171875, -0.06644439697265625, -0.0357513427734375, -0.00505828857421875, 0.025634765625, 0.05632781982421875, 0.0870208740234375, 0.11771392822265625, 0.148406982421875, 0.17910003662109375, 0.2097930908203125, 0.24048614501953125, 0.27117919921875, 0.30187225341796875, 0.3325653076171875, 0.36325836181640625, 0.393951416015625, 0.42464447021484375, 0.4553375244140625, 0.48603057861328125, 0.5167236328125, 0.5474166870117188, 0.5781097412109375, 0.6088027954101562, 0.639495849609375, 0.6701889038085938, 0.7008819580078125, 0.7315750122070312, 0.76226806640625, 0.7929611206054688, 0.8236541748046875, 0.8543472290039062, 0.885040283203125, 0.9157333374023438, 0.9464263916015625, 0.9771194458007812, 1.0078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 9.0, 5.0, 11.0, 6.0, 15.0, 14.0, 13.0, 24.0, 20.0, 33.0, 21.0, 31.0, 47.0, 48.0, 45.0, 39.0, 50.0, 38.0, 40.0, 41.0, 56.0, 27.0, 27.0, 41.0, 29.0, 32.0, 30.0, 23.0, 30.0, 19.0, 23.0, 13.0, 14.0, 10.0, 14.0, 3.0, 12.0, 10.0, 2.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2605476379394531, -0.25205230712890625, -0.24355697631835938, -0.2350616455078125, -0.22656631469726562, -0.21807098388671875, -0.20957565307617188, -0.201080322265625, -0.19258499145507812, -0.18408966064453125, -0.17559432983398438, -0.1670989990234375, -0.15860366821289062, -0.15010833740234375, -0.14161300659179688, -0.13311767578125, -0.12462234497070312, -0.11612701416015625, -0.10763168334960938, -0.0991363525390625, -0.09064102172851562, -0.08214569091796875, -0.07365036010742188, -0.065155029296875, -0.056659698486328125, -0.04816436767578125, -0.039669036865234375, -0.0311737060546875, -0.022678375244140625, -0.01418304443359375, -0.005687713623046875, 0.0028076171875, 0.011302947998046875, 0.01979827880859375, 0.028293609619140625, 0.0367889404296875, 0.045284271240234375, 0.05377960205078125, 0.062274932861328125, 0.070770263671875, 0.07926559448242188, 0.08776092529296875, 0.09625625610351562, 0.1047515869140625, 0.11324691772460938, 0.12174224853515625, 0.13023757934570312, 0.13873291015625, 0.14722824096679688, 0.15572357177734375, 0.16421890258789062, 0.1727142333984375, 0.18120956420898438, 0.18970489501953125, 0.19820022583007812, 0.206695556640625, 0.21519088745117188, 0.22368621826171875, 0.23218154907226562, 0.2406768798828125, 0.24917221069335938, 0.25766754150390625, 0.2661628723144531, 0.274658203125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 9.0, 9.0, 9.0, 10.0, 11.0, 14.0, 18.0, 20.0, 23.0, 29.0, 27.0, 40.0, 44.0, 37.0, 40.0, 45.0, 58.0, 58.0, 43.0, 41.0, 37.0, 58.0, 36.0, 41.0, 35.0, 38.0, 29.0, 30.0, 19.0, 20.0, 8.0, 11.0, 10.0, 5.0, 9.0, 6.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.380751848220825, -3.2809531688690186, -3.181154727935791, -3.0813560485839844, -2.981557607650757, -2.88175892829895, -2.7819604873657227, -2.682161808013916, -2.5823631286621094, -2.4825644493103027, -2.382766008377075, -2.2829673290252686, -2.183168888092041, -2.0833702087402344, -1.9835716485977173, -1.8837730884552002, -1.7839746475219727, -1.6841760873794556, -1.5843775272369385, -1.4845788478851318, -1.3847804069519043, -1.2849817276000977, -1.1851831674575806, -1.0853846073150635, -0.9855860471725464, -0.8857874870300293, -0.7859889268875122, -0.6861903071403503, -0.5863917469978333, -0.48659318685531616, -0.3867945671081543, -0.2869960069656372, -0.18719744682312012, -0.08739887177944183, 0.01239970326423645, 0.11219829320907593, 0.21199685335159302, 0.3117954134941101, 0.411594033241272, 0.5113925933837891, 0.6111911535263062, 0.7109897136688232, 0.8107882738113403, 0.9105868935585022, 1.010385513305664, 1.1101839542388916, 1.2099826335906982, 1.3097811937332153, 1.4095797538757324, 1.5093783140182495, 1.6091768741607666, 1.7089755535125732, 1.8087739944458008, 1.9085726737976074, 2.008371353149414, 2.1081697940826416, 2.207968235015869, 2.307766914367676, 2.4075653553009033, 2.50736403465271, 2.6071624755859375, 2.706961154937744, 2.806759834289551, 2.9065582752227783, 3.006356954574585]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 14.0, 9.0, 15.0, 18.0, 31.0, 28.0, 22.0, 22.0, 38.0, 47.0, 47.0, 39.0, 44.0, 48.0, 46.0, 47.0, 44.0, 50.0, 53.0, 43.0, 31.0, 37.0, 26.0, 35.0, 28.0, 23.0, 22.0, 13.0, 11.0, 12.0, 8.0, 12.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2223832607269287, -3.131322145462036, -3.0402612686157227, -2.94920015335083, -2.8581392765045166, -2.767078161239624, -2.6760172843933105, -2.584956169128418, -2.4938952922821045, -2.402834177017212, -2.3117733001708984, -2.220712184906006, -2.1296513080596924, -2.0385901927948, -1.9475293159484863, -1.8564682006835938, -1.7654072046279907, -1.6743462085723877, -1.5832852125167847, -1.4922242164611816, -1.4011632204055786, -1.3101022243499756, -1.219041109085083, -1.1279802322387695, -1.036919116973877, -0.9458581209182739, -0.8547971248626709, -0.7637361288070679, -0.6726751327514648, -0.5816141366958618, -0.490553081035614, -0.399492084980011, -0.30843114852905273, -0.2173701524734497, -0.12630914151668549, -0.035248130559921265, 0.05581286549568176, 0.1468738615512848, 0.2379348874092102, 0.32899588346481323, 0.42005687952041626, 0.5111178755760193, 0.6021788716316223, 0.6932399272918701, 0.7843009233474731, 0.8753619194030762, 0.9664229154586792, 1.0574839115142822, 1.1485449075698853, 1.2396059036254883, 1.3306668996810913, 1.4217278957366943, 1.5127888917922974, 1.6038498878479004, 1.694911003112793, 1.7859718799591064, 1.877032995223999, 1.968093991279602, 2.059154987335205, 2.1502161026000977, 2.241276979446411, 2.3323380947113037, 2.423398971557617, 2.5144600868225098, 2.6055209636688232]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 18.0, 30.0, 33.0, 53.0, 96.0, 139.0, 209.0, 383.0, 551.0, 872.0, 1520.0, 2234.0, 3653.0, 5774.0, 9396.0, 14681.0, 23514.0, 37424.0, 58179.0, 89889.0, 135010.0, 196010.0, 273121.0, 357394.0, 433796.0, 477430.0, 476084.0, 427041.0, 348518.0, 263653.0, 188259.0, 129091.0, 86045.0, 56027.0, 35856.0, 23139.0, 14330.0, 9097.0, 5802.0, 3781.0, 2313.0, 1376.0, 912.0, 588.0, 392.0, 203.0, 140.0, 85.0, 56.0, 37.0, 23.0, 10.0, 10.0, 4.0, 0.0, 1.0], "bins": [-2.603515625, -2.526824951171875, -2.45013427734375, -2.373443603515625, -2.2967529296875, -2.220062255859375, -2.14337158203125, -2.066680908203125, -1.989990234375, -1.913299560546875, -1.83660888671875, -1.759918212890625, -1.6832275390625, -1.606536865234375, -1.52984619140625, -1.453155517578125, -1.37646484375, -1.299774169921875, -1.22308349609375, -1.146392822265625, -1.0697021484375, -0.993011474609375, -0.91632080078125, -0.839630126953125, -0.762939453125, -0.686248779296875, -0.60955810546875, -0.532867431640625, -0.4561767578125, -0.379486083984375, -0.30279541015625, -0.226104736328125, -0.1494140625, -0.072723388671875, 0.00396728515625, 0.080657958984375, 0.1573486328125, 0.234039306640625, 0.31072998046875, 0.387420654296875, 0.464111328125, 0.540802001953125, 0.61749267578125, 0.694183349609375, 0.7708740234375, 0.847564697265625, 0.92425537109375, 1.000946044921875, 1.07763671875, 1.154327392578125, 1.23101806640625, 1.307708740234375, 1.3843994140625, 1.461090087890625, 1.53778076171875, 1.614471435546875, 1.691162109375, 1.767852783203125, 1.84454345703125, 1.921234130859375, 1.9979248046875, 2.074615478515625, 2.15130615234375, 2.227996826171875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 20.0, 21.0, 21.0, 28.0, 31.0, 21.0, 38.0, 36.0, 35.0, 28.0, 43.0, 44.0, 42.0, 36.0, 41.0, 36.0, 35.0, 40.0, 39.0, 43.0, 34.0, 27.0, 29.0, 27.0, 21.0, 15.0, 16.0, 20.0, 13.0, 8.0, 12.0, 9.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.51953125, -2.44488525390625, -2.3702392578125, -2.29559326171875, -2.220947265625, -2.14630126953125, -2.0716552734375, -1.99700927734375, -1.92236328125, -1.84771728515625, -1.7730712890625, -1.69842529296875, -1.623779296875, -1.54913330078125, -1.4744873046875, -1.39984130859375, -1.3251953125, -1.25054931640625, -1.1759033203125, -1.10125732421875, -1.026611328125, -0.95196533203125, -0.8773193359375, -0.80267333984375, -0.72802734375, -0.65338134765625, -0.5787353515625, -0.50408935546875, -0.429443359375, -0.35479736328125, -0.2801513671875, -0.20550537109375, -0.130859375, -0.05621337890625, 0.0184326171875, 0.09307861328125, 0.167724609375, 0.24237060546875, 0.3170166015625, 0.39166259765625, 0.46630859375, 0.54095458984375, 0.6156005859375, 0.69024658203125, 0.764892578125, 0.83953857421875, 0.9141845703125, 0.98883056640625, 1.0634765625, 1.13812255859375, 1.2127685546875, 1.28741455078125, 1.362060546875, 1.43670654296875, 1.5113525390625, 1.58599853515625, 1.66064453125, 1.73529052734375, 1.8099365234375, 1.88458251953125, 1.959228515625, 2.03387451171875, 2.1085205078125, 2.18316650390625, 2.2578125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 17.0, 30.0, 37.0, 60.0, 150.0, 199.0, 343.0, 516.0, 971.0, 1584.0, 2661.0, 4390.0, 7488.0, 12211.0, 20286.0, 33354.0, 52782.0, 83153.0, 126253.0, 185615.0, 256432.0, 337553.0, 411129.0, 460870.0, 470288.0, 436930.0, 369702.0, 290521.0, 213802.0, 148934.0, 98340.0, 64092.0, 40372.0, 25074.0, 15222.0, 9164.0, 5486.0, 3356.0, 1996.0, 1157.0, 684.0, 459.0, 232.0, 145.0, 95.0, 57.0, 30.0, 19.0, 7.0, 10.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.923828125, -2.83013916015625, -2.7364501953125, -2.64276123046875, -2.549072265625, -2.45538330078125, -2.3616943359375, -2.26800537109375, -2.17431640625, -2.08062744140625, -1.9869384765625, -1.89324951171875, -1.799560546875, -1.70587158203125, -1.6121826171875, -1.51849365234375, -1.4248046875, -1.33111572265625, -1.2374267578125, -1.14373779296875, -1.050048828125, -0.95635986328125, -0.8626708984375, -0.76898193359375, -0.67529296875, -0.58160400390625, -0.4879150390625, -0.39422607421875, -0.300537109375, -0.20684814453125, -0.1131591796875, -0.01947021484375, 0.07421875, 0.16790771484375, 0.2615966796875, 0.35528564453125, 0.448974609375, 0.54266357421875, 0.6363525390625, 0.73004150390625, 0.82373046875, 0.91741943359375, 1.0111083984375, 1.10479736328125, 1.198486328125, 1.29217529296875, 1.3858642578125, 1.47955322265625, 1.5732421875, 1.66693115234375, 1.7606201171875, 1.85430908203125, 1.947998046875, 2.04168701171875, 2.1353759765625, 2.22906494140625, 2.32275390625, 2.41644287109375, 2.5101318359375, 2.60382080078125, 2.697509765625, 2.79119873046875, 2.8848876953125, 2.97857666015625, 3.072265625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 11.0, 10.0, 21.0, 25.0, 37.0, 37.0, 46.0, 67.0, 77.0, 105.0, 140.0, 169.0, 193.0, 221.0, 237.0, 236.0, 261.0, 271.0, 256.0, 265.0, 249.0, 212.0, 187.0, 153.0, 144.0, 109.0, 77.0, 70.0, 56.0, 37.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.857818603515625, -1.80548095703125, -1.753143310546875, -1.7008056640625, -1.648468017578125, -1.59613037109375, -1.543792724609375, -1.491455078125, -1.439117431640625, -1.38677978515625, -1.334442138671875, -1.2821044921875, -1.229766845703125, -1.17742919921875, -1.125091552734375, -1.07275390625, -1.020416259765625, -0.96807861328125, -0.915740966796875, -0.8634033203125, -0.811065673828125, -0.75872802734375, -0.706390380859375, -0.654052734375, -0.601715087890625, -0.54937744140625, -0.497039794921875, -0.4447021484375, -0.392364501953125, -0.34002685546875, -0.287689208984375, -0.2353515625, -0.183013916015625, -0.13067626953125, -0.078338623046875, -0.0260009765625, 0.026336669921875, 0.07867431640625, 0.131011962890625, 0.183349609375, 0.235687255859375, 0.28802490234375, 0.340362548828125, 0.3927001953125, 0.445037841796875, 0.49737548828125, 0.549713134765625, 0.60205078125, 0.654388427734375, 0.70672607421875, 0.759063720703125, 0.8114013671875, 0.863739013671875, 0.91607666015625, 0.968414306640625, 1.020751953125, 1.073089599609375, 1.12542724609375, 1.177764892578125, 1.2301025390625, 1.282440185546875, 1.33477783203125, 1.387115478515625, 1.439453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 0.0, 4.0, 7.0, 11.0, 13.0, 9.0, 26.0, 19.0, 23.0, 32.0, 36.0, 46.0, 33.0, 49.0, 54.0, 52.0, 53.0, 45.0, 43.0, 52.0, 35.0, 39.0, 44.0, 41.0, 38.0, 30.0, 21.0, 29.0, 27.0, 13.0, 17.0, 11.0, 14.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.072996139526367, -3.9328458309173584, -3.7926955223083496, -3.6525449752807617, -3.512394666671753, -3.372244358062744, -3.2320938110351562, -3.0919435024261475, -2.9517931938171387, -2.81164288520813, -2.671492576599121, -2.531342029571533, -2.3911917209625244, -2.2510414123535156, -2.1108908653259277, -1.970740556716919, -1.8305902481079102, -1.6904399394989014, -1.550289511680603, -1.4101390838623047, -1.269988775253296, -1.129838466644287, -0.9896880388259888, -0.8495376706123352, -0.7093873023986816, -0.5692369341850281, -0.4290865659713745, -0.28893619775772095, -0.14878582954406738, -0.008635461330413818, 0.13151490688323975, 0.2716652750968933, 0.4118156433105469, 0.5519660115242004, 0.692116379737854, 0.8322667479515076, 0.9724171161651611, 1.11256742477417, 1.2527178525924683, 1.3928682804107666, 1.5330185890197754, 1.6731688976287842, 1.8133193254470825, 1.9534697532653809, 2.0936200618743896, 2.2337703704833984, 2.3739209175109863, 2.514071226119995, 2.654221534729004, 2.7943718433380127, 2.9345221519470215, 3.0746726989746094, 3.214823007583618, 3.354973316192627, 3.495123863220215, 3.6352741718292236, 3.7754244804382324, 3.915574789047241, 4.05572509765625, 4.195875644683838, 4.336026191711426, 4.4761762619018555, 4.616326808929443, 4.756476879119873, 4.896627426147461]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 8.0, 6.0, 10.0, 7.0, 17.0, 19.0, 21.0, 27.0, 21.0, 23.0, 25.0, 35.0, 27.0, 33.0, 43.0, 38.0, 49.0, 49.0, 43.0, 33.0, 44.0, 41.0, 27.0, 42.0, 35.0, 33.0, 37.0, 23.0, 22.0, 23.0, 18.0, 16.0, 15.0, 16.0, 12.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5045316219329834, -3.404284715652466, -3.3040378093719482, -3.2037906646728516, -3.103543758392334, -3.0032968521118164, -2.903049945831299, -2.8028030395507812, -2.7025561332702637, -2.602309226989746, -2.5020623207092285, -2.401815414428711, -2.3015682697296143, -2.2013213634490967, -2.101074457168579, -2.0008275508880615, -1.9005804061889648, -1.8003334999084473, -1.7000864744186401, -1.5998395681381226, -1.4995925426483154, -1.3993456363677979, -1.2990987300872803, -1.1988518238067627, -1.0986047983169556, -0.9983578324317932, -0.8981108665466309, -0.7978639602661133, -0.6976169943809509, -0.5973700284957886, -0.497123122215271, -0.39687615633010864, -0.2966291904449463, -0.19638223946094513, -0.09613528847694397, 0.004111647605895996, 0.10435861349105835, 0.2046055793762207, 0.3048524856567383, 0.40509945154190063, 0.505346417427063, 0.6055933833122253, 0.7058403491973877, 0.8060872554779053, 0.9063342213630676, 1.00658118724823, 1.1068280935287476, 1.2070751190185547, 1.3073220252990723, 1.4075689315795898, 1.507815957069397, 1.6080628633499146, 1.7083098888397217, 1.8085567951202393, 1.9088037014007568, 2.0090506076812744, 2.109297752380371, 2.2095446586608887, 2.3097915649414062, 2.410038471221924, 2.5102856159210205, 2.610532522201538, 2.7107794284820557, 2.8110263347625732, 2.911273241043091]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 13.0, 9.0, 23.0, 22.0, 34.0, 55.0, 73.0, 90.0, 147.0, 235.0, 343.0, 439.0, 689.0, 1109.0, 1684.0, 2623.0, 3833.0, 6033.0, 9165.0, 13924.0, 21680.0, 33252.0, 50761.0, 75719.0, 108031.0, 142434.0, 154598.0, 132006.0, 96595.0, 65967.0, 44188.0, 28847.0, 18870.0, 12162.0, 7925.0, 5136.0, 3365.0, 2198.0, 1416.0, 935.0, 663.0, 417.0, 282.0, 195.0, 108.0, 90.0, 68.0, 36.0, 19.0, 17.0, 12.0, 7.0, 10.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.71826171875, -0.696044921875, -0.673828125, -0.651611328125, -0.62939453125, -0.607177734375, -0.5849609375, -0.562744140625, -0.54052734375, -0.518310546875, -0.49609375, -0.473876953125, -0.45166015625, -0.429443359375, -0.4072265625, -0.385009765625, -0.36279296875, -0.340576171875, -0.318359375, -0.296142578125, -0.27392578125, -0.251708984375, -0.2294921875, -0.207275390625, -0.18505859375, -0.162841796875, -0.140625, -0.118408203125, -0.09619140625, -0.073974609375, -0.0517578125, -0.029541015625, -0.00732421875, 0.014892578125, 0.037109375, 0.059326171875, 0.08154296875, 0.103759765625, 0.1259765625, 0.148193359375, 0.17041015625, 0.192626953125, 0.21484375, 0.237060546875, 0.25927734375, 0.281494140625, 0.3037109375, 0.325927734375, 0.34814453125, 0.370361328125, 0.392578125, 0.414794921875, 0.43701171875, 0.459228515625, 0.4814453125, 0.503662109375, 0.52587890625, 0.548095703125, 0.5703125, 0.592529296875, 0.61474609375, 0.636962890625, 0.6591796875, 0.681396484375, 0.70361328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 11.0, 22.0, 18.0, 22.0, 27.0, 30.0, 30.0, 42.0, 39.0, 37.0, 29.0, 45.0, 74.0, 59.0, 51.0, 57.0, 44.0, 53.0, 34.0, 33.0, 26.0, 34.0, 30.0, 24.0, 20.0, 13.0, 12.0, 14.0, 11.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.96075439453125, -3.8316650390625, -3.70257568359375, -3.573486328125, -3.44439697265625, -3.3153076171875, -3.18621826171875, -3.05712890625, -2.92803955078125, -2.7989501953125, -2.66986083984375, -2.540771484375, -2.41168212890625, -2.2825927734375, -2.15350341796875, -2.0244140625, -1.89532470703125, -1.7662353515625, -1.63714599609375, -1.508056640625, -1.37896728515625, -1.2498779296875, -1.12078857421875, -0.99169921875, -0.86260986328125, -0.7335205078125, -0.60443115234375, -0.475341796875, -0.34625244140625, -0.2171630859375, -0.08807373046875, 0.041015625, 0.17010498046875, 0.2991943359375, 0.42828369140625, 0.557373046875, 0.68646240234375, 0.8155517578125, 0.94464111328125, 1.07373046875, 1.20281982421875, 1.3319091796875, 1.46099853515625, 1.590087890625, 1.71917724609375, 1.8482666015625, 1.97735595703125, 2.1064453125, 2.23553466796875, 2.3646240234375, 2.49371337890625, 2.622802734375, 2.75189208984375, 2.8809814453125, 3.01007080078125, 3.13916015625, 3.26824951171875, 3.3973388671875, 3.52642822265625, 3.655517578125, 3.78460693359375, 3.9136962890625, 4.04278564453125, 4.171875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 9.0, 4.0, 6.0, 5.0, 15.0, 20.0, 28.0, 26.0, 55.0, 47.0, 87.0, 128.0, 216.0, 266.0, 465.0, 709.0, 990.0, 1555.0, 2407.0, 3710.0, 6013.0, 9889.0, 16661.0, 28912.0, 50259.0, 86383.0, 141128.0, 196176.0, 187269.0, 128610.0, 77118.0, 44587.0, 25592.0, 15111.0, 8983.0, 5521.0, 3291.0, 2174.0, 1369.0, 935.0, 576.0, 389.0, 267.0, 177.0, 139.0, 87.0, 50.0, 45.0, 41.0, 18.0, 15.0, 10.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.87841796875, -0.8499832153320312, -0.8215484619140625, -0.7931137084960938, -0.764678955078125, -0.7362442016601562, -0.7078094482421875, -0.6793746948242188, -0.65093994140625, -0.6225051879882812, -0.5940704345703125, -0.5656356811523438, -0.537200927734375, -0.5087661743164062, -0.4803314208984375, -0.45189666748046875, -0.4234619140625, -0.39502716064453125, -0.3665924072265625, -0.33815765380859375, -0.309722900390625, -0.28128814697265625, -0.2528533935546875, -0.22441864013671875, -0.19598388671875, -0.16754913330078125, -0.1391143798828125, -0.11067962646484375, -0.082244873046875, -0.05381011962890625, -0.0253753662109375, 0.00305938720703125, 0.031494140625, 0.05992889404296875, 0.0883636474609375, 0.11679840087890625, 0.145233154296875, 0.17366790771484375, 0.2021026611328125, 0.23053741455078125, 0.25897216796875, 0.28740692138671875, 0.3158416748046875, 0.34427642822265625, 0.372711181640625, 0.40114593505859375, 0.4295806884765625, 0.45801544189453125, 0.4864501953125, 0.5148849487304688, 0.5433197021484375, 0.5717544555664062, 0.600189208984375, 0.6286239624023438, 0.6570587158203125, 0.6854934692382812, 0.71392822265625, 0.7423629760742188, 0.7707977294921875, 0.7992324829101562, 0.827667236328125, 0.8561019897460938, 0.8845367431640625, 0.9129714965820312, 0.94140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 11.0, 3.0, 9.0, 16.0, 14.0, 18.0, 23.0, 35.0, 20.0, 29.0, 43.0, 28.0, 37.0, 34.0, 44.0, 48.0, 46.0, 46.0, 43.0, 39.0, 39.0, 46.0, 35.0, 40.0, 39.0, 22.0, 31.0, 20.0, 18.0, 22.0, 15.0, 20.0, 10.0, 12.0, 8.0, 5.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19921875, -2.129913330078125, -2.06060791015625, -1.991302490234375, -1.9219970703125, -1.852691650390625, -1.78338623046875, -1.714080810546875, -1.644775390625, -1.575469970703125, -1.50616455078125, -1.436859130859375, -1.3675537109375, -1.298248291015625, -1.22894287109375, -1.159637451171875, -1.09033203125, -1.021026611328125, -0.95172119140625, -0.882415771484375, -0.8131103515625, -0.743804931640625, -0.67449951171875, -0.605194091796875, -0.535888671875, -0.466583251953125, -0.39727783203125, -0.327972412109375, -0.2586669921875, -0.189361572265625, -0.12005615234375, -0.050750732421875, 0.0185546875, 0.087860107421875, 0.15716552734375, 0.226470947265625, 0.2957763671875, 0.365081787109375, 0.43438720703125, 0.503692626953125, 0.572998046875, 0.642303466796875, 0.71160888671875, 0.780914306640625, 0.8502197265625, 0.919525146484375, 0.98883056640625, 1.058135986328125, 1.12744140625, 1.196746826171875, 1.26605224609375, 1.335357666015625, 1.4046630859375, 1.473968505859375, 1.54327392578125, 1.612579345703125, 1.681884765625, 1.751190185546875, 1.82049560546875, 1.889801025390625, 1.9591064453125, 2.028411865234375, 2.09771728515625, 2.167022705078125, 2.236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 19.0, 30.0, 27.0, 53.0, 68.0, 86.0, 121.0, 183.0, 231.0, 312.0, 435.0, 664.0, 998.0, 1571.0, 2386.0, 3781.0, 6264.0, 10953.0, 20913.0, 45324.0, 118264.0, 341696.0, 305237.0, 103039.0, 40309.0, 19148.0, 10149.0, 5838.0, 3511.0, 2320.0, 1453.0, 948.0, 661.0, 456.0, 292.0, 191.0, 162.0, 121.0, 73.0, 59.0, 48.0, 36.0, 28.0, 23.0, 10.0, 11.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.517578125, -0.5008468627929688, -0.4841156005859375, -0.46738433837890625, -0.450653076171875, -0.43392181396484375, -0.4171905517578125, -0.40045928955078125, -0.38372802734375, -0.36699676513671875, -0.3502655029296875, -0.33353424072265625, -0.316802978515625, -0.30007171630859375, -0.2833404541015625, -0.26660919189453125, -0.2498779296875, -0.23314666748046875, -0.2164154052734375, -0.19968414306640625, -0.182952880859375, -0.16622161865234375, -0.1494903564453125, -0.13275909423828125, -0.11602783203125, -0.09929656982421875, -0.0825653076171875, -0.06583404541015625, -0.049102783203125, -0.03237152099609375, -0.0156402587890625, 0.00109100341796875, 0.017822265625, 0.03455352783203125, 0.0512847900390625, 0.06801605224609375, 0.084747314453125, 0.10147857666015625, 0.1182098388671875, 0.13494110107421875, 0.15167236328125, 0.16840362548828125, 0.1851348876953125, 0.20186614990234375, 0.218597412109375, 0.23532867431640625, 0.2520599365234375, 0.26879119873046875, 0.2855224609375, 0.30225372314453125, 0.3189849853515625, 0.33571624755859375, 0.352447509765625, 0.36917877197265625, 0.3859100341796875, 0.40264129638671875, 0.41937255859375, 0.43610382080078125, 0.4528350830078125, 0.46956634521484375, 0.486297607421875, 0.5030288696289062, 0.5197601318359375, 0.5364913940429688, 0.55322265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 8.0, 4.0, 4.0, 12.0, 14.0, 17.0, 29.0, 24.0, 34.0, 47.0, 42.0, 55.0, 57.0, 58.0, 49.0, 61.0, 48.0, 52.0, 54.0, 41.0, 52.0, 43.0, 25.0, 29.0, 21.0, 28.0, 13.0, 22.0, 13.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4259090423583984e-05, -2.3513101041316986e-05, -2.2767111659049988e-05, -2.202112227678299e-05, -2.127513289451599e-05, -2.0529143512248993e-05, -1.9783154129981995e-05, -1.9037164747714996e-05, -1.8291175365447998e-05, -1.7545185983181e-05, -1.6799196600914e-05, -1.6053207218647003e-05, -1.5307217836380005e-05, -1.4561228454113007e-05, -1.3815239071846008e-05, -1.306924968957901e-05, -1.2323260307312012e-05, -1.1577270925045013e-05, -1.0831281542778015e-05, -1.0085292160511017e-05, -9.339302778244019e-06, -8.59331339597702e-06, -7.847324013710022e-06, -7.101334631443024e-06, -6.355345249176025e-06, -5.609355866909027e-06, -4.863366484642029e-06, -4.1173771023750305e-06, -3.3713877201080322e-06, -2.625398337841034e-06, -1.8794089555740356e-06, -1.1334195733070374e-06, -3.8743019104003906e-07, 3.5855919122695923e-07, 1.1045485734939575e-06, 1.8505379557609558e-06, 2.596527338027954e-06, 3.3425167202949524e-06, 4.088506102561951e-06, 4.834495484828949e-06, 5.580484867095947e-06, 6.3264742493629456e-06, 7.072463631629944e-06, 7.818453013896942e-06, 8.56444239616394e-06, 9.310431778430939e-06, 1.0056421160697937e-05, 1.0802410542964935e-05, 1.1548399925231934e-05, 1.2294389307498932e-05, 1.304037868976593e-05, 1.3786368072032928e-05, 1.4532357454299927e-05, 1.5278346836566925e-05, 1.6024336218833923e-05, 1.677032560110092e-05, 1.751631498336792e-05, 1.8262304365634918e-05, 1.9008293747901917e-05, 1.9754283130168915e-05, 2.0500272512435913e-05, 2.124626189470291e-05, 2.199225127696991e-05, 2.2738240659236908e-05, 2.3484230041503906e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 15.0, 21.0, 32.0, 38.0, 64.0, 67.0, 123.0, 146.0, 231.0, 309.0, 460.0, 692.0, 952.0, 1537.0, 2281.0, 3514.0, 5741.0, 9430.0, 16148.0, 29452.0, 55141.0, 109463.0, 207699.0, 257993.0, 164112.0, 83079.0, 42523.0, 22740.0, 13112.0, 7630.0, 4728.0, 3020.0, 1964.0, 1295.0, 843.0, 580.0, 406.0, 292.0, 217.0, 135.0, 97.0, 60.0, 47.0, 40.0, 23.0, 19.0, 8.0, 3.0, 11.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5765151977539062, -0.5568389892578125, -0.5371627807617188, -0.517486572265625, -0.49781036376953125, -0.4781341552734375, -0.45845794677734375, -0.43878173828125, -0.41910552978515625, -0.3994293212890625, -0.37975311279296875, -0.360076904296875, -0.34040069580078125, -0.3207244873046875, -0.30104827880859375, -0.2813720703125, -0.26169586181640625, -0.2420196533203125, -0.22234344482421875, -0.202667236328125, -0.18299102783203125, -0.1633148193359375, -0.14363861083984375, -0.12396240234375, -0.10428619384765625, -0.0846099853515625, -0.06493377685546875, -0.045257568359375, -0.02558135986328125, -0.0059051513671875, 0.01377105712890625, 0.033447265625, 0.05312347412109375, 0.0727996826171875, 0.09247589111328125, 0.112152099609375, 0.13182830810546875, 0.1515045166015625, 0.17118072509765625, 0.19085693359375, 0.21053314208984375, 0.2302093505859375, 0.24988555908203125, 0.269561767578125, 0.28923797607421875, 0.3089141845703125, 0.32859039306640625, 0.3482666015625, 0.36794281005859375, 0.3876190185546875, 0.40729522705078125, 0.426971435546875, 0.44664764404296875, 0.4663238525390625, 0.48600006103515625, 0.50567626953125, 0.5253524780273438, 0.5450286865234375, 0.5647048950195312, 0.584381103515625, 0.6040573120117188, 0.6237335205078125, 0.6434097290039062, 0.6630859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 13.0, 19.0, 23.0, 29.0, 40.0, 41.0, 58.0, 89.0, 102.0, 103.0, 93.0, 94.0, 63.0, 39.0, 35.0, 25.0, 29.0, 19.0, 17.0, 10.0, 10.0, 7.0, 6.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2238025665283203, -0.21750259399414062, -0.21120262145996094, -0.20490264892578125, -0.19860267639160156, -0.19230270385742188, -0.1860027313232422, -0.1797027587890625, -0.1734027862548828, -0.16710281372070312, -0.16080284118652344, -0.15450286865234375, -0.14820289611816406, -0.14190292358398438, -0.1356029510498047, -0.129302978515625, -0.12300300598144531, -0.11670303344726562, -0.11040306091308594, -0.10410308837890625, -0.09780311584472656, -0.09150314331054688, -0.08520317077636719, -0.0789031982421875, -0.07260322570800781, -0.06630325317382812, -0.06000328063964844, -0.05370330810546875, -0.04740333557128906, -0.041103363037109375, -0.03480339050292969, -0.02850341796875, -0.022203445434570312, -0.015903472900390625, -0.009603500366210938, -0.00330352783203125, 0.0029964447021484375, 0.009296417236328125, 0.015596389770507812, 0.0218963623046875, 0.028196334838867188, 0.034496307373046875, 0.04079627990722656, 0.04709625244140625, 0.05339622497558594, 0.059696197509765625, 0.06599617004394531, 0.072296142578125, 0.07859611511230469, 0.08489608764648438, 0.09119606018066406, 0.09749603271484375, 0.10379600524902344, 0.11009597778320312, 0.11639595031738281, 0.1226959228515625, 0.1289958953857422, 0.13529586791992188, 0.14159584045410156, 0.14789581298828125, 0.15419578552246094, 0.16049575805664062, 0.1667957305908203, 0.173095703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 11.0, 14.0, 12.0, 23.0, 20.0, 20.0, 35.0, 42.0, 41.0, 43.0, 44.0, 53.0, 52.0, 54.0, 45.0, 53.0, 39.0, 37.0, 36.0, 49.0, 39.0, 34.0, 29.0, 26.0, 27.0, 24.0, 11.0, 15.0, 17.0, 12.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.080476760864258, -3.939161539077759, -3.797846555709839, -3.65653133392334, -3.51521635055542, -3.373901128768921, -3.232585906982422, -3.091270923614502, -2.949955940246582, -2.808640718460083, -2.667325735092163, -2.526010513305664, -2.384695529937744, -2.243380308151245, -2.102065086364746, -1.9607501029968262, -1.8194348812103271, -1.6781197786331177, -1.5368046760559082, -1.3954894542694092, -1.2541744709014893, -1.1128592491149902, -0.9715441465377808, -0.8302290439605713, -0.6889139413833618, -0.5475988388061523, -0.4062837064266205, -0.2649685740470886, -0.12365347146987915, 0.017661631107330322, 0.15897679328918457, 0.30029189586639404, 0.4416069984436035, 0.582922101020813, 0.7242372035980225, 0.8655523657798767, 1.0068674087524414, 1.1481826305389404, 1.28949773311615, 1.4308128356933594, 1.5721279382705688, 1.7134430408477783, 1.8547581434249878, 1.9960732460021973, 2.1373884677886963, 2.278703451156616, 2.4200186729431152, 2.561333656311035, 2.702648878097534, 2.843964099884033, 2.985279083251953, 3.126594305038452, 3.267909288406372, 3.409224510192871, 3.550539493560791, 3.69185471534729, 3.833169937133789, 3.974485158920288, 4.115800380706787, 4.257115364074707, 4.398430347442627, 4.539745330810547, 4.681060791015625, 4.822375774383545, 4.963690757751465]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 8.0, 10.0, 9.0, 14.0, 19.0, 25.0, 23.0, 21.0, 21.0, 28.0, 26.0, 33.0, 34.0, 37.0, 44.0, 53.0, 46.0, 44.0, 35.0, 39.0, 46.0, 31.0, 36.0, 36.0, 32.0, 39.0, 21.0, 23.0, 25.0, 16.0, 16.0, 17.0, 17.0, 8.0, 15.0, 8.0, 7.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.544121503829956, -3.4429636001586914, -3.341805934906006, -3.240648031234741, -3.1394901275634766, -3.038332223892212, -2.9371743202209473, -2.8360166549682617, -2.734858751296997, -2.6337008476257324, -2.532543182373047, -2.4313852787017822, -2.3302273750305176, -2.229069471359253, -2.1279115676879883, -2.0267539024353027, -1.925595998764038, -1.8244380950927734, -1.7232803106307983, -1.6221225261688232, -1.5209646224975586, -1.419806718826294, -1.3186489343643188, -1.2174911499023438, -1.116333246231079, -1.0151753425598145, -0.9140175580978394, -0.8128597140312195, -0.7117018699645996, -0.6105440258979797, -0.5093861818313599, -0.40822833776474, -0.3070704936981201, -0.20591264963150024, -0.10475480556488037, -0.003596961498260498, 0.09756088256835938, 0.19871872663497925, 0.2998765707015991, 0.401034414768219, 0.5021922588348389, 0.6033501029014587, 0.7045079469680786, 0.8056657910346985, 0.9068236351013184, 1.007981538772583, 1.109139323234558, 1.2102971076965332, 1.3114550113677979, 1.4126129150390625, 1.5137706995010376, 1.6149284839630127, 1.7160863876342773, 1.817244291305542, 1.918402075767517, 2.019559860229492, 2.120717763900757, 2.2218756675720215, 2.323033332824707, 2.4241912364959717, 2.5253491401672363, 2.626507043838501, 2.7276649475097656, 2.828822612762451, 2.929980516433716]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 8.0, 18.0, 31.0, 49.0, 64.0, 105.0, 193.0, 297.0, 452.0, 777.0, 1245.0, 1996.0, 3214.0, 5219.0, 8187.0, 13202.0, 20357.0, 30115.0, 43785.0, 60437.0, 78977.0, 97139.0, 110044.0, 114605.0, 108107.0, 94781.0, 75695.0, 57701.0, 41740.0, 28295.0, 18724.0, 12187.0, 7927.0, 4833.0, 3035.0, 1904.0, 1158.0, 761.0, 446.0, 248.0, 180.0, 114.0, 69.0, 46.0, 35.0, 15.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-2.095703125, -2.03106689453125, -1.9664306640625, -1.90179443359375, -1.837158203125, -1.77252197265625, -1.7078857421875, -1.64324951171875, -1.57861328125, -1.51397705078125, -1.4493408203125, -1.38470458984375, -1.320068359375, -1.25543212890625, -1.1907958984375, -1.12615966796875, -1.0615234375, -0.99688720703125, -0.9322509765625, -0.86761474609375, -0.802978515625, -0.73834228515625, -0.6737060546875, -0.60906982421875, -0.54443359375, -0.47979736328125, -0.4151611328125, -0.35052490234375, -0.285888671875, -0.22125244140625, -0.1566162109375, -0.09197998046875, -0.02734375, 0.03729248046875, 0.1019287109375, 0.16656494140625, 0.231201171875, 0.29583740234375, 0.3604736328125, 0.42510986328125, 0.48974609375, 0.55438232421875, 0.6190185546875, 0.68365478515625, 0.748291015625, 0.81292724609375, 0.8775634765625, 0.94219970703125, 1.0068359375, 1.07147216796875, 1.1361083984375, 1.20074462890625, 1.265380859375, 1.33001708984375, 1.3946533203125, 1.45928955078125, 1.52392578125, 1.58856201171875, 1.6531982421875, 1.71783447265625, 1.782470703125, 1.84710693359375, 1.9117431640625, 1.97637939453125, 2.041015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 13.0, 14.0, 22.0, 31.0, 28.0, 22.0, 29.0, 33.0, 33.0, 42.0, 33.0, 40.0, 40.0, 52.0, 35.0, 34.0, 40.0, 32.0, 31.0, 41.0, 26.0, 30.0, 20.0, 28.0, 22.0, 30.0, 16.0, 20.0, 12.0, 15.0, 9.0, 8.0, 11.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.916015625, -2.81646728515625, -2.7169189453125, -2.61737060546875, -2.517822265625, -2.41827392578125, -2.3187255859375, -2.21917724609375, -2.11962890625, -2.02008056640625, -1.9205322265625, -1.82098388671875, -1.721435546875, -1.62188720703125, -1.5223388671875, -1.42279052734375, -1.3232421875, -1.22369384765625, -1.1241455078125, -1.02459716796875, -0.925048828125, -0.82550048828125, -0.7259521484375, -0.62640380859375, -0.52685546875, -0.42730712890625, -0.3277587890625, -0.22821044921875, -0.128662109375, -0.02911376953125, 0.0704345703125, 0.16998291015625, 0.26953125, 0.36907958984375, 0.4686279296875, 0.56817626953125, 0.667724609375, 0.76727294921875, 0.8668212890625, 0.96636962890625, 1.06591796875, 1.16546630859375, 1.2650146484375, 1.36456298828125, 1.464111328125, 1.56365966796875, 1.6632080078125, 1.76275634765625, 1.8623046875, 1.96185302734375, 2.0614013671875, 2.16094970703125, 2.260498046875, 2.36004638671875, 2.4595947265625, 2.55914306640625, 2.65869140625, 2.75823974609375, 2.8577880859375, 2.95733642578125, 3.056884765625, 3.15643310546875, 3.2559814453125, 3.35552978515625, 3.455078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 13.0, 20.0, 28.0, 34.0, 52.0, 76.0, 122.0, 169.0, 260.0, 371.0, 561.0, 795.0, 1264.0, 1997.0, 2851.0, 4440.0, 6644.0, 10105.0, 15290.0, 22611.0, 32520.0, 46036.0, 61666.0, 78470.0, 94495.0, 105444.0, 108590.0, 102895.0, 90152.0, 73564.0, 56844.0, 41166.0, 29131.0, 19815.0, 13519.0, 9128.0, 6006.0, 3930.0, 2503.0, 1688.0, 1076.0, 753.0, 487.0, 291.0, 232.0, 140.0, 96.0, 81.0, 41.0, 30.0, 17.0, 18.0, 11.0, 8.0, 2.0, 4.0, 2.0], "bins": [-2.224609375, -2.15789794921875, -2.0911865234375, -2.02447509765625, -1.957763671875, -1.89105224609375, -1.8243408203125, -1.75762939453125, -1.69091796875, -1.62420654296875, -1.5574951171875, -1.49078369140625, -1.424072265625, -1.35736083984375, -1.2906494140625, -1.22393798828125, -1.1572265625, -1.09051513671875, -1.0238037109375, -0.95709228515625, -0.890380859375, -0.82366943359375, -0.7569580078125, -0.69024658203125, -0.62353515625, -0.55682373046875, -0.4901123046875, -0.42340087890625, -0.356689453125, -0.28997802734375, -0.2232666015625, -0.15655517578125, -0.08984375, -0.02313232421875, 0.0435791015625, 0.11029052734375, 0.177001953125, 0.24371337890625, 0.3104248046875, 0.37713623046875, 0.44384765625, 0.51055908203125, 0.5772705078125, 0.64398193359375, 0.710693359375, 0.77740478515625, 0.8441162109375, 0.91082763671875, 0.9775390625, 1.04425048828125, 1.1109619140625, 1.17767333984375, 1.244384765625, 1.31109619140625, 1.3778076171875, 1.44451904296875, 1.51123046875, 1.57794189453125, 1.6446533203125, 1.71136474609375, 1.778076171875, 1.84478759765625, 1.9114990234375, 1.97821044921875, 2.044921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 14.0, 10.0, 17.0, 9.0, 18.0, 23.0, 27.0, 21.0, 22.0, 24.0, 25.0, 35.0, 39.0, 38.0, 37.0, 34.0, 48.0, 25.0, 31.0, 50.0, 42.0, 35.0, 27.0, 42.0, 29.0, 34.0, 28.0, 17.0, 32.0, 19.0, 25.0, 19.0, 13.0, 12.0, 14.0, 4.0, 8.0, 3.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7529296875, -1.6934661865234375, -1.634002685546875, -1.5745391845703125, -1.51507568359375, -1.4556121826171875, -1.396148681640625, -1.3366851806640625, -1.2772216796875, -1.2177581787109375, -1.158294677734375, -1.0988311767578125, -1.03936767578125, -0.9799041748046875, -0.920440673828125, -0.8609771728515625, -0.801513671875, -0.7420501708984375, -0.682586669921875, -0.6231231689453125, -0.56365966796875, -0.5041961669921875, -0.444732666015625, -0.3852691650390625, -0.3258056640625, -0.2663421630859375, -0.206878662109375, -0.1474151611328125, -0.08795166015625, -0.0284881591796875, 0.030975341796875, 0.0904388427734375, 0.14990234375, 0.2093658447265625, 0.268829345703125, 0.3282928466796875, 0.38775634765625, 0.4472198486328125, 0.506683349609375, 0.5661468505859375, 0.6256103515625, 0.6850738525390625, 0.744537353515625, 0.8040008544921875, 0.86346435546875, 0.9229278564453125, 0.982391357421875, 1.0418548583984375, 1.101318359375, 1.1607818603515625, 1.220245361328125, 1.2797088623046875, 1.33917236328125, 1.3986358642578125, 1.458099365234375, 1.5175628662109375, 1.5770263671875, 1.6364898681640625, 1.695953369140625, 1.7554168701171875, 1.81488037109375, 1.8743438720703125, 1.933807373046875, 1.9932708740234375, 2.052734375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 16.0, 22.0, 30.0, 46.0, 76.0, 79.0, 131.0, 193.0, 255.0, 378.0, 536.0, 785.0, 1254.0, 1834.0, 2872.0, 4855.0, 8611.0, 16627.0, 33492.0, 67499.0, 124095.0, 183565.0, 206651.0, 170396.0, 107148.0, 56342.0, 27984.0, 13730.0, 7178.0, 4145.0, 2610.0, 1604.0, 1100.0, 774.0, 491.0, 324.0, 245.0, 167.0, 120.0, 82.0, 72.0, 46.0, 33.0, 13.0, 13.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7421875, -1.6866455078125, -1.631103515625, -1.5755615234375, -1.52001953125, -1.4644775390625, -1.408935546875, -1.3533935546875, -1.2978515625, -1.2423095703125, -1.186767578125, -1.1312255859375, -1.07568359375, -1.0201416015625, -0.964599609375, -0.9090576171875, -0.853515625, -0.7979736328125, -0.742431640625, -0.6868896484375, -0.63134765625, -0.5758056640625, -0.520263671875, -0.4647216796875, -0.4091796875, -0.3536376953125, -0.298095703125, -0.2425537109375, -0.18701171875, -0.1314697265625, -0.075927734375, -0.0203857421875, 0.03515625, 0.0906982421875, 0.146240234375, 0.2017822265625, 0.25732421875, 0.3128662109375, 0.368408203125, 0.4239501953125, 0.4794921875, 0.5350341796875, 0.590576171875, 0.6461181640625, 0.70166015625, 0.7572021484375, 0.812744140625, 0.8682861328125, 0.923828125, 0.9793701171875, 1.034912109375, 1.0904541015625, 1.14599609375, 1.2015380859375, 1.257080078125, 1.3126220703125, 1.3681640625, 1.4237060546875, 1.479248046875, 1.5347900390625, 1.59033203125, 1.6458740234375, 1.701416015625, 1.7569580078125, 1.8125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 4.0, 12.0, 10.0, 29.0, 29.0, 43.0, 40.0, 56.0, 83.0, 86.0, 82.0, 88.0, 71.0, 68.0, 81.0, 56.0, 31.0, 26.0, 28.0, 13.0, 10.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002448558807373047, -0.00023787468671798706, -0.00023089349269866943, -0.0002239122986793518, -0.00021693110466003418, -0.00020994991064071655, -0.00020296871662139893, -0.0001959875226020813, -0.00018900632858276367, -0.00018202513456344604, -0.00017504394054412842, -0.0001680627465248108, -0.00016108155250549316, -0.00015410035848617554, -0.0001471191644668579, -0.00014013797044754028, -0.00013315677642822266, -0.00012617558240890503, -0.0001191943883895874, -0.00011221319437026978, -0.00010523200035095215, -9.825080633163452e-05, -9.12696123123169e-05, -8.428841829299927e-05, -7.730722427368164e-05, -7.032603025436401e-05, -6.334483623504639e-05, -5.636364221572876e-05, -4.938244819641113e-05, -4.2401254177093506e-05, -3.542006015777588e-05, -2.8438866138458252e-05, -2.1457672119140625e-05, -1.4476478099822998e-05, -7.495284080505371e-06, -5.140900611877441e-07, 6.467103958129883e-06, 1.344829797744751e-05, 2.0429491996765137e-05, 2.7410686016082764e-05, 3.439188003540039e-05, 4.137307405471802e-05, 4.8354268074035645e-05, 5.533546209335327e-05, 6.23166561126709e-05, 6.929785013198853e-05, 7.627904415130615e-05, 8.326023817062378e-05, 9.02414321899414e-05, 9.722262620925903e-05, 0.00010420382022857666, 0.00011118501424789429, 0.00011816620826721191, 0.00012514740228652954, 0.00013212859630584717, 0.0001391097903251648, 0.00014609098434448242, 0.00015307217836380005, 0.00016005337238311768, 0.0001670345664024353, 0.00017401576042175293, 0.00018099695444107056, 0.00018797814846038818, 0.0001949593424797058, 0.00020194053649902344]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 7.0, 14.0, 21.0, 30.0, 44.0, 72.0, 112.0, 151.0, 262.0, 368.0, 567.0, 883.0, 1384.0, 2350.0, 3866.0, 6887.0, 14517.0, 32230.0, 74050.0, 150913.0, 229577.0, 231993.0, 155453.0, 76619.0, 33579.0, 14847.0, 7327.0, 4049.0, 2236.0, 1453.0, 928.0, 612.0, 389.0, 279.0, 164.0, 96.0, 76.0, 40.0, 43.0, 17.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.205078125, -2.1383056640625, -2.071533203125, -2.0047607421875, -1.93798828125, -1.8712158203125, -1.804443359375, -1.7376708984375, -1.6708984375, -1.6041259765625, -1.537353515625, -1.4705810546875, -1.40380859375, -1.3370361328125, -1.270263671875, -1.2034912109375, -1.13671875, -1.0699462890625, -1.003173828125, -0.9364013671875, -0.86962890625, -0.8028564453125, -0.736083984375, -0.6693115234375, -0.6025390625, -0.5357666015625, -0.468994140625, -0.4022216796875, -0.33544921875, -0.2686767578125, -0.201904296875, -0.1351318359375, -0.068359375, -0.0015869140625, 0.065185546875, 0.1319580078125, 0.19873046875, 0.2655029296875, 0.332275390625, 0.3990478515625, 0.4658203125, 0.5325927734375, 0.599365234375, 0.6661376953125, 0.73291015625, 0.7996826171875, 0.866455078125, 0.9332275390625, 1.0, 1.0667724609375, 1.133544921875, 1.2003173828125, 1.26708984375, 1.3338623046875, 1.400634765625, 1.4674072265625, 1.5341796875, 1.6009521484375, 1.667724609375, 1.7344970703125, 1.80126953125, 1.8680419921875, 1.934814453125, 2.0015869140625, 2.068359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 14.0, 16.0, 25.0, 45.0, 51.0, 45.0, 62.0, 68.0, 67.0, 81.0, 90.0, 81.0, 70.0, 52.0, 44.0, 40.0, 39.0, 22.0, 22.0, 11.0, 10.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5912933349609375, -0.572235107421875, -0.5531768798828125, -0.53411865234375, -0.5150604248046875, -0.496002197265625, -0.4769439697265625, -0.4578857421875, -0.4388275146484375, -0.419769287109375, -0.4007110595703125, -0.38165283203125, -0.3625946044921875, -0.343536376953125, -0.3244781494140625, -0.305419921875, -0.2863616943359375, -0.267303466796875, -0.2482452392578125, -0.22918701171875, -0.2101287841796875, -0.191070556640625, -0.1720123291015625, -0.1529541015625, -0.1338958740234375, -0.114837646484375, -0.0957794189453125, -0.07672119140625, -0.0576629638671875, -0.038604736328125, -0.0195465087890625, -0.00048828125, 0.0185699462890625, 0.037628173828125, 0.0566864013671875, 0.07574462890625, 0.0948028564453125, 0.113861083984375, 0.1329193115234375, 0.1519775390625, 0.1710357666015625, 0.190093994140625, 0.2091522216796875, 0.22821044921875, 0.2472686767578125, 0.266326904296875, 0.2853851318359375, 0.304443359375, 0.3235015869140625, 0.342559814453125, 0.3616180419921875, 0.38067626953125, 0.3997344970703125, 0.418792724609375, 0.4378509521484375, 0.4569091796875, 0.4759674072265625, 0.495025634765625, 0.5140838623046875, 0.53314208984375, 0.5522003173828125, 0.571258544921875, 0.5903167724609375, 0.609375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 12.0, 11.0, 18.0, 23.0, 26.0, 28.0, 24.0, 38.0, 46.0, 50.0, 55.0, 48.0, 52.0, 54.0, 43.0, 38.0, 47.0, 36.0, 43.0, 43.0, 36.0, 25.0, 23.0, 23.0, 21.0, 21.0, 21.0, 12.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.149673938751221, -4.006742000579834, -3.8638100624084473, -3.7208781242370605, -3.577946186065674, -3.435014247894287, -3.2920825481414795, -3.1491506099700928, -3.006218671798706, -2.8632867336273193, -2.7203547954559326, -2.577422857284546, -2.4344911575317383, -2.2915592193603516, -2.148627281188965, -2.005695343017578, -1.8627634048461914, -1.7198314666748047, -1.576899528503418, -1.4339677095413208, -1.291035771369934, -1.1481038331985474, -1.0051720142364502, -0.8622400760650635, -0.7193081378936768, -0.57637619972229, -0.4334443211555481, -0.29051241278648376, -0.14758050441741943, -0.004648566246032715, 0.13828331232070923, 0.28121519088745117, 0.4241471290588379, 0.5670790672302246, 0.7100109457969666, 0.8529428243637085, 0.9958747625350952, 1.138806700706482, 1.281738519668579, 1.4246704578399658, 1.5676023960113525, 1.7105343341827393, 1.853466272354126, 1.9963980913162231, 2.1393299102783203, 2.282261848449707, 2.4251937866210938, 2.5681257247924805, 2.711057662963867, 2.853989601135254, 2.9969215393066406, 3.1398534774780273, 3.282785415649414, 3.425717353820801, 3.5686490535736084, 3.711580991744995, 3.854512929916382, 3.9974448680877686, 4.140376567840576, 4.283308506011963, 4.42624044418335, 4.569172382354736, 4.712104320526123, 4.85503625869751, 4.9979681968688965]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 4.0, 10.0, 11.0, 10.0, 11.0, 13.0, 18.0, 24.0, 18.0, 25.0, 27.0, 28.0, 26.0, 48.0, 37.0, 31.0, 48.0, 44.0, 43.0, 49.0, 37.0, 53.0, 33.0, 47.0, 47.0, 26.0, 26.0, 17.0, 23.0, 25.0, 17.0, 22.0, 20.0, 16.0, 8.0, 10.0, 10.0, 7.0, 5.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0], "bins": [-4.125625133514404, -4.008246421813965, -3.890867233276367, -3.7734885215759277, -3.656109571456909, -3.5387306213378906, -3.421351671218872, -3.3039727210998535, -3.186594009399414, -3.0692150592803955, -2.951836109161377, -2.8344573974609375, -2.717078447341919, -2.5996994972229004, -2.482320547103882, -2.3649415969848633, -2.2475626468658447, -2.130183696746826, -2.0128047466278076, -1.8954259157180786, -1.7780470848083496, -1.660668134689331, -1.5432891845703125, -1.425910234451294, -1.308531403541565, -1.1911524534225464, -1.0737736225128174, -0.9563946723937988, -0.839015781879425, -0.7216368913650513, -0.6042579412460327, -0.48687905073165894, -0.36950016021728516, -0.2521212697029114, -0.1347423493862152, -0.017363429069519043, 0.10001546144485474, 0.21739435195922852, 0.33477330207824707, 0.45215219259262085, 0.5695310831069946, 0.6869099736213684, 0.8042888641357422, 0.9216678142547607, 1.0390467643737793, 1.1564255952835083, 1.2738045454025269, 1.3911833763122559, 1.5085623264312744, 1.625941276550293, 1.743320107460022, 1.8606990575790405, 1.9780778884887695, 2.095456838607788, 2.2128357887268066, 2.330214738845825, 2.4475936889648438, 2.5649726390838623, 2.682351589202881, 2.7997303009033203, 2.917109251022339, 3.0344882011413574, 3.151867151260376, 3.2692461013793945, 3.386624813079834]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 12.0, 28.0, 34.0, 47.0, 92.0, 123.0, 166.0, 233.0, 398.0, 595.0, 981.0, 1544.0, 2363.0, 3999.0, 6436.0, 10950.0, 18336.0, 31499.0, 55303.0, 95817.0, 166694.0, 284017.0, 452038.0, 634462.0, 716733.0, 624006.0, 437497.0, 271210.0, 160114.0, 91545.0, 52437.0, 30475.0, 17779.0, 10376.0, 6279.0, 3676.0, 2255.0, 1442.0, 898.0, 526.0, 327.0, 211.0, 130.0, 71.0, 44.0, 24.0, 19.0, 13.0, 15.0, 3.0, 0.0, 2.0], "bins": [-5.26953125, -5.125030517578125, -4.98052978515625, -4.836029052734375, -4.6915283203125, -4.547027587890625, -4.40252685546875, -4.258026123046875, -4.113525390625, -3.969024658203125, -3.82452392578125, -3.680023193359375, -3.5355224609375, -3.391021728515625, -3.24652099609375, -3.102020263671875, -2.95751953125, -2.813018798828125, -2.66851806640625, -2.524017333984375, -2.3795166015625, -2.235015869140625, -2.09051513671875, -1.946014404296875, -1.801513671875, -1.657012939453125, -1.51251220703125, -1.368011474609375, -1.2235107421875, -1.079010009765625, -0.93450927734375, -0.790008544921875, -0.6455078125, -0.501007080078125, -0.35650634765625, -0.212005615234375, -0.0675048828125, 0.076995849609375, 0.22149658203125, 0.365997314453125, 0.510498046875, 0.654998779296875, 0.79949951171875, 0.944000244140625, 1.0885009765625, 1.233001708984375, 1.37750244140625, 1.522003173828125, 1.66650390625, 1.811004638671875, 1.95550537109375, 2.100006103515625, 2.2445068359375, 2.389007568359375, 2.53350830078125, 2.678009033203125, 2.822509765625, 2.967010498046875, 3.11151123046875, 3.256011962890625, 3.4005126953125, 3.545013427734375, 3.68951416015625, 3.834014892578125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 4.0, 6.0, 13.0, 12.0, 15.0, 17.0, 20.0, 17.0, 23.0, 28.0, 30.0, 35.0, 42.0, 32.0, 35.0, 38.0, 38.0, 47.0, 50.0, 37.0, 42.0, 37.0, 38.0, 45.0, 39.0, 32.0, 26.0, 29.0, 14.0, 18.0, 20.0, 12.0, 13.0, 17.0, 17.0, 9.0, 7.0, 7.0, 12.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.61822509765625, -3.5001220703125, -3.38201904296875, -3.263916015625, -3.14581298828125, -3.0277099609375, -2.90960693359375, -2.79150390625, -2.67340087890625, -2.5552978515625, -2.43719482421875, -2.319091796875, -2.20098876953125, -2.0828857421875, -1.96478271484375, -1.8466796875, -1.72857666015625, -1.6104736328125, -1.49237060546875, -1.374267578125, -1.25616455078125, -1.1380615234375, -1.01995849609375, -0.90185546875, -0.78375244140625, -0.6656494140625, -0.54754638671875, -0.429443359375, -0.31134033203125, -0.1932373046875, -0.07513427734375, 0.04296875, 0.16107177734375, 0.2791748046875, 0.39727783203125, 0.515380859375, 0.63348388671875, 0.7515869140625, 0.86968994140625, 0.98779296875, 1.10589599609375, 1.2239990234375, 1.34210205078125, 1.460205078125, 1.57830810546875, 1.6964111328125, 1.81451416015625, 1.9326171875, 2.05072021484375, 2.1688232421875, 2.28692626953125, 2.405029296875, 2.52313232421875, 2.6412353515625, 2.75933837890625, 2.87744140625, 2.99554443359375, 3.1136474609375, 3.23175048828125, 3.349853515625, 3.46795654296875, 3.5860595703125, 3.70416259765625, 3.822265625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 12.0, 19.0, 23.0, 37.0, 65.0, 124.0, 204.0, 294.0, 531.0, 924.0, 1563.0, 2805.0, 4727.0, 8332.0, 14990.0, 27004.0, 48049.0, 86296.0, 150623.0, 250802.0, 395535.0, 558656.0, 673454.0, 642958.0, 499298.0, 337153.0, 208527.0, 123051.0, 69896.0, 38982.0, 21476.0, 11957.0, 6731.0, 3894.0, 2114.0, 1284.0, 774.0, 410.0, 256.0, 169.0, 112.0, 68.0, 48.0, 19.0, 7.0, 8.0, 11.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.4991455078125, -5.314697265625, -5.1302490234375, -4.94580078125, -4.7613525390625, -4.576904296875, -4.3924560546875, -4.2080078125, -4.0235595703125, -3.839111328125, -3.6546630859375, -3.47021484375, -3.2857666015625, -3.101318359375, -2.9168701171875, -2.732421875, -2.5479736328125, -2.363525390625, -2.1790771484375, -1.99462890625, -1.8101806640625, -1.625732421875, -1.4412841796875, -1.2568359375, -1.0723876953125, -0.887939453125, -0.7034912109375, -0.51904296875, -0.3345947265625, -0.150146484375, 0.0343017578125, 0.21875, 0.4031982421875, 0.587646484375, 0.7720947265625, 0.95654296875, 1.1409912109375, 1.325439453125, 1.5098876953125, 1.6943359375, 1.8787841796875, 2.063232421875, 2.2476806640625, 2.43212890625, 2.6165771484375, 2.801025390625, 2.9854736328125, 3.169921875, 3.3543701171875, 3.538818359375, 3.7232666015625, 3.90771484375, 4.0921630859375, 4.276611328125, 4.4610595703125, 4.6455078125, 4.8299560546875, 5.014404296875, 5.1988525390625, 5.38330078125, 5.5677490234375, 5.752197265625, 5.9366455078125, 6.12109375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 10.0, 3.0, 7.0, 9.0, 11.0, 11.0, 28.0, 32.0, 53.0, 57.0, 67.0, 74.0, 97.0, 110.0, 132.0, 141.0, 198.0, 189.0, 231.0, 230.0, 266.0, 244.0, 272.0, 229.0, 228.0, 191.0, 170.0, 145.0, 125.0, 83.0, 94.0, 79.0, 73.0, 48.0, 25.0, 35.0, 25.0, 12.0, 12.0, 4.0, 6.0, 11.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.406463623046875, -2.33441162109375, -2.262359619140625, -2.1903076171875, -2.118255615234375, -2.04620361328125, -1.974151611328125, -1.902099609375, -1.830047607421875, -1.75799560546875, -1.685943603515625, -1.6138916015625, -1.541839599609375, -1.46978759765625, -1.397735595703125, -1.32568359375, -1.253631591796875, -1.18157958984375, -1.109527587890625, -1.0374755859375, -0.965423583984375, -0.89337158203125, -0.821319580078125, -0.749267578125, -0.677215576171875, -0.60516357421875, -0.533111572265625, -0.4610595703125, -0.389007568359375, -0.31695556640625, -0.244903564453125, -0.1728515625, -0.100799560546875, -0.02874755859375, 0.043304443359375, 0.1153564453125, 0.187408447265625, 0.25946044921875, 0.331512451171875, 0.403564453125, 0.475616455078125, 0.54766845703125, 0.619720458984375, 0.6917724609375, 0.763824462890625, 0.83587646484375, 0.907928466796875, 0.97998046875, 1.052032470703125, 1.12408447265625, 1.196136474609375, 1.2681884765625, 1.340240478515625, 1.41229248046875, 1.484344482421875, 1.556396484375, 1.628448486328125, 1.70050048828125, 1.772552490234375, 1.8446044921875, 1.916656494140625, 1.98870849609375, 2.060760498046875, 2.1328125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 7.0, 25.0, 11.0, 23.0, 32.0, 38.0, 38.0, 55.0, 56.0, 63.0, 85.0, 72.0, 57.0, 58.0, 45.0, 53.0, 67.0, 34.0, 32.0, 28.0, 21.0, 25.0, 17.0, 9.0, 8.0, 5.0, 10.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.030409812927246, -10.74123764038086, -10.452064514160156, -10.16289234161377, -9.873720169067383, -9.58454704284668, -9.295374870300293, -9.006202697753906, -8.717029571533203, -8.427857398986816, -8.138684272766113, -7.849512100219727, -7.560339450836182, -7.271166801452637, -6.98199462890625, -6.692821979522705, -6.403649806976318, -6.114477157592773, -5.825304985046387, -5.536132335662842, -5.246959686279297, -4.95778751373291, -4.668614864349365, -4.37944221496582, -4.090270042419434, -3.8010976314544678, -3.511924982070923, -3.222752571105957, -2.933579921722412, -2.6444075107574463, -2.3552350997924805, -2.0660624504089355, -1.7768893241882324, -1.487716794013977, -1.1985442638397217, -0.9093718528747559, -0.6201993227005005, -0.3310267925262451, -0.0418543815612793, 0.24731826782226562, 0.5364906787872314, 0.8256632089614868, 1.1148357391357422, 1.404008150100708, 1.6931806802749634, 1.9823532104492188, 2.2715256214141846, 2.5606982707977295, 2.8498706817626953, 3.139043092727661, 3.428215742111206, 3.717388153076172, 4.006560802459717, 4.295733451843262, 4.584905624389648, 4.874078273773193, 5.163250923156738, 5.452423572540283, 5.74159574508667, 6.030768394470215, 6.31994104385376, 6.609113693237305, 6.898285865783691, 7.187458515167236, 7.476630687713623]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 12.0, 20.0, 14.0, 20.0, 22.0, 30.0, 25.0, 25.0, 31.0, 39.0, 46.0, 37.0, 47.0, 54.0, 44.0, 36.0, 49.0, 37.0, 38.0, 39.0, 40.0, 33.0, 36.0, 31.0, 22.0, 14.0, 22.0, 13.0, 16.0, 10.0, 11.0, 10.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.184546947479248, -5.999026775360107, -5.813506603240967, -5.627986907958984, -5.442466735839844, -5.256946563720703, -5.0714263916015625, -4.885906219482422, -4.700386047363281, -4.514865875244141, -4.329345703125, -4.143825531005859, -3.958305835723877, -3.7727856636047363, -3.5872654914855957, -3.401745319366455, -3.2162256240844727, -3.030705451965332, -2.8451855182647705, -2.65966534614563, -2.4741454124450684, -2.2886252403259277, -2.103105068206787, -1.917585015296936, -1.732064962387085, -1.5465449094772339, -1.3610248565673828, -1.1755046844482422, -0.9899846315383911, -0.80446457862854, -0.6189444065093994, -0.43342435359954834, -0.24790382385253906, -0.0623837411403656, 0.12313634157180786, 0.3086564540863037, 0.4941765069961548, 0.6796965599060059, 0.8652167320251465, 1.0507367849349976, 1.2362568378448486, 1.4217768907546997, 1.6072969436645508, 1.7928171157836914, 1.9783371686935425, 2.1638572216033936, 2.349377393722534, 2.5348973274230957, 2.7204174995422363, 2.905937671661377, 3.0914576053619385, 3.276977777481079, 3.4624977111816406, 3.6480178833007812, 3.833538055419922, 4.0190582275390625, 4.204578399658203, 4.390098571777344, 4.575618743896484, 4.761138916015625, 4.946658611297607, 5.132178783416748, 5.317698955535889, 5.503219127655029, 5.688738822937012]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 4.0, 7.0, 13.0, 23.0, 30.0, 39.0, 59.0, 62.0, 120.0, 171.0, 259.0, 464.0, 696.0, 1098.0, 1675.0, 2780.0, 4663.0, 8072.0, 14588.0, 26524.0, 50066.0, 96183.0, 182020.0, 256498.0, 187294.0, 99854.0, 51825.0, 27559.0, 15058.0, 8389.0, 4847.0, 2877.0, 1716.0, 1052.0, 639.0, 432.0, 290.0, 185.0, 137.0, 93.0, 52.0, 33.0, 30.0, 25.0, 15.0, 11.0, 11.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.62890625, -1.577239990234375, -1.52557373046875, -1.473907470703125, -1.4222412109375, -1.370574951171875, -1.31890869140625, -1.267242431640625, -1.215576171875, -1.163909912109375, -1.11224365234375, -1.060577392578125, -1.0089111328125, -0.957244873046875, -0.90557861328125, -0.853912353515625, -0.80224609375, -0.750579833984375, -0.69891357421875, -0.647247314453125, -0.5955810546875, -0.543914794921875, -0.49224853515625, -0.440582275390625, -0.388916015625, -0.337249755859375, -0.28558349609375, -0.233917236328125, -0.1822509765625, -0.130584716796875, -0.07891845703125, -0.027252197265625, 0.0244140625, 0.076080322265625, 0.12774658203125, 0.179412841796875, 0.2310791015625, 0.282745361328125, 0.33441162109375, 0.386077880859375, 0.437744140625, 0.489410400390625, 0.54107666015625, 0.592742919921875, 0.6444091796875, 0.696075439453125, 0.74774169921875, 0.799407958984375, 0.85107421875, 0.902740478515625, 0.95440673828125, 1.006072998046875, 1.0577392578125, 1.109405517578125, 1.16107177734375, 1.212738037109375, 1.264404296875, 1.316070556640625, 1.36773681640625, 1.419403076171875, 1.4710693359375, 1.522735595703125, 1.57440185546875, 1.626068115234375, 1.677734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 7.0, 7.0, 5.0, 11.0, 9.0, 10.0, 17.0, 21.0, 29.0, 22.0, 26.0, 39.0, 27.0, 43.0, 49.0, 43.0, 47.0, 56.0, 33.0, 39.0, 51.0, 44.0, 45.0, 52.0, 32.0, 29.0, 35.0, 24.0, 18.0, 21.0, 21.0, 14.0, 11.0, 12.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.75, -6.53973388671875, -6.3294677734375, -6.11920166015625, -5.908935546875, -5.69866943359375, -5.4884033203125, -5.27813720703125, -5.06787109375, -4.85760498046875, -4.6473388671875, -4.43707275390625, -4.226806640625, -4.01654052734375, -3.8062744140625, -3.59600830078125, -3.3857421875, -3.17547607421875, -2.9652099609375, -2.75494384765625, -2.544677734375, -2.33441162109375, -2.1241455078125, -1.91387939453125, -1.70361328125, -1.49334716796875, -1.2830810546875, -1.07281494140625, -0.862548828125, -0.65228271484375, -0.4420166015625, -0.23175048828125, -0.021484375, 0.18878173828125, 0.3990478515625, 0.60931396484375, 0.819580078125, 1.02984619140625, 1.2401123046875, 1.45037841796875, 1.66064453125, 1.87091064453125, 2.0811767578125, 2.29144287109375, 2.501708984375, 2.71197509765625, 2.9222412109375, 3.13250732421875, 3.3427734375, 3.55303955078125, 3.7633056640625, 3.97357177734375, 4.183837890625, 4.39410400390625, 4.6043701171875, 4.81463623046875, 5.02490234375, 5.23516845703125, 5.4454345703125, 5.65570068359375, 5.865966796875, 6.07623291015625, 6.2864990234375, 6.49676513671875, 6.70703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 6.0, 8.0, 15.0, 27.0, 32.0, 60.0, 94.0, 137.0, 233.0, 357.0, 613.0, 1019.0, 1786.0, 3201.0, 6113.0, 11718.0, 23069.0, 46548.0, 95184.0, 186824.0, 272834.0, 196394.0, 101465.0, 49612.0, 24454.0, 12362.0, 6398.0, 3390.0, 1891.0, 1091.0, 624.0, 394.0, 209.0, 135.0, 93.0, 47.0, 45.0, 22.0, 22.0, 10.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5841522216796875, -1.528656005859375, -1.4731597900390625, -1.41766357421875, -1.3621673583984375, -1.306671142578125, -1.2511749267578125, -1.1956787109375, -1.1401824951171875, -1.084686279296875, -1.0291900634765625, -0.97369384765625, -0.9181976318359375, -0.862701416015625, -0.8072052001953125, -0.751708984375, -0.6962127685546875, -0.640716552734375, -0.5852203369140625, -0.52972412109375, -0.4742279052734375, -0.418731689453125, -0.3632354736328125, -0.3077392578125, -0.2522430419921875, -0.196746826171875, -0.1412506103515625, -0.08575439453125, -0.0302581787109375, 0.025238037109375, 0.0807342529296875, 0.13623046875, 0.1917266845703125, 0.247222900390625, 0.3027191162109375, 0.35821533203125, 0.4137115478515625, 0.469207763671875, 0.5247039794921875, 0.5802001953125, 0.6356964111328125, 0.691192626953125, 0.7466888427734375, 0.80218505859375, 0.8576812744140625, 0.913177490234375, 0.9686737060546875, 1.024169921875, 1.0796661376953125, 1.135162353515625, 1.1906585693359375, 1.24615478515625, 1.3016510009765625, 1.357147216796875, 1.4126434326171875, 1.4681396484375, 1.5236358642578125, 1.579132080078125, 1.6346282958984375, 1.69012451171875, 1.7456207275390625, 1.801116943359375, 1.8566131591796875, 1.912109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 3.0, 10.0, 15.0, 14.0, 11.0, 13.0, 16.0, 20.0, 23.0, 18.0, 22.0, 31.0, 35.0, 36.0, 49.0, 46.0, 42.0, 67.0, 41.0, 39.0, 45.0, 47.0, 50.0, 42.0, 41.0, 41.0, 23.0, 22.0, 24.0, 20.0, 16.0, 10.0, 11.0, 10.0, 14.0, 6.0, 4.0, 1.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.1484375, -4.0252685546875, -3.902099609375, -3.7789306640625, -3.65576171875, -3.5325927734375, -3.409423828125, -3.2862548828125, -3.1630859375, -3.0399169921875, -2.916748046875, -2.7935791015625, -2.67041015625, -2.5472412109375, -2.424072265625, -2.3009033203125, -2.177734375, -2.0545654296875, -1.931396484375, -1.8082275390625, -1.68505859375, -1.5618896484375, -1.438720703125, -1.3155517578125, -1.1923828125, -1.0692138671875, -0.946044921875, -0.8228759765625, -0.69970703125, -0.5765380859375, -0.453369140625, -0.3302001953125, -0.20703125, -0.0838623046875, 0.039306640625, 0.1624755859375, 0.28564453125, 0.4088134765625, 0.531982421875, 0.6551513671875, 0.7783203125, 0.9014892578125, 1.024658203125, 1.1478271484375, 1.27099609375, 1.3941650390625, 1.517333984375, 1.6405029296875, 1.763671875, 1.8868408203125, 2.010009765625, 2.1331787109375, 2.25634765625, 2.3795166015625, 2.502685546875, 2.6258544921875, 2.7490234375, 2.8721923828125, 2.995361328125, 3.1185302734375, 3.24169921875, 3.3648681640625, 3.488037109375, 3.6112060546875, 3.734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 13.0, 11.0, 20.0, 26.0, 52.0, 56.0, 79.0, 140.0, 209.0, 273.0, 449.0, 654.0, 1029.0, 1695.0, 2896.0, 5786.0, 14046.0, 44699.0, 204230.0, 546031.0, 163951.0, 37355.0, 12350.0, 5326.0, 2665.0, 1592.0, 1002.0, 644.0, 405.0, 274.0, 196.0, 134.0, 74.0, 72.0, 30.0, 24.0, 16.0, 13.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8901824951171875, -0.860931396484375, -0.8316802978515625, -0.80242919921875, -0.7731781005859375, -0.743927001953125, -0.7146759033203125, -0.6854248046875, -0.6561737060546875, -0.626922607421875, -0.5976715087890625, -0.56842041015625, -0.5391693115234375, -0.509918212890625, -0.4806671142578125, -0.451416015625, -0.4221649169921875, -0.392913818359375, -0.3636627197265625, -0.33441162109375, -0.3051605224609375, -0.275909423828125, -0.2466583251953125, -0.2174072265625, -0.1881561279296875, -0.158905029296875, -0.1296539306640625, -0.10040283203125, -0.0711517333984375, -0.041900634765625, -0.0126495361328125, 0.0166015625, 0.0458526611328125, 0.075103759765625, 0.1043548583984375, 0.13360595703125, 0.1628570556640625, 0.192108154296875, 0.2213592529296875, 0.2506103515625, 0.2798614501953125, 0.309112548828125, 0.3383636474609375, 0.36761474609375, 0.3968658447265625, 0.426116943359375, 0.4553680419921875, 0.484619140625, 0.5138702392578125, 0.543121337890625, 0.5723724365234375, 0.60162353515625, 0.6308746337890625, 0.660125732421875, 0.6893768310546875, 0.7186279296875, 0.7478790283203125, 0.777130126953125, 0.8063812255859375, 0.83563232421875, 0.8648834228515625, 0.894134521484375, 0.9233856201171875, 0.95263671875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 0.0, 6.0, 4.0, 6.0, 10.0, 8.0, 17.0, 28.0, 24.0, 28.0, 40.0, 39.0, 50.0, 64.0, 63.0, 66.0, 83.0, 91.0, 71.0, 60.0, 45.0, 41.0, 28.0, 27.0, 21.0, 24.0, 14.0, 20.0, 11.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8014183044433594e-05, -2.690032124519348e-05, -2.578645944595337e-05, -2.4672597646713257e-05, -2.3558735847473145e-05, -2.2444874048233032e-05, -2.133101224899292e-05, -2.0217150449752808e-05, -1.9103288650512695e-05, -1.7989426851272583e-05, -1.687556505203247e-05, -1.576170325279236e-05, -1.4647841453552246e-05, -1.3533979654312134e-05, -1.2420117855072021e-05, -1.130625605583191e-05, -1.0192394256591797e-05, -9.078532457351685e-06, -7.964670658111572e-06, -6.85080885887146e-06, -5.736947059631348e-06, -4.623085260391235e-06, -3.509223461151123e-06, -2.3953616619110107e-06, -1.2814998626708984e-06, -1.6763806343078613e-07, 9.462237358093262e-07, 2.0600855350494385e-06, 3.1739473342895508e-06, 4.287809133529663e-06, 5.401670932769775e-06, 6.515532732009888e-06, 7.62939453125e-06, 8.743256330490112e-06, 9.857118129730225e-06, 1.0970979928970337e-05, 1.208484172821045e-05, 1.3198703527450562e-05, 1.4312565326690674e-05, 1.5426427125930786e-05, 1.65402889251709e-05, 1.765415072441101e-05, 1.8768012523651123e-05, 1.9881874322891235e-05, 2.0995736122131348e-05, 2.210959792137146e-05, 2.3223459720611572e-05, 2.4337321519851685e-05, 2.5451183319091797e-05, 2.656504511833191e-05, 2.767890691757202e-05, 2.8792768716812134e-05, 2.9906630516052246e-05, 3.102049231529236e-05, 3.213435411453247e-05, 3.324821591377258e-05, 3.4362077713012695e-05, 3.547593951225281e-05, 3.658980131149292e-05, 3.770366311073303e-05, 3.8817524909973145e-05, 3.993138670921326e-05, 4.104524850845337e-05, 4.215911030769348e-05, 4.3272972106933594e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 16.0, 26.0, 41.0, 45.0, 46.0, 88.0, 136.0, 192.0, 253.0, 363.0, 502.0, 707.0, 1031.0, 1625.0, 2540.0, 4288.0, 7792.0, 15232.0, 34280.0, 84491.0, 220237.0, 360009.0, 184037.0, 70444.0, 28963.0, 13379.0, 6794.0, 3890.0, 2383.0, 1496.0, 940.0, 709.0, 418.0, 313.0, 233.0, 164.0, 126.0, 83.0, 69.0, 53.0, 26.0, 20.0, 20.0, 4.0, 13.0, 8.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.87030029296875, -0.8416748046875, -0.81304931640625, -0.784423828125, -0.75579833984375, -0.7271728515625, -0.69854736328125, -0.669921875, -0.64129638671875, -0.6126708984375, -0.58404541015625, -0.555419921875, -0.52679443359375, -0.4981689453125, -0.46954345703125, -0.44091796875, -0.41229248046875, -0.3836669921875, -0.35504150390625, -0.326416015625, -0.29779052734375, -0.2691650390625, -0.24053955078125, -0.2119140625, -0.18328857421875, -0.1546630859375, -0.12603759765625, -0.097412109375, -0.06878662109375, -0.0401611328125, -0.01153564453125, 0.01708984375, 0.04571533203125, 0.0743408203125, 0.10296630859375, 0.131591796875, 0.16021728515625, 0.1888427734375, 0.21746826171875, 0.24609375, 0.27471923828125, 0.3033447265625, 0.33197021484375, 0.360595703125, 0.38922119140625, 0.4178466796875, 0.44647216796875, 0.47509765625, 0.50372314453125, 0.5323486328125, 0.56097412109375, 0.589599609375, 0.61822509765625, 0.6468505859375, 0.67547607421875, 0.7041015625, 0.73272705078125, 0.7613525390625, 0.78997802734375, 0.818603515625, 0.84722900390625, 0.8758544921875, 0.90447998046875, 0.93310546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 15.0, 18.0, 24.0, 26.0, 47.0, 91.0, 99.0, 127.0, 137.0, 110.0, 83.0, 62.0, 61.0, 19.0, 19.0, 16.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4033203125, -0.3915367126464844, -0.37975311279296875, -0.3679695129394531, -0.3561859130859375, -0.3444023132324219, -0.33261871337890625, -0.3208351135253906, -0.309051513671875, -0.2972679138183594, -0.28548431396484375, -0.2737007141113281, -0.2619171142578125, -0.2501335144042969, -0.23834991455078125, -0.22656631469726562, -0.21478271484375, -0.20299911499023438, -0.19121551513671875, -0.17943191528320312, -0.1676483154296875, -0.15586471557617188, -0.14408111572265625, -0.13229751586914062, -0.120513916015625, -0.10873031616210938, -0.09694671630859375, -0.08516311645507812, -0.0733795166015625, -0.061595916748046875, -0.04981231689453125, -0.038028717041015625, -0.0262451171875, -0.014461517333984375, -0.00267791748046875, 0.009105682373046875, 0.0208892822265625, 0.032672882080078125, 0.04445648193359375, 0.056240081787109375, 0.068023681640625, 0.07980728149414062, 0.09159088134765625, 0.10337448120117188, 0.1151580810546875, 0.12694168090820312, 0.13872528076171875, 0.15050888061523438, 0.16229248046875, 0.17407608032226562, 0.18585968017578125, 0.19764328002929688, 0.2094268798828125, 0.22121047973632812, 0.23299407958984375, 0.24477767944335938, 0.256561279296875, 0.2683448791503906, 0.28012847900390625, 0.2919120788574219, 0.3036956787109375, 0.3154792785644531, 0.32726287841796875, 0.3390464782714844, 0.350830078125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 5.0, 24.0, 10.0, 21.0, 32.0, 37.0, 38.0, 50.0, 58.0, 60.0, 72.0, 78.0, 65.0, 54.0, 52.0, 49.0, 63.0, 39.0, 36.0, 26.0, 21.0, 28.0, 21.0, 9.0, 5.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.094508171081543, -10.80483341217041, -10.515158653259277, -10.225483894348145, -9.935808181762695, -9.646133422851562, -9.35645866394043, -9.066783905029297, -8.777109146118164, -8.487434387207031, -8.197759628295898, -7.908084392547607, -7.618409633636475, -7.328734874725342, -7.039059638977051, -6.749384880065918, -6.459710121154785, -6.170035362243652, -5.8803606033325195, -5.5906853675842285, -5.301010608673096, -5.011335849761963, -4.721660614013672, -4.431985855102539, -4.142311096191406, -3.8526363372802734, -3.5629613399505615, -3.2732863426208496, -2.983611583709717, -2.693936824798584, -2.404261827468872, -2.11458683013916, -1.8249125480651855, -1.5352376699447632, -1.2455627918243408, -0.9558879137039185, -0.6662130355834961, -0.37653815746307373, -0.08686327934265137, 0.20281171798706055, 0.49248647689819336, 0.7821613550186157, 1.071836233139038, 1.3615111112594604, 1.6511859893798828, 1.9408608675003052, 2.2305357456207275, 2.5202107429504395, 2.8098855018615723, 3.099560260772705, 3.389235258102417, 3.678910255432129, 3.9685850143432617, 4.2582597732543945, 4.547934532165527, 4.837609767913818, 5.127284526824951, 5.416959285736084, 5.706634521484375, 5.996309280395508, 6.285984039306641, 6.575658798217773, 6.865333557128906, 7.155008792877197, 7.44468355178833]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 11.0, 8.0, 13.0, 8.0, 14.0, 19.0, 16.0, 16.0, 26.0, 30.0, 27.0, 23.0, 31.0, 37.0, 37.0, 47.0, 43.0, 58.0, 40.0, 46.0, 41.0, 37.0, 42.0, 41.0, 40.0, 36.0, 37.0, 26.0, 19.0, 16.0, 19.0, 13.0, 17.0, 12.0, 9.0, 9.0, 5.0, 3.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.316371440887451, -6.126894950866699, -5.937417984008789, -5.747941017150879, -5.558464527130127, -5.368988037109375, -5.179511070251465, -4.990034103393555, -4.800557613372803, -4.611081123352051, -4.421604156494141, -4.2321271896362305, -4.0426506996154785, -3.8531739711761475, -3.6636972427368164, -3.4742205142974854, -3.2847437858581543, -3.0952670574188232, -2.905790328979492, -2.716313600540161, -2.52683687210083, -2.337360143661499, -2.147883415222168, -1.958406686782837, -1.7689299583435059, -1.5794532299041748, -1.3899765014648438, -1.2004997730255127, -1.0110230445861816, -0.8215463161468506, -0.6320695877075195, -0.4425928592681885, -0.2531156539916992, -0.06363892555236816, 0.1258378028869629, 0.31531453132629395, 0.504791259765625, 0.694267988204956, 0.8837447166442871, 1.0732214450836182, 1.2626981735229492, 1.4521749019622803, 1.6416516304016113, 1.8311283588409424, 2.0206050872802734, 2.2100818157196045, 2.3995585441589355, 2.5890352725982666, 2.7785120010375977, 2.9679887294769287, 3.1574654579162598, 3.346942186355591, 3.536418914794922, 3.725895643234253, 3.915372371673584, 4.104848861694336, 4.294325828552246, 4.483802795410156, 4.673279285430908, 4.86275577545166, 5.05223274230957, 5.2417097091674805, 5.431186199188232, 5.620662689208984, 5.8101396560668945]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 27.0, 21.0, 49.0, 54.0, 114.0, 163.0, 171.0, 290.0, 458.0, 666.0, 975.0, 1629.0, 2531.0, 4060.0, 6616.0, 11381.0, 19757.0, 35304.0, 62042.0, 104007.0, 152196.0, 179576.0, 166154.0, 121463.0, 75861.0, 43701.0, 24282.0, 13994.0, 7868.0, 4834.0, 2899.0, 1894.0, 1222.0, 747.0, 511.0, 304.0, 257.0, 141.0, 102.0, 65.0, 57.0, 32.0, 22.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3359375, -5.17266845703125, -5.0093994140625, -4.84613037109375, -4.682861328125, -4.51959228515625, -4.3563232421875, -4.19305419921875, -4.02978515625, -3.86651611328125, -3.7032470703125, -3.53997802734375, -3.376708984375, -3.21343994140625, -3.0501708984375, -2.88690185546875, -2.7236328125, -2.56036376953125, -2.3970947265625, -2.23382568359375, -2.070556640625, -1.90728759765625, -1.7440185546875, -1.58074951171875, -1.41748046875, -1.25421142578125, -1.0909423828125, -0.92767333984375, -0.764404296875, -0.60113525390625, -0.4378662109375, -0.27459716796875, -0.111328125, 0.05194091796875, 0.2152099609375, 0.37847900390625, 0.541748046875, 0.70501708984375, 0.8682861328125, 1.03155517578125, 1.19482421875, 1.35809326171875, 1.5213623046875, 1.68463134765625, 1.847900390625, 2.01116943359375, 2.1744384765625, 2.33770751953125, 2.5009765625, 2.66424560546875, 2.8275146484375, 2.99078369140625, 3.154052734375, 3.31732177734375, 3.4805908203125, 3.64385986328125, 3.80712890625, 3.97039794921875, 4.1336669921875, 4.29693603515625, 4.460205078125, 4.62347412109375, 4.7867431640625, 4.95001220703125, 5.11328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 8.0, 13.0, 12.0, 12.0, 22.0, 19.0, 24.0, 21.0, 24.0, 28.0, 35.0, 29.0, 33.0, 34.0, 40.0, 45.0, 50.0, 45.0, 50.0, 37.0, 43.0, 46.0, 38.0, 31.0, 36.0, 36.0, 22.0, 20.0, 22.0, 24.0, 15.0, 8.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.59765625, -6.400146484375, -6.20263671875, -6.005126953125, -5.8076171875, -5.610107421875, -5.41259765625, -5.215087890625, -5.017578125, -4.820068359375, -4.62255859375, -4.425048828125, -4.2275390625, -4.030029296875, -3.83251953125, -3.635009765625, -3.4375, -3.239990234375, -3.04248046875, -2.844970703125, -2.6474609375, -2.449951171875, -2.25244140625, -2.054931640625, -1.857421875, -1.659912109375, -1.46240234375, -1.264892578125, -1.0673828125, -0.869873046875, -0.67236328125, -0.474853515625, -0.27734375, -0.079833984375, 0.11767578125, 0.315185546875, 0.5126953125, 0.710205078125, 0.90771484375, 1.105224609375, 1.302734375, 1.500244140625, 1.69775390625, 1.895263671875, 2.0927734375, 2.290283203125, 2.48779296875, 2.685302734375, 2.8828125, 3.080322265625, 3.27783203125, 3.475341796875, 3.6728515625, 3.870361328125, 4.06787109375, 4.265380859375, 4.462890625, 4.660400390625, 4.85791015625, 5.055419921875, 5.2529296875, 5.450439453125, 5.64794921875, 5.845458984375, 6.04296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 8.0, 18.0, 32.0, 32.0, 51.0, 70.0, 120.0, 132.0, 213.0, 335.0, 539.0, 752.0, 1185.0, 1851.0, 3014.0, 4721.0, 7716.0, 12466.0, 20804.0, 35708.0, 62572.0, 111614.0, 176604.0, 206782.0, 164834.0, 99424.0, 55959.0, 32040.0, 18758.0, 11333.0, 6772.0, 4347.0, 2789.0, 1727.0, 1056.0, 699.0, 473.0, 298.0, 229.0, 134.0, 101.0, 62.0, 63.0, 34.0, 15.0, 12.0, 13.0, 5.0, 7.0, 1.0, 8.0, 1.0, 2.0, 4.0, 3.0, 2.0], "bins": [-7.9921875, -7.7376708984375, -7.483154296875, -7.2286376953125, -6.97412109375, -6.7196044921875, -6.465087890625, -6.2105712890625, -5.9560546875, -5.7015380859375, -5.447021484375, -5.1925048828125, -4.93798828125, -4.6834716796875, -4.428955078125, -4.1744384765625, -3.919921875, -3.6654052734375, -3.410888671875, -3.1563720703125, -2.90185546875, -2.6473388671875, -2.392822265625, -2.1383056640625, -1.8837890625, -1.6292724609375, -1.374755859375, -1.1202392578125, -0.86572265625, -0.6112060546875, -0.356689453125, -0.1021728515625, 0.15234375, 0.4068603515625, 0.661376953125, 0.9158935546875, 1.17041015625, 1.4249267578125, 1.679443359375, 1.9339599609375, 2.1884765625, 2.4429931640625, 2.697509765625, 2.9520263671875, 3.20654296875, 3.4610595703125, 3.715576171875, 3.9700927734375, 4.224609375, 4.4791259765625, 4.733642578125, 4.9881591796875, 5.24267578125, 5.4971923828125, 5.751708984375, 6.0062255859375, 6.2607421875, 6.5152587890625, 6.769775390625, 7.0242919921875, 7.27880859375, 7.5333251953125, 7.787841796875, 8.0423583984375, 8.296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 18.0, 18.0, 21.0, 31.0, 34.0, 28.0, 27.0, 27.0, 33.0, 33.0, 34.0, 40.0, 47.0, 43.0, 31.0, 40.0, 47.0, 46.0, 29.0, 35.0, 32.0, 28.0, 30.0, 33.0, 38.0, 31.0, 19.0, 15.0, 14.0, 9.0, 15.0, 6.0, 9.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.05987548828125, -3.9400634765625, -3.82025146484375, -3.700439453125, -3.58062744140625, -3.4608154296875, -3.34100341796875, -3.22119140625, -3.10137939453125, -2.9815673828125, -2.86175537109375, -2.741943359375, -2.62213134765625, -2.5023193359375, -2.38250732421875, -2.2626953125, -2.14288330078125, -2.0230712890625, -1.90325927734375, -1.783447265625, -1.66363525390625, -1.5438232421875, -1.42401123046875, -1.30419921875, -1.18438720703125, -1.0645751953125, -0.94476318359375, -0.824951171875, -0.70513916015625, -0.5853271484375, -0.46551513671875, -0.345703125, -0.22589111328125, -0.1060791015625, 0.01373291015625, 0.133544921875, 0.25335693359375, 0.3731689453125, 0.49298095703125, 0.61279296875, 0.73260498046875, 0.8524169921875, 0.97222900390625, 1.092041015625, 1.21185302734375, 1.3316650390625, 1.45147705078125, 1.5712890625, 1.69110107421875, 1.8109130859375, 1.93072509765625, 2.050537109375, 2.17034912109375, 2.2901611328125, 2.40997314453125, 2.52978515625, 2.64959716796875, 2.7694091796875, 2.88922119140625, 3.009033203125, 3.12884521484375, 3.2486572265625, 3.36846923828125, 3.48828125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 16.0, 42.0, 42.0, 93.0, 86.0, 176.0, 254.0, 354.0, 596.0, 946.0, 1402.0, 2262.0, 3653.0, 5933.0, 9872.0, 16166.0, 26282.0, 41607.0, 63102.0, 89169.0, 114388.0, 132332.0, 133759.0, 119219.0, 95489.0, 68855.0, 46245.0, 29492.0, 18039.0, 10982.0, 6656.0, 4097.0, 2533.0, 1492.0, 1055.0, 594.0, 403.0, 286.0, 166.0, 140.0, 77.0, 64.0, 46.0, 22.0, 15.0, 7.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.4638671875, -1.4196624755859375, -1.375457763671875, -1.3312530517578125, -1.28704833984375, -1.2428436279296875, -1.198638916015625, -1.1544342041015625, -1.1102294921875, -1.0660247802734375, -1.021820068359375, -0.9776153564453125, -0.93341064453125, -0.8892059326171875, -0.845001220703125, -0.8007965087890625, -0.756591796875, -0.7123870849609375, -0.668182373046875, -0.6239776611328125, -0.57977294921875, -0.5355682373046875, -0.491363525390625, -0.4471588134765625, -0.4029541015625, -0.3587493896484375, -0.314544677734375, -0.2703399658203125, -0.22613525390625, -0.1819305419921875, -0.137725830078125, -0.0935211181640625, -0.04931640625, -0.0051116943359375, 0.039093017578125, 0.0832977294921875, 0.12750244140625, 0.1717071533203125, 0.215911865234375, 0.2601165771484375, 0.3043212890625, 0.3485260009765625, 0.392730712890625, 0.4369354248046875, 0.48114013671875, 0.5253448486328125, 0.569549560546875, 0.6137542724609375, 0.657958984375, 0.7021636962890625, 0.746368408203125, 0.7905731201171875, 0.83477783203125, 0.8789825439453125, 0.923187255859375, 0.9673919677734375, 1.0115966796875, 1.0558013916015625, 1.100006103515625, 1.1442108154296875, 1.18841552734375, 1.2326202392578125, 1.276824951171875, 1.3210296630859375, 1.365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 12.0, 20.0, 21.0, 21.0, 34.0, 47.0, 36.0, 42.0, 55.0, 45.0, 62.0, 65.0, 57.0, 47.0, 59.0, 66.0, 50.0, 47.0, 38.0, 26.0, 25.0, 17.0, 26.0, 14.0, 10.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001915767788887024, -0.0001852661371231079, -0.00017895549535751343, -0.00017264485359191895, -0.00016633421182632446, -0.00016002357006072998, -0.0001537129282951355, -0.00014740228652954102, -0.00014109164476394653, -0.00013478100299835205, -0.00012847036123275757, -0.00012215971946716309, -0.0001158490777015686, -0.00010953843593597412, -0.00010322779417037964, -9.691715240478516e-05, -9.060651063919067e-05, -8.429586887359619e-05, -7.798522710800171e-05, -7.167458534240723e-05, -6.536394357681274e-05, -5.905330181121826e-05, -5.274266004562378e-05, -4.64320182800293e-05, -4.0121376514434814e-05, -3.381073474884033e-05, -2.750009298324585e-05, -2.1189451217651367e-05, -1.4878809452056885e-05, -8.568167686462402e-06, -2.25752592086792e-06, 4.0531158447265625e-06, 1.0363757610321045e-05, 1.6674399375915527e-05, 2.298504114151001e-05, 2.9295682907104492e-05, 3.5606324672698975e-05, 4.191696643829346e-05, 4.822760820388794e-05, 5.453824996948242e-05, 6.0848891735076904e-05, 6.715953350067139e-05, 7.347017526626587e-05, 7.978081703186035e-05, 8.609145879745483e-05, 9.240210056304932e-05, 9.87127423286438e-05, 0.00010502338409423828, 0.00011133402585983276, 0.00011764466762542725, 0.00012395530939102173, 0.0001302659511566162, 0.0001365765929222107, 0.00014288723468780518, 0.00014919787645339966, 0.00015550851821899414, 0.00016181915998458862, 0.0001681298017501831, 0.0001744404435157776, 0.00018075108528137207, 0.00018706172704696655, 0.00019337236881256104, 0.00019968301057815552, 0.00020599365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 9.0, 7.0, 18.0, 23.0, 48.0, 58.0, 90.0, 139.0, 252.0, 383.0, 573.0, 999.0, 1628.0, 2790.0, 4603.0, 8160.0, 13796.0, 23291.0, 38158.0, 59980.0, 87228.0, 115249.0, 135668.0, 139778.0, 125858.0, 99780.0, 71202.0, 47053.0, 29118.0, 17613.0, 10173.0, 6042.0, 3546.0, 2042.0, 1280.0, 736.0, 458.0, 286.0, 181.0, 99.0, 53.0, 54.0, 26.0, 13.0, 9.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3470306396484375, -1.302459716796875, -1.2578887939453125, -1.21331787109375, -1.1687469482421875, -1.124176025390625, -1.0796051025390625, -1.0350341796875, -0.9904632568359375, -0.945892333984375, -0.9013214111328125, -0.85675048828125, -0.8121795654296875, -0.767608642578125, -0.7230377197265625, -0.678466796875, -0.6338958740234375, -0.589324951171875, -0.5447540283203125, -0.50018310546875, -0.4556121826171875, -0.411041259765625, -0.3664703369140625, -0.3218994140625, -0.2773284912109375, -0.232757568359375, -0.1881866455078125, -0.14361572265625, -0.0990447998046875, -0.054473876953125, -0.0099029541015625, 0.03466796875, 0.0792388916015625, 0.123809814453125, 0.1683807373046875, 0.21295166015625, 0.2575225830078125, 0.302093505859375, 0.3466644287109375, 0.3912353515625, 0.4358062744140625, 0.480377197265625, 0.5249481201171875, 0.56951904296875, 0.6140899658203125, 0.658660888671875, 0.7032318115234375, 0.747802734375, 0.7923736572265625, 0.836944580078125, 0.8815155029296875, 0.92608642578125, 0.9706573486328125, 1.015228271484375, 1.0597991943359375, 1.1043701171875, 1.1489410400390625, 1.193511962890625, 1.2380828857421875, 1.28265380859375, 1.3272247314453125, 1.371795654296875, 1.4163665771484375, 1.4609375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 7.0, 10.0, 8.0, 7.0, 14.0, 18.0, 17.0, 31.0, 28.0, 25.0, 31.0, 40.0, 30.0, 48.0, 46.0, 37.0, 50.0, 44.0, 48.0, 43.0, 43.0, 43.0, 42.0, 32.0, 37.0, 27.0, 24.0, 24.0, 22.0, 14.0, 25.0, 12.0, 9.0, 9.0, 4.0, 8.0, 3.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.42792510986328125, -0.4134674072265625, -0.39900970458984375, -0.384552001953125, -0.37009429931640625, -0.3556365966796875, -0.34117889404296875, -0.32672119140625, -0.31226348876953125, -0.2978057861328125, -0.28334808349609375, -0.268890380859375, -0.25443267822265625, -0.2399749755859375, -0.22551727294921875, -0.2110595703125, -0.19660186767578125, -0.1821441650390625, -0.16768646240234375, -0.153228759765625, -0.13877105712890625, -0.1243133544921875, -0.10985565185546875, -0.09539794921875, -0.08094024658203125, -0.0664825439453125, -0.05202484130859375, -0.037567138671875, -0.02310943603515625, -0.0086517333984375, 0.00580596923828125, 0.020263671875, 0.03472137451171875, 0.0491790771484375, 0.06363677978515625, 0.078094482421875, 0.09255218505859375, 0.1070098876953125, 0.12146759033203125, 0.13592529296875, 0.15038299560546875, 0.1648406982421875, 0.17929840087890625, 0.193756103515625, 0.20821380615234375, 0.2226715087890625, 0.23712921142578125, 0.2515869140625, 0.26604461669921875, 0.2805023193359375, 0.29496002197265625, 0.309417724609375, 0.32387542724609375, 0.3383331298828125, 0.35279083251953125, 0.36724853515625, 0.38170623779296875, 0.3961639404296875, 0.41062164306640625, 0.425079345703125, 0.43953704833984375, 0.4539947509765625, 0.46845245361328125, 0.48291015625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 16.0, 16.0, 30.0, 32.0, 34.0, 37.0, 40.0, 51.0, 38.0, 63.0, 57.0, 72.0, 60.0, 55.0, 54.0, 47.0, 42.0, 29.0, 29.0, 29.0, 23.0, 15.0, 24.0, 16.0, 14.0, 11.0, 2.0, 3.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.497963905334473, -9.224068641662598, -8.950172424316406, -8.676277160644531, -8.40238094329834, -8.128485679626465, -7.854589939117432, -7.580694198608398, -7.306798934936523, -7.03290319442749, -6.759007453918457, -6.485112190246582, -6.211216449737549, -5.937320709228516, -5.663424968719482, -5.389529228210449, -5.115633487701416, -4.841737747192383, -4.56784200668335, -4.293946266174316, -4.020051002502441, -3.746155261993408, -3.472259521484375, -3.198363780975342, -2.9244682788848877, -2.6505725383758545, -2.3766770362854004, -2.102781295776367, -1.8288856744766235, -1.5549900531768799, -1.2810943126678467, -1.007198691368103, -0.7333030700683594, -0.45940741896629333, -0.1855117678642273, 0.08838391304016113, 0.3622795343399048, 0.6361751556396484, 0.9100708961486816, 1.1839665174484253, 1.457862138748169, 1.7317577600479126, 2.0056533813476562, 2.2795491218566895, 2.5534448623657227, 2.8273403644561768, 3.10123610496521, 3.375131607055664, 3.6490273475646973, 3.9229230880737305, 4.196818828582764, 4.470714569091797, 4.744609832763672, 5.018505573272705, 5.292401313781738, 5.5662970542907715, 5.840192794799805, 6.114088535308838, 6.387984275817871, 6.661879539489746, 6.935775279998779, 7.2096710205078125, 7.483566761016846, 7.757462501525879, 8.031357765197754]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 14.0, 10.0, 17.0, 20.0, 30.0, 18.0, 24.0, 29.0, 38.0, 30.0, 47.0, 41.0, 43.0, 63.0, 58.0, 38.0, 44.0, 44.0, 51.0, 38.0, 26.0, 35.0, 36.0, 37.0, 25.0, 28.0, 15.0, 19.0, 14.0, 11.0, 7.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.619253158569336, -8.35822868347168, -8.097204208374023, -7.836179733276367, -7.575155258178711, -7.314130783081055, -7.053106307983398, -6.792081832885742, -6.531057357788086, -6.27003288269043, -6.009008407592773, -5.747983932495117, -5.486959457397461, -5.225934982299805, -4.964910507202148, -4.703886032104492, -4.442862033843994, -4.181837558746338, -3.9208130836486816, -3.6597886085510254, -3.398764133453369, -3.137739658355713, -2.8767154216766357, -2.6156909465789795, -2.3546664714813232, -2.093641996383667, -1.8326175212860107, -1.571593165397644, -1.3105686902999878, -1.0495442152023315, -0.7885198593139648, -0.5274953842163086, -0.26647090911865234, -0.0054464638233184814, 0.2555779814720154, 0.5166023969650269, 0.7776268720626831, 1.0386513471603394, 1.299675703048706, 1.5607001781463623, 1.8217246532440186, 2.082749128341675, 2.343773603439331, 2.604797840118408, 2.8658223152160645, 3.1268467903137207, 3.387871265411377, 3.648895740509033, 3.9099202156066895, 4.170944690704346, 4.431969165802002, 4.692993640899658, 4.9540181159973145, 5.215042591094971, 5.476066589355469, 5.737091064453125, 5.998115539550781, 6.2591400146484375, 6.520164489746094, 6.78118896484375, 7.042213439941406, 7.3032379150390625, 7.564262390136719, 7.825286865234375, 8.086311340332031]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 5.0, 16.0, 18.0, 21.0, 31.0, 42.0, 48.0, 65.0, 81.0, 119.0, 137.0, 225.0, 301.0, 390.0, 566.0, 793.0, 1131.0, 1655.0, 2295.0, 3183.0, 4330.0, 488572.0, 5585.0, 4059.0, 3035.0, 2148.0, 1544.0, 1086.0, 749.0, 554.0, 396.0, 265.0, 222.0, 142.0, 96.0, 83.0, 60.0, 46.0, 33.0, 28.0, 26.0, 14.0, 22.0, 7.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-71.41798400878906, -69.10797119140625, -66.79795837402344, -64.48794555664062, -62.17793273925781, -59.867919921875, -57.55790328979492, -55.24789047241211, -52.9378776550293, -50.627864837646484, -48.31785202026367, -46.00783920288086, -43.69782257080078, -41.38780975341797, -39.077796936035156, -36.767784118652344, -34.45777130126953, -32.14775848388672, -29.837745666503906, -27.52773094177246, -25.21771812438965, -22.907705307006836, -20.59769058227539, -18.287677764892578, -15.977664947509766, -13.667652130126953, -11.357638359069824, -9.047624588012695, -6.737611770629883, -4.42759895324707, -2.1175851821899414, 0.1924285888671875, 2.50244140625, 4.812454700469971, 7.122467994689941, 9.43248176574707, 11.742494583129883, 14.052507400512695, 16.36252212524414, 18.672534942626953, 20.982547760009766, 23.292560577392578, 25.60257339477539, 27.912588119506836, 30.22260093688965, 32.532615661621094, 34.842628479003906, 37.15264129638672, 39.46265411376953, 41.772666931152344, 44.082679748535156, 46.39269256591797, 48.70270538330078, 51.012718200683594, 53.32273483276367, 55.632747650146484, 57.9427604675293, 60.25277328491211, 62.56278610229492, 64.872802734375, 67.18281555175781, 69.49282836914062, 71.80284118652344, 74.11285400390625, 76.42286682128906]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 12.0, 11.0, 12.0, 15.0, 22.0, 30.0, 16.0, 24.0, 29.0, 41.0, 28.0, 45.0, 43.0, 46.0, 64.0, 1080.0, 43.0, 42.0, 46.0, 50.0, 34.0, 28.0, 40.0, 36.0, 33.0, 27.0, 27.0, 12.0, 18.0, 14.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-265.3472595214844, -257.3047790527344, -249.26229858398438, -241.21981811523438, -233.17733764648438, -225.13485717773438, -217.09237670898438, -209.04989624023438, -201.00741577148438, -192.96493530273438, -184.92245483398438, -176.87997436523438, -168.83749389648438, -160.79501342773438, -152.75253295898438, -144.71005249023438, -136.66758728027344, -128.62510681152344, -120.58262634277344, -112.54014587402344, -104.49766540527344, -96.45518493652344, -88.41271209716797, -80.37023162841797, -72.32775115966797, -64.28527069091797, -56.24279022216797, -48.200313568115234, -40.157833099365234, -32.115352630615234, -24.0728759765625, -16.0303955078125, -7.9879150390625, 0.054564476013183594, 8.097043991088867, 16.139522552490234, 24.182003021240234, 32.224483489990234, 40.26696014404297, 48.30944061279297, 56.35192108154297, 64.39440155029297, 72.43688201904297, 80.47935485839844, 88.52183532714844, 96.56431579589844, 104.60679626464844, 112.64927673339844, 120.69175720214844, 128.73423767089844, 136.77671813964844, 144.81919860839844, 152.86167907714844, 160.90415954589844, 168.94662475585938, 176.98910522460938, 185.03158569335938, 193.07406616210938, 201.11654663085938, 209.15902709960938, 217.20150756835938, 225.24398803710938, 233.28646850585938, 241.32894897460938, 249.37142944335938]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 13.0, 6.0, 13.0, 21.0, 21.0, 26.0, 39.0, 51.0, 80.0, 67.0, 123.0, 156.0, 178.0, 264.0, 373.0, 523.0, 687.0, 1038.0, 1566.0, 2346.0, 3328.0, 4723.0, 6289.0, 8418.0, 10499.0, 13807.0, 20183.0, 390907.0, 30684016.0, 34277.0, 31096.0, 16687.0, 8575.0, 5095.0, 3060.0, 1958.0, 1258.0, 808.0, 584.0, 378.0, 297.0, 229.0, 168.0, 119.0, 75.0, 36.0, 22.0, 12.0, 9.0, 5.0, 5.0, 2.0], "bins": [-91.87071228027344, -89.57714080810547, -87.2835693359375, -84.989990234375, -82.69641876220703, -80.40284729003906, -78.1092758178711, -75.81570434570312, -73.52213287353516, -71.22856140136719, -68.93498992919922, -66.64141845703125, -64.34783935546875, -62.05426788330078, -59.76069641113281, -57.467124938964844, -55.17354965209961, -52.87997817993164, -50.586402893066406, -48.29283142089844, -45.99925994873047, -43.7056884765625, -41.412113189697266, -39.1185417175293, -36.82496643066406, -34.531394958496094, -32.23781967163086, -29.94424819946289, -27.650676727294922, -25.35710334777832, -23.06352996826172, -20.76995849609375, -18.47638702392578, -16.18281364440918, -13.889242172241211, -11.59566879272461, -9.302096366882324, -7.008523941040039, -4.7149505615234375, -2.4213790893554688, -0.1278057098388672, 2.165766954421997, 4.459339618682861, 6.752912521362305, 9.04648494720459, 11.340057373046875, 13.633630752563477, 15.927202224731445, 18.220775604248047, 20.51434898376465, 22.807920455932617, 25.10149383544922, 27.395065307617188, 29.68863868713379, 31.98221206665039, 34.27578353881836, 36.569358825683594, 38.86293029785156, 41.1565055847168, 43.450077056884766, 45.743648529052734, 48.03722381591797, 50.33079528808594, 52.624366760253906, 54.917938232421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 7.0, 15.0, 35.0, 47.0, 60.0, 73.0, 116.0, 167.0, 315.0, 509.0, 803.0, 1318.0, 2134.0, 3665.0, 6640.0, 12180.0, 24035.0, 51122.0, 117466.0, 302918.0, 946099.0, 3192008.0, 1063741.0, 330040.0, 126212.0, 54654.0, 25465.0, 12773.0, 6922.0, 3912.0, 2294.0, 1376.0, 862.0, 532.0, 323.0, 204.0, 118.0, 89.0, 55.0, 45.0, 26.0, 19.0, 13.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.6171875, -5.44970703125, -5.2822265625, -5.11474609375, -4.947265625, -4.77978515625, -4.6123046875, -4.44482421875, -4.27734375, -4.10986328125, -3.9423828125, -3.77490234375, -3.607421875, -3.43994140625, -3.2724609375, -3.10498046875, -2.9375, -2.77001953125, -2.6025390625, -2.43505859375, -2.267578125, -2.10009765625, -1.9326171875, -1.76513671875, -1.59765625, -1.43017578125, -1.2626953125, -1.09521484375, -0.927734375, -0.76025390625, -0.5927734375, -0.42529296875, -0.2578125, -0.09033203125, 0.0771484375, 0.24462890625, 0.412109375, 0.57958984375, 0.7470703125, 0.91455078125, 1.08203125, 1.24951171875, 1.4169921875, 1.58447265625, 1.751953125, 1.91943359375, 2.0869140625, 2.25439453125, 2.421875, 2.58935546875, 2.7568359375, 2.92431640625, 3.091796875, 3.25927734375, 3.4267578125, 3.59423828125, 3.76171875, 3.92919921875, 4.0966796875, 4.26416015625, 4.431640625, 4.59912109375, 4.7666015625, 4.93408203125, 5.1015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 3.0, 9.0, 6.0, 7.0, 9.0, 14.0, 14.0, 20.0, 21.0, 20.0, 27.0, 28.0, 34.0, 36.0, 38.0, 41.0, 44.0, 77.0, 149.0, 205.0, 258.0, 241.0, 146.0, 112.0, 74.0, 56.0, 44.0, 36.0, 35.0, 32.0, 27.0, 21.0, 24.0, 21.0, 14.0, 8.0, 17.0, 8.0, 9.0, 5.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.91796875, -3.79302978515625, -3.6680908203125, -3.54315185546875, -3.418212890625, -3.29327392578125, -3.1683349609375, -3.04339599609375, -2.91845703125, -2.79351806640625, -2.6685791015625, -2.54364013671875, -2.418701171875, -2.29376220703125, -2.1688232421875, -2.04388427734375, -1.9189453125, -1.79400634765625, -1.6690673828125, -1.54412841796875, -1.419189453125, -1.29425048828125, -1.1693115234375, -1.04437255859375, -0.91943359375, -0.79449462890625, -0.6695556640625, -0.54461669921875, -0.419677734375, -0.29473876953125, -0.1697998046875, -0.04486083984375, 0.080078125, 0.20501708984375, 0.3299560546875, 0.45489501953125, 0.579833984375, 0.70477294921875, 0.8297119140625, 0.95465087890625, 1.07958984375, 1.20452880859375, 1.3294677734375, 1.45440673828125, 1.579345703125, 1.70428466796875, 1.8292236328125, 1.95416259765625, 2.0791015625, 2.20404052734375, 2.3289794921875, 2.45391845703125, 2.578857421875, 2.70379638671875, 2.8287353515625, 2.95367431640625, 3.07861328125, 3.20355224609375, 3.3284912109375, 3.45343017578125, 3.578369140625, 3.70330810546875, 3.8282470703125, 3.95318603515625, 4.078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 5.0, 4.0, 14.0, 15.0, 16.0, 32.0, 56.0, 73.0, 81.0, 111.0, 158.0, 181.0, 267.0, 364.0, 510.0, 795.0, 1273.0, 1989.0, 3325.0, 5704.0, 9669.0, 17815.0, 33305.0, 64494.0, 130528.0, 279611.0, 702793.0, 3070359.0, 1223262.0, 388281.0, 175235.0, 85214.0, 43114.0, 22472.0, 12227.0, 6925.0, 3987.0, 2479.0, 1454.0, 1012.0, 668.0, 478.0, 318.0, 241.0, 164.0, 89.0, 60.0, 43.0, 42.0, 20.0, 20.0, 13.0, 18.0, 11.0, 10.0, 6.0, 8.0, 7.0, 7.0, 4.0, 3.0], "bins": [-3.26171875, -3.15545654296875, -3.0491943359375, -2.94293212890625, -2.836669921875, -2.73040771484375, -2.6241455078125, -2.51788330078125, -2.41162109375, -2.30535888671875, -2.1990966796875, -2.09283447265625, -1.986572265625, -1.88031005859375, -1.7740478515625, -1.66778564453125, -1.5615234375, -1.45526123046875, -1.3489990234375, -1.24273681640625, -1.136474609375, -1.03021240234375, -0.9239501953125, -0.81768798828125, -0.71142578125, -0.60516357421875, -0.4989013671875, -0.39263916015625, -0.286376953125, -0.18011474609375, -0.0738525390625, 0.03240966796875, 0.138671875, 0.24493408203125, 0.3511962890625, 0.45745849609375, 0.563720703125, 0.66998291015625, 0.7762451171875, 0.88250732421875, 0.98876953125, 1.09503173828125, 1.2012939453125, 1.30755615234375, 1.413818359375, 1.52008056640625, 1.6263427734375, 1.73260498046875, 1.8388671875, 1.94512939453125, 2.0513916015625, 2.15765380859375, 2.263916015625, 2.37017822265625, 2.4764404296875, 2.58270263671875, 2.68896484375, 2.79522705078125, 2.9014892578125, 3.00775146484375, 3.114013671875, 3.22027587890625, 3.3265380859375, 3.43280029296875, 3.5390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 16.0, 12.0, 16.0, 23.0, 26.0, 58.0, 45.0, 69.0, 88.0, 201.0, 454.0, 409.0, 172.0, 108.0, 76.0, 51.0, 40.0, 38.0, 28.0, 27.0, 11.0, 4.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.078125, -7.8463134765625, -7.614501953125, -7.3826904296875, -7.15087890625, -6.9190673828125, -6.687255859375, -6.4554443359375, -6.2236328125, -5.9918212890625, -5.760009765625, -5.5281982421875, -5.29638671875, -5.0645751953125, -4.832763671875, -4.6009521484375, -4.369140625, -4.1373291015625, -3.905517578125, -3.6737060546875, -3.44189453125, -3.2100830078125, -2.978271484375, -2.7464599609375, -2.5146484375, -2.2828369140625, -2.051025390625, -1.8192138671875, -1.58740234375, -1.3555908203125, -1.123779296875, -0.8919677734375, -0.66015625, -0.4283447265625, -0.196533203125, 0.0352783203125, 0.26708984375, 0.4989013671875, 0.730712890625, 0.9625244140625, 1.1943359375, 1.4261474609375, 1.657958984375, 1.8897705078125, 2.12158203125, 2.3533935546875, 2.585205078125, 2.8170166015625, 3.048828125, 3.2806396484375, 3.512451171875, 3.7442626953125, 3.97607421875, 4.2078857421875, 4.439697265625, 4.6715087890625, 4.9033203125, 5.1351318359375, 5.366943359375, 5.5987548828125, 5.83056640625, 6.0623779296875, 6.294189453125, 6.5260009765625, 6.7578125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 6.0, 7.0, 13.0, 10.0, 21.0, 16.0, 24.0, 37.0, 41.0, 27.0, 38.0, 54.0, 96.0, 120.0, 154.0, 214.0, 303.0, 524.0, 736.0, 1145.0, 1915.0, 3715.0, 8078.0, 21912.0, 94092.0, 5988706.0, 124753.0, 25506.0, 9146.0, 4035.0, 2220.0, 1231.0, 813.0, 519.0, 313.0, 269.0, 139.0, 135.0, 91.0, 57.0, 46.0, 29.0, 32.0, 25.0, 21.0, 17.0, 15.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-25.90625, -25.085693359375, -24.26513671875, -23.444580078125, -22.6240234375, -21.803466796875, -20.98291015625, -20.162353515625, -19.341796875, -18.521240234375, -17.70068359375, -16.880126953125, -16.0595703125, -15.239013671875, -14.41845703125, -13.597900390625, -12.77734375, -11.956787109375, -11.13623046875, -10.315673828125, -9.4951171875, -8.674560546875, -7.85400390625, -7.033447265625, -6.212890625, -5.392333984375, -4.57177734375, -3.751220703125, -2.9306640625, -2.110107421875, -1.28955078125, -0.468994140625, 0.3515625, 1.172119140625, 1.99267578125, 2.813232421875, 3.6337890625, 4.454345703125, 5.27490234375, 6.095458984375, 6.916015625, 7.736572265625, 8.55712890625, 9.377685546875, 10.1982421875, 11.018798828125, 11.83935546875, 12.659912109375, 13.48046875, 14.301025390625, 15.12158203125, 15.942138671875, 16.7626953125, 17.583251953125, 18.40380859375, 19.224365234375, 20.044921875, 20.865478515625, 21.68603515625, 22.506591796875, 23.3271484375, 24.147705078125, 24.96826171875, 25.788818359375, 26.609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 32.0, 37.0, 47.0, 49.0, 72.0, 102.0, 328.0, 542.0, 242.0, 136.0, 70.0, 52.0, 38.0, 32.0, 26.0, 22.0, 17.0, 13.0, 16.0, 8.0, 10.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3609619140625, -8.042236328125, -7.7235107421875, -7.40478515625, -7.0860595703125, -6.767333984375, -6.4486083984375, -6.1298828125, -5.8111572265625, -5.492431640625, -5.1737060546875, -4.85498046875, -4.5362548828125, -4.217529296875, -3.8988037109375, -3.580078125, -3.2613525390625, -2.942626953125, -2.6239013671875, -2.30517578125, -1.9864501953125, -1.667724609375, -1.3489990234375, -1.0302734375, -0.7115478515625, -0.392822265625, -0.0740966796875, 0.24462890625, 0.5633544921875, 0.882080078125, 1.2008056640625, 1.51953125, 1.8382568359375, 2.156982421875, 2.4757080078125, 2.79443359375, 3.1131591796875, 3.431884765625, 3.7506103515625, 4.0693359375, 4.3880615234375, 4.706787109375, 5.0255126953125, 5.34423828125, 5.6629638671875, 5.981689453125, 6.3004150390625, 6.619140625, 6.9378662109375, 7.256591796875, 7.5753173828125, 7.89404296875, 8.2127685546875, 8.531494140625, 8.8502197265625, 9.1689453125, 9.4876708984375, 9.806396484375, 10.1251220703125, 10.44384765625, 10.7625732421875, 11.081298828125, 11.4000244140625, 11.71875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 19.0, 94.0, 839.0, 33.0, 12.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-727.3897705078125, -708.3659057617188, -689.342041015625, -670.3181762695312, -651.2943115234375, -632.2704467773438, -613.24658203125, -594.2227172851562, -575.1988525390625, -556.1749877929688, -537.151123046875, -518.1272583007812, -499.1033935546875, -480.07952880859375, -461.0556640625, -442.03179931640625, -423.0079650878906, -403.9841003417969, -384.9602355957031, -365.9363708496094, -346.9125061035156, -327.8886413574219, -308.86480712890625, -289.8409423828125, -270.81707763671875, -251.793212890625, -232.76934814453125, -213.7454833984375, -194.72161865234375, -175.69775390625, -156.6739044189453, -137.65003967285156, -118.62615966796875, -99.602294921875, -80.57843017578125, -61.55457305908203, -42.53070831298828, -23.50684356689453, -4.4829864501953125, 14.540878295898438, 33.56474304199219, 52.58860778808594, 71.61247253417969, 90.6363296508789, 109.66019439697266, 128.68405151367188, 147.70791625976562, 166.73178100585938, 185.75564575195312, 204.77951049804688, 223.80337524414062, 242.82723999023438, 261.8511047363281, 280.8749694824219, 299.8988037109375, 318.92266845703125, 337.946533203125, 356.97039794921875, 375.9942626953125, 395.01812744140625, 414.0419921875, 433.06585693359375, 452.0897216796875, 471.11358642578125, 490.137451171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 17.0, 45.0, 533.0, 282.0, 38.0, 15.0, 19.0, 3.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-514.69970703125, -501.1358337402344, -487.57196044921875, -474.00811767578125, -460.4442443847656, -446.88037109375, -433.3164978027344, -419.75262451171875, -406.1887512207031, -392.6248779296875, -379.0610046386719, -365.49713134765625, -351.93328857421875, -338.3694152832031, -324.8055419921875, -311.2416687011719, -297.67779541015625, -284.1139221191406, -270.550048828125, -256.9862060546875, -243.4223175048828, -229.85845947265625, -216.29458618164062, -202.730712890625, -189.1668701171875, -175.60299682617188, -162.0391387939453, -148.4752655029297, -134.91139221191406, -121.34752655029297, -107.78366088867188, -94.21978759765625, -80.65591430664062, -67.09204864501953, -53.528175354003906, -39.96430969238281, -26.400440216064453, -12.836570739746094, 0.727294921875, 14.291168212890625, 27.85503387451172, 41.41890335083008, 54.98277282714844, 68.54663848876953, 82.11050415039062, 95.67437744140625, 109.23824310302734, 122.80211639404297, 136.36598205566406, 149.9298553466797, 163.49371337890625, 177.05758666992188, 190.6214599609375, 204.18533325195312, 217.7491912841797, 231.3130645751953, 244.87692260742188, 258.4407958984375, 272.0046691894531, 285.56854248046875, 299.13238525390625, 312.6962585449219, 326.2601318359375, 339.8240051269531, 353.38787841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 15.0, 18.0, 27.0, 30.0, 49.0, 80.0, 122.0, 171.0, 248.0, 430.0, 646.0, 976.0, 1678.0, 2917.0, 5915.0, 13237.0, 33525.0, 111659.0, 3505025.0, 419214.0, 56362.0, 22007.0, 9832.0, 4626.0, 2323.0, 1223.0, 714.0, 410.0, 249.0, 157.0, 91.0, 86.0, 53.0, 29.0, 28.0, 25.0, 22.0, 8.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3037109375, -1.2613372802734375, -1.218963623046875, -1.1765899658203125, -1.13421630859375, -1.0918426513671875, -1.049468994140625, -1.0070953369140625, -0.9647216796875, -0.9223480224609375, -0.879974365234375, -0.8376007080078125, -0.79522705078125, -0.7528533935546875, -0.710479736328125, -0.6681060791015625, -0.625732421875, -0.5833587646484375, -0.540985107421875, -0.4986114501953125, -0.45623779296875, -0.4138641357421875, -0.371490478515625, -0.3291168212890625, -0.2867431640625, -0.2443695068359375, -0.201995849609375, -0.1596221923828125, -0.11724853515625, -0.0748748779296875, -0.032501220703125, 0.0098724365234375, 0.05224609375, 0.0946197509765625, 0.136993408203125, 0.1793670654296875, 0.22174072265625, 0.2641143798828125, 0.306488037109375, 0.3488616943359375, 0.3912353515625, 0.4336090087890625, 0.475982666015625, 0.5183563232421875, 0.56072998046875, 0.6031036376953125, 0.645477294921875, 0.6878509521484375, 0.730224609375, 0.7725982666015625, 0.814971923828125, 0.8573455810546875, 0.89971923828125, 0.9420928955078125, 0.984466552734375, 1.0268402099609375, 1.0692138671875, 1.1115875244140625, 1.153961181640625, 1.1963348388671875, 1.23870849609375, 1.2810821533203125, 1.323455810546875, 1.3658294677734375, 1.408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 13.0, 13.0, 12.0, 26.0, 113.0, 277.0, 306.0, 133.0, 33.0, 16.0, 11.0, 11.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12723207473754883, -0.12433719635009766, -0.12144231796264648, -0.11854743957519531, -0.11565256118774414, -0.11275768280029297, -0.1098628044128418, -0.10696792602539062, -0.10407304763793945, -0.10117816925048828, -0.09828329086303711, -0.09538841247558594, -0.09249353408813477, -0.0895986557006836, -0.08670377731323242, -0.08380889892578125, -0.08091402053833008, -0.0780191421508789, -0.07512426376342773, -0.07222938537597656, -0.06933450698852539, -0.06643962860107422, -0.06354475021362305, -0.060649871826171875, -0.0577549934387207, -0.05486011505126953, -0.05196523666381836, -0.04907035827636719, -0.046175479888916016, -0.043280601501464844, -0.04038572311401367, -0.0374908447265625, -0.03459596633911133, -0.031701087951660156, -0.028806209564208984, -0.025911331176757812, -0.02301645278930664, -0.02012157440185547, -0.017226696014404297, -0.014331817626953125, -0.011436939239501953, -0.008542060852050781, -0.005647182464599609, -0.0027523040771484375, 0.00014257431030273438, 0.0030374526977539062, 0.005932331085205078, 0.00882720947265625, 0.011722087860107422, 0.014616966247558594, 0.017511844635009766, 0.020406723022460938, 0.02330160140991211, 0.02619647979736328, 0.029091358184814453, 0.031986236572265625, 0.0348811149597168, 0.03777599334716797, 0.04067087173461914, 0.04356575012207031, 0.046460628509521484, 0.049355506896972656, 0.05225038528442383, 0.055145263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 8.0, 8.0, 10.0, 21.0, 24.0, 34.0, 38.0, 57.0, 90.0, 110.0, 179.0, 334.0, 629.0, 1480.0, 3641.0, 10836.0, 44320.0, 290256.0, 2905048.0, 810971.0, 96440.0, 19518.0, 5926.0, 2181.0, 955.0, 463.0, 233.0, 134.0, 86.0, 59.0, 54.0, 27.0, 26.0, 9.0, 14.0, 8.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3857421875, -1.3433837890625, -1.301025390625, -1.2586669921875, -1.21630859375, -1.1739501953125, -1.131591796875, -1.0892333984375, -1.046875, -1.0045166015625, -0.962158203125, -0.9197998046875, -0.87744140625, -0.8350830078125, -0.792724609375, -0.7503662109375, -0.7080078125, -0.6656494140625, -0.623291015625, -0.5809326171875, -0.53857421875, -0.4962158203125, -0.453857421875, -0.4114990234375, -0.369140625, -0.3267822265625, -0.284423828125, -0.2420654296875, -0.19970703125, -0.1573486328125, -0.114990234375, -0.0726318359375, -0.0302734375, 0.0120849609375, 0.054443359375, 0.0968017578125, 0.13916015625, 0.1815185546875, 0.223876953125, 0.2662353515625, 0.30859375, 0.3509521484375, 0.393310546875, 0.4356689453125, 0.47802734375, 0.5203857421875, 0.562744140625, 0.6051025390625, 0.6474609375, 0.6898193359375, 0.732177734375, 0.7745361328125, 0.81689453125, 0.8592529296875, 0.901611328125, 0.9439697265625, 0.986328125, 1.0286865234375, 1.071044921875, 1.1134033203125, 1.15576171875, 1.1981201171875, 1.240478515625, 1.2828369140625, 1.3251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 10.0, 10.0, 12.0, 19.0, 21.0, 29.0, 37.0, 55.0, 66.0, 95.0, 107.0, 149.0, 193.0, 258.0, 266.0, 341.0, 451.0, 400.0, 297.0, 261.0, 196.0, 167.0, 131.0, 99.0, 100.0, 69.0, 51.0, 35.0, 33.0, 27.0, 23.0, 19.0, 11.0, 12.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17529296875, -0.16959571838378906, -0.16389846801757812, -0.1582012176513672, -0.15250396728515625, -0.1468067169189453, -0.14110946655273438, -0.13541221618652344, -0.1297149658203125, -0.12401771545410156, -0.11832046508789062, -0.11262321472167969, -0.10692596435546875, -0.10122871398925781, -0.09553146362304688, -0.08983421325683594, -0.084136962890625, -0.07843971252441406, -0.07274246215820312, -0.06704521179199219, -0.06134796142578125, -0.05565071105957031, -0.049953460693359375, -0.04425621032714844, -0.0385589599609375, -0.03286170959472656, -0.027164459228515625, -0.021467208862304688, -0.01576995849609375, -0.010072708129882812, -0.004375457763671875, 0.0013217926025390625, 0.00701904296875, 0.012716293334960938, 0.018413543701171875, 0.024110794067382812, 0.02980804443359375, 0.03550529479980469, 0.041202545166015625, 0.04689979553222656, 0.0525970458984375, 0.05829429626464844, 0.06399154663085938, 0.06968879699707031, 0.07538604736328125, 0.08108329772949219, 0.08678054809570312, 0.09247779846191406, 0.098175048828125, 0.10387229919433594, 0.10956954956054688, 0.11526679992675781, 0.12096405029296875, 0.1266613006591797, 0.13235855102539062, 0.13805580139160156, 0.1437530517578125, 0.14945030212402344, 0.15514755249023438, 0.1608448028564453, 0.16654205322265625, 0.1722393035888672, 0.17793655395507812, 0.18363380432128906, 0.1893310546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 15.0, 59.0, 160.0, 326.0, 254.0, 104.0, 50.0, 24.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.431906223297119, -4.1932783126831055, -3.954650640487671, -3.7160229682922363, -3.4773950576782227, -3.238767385482788, -3.0001397132873535, -2.76151180267334, -2.5228841304779053, -2.2842564582824707, -2.045628547668457, -1.8070008754730225, -1.5683730840682983, -1.3297452926635742, -1.0911176204681396, -0.8524898290634155, -0.6138620376586914, -0.3752342760562897, -0.13660651445388794, 0.1020212173461914, 0.3406490087509155, 0.5792768001556396, 0.8179044723510742, 1.0565322637557983, 1.2951600551605225, 1.5337878465652466, 1.7724156379699707, 2.0110433101654053, 2.24967098236084, 2.4882988929748535, 2.726926565170288, 2.9655542373657227, 3.204181671142578, 3.4428093433380127, 3.6814372539520264, 3.920064926147461, 4.158692836761475, 4.397320747375488, 4.635948181152344, 4.874576091766357, 5.113204002380371, 5.351831912994385, 5.59045934677124, 5.829087257385254, 6.067715167999268, 6.306343078613281, 6.544970512390137, 6.78359842300415, 7.022225856781006, 7.2608537673950195, 7.499481201171875, 7.738109111785889, 7.976737022399902, 8.215364456176758, 8.45399284362793, 8.692620277404785, 8.93124771118164, 9.169875144958496, 9.408503532409668, 9.647130966186523, 9.885758399963379, 10.12438678741455, 10.363014221191406, 10.601641654968262, 10.840270042419434]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 16.0, 9.0, 11.0, 12.0, 24.0, 31.0, 43.0, 57.0, 46.0, 54.0, 67.0, 67.0, 55.0, 60.0, 48.0, 55.0, 47.0, 42.0, 57.0, 37.0, 26.0, 26.0, 17.0, 19.0, 14.0, 11.0, 11.0, 7.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5127581357955933, -1.460258960723877, -1.4077597856521606, -1.3552606105804443, -1.302761435508728, -1.2502622604370117, -1.197763204574585, -1.145263910293579, -1.0927648544311523, -1.040265679359436, -0.9877665042877197, -0.9352673292160034, -0.8827681541442871, -0.8302689790725708, -0.7777698636054993, -0.725270688533783, -0.6727714538574219, -0.6202722787857056, -0.5677731037139893, -0.515273928642273, -0.46277478337287903, -0.4102756083011627, -0.3577764630317688, -0.3052772879600525, -0.2527781128883362, -0.20027893781661987, -0.14777977764606476, -0.09528061747550964, -0.042781442403793335, 0.009717732667922974, 0.062216877937316895, 0.1147160530090332, 0.16721510887145996, 0.21971428394317627, 0.2722134590148926, 0.3247126042842865, 0.3772117793560028, 0.4297109544277191, 0.48221009969711304, 0.5347092747688293, 0.5872084498405457, 0.639707624912262, 0.6922067999839783, 0.7447059154510498, 0.7972050905227661, 0.8497042655944824, 0.9022034406661987, 0.954702615737915, 1.0072017908096313, 1.0597009658813477, 1.112200140953064, 1.1646993160247803, 1.2171984910964966, 1.269697666168213, 1.3221967220306396, 1.3746960163116455, 1.4271950721740723, 1.4796942472457886, 1.5321934223175049, 1.5846925973892212, 1.6371917724609375, 1.6896909475326538, 1.7421901226043701, 1.7946891784667969, 1.8471884727478027]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 6.0, 15.0, 13.0, 22.0, 24.0, 54.0, 70.0, 79.0, 121.0, 193.0, 275.0, 441.0, 710.0, 1224.0, 2177.0, 4329.0, 9928.0, 29971.0, 170070.0, 680147.0, 108899.0, 23101.0, 8164.0, 3674.0, 1913.0, 1071.0, 648.0, 357.0, 241.0, 197.0, 112.0, 82.0, 55.0, 31.0, 28.0, 28.0, 23.0, 13.0, 11.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.802734375, -0.7806777954101562, -0.7586212158203125, -0.7365646362304688, -0.714508056640625, -0.6924514770507812, -0.6703948974609375, -0.6483383178710938, -0.62628173828125, -0.6042251586914062, -0.5821685791015625, -0.5601119995117188, -0.538055419921875, -0.5159988403320312, -0.4939422607421875, -0.47188568115234375, -0.4498291015625, -0.42777252197265625, -0.4057159423828125, -0.38365936279296875, -0.361602783203125, -0.33954620361328125, -0.3174896240234375, -0.29543304443359375, -0.27337646484375, -0.25131988525390625, -0.2292633056640625, -0.20720672607421875, -0.185150146484375, -0.16309356689453125, -0.1410369873046875, -0.11898040771484375, -0.096923828125, -0.07486724853515625, -0.0528106689453125, -0.03075408935546875, -0.008697509765625, 0.01335906982421875, 0.0354156494140625, 0.05747222900390625, 0.07952880859375, 0.10158538818359375, 0.1236419677734375, 0.14569854736328125, 0.167755126953125, 0.18981170654296875, 0.2118682861328125, 0.23392486572265625, 0.2559814453125, 0.27803802490234375, 0.3000946044921875, 0.32215118408203125, 0.344207763671875, 0.36626434326171875, 0.3883209228515625, 0.41037750244140625, 0.43243408203125, 0.45449066162109375, 0.4765472412109375, 0.49860382080078125, 0.520660400390625, 0.5427169799804688, 0.5647735595703125, 0.5868301391601562, 0.60888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 20.0, 20.0, 21.0, 44.0, 50.0, 66.0, 79.0, 86.0, 95.0, 107.0, 88.0, 78.0, 68.0, 44.0, 26.0, 19.0, 21.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06875371932983398, -0.06682872772216797, -0.06490373611450195, -0.06297874450683594, -0.06105375289916992, -0.059128761291503906, -0.05720376968383789, -0.055278778076171875, -0.05335378646850586, -0.051428794860839844, -0.04950380325317383, -0.04757881164550781, -0.0456538200378418, -0.04372882843017578, -0.041803836822509766, -0.03987884521484375, -0.037953853607177734, -0.03602886199951172, -0.0341038703918457, -0.03217887878417969, -0.030253887176513672, -0.028328895568847656, -0.02640390396118164, -0.024478912353515625, -0.02255392074584961, -0.020628929138183594, -0.018703937530517578, -0.016778945922851562, -0.014853954315185547, -0.012928962707519531, -0.011003971099853516, -0.0090789794921875, -0.007153987884521484, -0.005228996276855469, -0.003304004669189453, -0.0013790130615234375, 0.0005459785461425781, 0.0024709701538085938, 0.004395961761474609, 0.006320953369140625, 0.00824594497680664, 0.010170936584472656, 0.012095928192138672, 0.014020919799804688, 0.015945911407470703, 0.01787090301513672, 0.019795894622802734, 0.02172088623046875, 0.023645877838134766, 0.02557086944580078, 0.027495861053466797, 0.029420852661132812, 0.03134584426879883, 0.033270835876464844, 0.03519582748413086, 0.037120819091796875, 0.03904581069946289, 0.040970802307128906, 0.04289579391479492, 0.04482078552246094, 0.04674577713012695, 0.04867076873779297, 0.050595760345458984, 0.052520751953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 0.0, 8.0, 10.0, 6.0, 10.0, 15.0, 21.0, 34.0, 48.0, 47.0, 85.0, 117.0, 185.0, 338.0, 537.0, 971.0, 2105.0, 5476.0, 20586.0, 167761.0, 739844.0, 88627.0, 13708.0, 4220.0, 1683.0, 875.0, 455.0, 264.0, 175.0, 81.0, 83.0, 51.0, 33.0, 28.0, 20.0, 12.0, 12.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0087890625, -0.9744415283203125, -0.940093994140625, -0.9057464599609375, -0.87139892578125, -0.8370513916015625, -0.802703857421875, -0.7683563232421875, -0.7340087890625, -0.6996612548828125, -0.665313720703125, -0.6309661865234375, -0.59661865234375, -0.5622711181640625, -0.527923583984375, -0.4935760498046875, -0.459228515625, -0.4248809814453125, -0.390533447265625, -0.3561859130859375, -0.32183837890625, -0.2874908447265625, -0.253143310546875, -0.2187957763671875, -0.1844482421875, -0.1501007080078125, -0.115753173828125, -0.0814056396484375, -0.04705810546875, -0.0127105712890625, 0.021636962890625, 0.0559844970703125, 0.09033203125, 0.1246795654296875, 0.159027099609375, 0.1933746337890625, 0.22772216796875, 0.2620697021484375, 0.296417236328125, 0.3307647705078125, 0.3651123046875, 0.3994598388671875, 0.433807373046875, 0.4681549072265625, 0.50250244140625, 0.5368499755859375, 0.571197509765625, 0.6055450439453125, 0.639892578125, 0.6742401123046875, 0.708587646484375, 0.7429351806640625, 0.77728271484375, 0.8116302490234375, 0.845977783203125, 0.8803253173828125, 0.9146728515625, 0.9490203857421875, 0.983367919921875, 1.0177154541015625, 1.05206298828125, 1.0864105224609375, 1.120758056640625, 1.1551055908203125, 1.189453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 9.0, 5.0, 15.0, 8.0, 11.0, 13.0, 21.0, 21.0, 23.0, 35.0, 25.0, 30.0, 19.0, 34.0, 42.0, 28.0, 43.0, 49.0, 42.0, 40.0, 41.0, 41.0, 33.0, 37.0, 26.0, 35.0, 32.0, 25.0, 31.0, 14.0, 22.0, 18.0, 13.0, 18.0, 15.0, 9.0, 10.0, 6.0, 11.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.2391357421875, -0.23168373107910156, -0.22423171997070312, -0.2167797088623047, -0.20932769775390625, -0.2018756866455078, -0.19442367553710938, -0.18697166442871094, -0.1795196533203125, -0.17206764221191406, -0.16461563110351562, -0.1571636199951172, -0.14971160888671875, -0.1422595977783203, -0.13480758666992188, -0.12735557556152344, -0.119903564453125, -0.11245155334472656, -0.10499954223632812, -0.09754753112792969, -0.09009552001953125, -0.08264350891113281, -0.07519149780273438, -0.06773948669433594, -0.0602874755859375, -0.05283546447753906, -0.045383453369140625, -0.03793144226074219, -0.03047943115234375, -0.023027420043945312, -0.015575408935546875, -0.008123397827148438, -0.00067138671875, 0.0067806243896484375, 0.014232635498046875, 0.021684646606445312, 0.02913665771484375, 0.03658866882324219, 0.044040679931640625, 0.05149269104003906, 0.0589447021484375, 0.06639671325683594, 0.07384872436523438, 0.08130073547363281, 0.08875274658203125, 0.09620475769042969, 0.10365676879882812, 0.11110877990722656, 0.118560791015625, 0.12601280212402344, 0.13346481323242188, 0.1409168243408203, 0.14836883544921875, 0.1558208465576172, 0.16327285766601562, 0.17072486877441406, 0.1781768798828125, 0.18562889099121094, 0.19308090209960938, 0.2005329132080078, 0.20798492431640625, 0.2154369354248047, 0.22288894653320312, 0.23034095764160156, 0.23779296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 23.0, 14.0, 27.0, 56.0, 81.0, 180.0, 394.0, 952.0, 3808.0, 63288.0, 968521.0, 8546.0, 1610.0, 527.0, 234.0, 115.0, 61.0, 29.0, 28.0, 15.0, 10.0, 8.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2777099609375, -6.082763671875, -5.8878173828125, -5.69287109375, -5.4979248046875, -5.302978515625, -5.1080322265625, -4.9130859375, -4.7181396484375, -4.523193359375, -4.3282470703125, -4.13330078125, -3.9383544921875, -3.743408203125, -3.5484619140625, -3.353515625, -3.1585693359375, -2.963623046875, -2.7686767578125, -2.57373046875, -2.3787841796875, -2.183837890625, -1.9888916015625, -1.7939453125, -1.5989990234375, -1.404052734375, -1.2091064453125, -1.01416015625, -0.8192138671875, -0.624267578125, -0.4293212890625, -0.234375, -0.0394287109375, 0.155517578125, 0.3504638671875, 0.54541015625, 0.7403564453125, 0.935302734375, 1.1302490234375, 1.3251953125, 1.5201416015625, 1.715087890625, 1.9100341796875, 2.10498046875, 2.2999267578125, 2.494873046875, 2.6898193359375, 2.884765625, 3.0797119140625, 3.274658203125, 3.4696044921875, 3.66455078125, 3.8594970703125, 4.054443359375, 4.2493896484375, 4.4443359375, 4.6392822265625, 4.834228515625, 5.0291748046875, 5.22412109375, 5.4190673828125, 5.614013671875, 5.8089599609375, 6.00390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 2.0, 12.0, 6.0, 4.0, 16.0, 12.0, 15.0, 17.0, 24.0, 42.0, 48.0, 73.0, 139.0, 190.0, 115.0, 58.0, 41.0, 30.0, 30.0, 27.0, 16.0, 15.0, 11.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.000701904296875, -0.0006814450025558472, -0.0006609857082366943, -0.0006405264139175415, -0.0006200671195983887, -0.0005996078252792358, -0.000579148530960083, -0.0005586892366409302, -0.0005382299423217773, -0.0005177706480026245, -0.0004973113536834717, -0.00047685205936431885, -0.000456392765045166, -0.0004359334707260132, -0.00041547417640686035, -0.0003950148820877075, -0.0003745555877685547, -0.00035409629344940186, -0.000333636999130249, -0.0003131777048110962, -0.00029271841049194336, -0.00027225911617279053, -0.0002517998218536377, -0.00023134052753448486, -0.00021088123321533203, -0.0001904219388961792, -0.00016996264457702637, -0.00014950335025787354, -0.0001290440559387207, -0.00010858476161956787, -8.812546730041504e-05, -6.766617298126221e-05, -4.7206878662109375e-05, -2.6747584342956543e-05, -6.288290023803711e-06, 1.4171004295349121e-05, 3.463029861450195e-05, 5.5089592933654785e-05, 7.554888725280762e-05, 9.600818157196045e-05, 0.00011646747589111328, 0.0001369267702102661, 0.00015738606452941895, 0.00017784535884857178, 0.0001983046531677246, 0.00021876394748687744, 0.00023922324180603027, 0.0002596825361251831, 0.00028014183044433594, 0.00030060112476348877, 0.0003210604190826416, 0.00034151971340179443, 0.00036197900772094727, 0.0003824383020401001, 0.00040289759635925293, 0.00042335689067840576, 0.0004438161849975586, 0.0004642754793167114, 0.00048473477363586426, 0.0005051940679550171, 0.0005256533622741699, 0.0005461126565933228, 0.0005665719509124756, 0.0005870312452316284, 0.0006074905395507812]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 11.0, 15.0, 13.0, 17.0, 32.0, 31.0, 49.0, 53.0, 78.0, 125.0, 182.0, 282.0, 445.0, 804.0, 1377.0, 3028.0, 8091.0, 34165.0, 791428.0, 178050.0, 19378.0, 5666.0, 2339.0, 1143.0, 582.0, 356.0, 233.0, 165.0, 113.0, 80.0, 62.0, 32.0, 25.0, 22.0, 12.0, 14.0, 10.0, 16.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.048828125, -2.953033447265625, -2.85723876953125, -2.761444091796875, -2.6656494140625, -2.569854736328125, -2.47406005859375, -2.378265380859375, -2.282470703125, -2.186676025390625, -2.09088134765625, -1.995086669921875, -1.8992919921875, -1.803497314453125, -1.70770263671875, -1.611907958984375, -1.51611328125, -1.420318603515625, -1.32452392578125, -1.228729248046875, -1.1329345703125, -1.037139892578125, -0.94134521484375, -0.845550537109375, -0.749755859375, -0.653961181640625, -0.55816650390625, -0.462371826171875, -0.3665771484375, -0.270782470703125, -0.17498779296875, -0.079193115234375, 0.0166015625, 0.112396240234375, 0.20819091796875, 0.303985595703125, 0.3997802734375, 0.495574951171875, 0.59136962890625, 0.687164306640625, 0.782958984375, 0.878753662109375, 0.97454833984375, 1.070343017578125, 1.1661376953125, 1.261932373046875, 1.35772705078125, 1.453521728515625, 1.54931640625, 1.645111083984375, 1.74090576171875, 1.836700439453125, 1.9324951171875, 2.028289794921875, 2.12408447265625, 2.219879150390625, 2.315673828125, 2.411468505859375, 2.50726318359375, 2.603057861328125, 2.6988525390625, 2.794647216796875, 2.89044189453125, 2.986236572265625, 3.08203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 2.0, 14.0, 7.0, 15.0, 13.0, 25.0, 24.0, 42.0, 54.0, 85.0, 189.0, 177.0, 97.0, 67.0, 35.0, 24.0, 29.0, 18.0, 10.0, 12.0, 11.0, 3.0, 9.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0160903930664062, -0.9862823486328125, -0.9564743041992188, -0.926666259765625, -0.8968582153320312, -0.8670501708984375, -0.8372421264648438, -0.80743408203125, -0.7776260375976562, -0.7478179931640625, -0.7180099487304688, -0.688201904296875, -0.6583938598632812, -0.6285858154296875, -0.5987777709960938, -0.5689697265625, -0.5391616821289062, -0.5093536376953125, -0.47954559326171875, -0.449737548828125, -0.41992950439453125, -0.3901214599609375, -0.36031341552734375, -0.33050537109375, -0.30069732666015625, -0.2708892822265625, -0.24108123779296875, -0.211273193359375, -0.18146514892578125, -0.1516571044921875, -0.12184906005859375, -0.092041015625, -0.06223297119140625, -0.0324249267578125, -0.00261688232421875, 0.027191162109375, 0.05699920654296875, 0.0868072509765625, 0.11661529541015625, 0.14642333984375, 0.17623138427734375, 0.2060394287109375, 0.23584747314453125, 0.265655517578125, 0.29546356201171875, 0.3252716064453125, 0.35507965087890625, 0.3848876953125, 0.41469573974609375, 0.4445037841796875, 0.47431182861328125, 0.504119873046875, 0.5339279174804688, 0.5637359619140625, 0.5935440063476562, 0.62335205078125, 0.6531600952148438, 0.6829681396484375, 0.7127761840820312, 0.742584228515625, 0.7723922729492188, 0.8022003173828125, 0.8320083618164062, 0.86181640625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 14.0, 21.0, 49.0, 116.0, 256.0, 320.0, 127.0, 61.0, 25.0, 10.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.086206436157227, -9.68289852142334, -9.27959156036377, -8.876283645629883, -8.472975730895996, -8.069668769836426, -7.666360855102539, -7.2630534172058105, -6.859745979309082, -6.4564385414123535, -6.053130626678467, -5.649823188781738, -5.24651575088501, -4.843208312988281, -4.4399003982543945, -4.036592960357666, -3.6332850456237793, -3.2299773693084717, -2.826669931411743, -2.4233622550964355, -2.020054817199707, -1.6167471408843994, -1.2134394645690918, -0.8101320266723633, -0.40682435035705566, -0.00351676344871521, 0.39979082345962524, 0.8030984401702881, 1.2064059972763062, 1.6097135543823242, 2.013021230697632, 2.4163286685943604, 2.819636344909668, 3.2229440212249756, 3.626251459121704, 4.029559135437012, 4.43286657333374, 4.836174011230469, 5.2394819259643555, 5.642789363861084, 6.0460968017578125, 6.449404239654541, 6.852712154388428, 7.256019592285156, 7.659327030181885, 8.062634468078613, 8.4659423828125, 8.86924934387207, 9.272558212280273, 9.67586612701416, 10.07917308807373, 10.482481002807617, 10.885788917541504, 11.289095878601074, 11.692403793334961, 12.095710754394531, 12.499018669128418, 12.902326583862305, 13.305633544921875, 13.708941459655762, 14.112249374389648, 14.515556335449219, 14.918864250183105, 15.322172164916992, 15.725479125976562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 9.0, 28.0, 36.0, 49.0, 89.0, 93.0, 118.0, 123.0, 97.0, 106.0, 71.0, 43.0, 22.0, 29.0, 15.0, 10.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.885300636291504, -4.714145660400391, -4.5429911613464355, -4.371836185455322, -4.200681209564209, -4.029526233673096, -3.8583717346191406, -3.6872167587280273, -3.516061782836914, -3.34490704536438, -3.1737520694732666, -3.0025973320007324, -2.831442356109619, -2.660287618637085, -2.489132881164551, -2.3179779052734375, -2.1468231678009033, -1.9756683111190796, -1.8045134544372559, -1.6333587169647217, -1.4622037410736084, -1.2910490036010742, -1.1198941469192505, -0.9487392902374268, -0.777584433555603, -0.6064295768737793, -0.43527474999427795, -0.2641199231147766, -0.09296506643295288, 0.07818979024887085, 0.2493445873260498, 0.42049944400787354, 0.5916543006896973, 0.762809157371521, 0.9339640140533447, 1.105118751525879, 1.2762737274169922, 1.4474284648895264, 1.61858332157135, 1.7897381782531738, 1.9608930349349976, 2.1320478916168213, 2.3032026290893555, 2.4743576049804688, 2.645512342453003, 2.816667318344116, 2.9878220558166504, 3.1589770317077637, 3.330131769180298, 3.501286506652832, 3.6724414825439453, 3.8435962200164795, 4.014750957489014, 4.185905933380127, 4.35706090927124, 4.528215408325195, 4.699370384216309, 4.870525360107422, 5.041679859161377, 5.21283483505249, 5.3839898109436035, 5.555144786834717, 5.726299285888672, 5.897454261779785, 6.068609237670898]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 18.0, 27.0, 36.0, 122.0, 493.0, 8569.0, 4177163.0, 7429.0, 281.0, 57.0, 26.0, 13.0, 14.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.734375, -23.234619140625, -22.73486328125, -22.235107421875, -21.7353515625, -21.235595703125, -20.73583984375, -20.236083984375, -19.736328125, -19.236572265625, -18.73681640625, -18.237060546875, -17.7373046875, -17.237548828125, -16.73779296875, -16.238037109375, -15.73828125, -15.238525390625, -14.73876953125, -14.239013671875, -13.7392578125, -13.239501953125, -12.73974609375, -12.239990234375, -11.740234375, -11.240478515625, -10.74072265625, -10.240966796875, -9.7412109375, -9.241455078125, -8.74169921875, -8.241943359375, -7.7421875, -7.242431640625, -6.74267578125, -6.242919921875, -5.7431640625, -5.243408203125, -4.74365234375, -4.243896484375, -3.744140625, -3.244384765625, -2.74462890625, -2.244873046875, -1.7451171875, -1.245361328125, -0.74560546875, -0.245849609375, 0.25390625, 0.753662109375, 1.25341796875, 1.753173828125, 2.2529296875, 2.752685546875, 3.25244140625, 3.752197265625, 4.251953125, 4.751708984375, 5.25146484375, 5.751220703125, 6.2509765625, 6.750732421875, 7.25048828125, 7.750244140625, 8.25]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 8.0, 6.0, 20.0, 26.0, 31.0, 39.0, 59.0, 59.0, 75.0, 84.0, 94.0, 90.0, 92.0, 69.0, 59.0, 51.0, 32.0, 27.0, 15.0, 17.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06982421875, -0.06776952743530273, -0.06571483612060547, -0.0636601448059082, -0.06160545349121094, -0.05955076217651367, -0.057496070861816406, -0.05544137954711914, -0.053386688232421875, -0.05133199691772461, -0.049277305603027344, -0.04722261428833008, -0.04516792297363281, -0.04311323165893555, -0.04105854034423828, -0.039003849029541016, -0.03694915771484375, -0.034894466400146484, -0.03283977508544922, -0.030785083770751953, -0.028730392456054688, -0.026675701141357422, -0.024621009826660156, -0.02256631851196289, -0.020511627197265625, -0.01845693588256836, -0.016402244567871094, -0.014347553253173828, -0.012292861938476562, -0.010238170623779297, -0.008183479309082031, -0.006128787994384766, -0.0040740966796875, -0.0020194053649902344, 3.528594970703125e-05, 0.002089977264404297, 0.0041446685791015625, 0.006199359893798828, 0.008254051208496094, 0.01030874252319336, 0.012363433837890625, 0.01441812515258789, 0.016472816467285156, 0.018527507781982422, 0.020582199096679688, 0.022636890411376953, 0.02469158172607422, 0.026746273040771484, 0.02880096435546875, 0.030855655670166016, 0.03291034698486328, 0.03496503829956055, 0.03701972961425781, 0.03907442092895508, 0.041129112243652344, 0.04318380355834961, 0.045238494873046875, 0.04729318618774414, 0.049347877502441406, 0.05140256881713867, 0.05345726013183594, 0.0555119514465332, 0.05756664276123047, 0.059621334075927734, 0.061676025390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 16.0, 24.0, 37.0, 92.0, 139.0, 327.0, 739.0, 2096.0, 7842.0, 40602.0, 474716.0, 3550703.0, 96640.0, 14585.0, 3471.0, 1137.0, 488.0, 230.0, 137.0, 97.0, 42.0, 32.0, 16.0, 15.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.142578125, -3.05072021484375, -2.9588623046875, -2.86700439453125, -2.775146484375, -2.68328857421875, -2.5914306640625, -2.49957275390625, -2.40771484375, -2.31585693359375, -2.2239990234375, -2.13214111328125, -2.040283203125, -1.94842529296875, -1.8565673828125, -1.76470947265625, -1.6728515625, -1.58099365234375, -1.4891357421875, -1.39727783203125, -1.305419921875, -1.21356201171875, -1.1217041015625, -1.02984619140625, -0.93798828125, -0.84613037109375, -0.7542724609375, -0.66241455078125, -0.570556640625, -0.47869873046875, -0.3868408203125, -0.29498291015625, -0.203125, -0.11126708984375, -0.0194091796875, 0.07244873046875, 0.164306640625, 0.25616455078125, 0.3480224609375, 0.43988037109375, 0.53173828125, 0.62359619140625, 0.7154541015625, 0.80731201171875, 0.899169921875, 0.99102783203125, 1.0828857421875, 1.17474365234375, 1.2666015625, 1.35845947265625, 1.4503173828125, 1.54217529296875, 1.634033203125, 1.72589111328125, 1.8177490234375, 1.90960693359375, 2.00146484375, 2.09332275390625, 2.1851806640625, 2.27703857421875, 2.368896484375, 2.46075439453125, 2.5526123046875, 2.64447021484375, 2.736328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 6.0, 1.0, 8.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 22.0, 35.0, 37.0, 57.0, 80.0, 121.0, 161.0, 428.0, 1493.0, 716.0, 272.0, 171.0, 110.0, 72.0, 66.0, 28.0, 39.0, 17.0, 13.0, 17.0, 14.0, 6.0, 8.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2154541015625, -0.20940017700195312, -0.20334625244140625, -0.19729232788085938, -0.1912384033203125, -0.18518447875976562, -0.17913055419921875, -0.17307662963867188, -0.167022705078125, -0.16096878051757812, -0.15491485595703125, -0.14886093139648438, -0.1428070068359375, -0.13675308227539062, -0.13069915771484375, -0.12464523315429688, -0.11859130859375, -0.11253738403320312, -0.10648345947265625, -0.10042953491210938, -0.0943756103515625, -0.08832168579101562, -0.08226776123046875, -0.07621383666992188, -0.070159912109375, -0.06410598754882812, -0.05805206298828125, -0.051998138427734375, -0.0459442138671875, -0.039890289306640625, -0.03383636474609375, -0.027782440185546875, -0.021728515625, -0.015674591064453125, -0.00962066650390625, -0.003566741943359375, 0.0024871826171875, 0.008541107177734375, 0.01459503173828125, 0.020648956298828125, 0.026702880859375, 0.032756805419921875, 0.03881072998046875, 0.044864654541015625, 0.0509185791015625, 0.056972503662109375, 0.06302642822265625, 0.06908035278320312, 0.07513427734375, 0.08118820190429688, 0.08724212646484375, 0.09329605102539062, 0.0993499755859375, 0.10540390014648438, 0.11145782470703125, 0.11751174926757812, 0.123565673828125, 0.12961959838867188, 0.13567352294921875, 0.14172744750976562, 0.1477813720703125, 0.15383529663085938, 0.15988922119140625, 0.16594314575195312, 0.1719970703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 11.0, 42.0, 276.0, 547.0, 111.0, 15.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.924245834350586, -6.611834526062012, -6.2994232177734375, -5.9870123863220215, -5.674601078033447, -5.362189769744873, -5.049778938293457, -4.737367630004883, -4.424956321716309, -4.112545013427734, -3.8001339435577393, -3.487722873687744, -3.17531156539917, -2.8629002571105957, -2.5504891872406006, -2.2380781173706055, -1.9256668090820312, -1.6132556200027466, -1.300844430923462, -0.9884332418441772, -0.6760220527648926, -0.3636108636856079, -0.05119967460632324, 0.2612113952636719, 0.5736227035522461, 0.8860338926315308, 1.1984450817108154, 1.5108562707901, 1.8232674598693848, 2.135678768157959, 2.448089838027954, 2.760500907897949, 3.0729122161865234, 3.3853235244750977, 3.6977345943450928, 4.010145664215088, 4.322556972503662, 4.634968280792236, 4.947379112243652, 5.259790420532227, 5.572201728820801, 5.884613037109375, 6.197024345397949, 6.509435176849365, 6.8218464851379395, 7.134257793426514, 7.44666862487793, 7.759079933166504, 8.071491241455078, 8.383902549743652, 8.696313858032227, 9.0087251663208, 9.321136474609375, 9.633546829223633, 9.945958137512207, 10.258369445800781, 10.570780754089355, 10.88319206237793, 11.195603370666504, 11.508014678955078, 11.820425033569336, 12.13283634185791, 12.445247650146484, 12.757658958435059, 13.070070266723633]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 29.0, 45.0, 69.0, 87.0, 97.0, 95.0, 116.0, 104.0, 90.0, 66.0, 62.0, 30.0, 29.0, 11.0, 15.0, 3.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.533045768737793, -1.4771573543548584, -1.4212690591812134, -1.3653806447982788, -1.3094923496246338, -1.2536039352416992, -1.1977155208587646, -1.14182710647583, -1.085938811302185, -1.0300503969192505, -0.9741621017456055, -0.9182736873626709, -0.8623853325843811, -0.8064969778060913, -0.7506085634231567, -0.6947202086448669, -0.6388318538665771, -0.5829434990882874, -0.5270551443099976, -0.471166729927063, -0.4152783751487732, -0.3593900203704834, -0.3035016357898712, -0.24761325120925903, -0.19172489643096924, -0.13583652675151825, -0.07994815707206726, -0.024059787392616272, 0.03182858228683472, 0.08771693706512451, 0.1436053216457367, 0.19949370622634888, 0.25538206100463867, 0.31127041578292847, 0.36715880036354065, 0.42304718494415283, 0.4789355397224426, 0.5348238945007324, 0.590712308883667, 0.6466006636619568, 0.7024890184402466, 0.7583773732185364, 0.8142657279968262, 0.8701541423797607, 0.9260424971580505, 0.9819308519363403, 1.037819266319275, 1.09370756149292, 1.1495959758758545, 1.205484390258789, 1.261372685432434, 1.3172610998153687, 1.3731493949890137, 1.4290378093719482, 1.4849262237548828, 1.5408146381378174, 1.5967029333114624, 1.652591347694397, 1.708479642868042, 1.7643680572509766, 1.8202564716339111, 1.8761447668075562, 1.9320331811904907, 1.9879214763641357, 2.0438098907470703]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 4.0, 5.0, 5.0, 11.0, 10.0, 25.0, 25.0, 52.0, 69.0, 150.0, 299.0, 907.0, 3223.0, 17463.0, 344660.0, 650381.0, 25542.0, 3887.0, 1085.0, 367.0, 158.0, 82.0, 36.0, 33.0, 16.0, 11.0, 14.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.35546875, -3.25701904296875, -3.1585693359375, -3.06011962890625, -2.961669921875, -2.86322021484375, -2.7647705078125, -2.66632080078125, -2.56787109375, -2.46942138671875, -2.3709716796875, -2.27252197265625, -2.174072265625, -2.07562255859375, -1.9771728515625, -1.87872314453125, -1.7802734375, -1.68182373046875, -1.5833740234375, -1.48492431640625, -1.386474609375, -1.28802490234375, -1.1895751953125, -1.09112548828125, -0.99267578125, -0.89422607421875, -0.7957763671875, -0.69732666015625, -0.598876953125, -0.50042724609375, -0.4019775390625, -0.30352783203125, -0.205078125, -0.10662841796875, -0.0081787109375, 0.09027099609375, 0.188720703125, 0.28717041015625, 0.3856201171875, 0.48406982421875, 0.58251953125, 0.68096923828125, 0.7794189453125, 0.87786865234375, 0.976318359375, 1.07476806640625, 1.1732177734375, 1.27166748046875, 1.3701171875, 1.46856689453125, 1.5670166015625, 1.66546630859375, 1.763916015625, 1.86236572265625, 1.9608154296875, 2.05926513671875, 2.15771484375, 2.25616455078125, 2.3546142578125, 2.45306396484375, 2.551513671875, 2.64996337890625, 2.7484130859375, 2.84686279296875, 2.9453125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 6.0, 14.0, 35.0, 67.0, 103.0, 153.0, 171.0, 157.0, 135.0, 68.0, 36.0, 27.0, 12.0, 5.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06515979766845703, -0.06043434143066406, -0.055708885192871094, -0.050983428955078125, -0.046257972717285156, -0.04153251647949219, -0.03680706024169922, -0.03208160400390625, -0.02735614776611328, -0.022630691528320312, -0.017905235290527344, -0.013179779052734375, -0.008454322814941406, -0.0037288665771484375, 0.0009965896606445312, 0.0057220458984375, 0.010447502136230469, 0.015172958374023438, 0.019898414611816406, 0.024623870849609375, 0.029349327087402344, 0.03407478332519531, 0.03880023956298828, 0.04352569580078125, 0.04825115203857422, 0.05297660827636719, 0.057702064514160156, 0.062427520751953125, 0.0671529769897461, 0.07187843322753906, 0.07660388946533203, 0.081329345703125, 0.08605480194091797, 0.09078025817871094, 0.0955057144165039, 0.10023117065429688, 0.10495662689208984, 0.10968208312988281, 0.11440753936767578, 0.11913299560546875, 0.12385845184326172, 0.1285839080810547, 0.13330936431884766, 0.13803482055664062, 0.1427602767944336, 0.14748573303222656, 0.15221118927001953, 0.1569366455078125, 0.16166210174560547, 0.16638755798339844, 0.1711130142211914, 0.17583847045898438, 0.18056392669677734, 0.1852893829345703, 0.19001483917236328, 0.19474029541015625, 0.19946575164794922, 0.2041912078857422, 0.20891666412353516, 0.21364212036132812, 0.2183675765991211, 0.22309303283691406, 0.22781848907470703, 0.2325439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 2.0, 4.0, 7.0, 2.0, 4.0, 8.0, 12.0, 8.0, 11.0, 17.0, 24.0, 18.0, 25.0, 39.0, 109.0, 505.0, 5170.0, 628767.0, 408917.0, 4182.0, 456.0, 66.0, 38.0, 29.0, 20.0, 15.0, 9.0, 13.0, 12.0, 11.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-4.66015625, -4.53057861328125, -4.4010009765625, -4.27142333984375, -4.141845703125, -4.01226806640625, -3.8826904296875, -3.75311279296875, -3.62353515625, -3.49395751953125, -3.3643798828125, -3.23480224609375, -3.105224609375, -2.97564697265625, -2.8460693359375, -2.71649169921875, -2.5869140625, -2.45733642578125, -2.3277587890625, -2.19818115234375, -2.068603515625, -1.93902587890625, -1.8094482421875, -1.67987060546875, -1.55029296875, -1.42071533203125, -1.2911376953125, -1.16156005859375, -1.031982421875, -0.90240478515625, -0.7728271484375, -0.64324951171875, -0.513671875, -0.38409423828125, -0.2545166015625, -0.12493896484375, 0.004638671875, 0.13421630859375, 0.2637939453125, 0.39337158203125, 0.52294921875, 0.65252685546875, 0.7821044921875, 0.91168212890625, 1.041259765625, 1.17083740234375, 1.3004150390625, 1.42999267578125, 1.5595703125, 1.68914794921875, 1.8187255859375, 1.94830322265625, 2.077880859375, 2.20745849609375, 2.3370361328125, 2.46661376953125, 2.59619140625, 2.72576904296875, 2.8553466796875, 2.98492431640625, 3.114501953125, 3.24407958984375, 3.3736572265625, 3.50323486328125, 3.6328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 12.0, 17.0, 7.0, 14.0, 22.0, 22.0, 28.0, 38.0, 36.0, 39.0, 51.0, 66.0, 43.0, 54.0, 51.0, 52.0, 50.0, 60.0, 44.0, 45.0, 38.0, 31.0, 35.0, 26.0, 11.0, 22.0, 19.0, 9.0, 12.0, 5.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.3027229309082031, -0.29172515869140625, -0.2807273864746094, -0.2697296142578125, -0.2587318420410156, -0.24773406982421875, -0.23673629760742188, -0.225738525390625, -0.21474075317382812, -0.20374298095703125, -0.19274520874023438, -0.1817474365234375, -0.17074966430664062, -0.15975189208984375, -0.14875411987304688, -0.13775634765625, -0.12675857543945312, -0.11576080322265625, -0.10476303100585938, -0.0937652587890625, -0.08276748657226562, -0.07176971435546875, -0.060771942138671875, -0.049774169921875, -0.038776397705078125, -0.02777862548828125, -0.016780853271484375, -0.0057830810546875, 0.005214691162109375, 0.01621246337890625, 0.027210235595703125, 0.0382080078125, 0.049205780029296875, 0.06020355224609375, 0.07120132446289062, 0.0821990966796875, 0.09319686889648438, 0.10419464111328125, 0.11519241333007812, 0.126190185546875, 0.13718795776367188, 0.14818572998046875, 0.15918350219726562, 0.1701812744140625, 0.18117904663085938, 0.19217681884765625, 0.20317459106445312, 0.21417236328125, 0.22517013549804688, 0.23616790771484375, 0.24716567993164062, 0.2581634521484375, 0.2691612243652344, 0.28015899658203125, 0.2911567687988281, 0.302154541015625, 0.3131523132324219, 0.32415008544921875, 0.3351478576660156, 0.3461456298828125, 0.3571434020996094, 0.36814117431640625, 0.3791389465332031, 0.39013671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 31.0, 79.0, 346.0, 3258.0, 1012672.0, 30883.0, 907.0, 139.0, 40.0, 26.0, 12.0, 18.0, 11.0, 7.0, 6.0, 11.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.09375, -12.6044921875, -12.115234375, -11.6259765625, -11.13671875, -10.6474609375, -10.158203125, -9.6689453125, -9.1796875, -8.6904296875, -8.201171875, -7.7119140625, -7.22265625, -6.7333984375, -6.244140625, -5.7548828125, -5.265625, -4.7763671875, -4.287109375, -3.7978515625, -3.30859375, -2.8193359375, -2.330078125, -1.8408203125, -1.3515625, -0.8623046875, -0.373046875, 0.1162109375, 0.60546875, 1.0947265625, 1.583984375, 2.0732421875, 2.5625, 3.0517578125, 3.541015625, 4.0302734375, 4.51953125, 5.0087890625, 5.498046875, 5.9873046875, 6.4765625, 6.9658203125, 7.455078125, 7.9443359375, 8.43359375, 8.9228515625, 9.412109375, 9.9013671875, 10.390625, 10.8798828125, 11.369140625, 11.8583984375, 12.34765625, 12.8369140625, 13.326171875, 13.8154296875, 14.3046875, 14.7939453125, 15.283203125, 15.7724609375, 16.26171875, 16.7509765625, 17.240234375, 17.7294921875, 18.21875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 46.0, 275.0, 439.0, 82.0, 22.0, 9.0, 4.0, 3.0, 11.0, 7.0, 9.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022125244140625, -0.0021167993545532227, -0.0020210742950439453, -0.001925349235534668, -0.0018296241760253906, -0.0017338991165161133, -0.001638174057006836, -0.0015424489974975586, -0.0014467239379882812, -0.001350998878479004, -0.0012552738189697266, -0.0011595487594604492, -0.0010638236999511719, -0.0009680986404418945, -0.0008723735809326172, -0.0007766485214233398, -0.0006809234619140625, -0.0005851984024047852, -0.0004894733428955078, -0.00039374828338623047, -0.0002980232238769531, -0.00020229816436767578, -0.00010657310485839844, -1.0848045349121094e-05, 8.487701416015625e-05, 0.0001806020736694336, 0.00027632713317871094, 0.0003720521926879883, 0.0004677772521972656, 0.000563502311706543, 0.0006592273712158203, 0.0007549524307250977, 0.000850677490234375, 0.0009464025497436523, 0.0010421276092529297, 0.001137852668762207, 0.0012335777282714844, 0.0013293027877807617, 0.001425027847290039, 0.0015207529067993164, 0.0016164779663085938, 0.001712203025817871, 0.0018079280853271484, 0.0019036531448364258, 0.001999378204345703, 0.0020951032638549805, 0.002190828323364258, 0.002286553382873535, 0.0023822784423828125, 0.00247800350189209, 0.002573728561401367, 0.0026694536209106445, 0.002765178680419922, 0.0028609037399291992, 0.0029566287994384766, 0.003052353858947754, 0.0031480789184570312, 0.0032438039779663086, 0.003339529037475586, 0.0034352540969848633, 0.0035309791564941406, 0.003626704216003418, 0.0037224292755126953, 0.0038181543350219727, 0.00391387939453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 9.0, 9.0, 5.0, 13.0, 22.0, 21.0, 54.0, 52.0, 75.0, 126.0, 201.0, 266.0, 410.0, 733.0, 1268.0, 2222.0, 4205.0, 8595.0, 21763.0, 95944.0, 795824.0, 78667.0, 20337.0, 8253.0, 3928.0, 2159.0, 1159.0, 722.0, 480.0, 301.0, 219.0, 154.0, 105.0, 63.0, 48.0, 37.0, 25.0, 26.0, 14.0, 6.0, 11.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.499481201171875, -3.37200927734375, -3.244537353515625, -3.1170654296875, -2.989593505859375, -2.86212158203125, -2.734649658203125, -2.607177734375, -2.479705810546875, -2.35223388671875, -2.224761962890625, -2.0972900390625, -1.969818115234375, -1.84234619140625, -1.714874267578125, -1.58740234375, -1.459930419921875, -1.33245849609375, -1.204986572265625, -1.0775146484375, -0.950042724609375, -0.82257080078125, -0.695098876953125, -0.567626953125, -0.440155029296875, -0.31268310546875, -0.185211181640625, -0.0577392578125, 0.069732666015625, 0.19720458984375, 0.324676513671875, 0.4521484375, 0.579620361328125, 0.70709228515625, 0.834564208984375, 0.9620361328125, 1.089508056640625, 1.21697998046875, 1.344451904296875, 1.471923828125, 1.599395751953125, 1.72686767578125, 1.854339599609375, 1.9818115234375, 2.109283447265625, 2.23675537109375, 2.364227294921875, 2.49169921875, 2.619171142578125, 2.74664306640625, 2.874114990234375, 3.0015869140625, 3.129058837890625, 3.25653076171875, 3.384002685546875, 3.511474609375, 3.638946533203125, 3.76641845703125, 3.893890380859375, 4.0213623046875, 4.148834228515625, 4.27630615234375, 4.403778076171875, 4.53125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 16.0, 28.0, 30.0, 103.0, 190.0, 263.0, 158.0, 44.0, 32.0, 20.0, 18.0, 13.0, 9.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.640625, -1.57037353515625, -1.5001220703125, -1.42987060546875, -1.359619140625, -1.28936767578125, -1.2191162109375, -1.14886474609375, -1.07861328125, -1.00836181640625, -0.9381103515625, -0.86785888671875, -0.797607421875, -0.72735595703125, -0.6571044921875, -0.58685302734375, -0.5166015625, -0.44635009765625, -0.3760986328125, -0.30584716796875, -0.235595703125, -0.16534423828125, -0.0950927734375, -0.02484130859375, 0.04541015625, 0.11566162109375, 0.1859130859375, 0.25616455078125, 0.326416015625, 0.39666748046875, 0.4669189453125, 0.53717041015625, 0.607421875, 0.67767333984375, 0.7479248046875, 0.81817626953125, 0.888427734375, 0.95867919921875, 1.0289306640625, 1.09918212890625, 1.16943359375, 1.23968505859375, 1.3099365234375, 1.38018798828125, 1.450439453125, 1.52069091796875, 1.5909423828125, 1.66119384765625, 1.7314453125, 1.80169677734375, 1.8719482421875, 1.94219970703125, 2.012451171875, 2.08270263671875, 2.1529541015625, 2.22320556640625, 2.29345703125, 2.36370849609375, 2.4339599609375, 2.50421142578125, 2.574462890625, 2.64471435546875, 2.7149658203125, 2.78521728515625, 2.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 18.0, 30.0, 61.0, 109.0, 160.0, 235.0, 160.0, 104.0, 54.0, 22.0, 12.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40109634399414, -13.04529094696045, -12.689485549926758, -12.333680152893066, -11.977874755859375, -11.6220703125, -11.266263961791992, -10.910459518432617, -10.554654121398926, -10.198848724365234, -9.843043327331543, -9.487237930297852, -9.13143253326416, -8.775627136230469, -8.419822692871094, -8.064017295837402, -7.708211421966553, -7.352406024932861, -6.99660062789917, -6.640795707702637, -6.284990310668945, -5.929184913635254, -5.5733795166015625, -5.217574119567871, -4.86176872253418, -4.505963325500488, -4.150157928466797, -3.7943527698516846, -3.4385476112365723, -3.082742214202881, -2.7269368171691895, -2.371131658554077, -2.015326499938965, -1.659521222114563, -1.3037159442901611, -0.9479105472564697, -0.5921052694320679, -0.23629999160766602, 0.11950540542602539, 0.4753105640411377, 0.8311159610748291, 1.186921238899231, 1.5427265167236328, 1.8985319137573242, 2.2543373107910156, 2.610142469406128, 2.9659478664398193, 3.3217530250549316, 3.677558422088623, 4.0333638191223145, 4.389169216156006, 4.744974136352539, 5.1007795333862305, 5.456584930419922, 5.812390327453613, 6.168195724487305, 6.524001121520996, 6.8798065185546875, 7.235611915588379, 7.59141731262207, 7.9472222328186035, 8.303028106689453, 8.658832550048828, 9.01463794708252, 9.370443344116211]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 9.0, 13.0, 12.0, 16.0, 17.0, 19.0, 23.0, 30.0, 39.0, 26.0, 46.0, 46.0, 44.0, 47.0, 40.0, 50.0, 48.0, 44.0, 45.0, 48.0, 39.0, 35.0, 34.0, 27.0, 29.0, 34.0, 19.0, 16.0, 17.0, 8.0, 21.0, 11.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.948370933532715, -2.8556225299835205, -2.7628743648529053, -2.670125961303711, -2.5773775577545166, -2.4846293926239014, -2.391880989074707, -2.299132823944092, -2.2063844203948975, -2.113636016845703, -2.020887851715088, -1.9281394481658936, -1.8353911638259888, -1.742642879486084, -1.6498944759368896, -1.5571461915969849, -1.4643977880477905, -1.3716495037078857, -1.2789011001586914, -1.1861528158187866, -1.0934045314788818, -1.0006561279296875, -0.9079078435897827, -0.8151595592498779, -0.7224112153053284, -0.6296628713607788, -0.536914587020874, -0.44416624307632446, -0.3514179289340973, -0.2586696147918701, -0.16592127084732056, -0.07317298650741577, 0.01957535743713379, 0.11232367902994156, 0.20507200062274933, 0.2978203296661377, 0.39056864380836487, 0.48331695795059204, 0.5760653018951416, 0.6688135862350464, 0.761561930179596, 0.8543102741241455, 0.9470585584640503, 1.039806842803955, 1.1325552463531494, 1.2253035306930542, 1.318051815032959, 1.4108002185821533, 1.503548502922058, 1.596296787261963, 1.6890451908111572, 1.781793475151062, 1.8745417594909668, 1.9672901630401611, 2.0600385665893555, 2.1527867317199707, 2.245535135269165, 2.3382835388183594, 2.4310317039489746, 2.523780107498169, 2.6165285110473633, 2.7092766761779785, 2.802025079727173, 2.894773483276367, 2.9875216484069824]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 7.0, 7.0, 8.0, 17.0, 33.0, 35.0, 37.0, 69.0, 129.0, 295.0, 982.0, 5318.0, 68001.0, 4050005.0, 62216.0, 5372.0, 1001.0, 294.0, 149.0, 71.0, 59.0, 37.0, 33.0, 29.0, 15.0, 16.0, 13.0, 8.0, 8.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.19451904296875, -4.9984130859375, -4.80230712890625, -4.606201171875, -4.41009521484375, -4.2139892578125, -4.01788330078125, -3.82177734375, -3.62567138671875, -3.4295654296875, -3.23345947265625, -3.037353515625, -2.84124755859375, -2.6451416015625, -2.44903564453125, -2.2529296875, -2.05682373046875, -1.8607177734375, -1.66461181640625, -1.468505859375, -1.27239990234375, -1.0762939453125, -0.88018798828125, -0.68408203125, -0.48797607421875, -0.2918701171875, -0.09576416015625, 0.100341796875, 0.29644775390625, 0.4925537109375, 0.68865966796875, 0.884765625, 1.08087158203125, 1.2769775390625, 1.47308349609375, 1.669189453125, 1.86529541015625, 2.0614013671875, 2.25750732421875, 2.45361328125, 2.64971923828125, 2.8458251953125, 3.04193115234375, 3.238037109375, 3.43414306640625, 3.6302490234375, 3.82635498046875, 4.0224609375, 4.21856689453125, 4.4146728515625, 4.61077880859375, 4.806884765625, 5.00299072265625, 5.1990966796875, 5.39520263671875, 5.59130859375, 5.78741455078125, 5.9835205078125, 6.17962646484375, 6.375732421875, 6.57183837890625, 6.7679443359375, 6.96405029296875, 7.16015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 20.0, 15.0, 19.0, 36.0, 42.0, 58.0, 57.0, 53.0, 55.0, 55.0, 70.0, 57.0, 58.0, 55.0, 42.0, 53.0, 41.0, 36.0, 32.0, 23.0, 27.0, 21.0, 8.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06856441497802734, -0.06626701354980469, -0.06396961212158203, -0.061672210693359375, -0.05937480926513672, -0.05707740783691406, -0.054780006408691406, -0.05248260498046875, -0.050185203552246094, -0.04788780212402344, -0.04559040069580078, -0.043292999267578125, -0.04099559783935547, -0.03869819641113281, -0.036400794982910156, -0.0341033935546875, -0.031805992126464844, -0.029508590698242188, -0.02721118927001953, -0.024913787841796875, -0.02261638641357422, -0.020318984985351562, -0.018021583557128906, -0.01572418212890625, -0.013426780700683594, -0.011129379272460938, -0.008831977844238281, -0.006534576416015625, -0.004237174987792969, -0.0019397735595703125, 0.00035762786865234375, 0.002655029296875, 0.004952430725097656, 0.0072498321533203125, 0.009547233581542969, 0.011844635009765625, 0.014142036437988281, 0.016439437866210938, 0.018736839294433594, 0.02103424072265625, 0.023331642150878906, 0.025629043579101562, 0.02792644500732422, 0.030223846435546875, 0.03252124786376953, 0.03481864929199219, 0.037116050720214844, 0.0394134521484375, 0.041710853576660156, 0.04400825500488281, 0.04630565643310547, 0.048603057861328125, 0.05090045928955078, 0.05319786071777344, 0.055495262145996094, 0.05779266357421875, 0.060090065002441406, 0.06238746643066406, 0.06468486785888672, 0.06698226928710938, 0.06927967071533203, 0.07157707214355469, 0.07387447357177734, 0.076171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 12.0, 25.0, 27.0, 46.0, 100.0, 256.0, 1112.0, 41931.0, 4140417.0, 9423.0, 553.0, 161.0, 81.0, 44.0, 29.0, 10.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.433349609375, -8.99169921875, -8.550048828125, -8.1083984375, -7.666748046875, -7.22509765625, -6.783447265625, -6.341796875, -5.900146484375, -5.45849609375, -5.016845703125, -4.5751953125, -4.133544921875, -3.69189453125, -3.250244140625, -2.80859375, -2.366943359375, -1.92529296875, -1.483642578125, -1.0419921875, -0.600341796875, -0.15869140625, 0.282958984375, 0.724609375, 1.166259765625, 1.60791015625, 2.049560546875, 2.4912109375, 2.932861328125, 3.37451171875, 3.816162109375, 4.2578125, 4.699462890625, 5.14111328125, 5.582763671875, 6.0244140625, 6.466064453125, 6.90771484375, 7.349365234375, 7.791015625, 8.232666015625, 8.67431640625, 9.115966796875, 9.5576171875, 9.999267578125, 10.44091796875, 10.882568359375, 11.32421875, 11.765869140625, 12.20751953125, 12.649169921875, 13.0908203125, 13.532470703125, 13.97412109375, 14.415771484375, 14.857421875, 15.299072265625, 15.74072265625, 16.182373046875, 16.6240234375, 17.065673828125, 17.50732421875, 17.948974609375, 18.390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 9.0, 8.0, 19.0, 33.0, 35.0, 59.0, 71.0, 118.0, 195.0, 400.0, 1504.0, 775.0, 299.0, 201.0, 115.0, 59.0, 46.0, 41.0, 15.0, 21.0, 13.0, 8.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35433197021484375, -0.3441619873046875, -0.33399200439453125, -0.323822021484375, -0.31365203857421875, -0.3034820556640625, -0.29331207275390625, -0.28314208984375, -0.27297210693359375, -0.2628021240234375, -0.25263214111328125, -0.242462158203125, -0.23229217529296875, -0.2221221923828125, -0.21195220947265625, -0.2017822265625, -0.19161224365234375, -0.1814422607421875, -0.17127227783203125, -0.161102294921875, -0.15093231201171875, -0.1407623291015625, -0.13059234619140625, -0.12042236328125, -0.11025238037109375, -0.1000823974609375, -0.08991241455078125, -0.079742431640625, -0.06957244873046875, -0.0594024658203125, -0.04923248291015625, -0.0390625, -0.02889251708984375, -0.0187225341796875, -0.00855255126953125, 0.001617431640625, 0.01178741455078125, 0.0219573974609375, 0.03212738037109375, 0.04229736328125, 0.05246734619140625, 0.0626373291015625, 0.07280731201171875, 0.082977294921875, 0.09314727783203125, 0.1033172607421875, 0.11348724365234375, 0.1236572265625, 0.13382720947265625, 0.1439971923828125, 0.15416717529296875, 0.164337158203125, 0.17450714111328125, 0.1846771240234375, 0.19484710693359375, 0.20501708984375, 0.21518707275390625, 0.2253570556640625, 0.23552703857421875, 0.245697021484375, 0.25586700439453125, 0.2660369873046875, 0.27620697021484375, 0.286376953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 27.0, 189.0, 477.0, 269.0, 36.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.40032196044922, -20.019495010375977, -19.638669967651367, -19.257843017578125, -18.877017974853516, -18.496191024780273, -18.115365982055664, -17.734539031982422, -17.353713989257812, -16.97288703918457, -16.59206199645996, -16.21123504638672, -15.83041000366211, -15.449584007263184, -15.068758010864258, -14.687931060791016, -14.30710506439209, -13.926279067993164, -13.545453071594238, -13.164627075195312, -12.783801078796387, -12.402975082397461, -12.022148132324219, -11.64132308959961, -11.260496139526367, -10.879670143127441, -10.498844146728516, -10.11801815032959, -9.737192153930664, -9.356366157531738, -8.975540161132812, -8.59471321105957, -8.213887214660645, -7.833061218261719, -7.452235221862793, -7.071409225463867, -6.690583229064941, -6.309757232666016, -5.928930759429932, -5.548104763031006, -5.167279243469238, -4.7864532470703125, -4.405627250671387, -4.024801254272461, -3.643975019454956, -3.2631490230560303, -2.8823227882385254, -2.5014967918395996, -2.1206705570220947, -1.739844560623169, -1.3590184450149536, -0.9781923294067383, -0.5973663330078125, -0.21654033660888672, 0.16428589820861816, 0.545111894607544, 0.9259378910064697, 1.3067638874053955, 1.6875900030136108, 2.068416118621826, 2.449242115020752, 2.8300681114196777, 3.2108943462371826, 3.5917203426361084, 3.972546339035034]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 7.0, 14.0, 4.0, 9.0, 9.0, 14.0, 14.0, 22.0, 18.0, 28.0, 38.0, 27.0, 30.0, 31.0, 31.0, 32.0, 55.0, 51.0, 42.0, 57.0, 48.0, 44.0, 48.0, 43.0, 33.0, 28.0, 23.0, 30.0, 31.0, 23.0, 24.0, 11.0, 16.0, 11.0, 6.0, 11.0, 4.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.947307825088501, -0.9157190918922424, -0.8841303586959839, -0.8525416254997253, -0.8209528923034668, -0.7893641591072083, -0.7577754259109497, -0.7261867523193359, -0.6945979595184326, -0.6630092263221741, -0.6314204931259155, -0.599831759929657, -0.5682430267333984, -0.5366542935371399, -0.5050655603408813, -0.4734768569469452, -0.44188815355300903, -0.4102994203567505, -0.37871068716049194, -0.3471219539642334, -0.31553322076797485, -0.2839444875717163, -0.25235578417778015, -0.2207670509815216, -0.18917831778526306, -0.15758958458900452, -0.12600085139274597, -0.09441213309764862, -0.06282339990139008, -0.03123466670513153, 0.0003540515899658203, 0.031942784786224365, 0.06353151798248291, 0.09512025117874146, 0.126708984375, 0.15829770267009735, 0.1898864358663559, 0.22147516906261444, 0.2530638873577118, 0.28465262055397034, 0.3162413537502289, 0.3478300869464874, 0.37941882014274597, 0.41100752353668213, 0.4425962567329407, 0.4741849899291992, 0.5057737231254578, 0.5373624563217163, 0.5689511895179749, 0.6005399227142334, 0.6321286559104919, 0.6637173891067505, 0.695306122303009, 0.7268948554992676, 0.7584835290908813, 0.7900723218917847, 0.8216609954833984, 0.853249728679657, 0.8848384618759155, 0.9164271950721741, 0.9480159282684326, 0.9796046614646912, 1.0111933946609497, 1.0427820682525635, 1.0743708610534668]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 10.0, 15.0, 12.0, 20.0, 21.0, 27.0, 38.0, 38.0, 59.0, 108.0, 1651.0, 195599.0, 839217.0, 11018.0, 349.0, 81.0, 62.0, 50.0, 39.0, 25.0, 20.0, 24.0, 15.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.48046875, -5.304931640625, -5.12939453125, -4.953857421875, -4.7783203125, -4.602783203125, -4.42724609375, -4.251708984375, -4.076171875, -3.900634765625, -3.72509765625, -3.549560546875, -3.3740234375, -3.198486328125, -3.02294921875, -2.847412109375, -2.671875, -2.496337890625, -2.32080078125, -2.145263671875, -1.9697265625, -1.794189453125, -1.61865234375, -1.443115234375, -1.267578125, -1.092041015625, -0.91650390625, -0.740966796875, -0.5654296875, -0.389892578125, -0.21435546875, -0.038818359375, 0.13671875, 0.312255859375, 0.48779296875, 0.663330078125, 0.8388671875, 1.014404296875, 1.18994140625, 1.365478515625, 1.541015625, 1.716552734375, 1.89208984375, 2.067626953125, 2.2431640625, 2.418701171875, 2.59423828125, 2.769775390625, 2.9453125, 3.120849609375, 3.29638671875, 3.471923828125, 3.6474609375, 3.822998046875, 3.99853515625, 4.174072265625, 4.349609375, 4.525146484375, 4.70068359375, 4.876220703125, 5.0517578125, 5.227294921875, 5.40283203125, 5.578369140625, 5.75390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 21.0, 16.0, 18.0, 24.0, 26.0, 27.0, 46.0, 24.0, 37.0, 49.0, 53.0, 52.0, 46.0, 43.0, 62.0, 41.0, 44.0, 55.0, 44.0, 37.0, 43.0, 27.0, 28.0, 21.0, 21.0, 14.0, 16.0, 1.0, 14.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0753173828125, -0.07300186157226562, -0.07068634033203125, -0.06837081909179688, -0.0660552978515625, -0.06373977661132812, -0.06142425537109375, -0.059108734130859375, -0.056793212890625, -0.054477691650390625, -0.05216217041015625, -0.049846649169921875, -0.0475311279296875, -0.045215606689453125, -0.04290008544921875, -0.040584564208984375, -0.03826904296875, -0.035953521728515625, -0.03363800048828125, -0.031322479248046875, -0.0290069580078125, -0.026691436767578125, -0.02437591552734375, -0.022060394287109375, -0.019744873046875, -0.017429351806640625, -0.01511383056640625, -0.012798309326171875, -0.0104827880859375, -0.008167266845703125, -0.00585174560546875, -0.003536224365234375, -0.001220703125, 0.001094818115234375, 0.00341033935546875, 0.005725860595703125, 0.0080413818359375, 0.010356903076171875, 0.01267242431640625, 0.014987945556640625, 0.017303466796875, 0.019618988037109375, 0.02193450927734375, 0.024250030517578125, 0.0265655517578125, 0.028881072998046875, 0.03119659423828125, 0.033512115478515625, 0.03582763671875, 0.038143157958984375, 0.04045867919921875, 0.042774200439453125, 0.0450897216796875, 0.047405242919921875, 0.04972076416015625, 0.052036285400390625, 0.054351806640625, 0.056667327880859375, 0.05898284912109375, 0.061298370361328125, 0.0636138916015625, 0.06592941284179688, 0.06824493408203125, 0.07056045532226562, 0.0728759765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 13.0, 15.0, 15.0, 21.0, 42.0, 59.0, 84.0, 96.0, 159.0, 231.0, 289.0, 499.0, 764.0, 1314.0, 2464.0, 5284.0, 13613.0, 40183.0, 121345.0, 295639.0, 331863.0, 152119.0, 51497.0, 17388.0, 6508.0, 3009.0, 1473.0, 862.0, 572.0, 342.0, 208.0, 154.0, 103.0, 80.0, 60.0, 36.0, 37.0, 22.0, 22.0, 17.0, 10.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.3984375, -1.354888916015625, -1.31134033203125, -1.267791748046875, -1.2242431640625, -1.180694580078125, -1.13714599609375, -1.093597412109375, -1.050048828125, -1.006500244140625, -0.96295166015625, -0.919403076171875, -0.8758544921875, -0.832305908203125, -0.78875732421875, -0.745208740234375, -0.70166015625, -0.658111572265625, -0.61456298828125, -0.571014404296875, -0.5274658203125, -0.483917236328125, -0.44036865234375, -0.396820068359375, -0.353271484375, -0.309722900390625, -0.26617431640625, -0.222625732421875, -0.1790771484375, -0.135528564453125, -0.09197998046875, -0.048431396484375, -0.0048828125, 0.038665771484375, 0.08221435546875, 0.125762939453125, 0.1693115234375, 0.212860107421875, 0.25640869140625, 0.299957275390625, 0.343505859375, 0.387054443359375, 0.43060302734375, 0.474151611328125, 0.5177001953125, 0.561248779296875, 0.60479736328125, 0.648345947265625, 0.69189453125, 0.735443115234375, 0.77899169921875, 0.822540283203125, 0.8660888671875, 0.909637451171875, 0.95318603515625, 0.996734619140625, 1.040283203125, 1.083831787109375, 1.12738037109375, 1.170928955078125, 1.2144775390625, 1.258026123046875, 1.30157470703125, 1.345123291015625, 1.388671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 9.0, 15.0, 11.0, 17.0, 18.0, 22.0, 33.0, 44.0, 41.0, 49.0, 62.0, 57.0, 55.0, 70.0, 72.0, 48.0, 50.0, 53.0, 37.0, 36.0, 36.0, 30.0, 23.0, 21.0, 21.0, 11.0, 13.0, 15.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.640625, -0.621734619140625, -0.60284423828125, -0.583953857421875, -0.5650634765625, -0.546173095703125, -0.52728271484375, -0.508392333984375, -0.489501953125, -0.470611572265625, -0.45172119140625, -0.432830810546875, -0.4139404296875, -0.395050048828125, -0.37615966796875, -0.357269287109375, -0.33837890625, -0.319488525390625, -0.30059814453125, -0.281707763671875, -0.2628173828125, -0.243927001953125, -0.22503662109375, -0.206146240234375, -0.187255859375, -0.168365478515625, -0.14947509765625, -0.130584716796875, -0.1116943359375, -0.092803955078125, -0.07391357421875, -0.055023193359375, -0.0361328125, -0.017242431640625, 0.00164794921875, 0.020538330078125, 0.0394287109375, 0.058319091796875, 0.07720947265625, 0.096099853515625, 0.114990234375, 0.133880615234375, 0.15277099609375, 0.171661376953125, 0.1905517578125, 0.209442138671875, 0.22833251953125, 0.247222900390625, 0.26611328125, 0.285003662109375, 0.30389404296875, 0.322784423828125, 0.3416748046875, 0.360565185546875, 0.37945556640625, 0.398345947265625, 0.417236328125, 0.436126708984375, 0.45501708984375, 0.473907470703125, 0.4927978515625, 0.511688232421875, 0.53057861328125, 0.549468994140625, 0.568359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 14.0, 24.0, 22.0, 45.0, 56.0, 78.0, 116.0, 184.0, 322.0, 597.0, 1214.0, 2652.0, 7086.0, 21608.0, 83277.0, 322944.0, 424135.0, 134427.0, 33028.0, 9830.0, 3593.0, 1574.0, 710.0, 347.0, 205.0, 150.0, 96.0, 59.0, 36.0, 26.0, 29.0, 16.0, 14.0, 10.0, 8.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.666259765625, -1.61279296875, -1.559326171875, -1.505859375, -1.452392578125, -1.39892578125, -1.345458984375, -1.2919921875, -1.238525390625, -1.18505859375, -1.131591796875, -1.078125, -1.024658203125, -0.97119140625, -0.917724609375, -0.8642578125, -0.810791015625, -0.75732421875, -0.703857421875, -0.650390625, -0.596923828125, -0.54345703125, -0.489990234375, -0.4365234375, -0.383056640625, -0.32958984375, -0.276123046875, -0.22265625, -0.169189453125, -0.11572265625, -0.062255859375, -0.0087890625, 0.044677734375, 0.09814453125, 0.151611328125, 0.205078125, 0.258544921875, 0.31201171875, 0.365478515625, 0.4189453125, 0.472412109375, 0.52587890625, 0.579345703125, 0.6328125, 0.686279296875, 0.73974609375, 0.793212890625, 0.8466796875, 0.900146484375, 0.95361328125, 1.007080078125, 1.060546875, 1.114013671875, 1.16748046875, 1.220947265625, 1.2744140625, 1.327880859375, 1.38134765625, 1.434814453125, 1.48828125, 1.541748046875, 1.59521484375, 1.648681640625, 1.7021484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 1.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 20.0, 28.0, 28.0, 42.0, 47.0, 67.0, 79.0, 85.0, 91.0, 88.0, 72.0, 72.0, 37.0, 36.0, 22.0, 22.0, 16.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00026607513427734375, -0.0002579018473625183, -0.00024972856044769287, -0.00024155527353286743, -0.000233381986618042, -0.00022520869970321655, -0.0002170354127883911, -0.00020886212587356567, -0.00020068883895874023, -0.0001925155520439148, -0.00018434226512908936, -0.00017616897821426392, -0.00016799569129943848, -0.00015982240438461304, -0.0001516491174697876, -0.00014347583055496216, -0.00013530254364013672, -0.00012712925672531128, -0.00011895596981048584, -0.0001107826828956604, -0.00010260939598083496, -9.443610906600952e-05, -8.626282215118408e-05, -7.808953523635864e-05, -6.99162483215332e-05, -6.174296140670776e-05, -5.3569674491882324e-05, -4.5396387577056885e-05, -3.7223100662231445e-05, -2.9049813747406006e-05, -2.0876526832580566e-05, -1.2703239917755127e-05, -4.5299530029296875e-06, 3.643333911895752e-06, 1.1816620826721191e-05, 1.998990774154663e-05, 2.816319465637207e-05, 3.633648157119751e-05, 4.450976848602295e-05, 5.268305540084839e-05, 6.085634231567383e-05, 6.902962923049927e-05, 7.720291614532471e-05, 8.537620306015015e-05, 9.354948997497559e-05, 0.00010172277688980103, 0.00010989606380462646, 0.0001180693507194519, 0.00012624263763427734, 0.00013441592454910278, 0.00014258921146392822, 0.00015076249837875366, 0.0001589357852935791, 0.00016710907220840454, 0.00017528235912322998, 0.00018345564603805542, 0.00019162893295288086, 0.0001998022198677063, 0.00020797550678253174, 0.00021614879369735718, 0.00022432208061218262, 0.00023249536752700806, 0.0002406686544418335, 0.00024884194135665894, 0.0002570152282714844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 12.0, 15.0, 35.0, 39.0, 69.0, 117.0, 223.0, 454.0, 954.0, 2575.0, 8851.0, 50048.0, 398278.0, 500715.0, 69774.0, 11145.0, 3046.0, 1148.0, 472.0, 263.0, 125.0, 73.0, 25.0, 28.0, 19.0, 9.0, 7.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.80078125, -2.725250244140625, -2.64971923828125, -2.574188232421875, -2.4986572265625, -2.423126220703125, -2.34759521484375, -2.272064208984375, -2.196533203125, -2.121002197265625, -2.04547119140625, -1.969940185546875, -1.8944091796875, -1.818878173828125, -1.74334716796875, -1.667816162109375, -1.59228515625, -1.516754150390625, -1.44122314453125, -1.365692138671875, -1.2901611328125, -1.214630126953125, -1.13909912109375, -1.063568115234375, -0.988037109375, -0.912506103515625, -0.83697509765625, -0.761444091796875, -0.6859130859375, -0.610382080078125, -0.53485107421875, -0.459320068359375, -0.3837890625, -0.308258056640625, -0.23272705078125, -0.157196044921875, -0.0816650390625, -0.006134033203125, 0.06939697265625, 0.144927978515625, 0.220458984375, 0.295989990234375, 0.37152099609375, 0.447052001953125, 0.5225830078125, 0.598114013671875, 0.67364501953125, 0.749176025390625, 0.82470703125, 0.900238037109375, 0.97576904296875, 1.051300048828125, 1.1268310546875, 1.202362060546875, 1.27789306640625, 1.353424072265625, 1.428955078125, 1.504486083984375, 1.58001708984375, 1.655548095703125, 1.7310791015625, 1.806610107421875, 1.88214111328125, 1.957672119140625, 2.033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 8.0, 18.0, 16.0, 14.0, 22.0, 31.0, 29.0, 40.0, 38.0, 50.0, 66.0, 65.0, 49.0, 45.0, 44.0, 62.0, 55.0, 51.0, 47.0, 46.0, 35.0, 27.0, 28.0, 20.0, 13.0, 10.0, 9.0, 7.0, 9.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59765625, -0.5804367065429688, -0.5632171630859375, -0.5459976196289062, -0.528778076171875, -0.5115585327148438, -0.4943389892578125, -0.47711944580078125, -0.45989990234375, -0.44268035888671875, -0.4254608154296875, -0.40824127197265625, -0.391021728515625, -0.37380218505859375, -0.3565826416015625, -0.33936309814453125, -0.3221435546875, -0.30492401123046875, -0.2877044677734375, -0.27048492431640625, -0.253265380859375, -0.23604583740234375, -0.2188262939453125, -0.20160675048828125, -0.18438720703125, -0.16716766357421875, -0.1499481201171875, -0.13272857666015625, -0.115509033203125, -0.09828948974609375, -0.0810699462890625, -0.06385040283203125, -0.046630859375, -0.02941131591796875, -0.0121917724609375, 0.00502777099609375, 0.022247314453125, 0.03946685791015625, 0.0566864013671875, 0.07390594482421875, 0.09112548828125, 0.10834503173828125, 0.1255645751953125, 0.14278411865234375, 0.160003662109375, 0.17722320556640625, 0.1944427490234375, 0.21166229248046875, 0.2288818359375, 0.24610137939453125, 0.2633209228515625, 0.28054046630859375, 0.297760009765625, 0.31497955322265625, 0.3321990966796875, 0.34941864013671875, 0.36663818359375, 0.38385772705078125, 0.4010772705078125, 0.41829681396484375, 0.435516357421875, 0.45273590087890625, 0.4699554443359375, 0.48717498779296875, 0.50439453125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 19.0, 86.0, 249.0, 376.0, 191.0, 56.0, 23.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.846235752105713, -4.9172163009643555, -3.9881973266601562, -3.059178113937378, -2.1301589012145996, -1.2011399269104004, -0.27212047576904297, 0.6568989753723145, 1.5859179496765137, 2.514937162399292, 3.4439563751220703, 4.3729753494262695, 5.301994800567627, 6.231013774871826, 7.160033226013184, 8.089052200317383, 9.018072128295898, 9.947091102600098, 10.876110076904297, 11.805130004882812, 12.734148979187012, 13.663167953491211, 14.592187881469727, 15.521206855773926, 16.450225830078125, 17.37924575805664, 18.308263778686523, 19.23728370666504, 20.166301727294922, 21.095321655273438, 22.024341583251953, 22.95336151123047, 23.88237762451172, 24.811397552490234, 25.740415573120117, 26.669435501098633, 27.598453521728516, 28.52747344970703, 29.456493377685547, 30.385513305664062, 31.314531326293945, 32.24354934692383, 33.172569274902344, 34.10158920288086, 35.030609130859375, 35.959625244140625, 36.88864517211914, 37.817665100097656, 38.74668502807617, 39.67570495605469, 40.6047248840332, 41.53374099731445, 42.46276092529297, 43.391780853271484, 44.32080078125, 45.249820709228516, 46.17884063720703, 47.10786056518555, 48.03688049316406, 48.96589660644531, 49.89491653442383, 50.823936462402344, 51.75295639038086, 52.681976318359375, 53.610992431640625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 4.0, 15.0, 20.0, 14.0, 28.0, 36.0, 39.0, 38.0, 44.0, 46.0, 53.0, 53.0, 58.0, 48.0, 55.0, 67.0, 46.0, 46.0, 45.0, 42.0, 31.0, 29.0, 33.0, 20.0, 19.0, 11.0, 9.0, 12.0, 7.0, 4.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.695977210998535, -4.55609130859375, -4.416205883026123, -4.276319980621338, -4.136434078216553, -3.9965484142303467, -3.8566627502441406, -3.7167768478393555, -3.5768909454345703, -3.4370052814483643, -3.297119379043579, -3.157233715057373, -3.017347812652588, -2.877462148666382, -2.737576484680176, -2.5976905822753906, -2.4578049182891846, -2.3179192543029785, -2.1780333518981934, -2.0381476879119873, -1.8982617855072021, -1.758376121520996, -1.6184903383255005, -1.4786045551300049, -1.3387187719345093, -1.1988329887390137, -1.058947205543518, -0.9190614819526672, -0.7791756987571716, -0.639289915561676, -0.4994041919708252, -0.3595184087753296, -0.21963262557983398, -0.07974685728549957, 0.06013891100883484, 0.20002466440200806, 0.33991044759750366, 0.47979623079299927, 0.6196819543838501, 0.7595677375793457, 0.8994535207748413, 1.039339303970337, 1.1792250871658325, 1.3191108703613281, 1.4589965343475342, 1.5988824367523193, 1.7387681007385254, 1.878653883934021, 2.0185396671295166, 2.1584253311157227, 2.298311233520508, 2.438196897506714, 2.578082799911499, 2.717968463897705, 2.8578543663024902, 2.9977400302886963, 3.1376256942749023, 3.2775113582611084, 3.4173972606658936, 3.5572829246520996, 3.6971688270568848, 3.837054491043091, 3.976940155029297, 4.116826057434082, 4.256711959838867]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 13.0, 13.0, 17.0, 35.0, 33.0, 65.0, 88.0, 146.0, 355.0, 1182.0, 8371.0, 210532.0, 3937903.0, 31464.0, 2849.0, 615.0, 222.0, 102.0, 76.0, 40.0, 24.0, 25.0, 15.0, 17.0, 10.0, 11.0, 8.0, 6.0, 3.0, 3.0, 10.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.2734375, -8.0386962890625, -7.803955078125, -7.5692138671875, -7.33447265625, -7.0997314453125, -6.864990234375, -6.6302490234375, -6.3955078125, -6.1607666015625, -5.926025390625, -5.6912841796875, -5.45654296875, -5.2218017578125, -4.987060546875, -4.7523193359375, -4.517578125, -4.2828369140625, -4.048095703125, -3.8133544921875, -3.57861328125, -3.3438720703125, -3.109130859375, -2.8743896484375, -2.6396484375, -2.4049072265625, -2.170166015625, -1.9354248046875, -1.70068359375, -1.4659423828125, -1.231201171875, -0.9964599609375, -0.76171875, -0.5269775390625, -0.292236328125, -0.0574951171875, 0.17724609375, 0.4119873046875, 0.646728515625, 0.8814697265625, 1.1162109375, 1.3509521484375, 1.585693359375, 1.8204345703125, 2.05517578125, 2.2899169921875, 2.524658203125, 2.7593994140625, 2.994140625, 3.2288818359375, 3.463623046875, 3.6983642578125, 3.93310546875, 4.1678466796875, 4.402587890625, 4.6373291015625, 4.8720703125, 5.1068115234375, 5.341552734375, 5.5762939453125, 5.81103515625, 6.0457763671875, 6.280517578125, 6.5152587890625, 6.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 9.0, 19.0, 22.0, 33.0, 33.0, 50.0, 54.0, 73.0, 63.0, 84.0, 88.0, 80.0, 80.0, 74.0, 53.0, 34.0, 31.0, 26.0, 24.0, 20.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1724853515625, -0.1677417755126953, -0.16299819946289062, -0.15825462341308594, -0.15351104736328125, -0.14876747131347656, -0.14402389526367188, -0.1392803192138672, -0.1345367431640625, -0.1297931671142578, -0.12504959106445312, -0.12030601501464844, -0.11556243896484375, -0.11081886291503906, -0.10607528686523438, -0.10133171081542969, -0.096588134765625, -0.09184455871582031, -0.08710098266601562, -0.08235740661621094, -0.07761383056640625, -0.07287025451660156, -0.06812667846679688, -0.06338310241699219, -0.0586395263671875, -0.05389595031738281, -0.049152374267578125, -0.04440879821777344, -0.03966522216796875, -0.03492164611816406, -0.030178070068359375, -0.025434494018554688, -0.02069091796875, -0.015947341918945312, -0.011203765869140625, -0.0064601898193359375, -0.00171661376953125, 0.0030269622802734375, 0.007770538330078125, 0.012514114379882812, 0.0172576904296875, 0.022001266479492188, 0.026744842529296875, 0.03148841857910156, 0.03623199462890625, 0.04097557067871094, 0.045719146728515625, 0.05046272277832031, 0.055206298828125, 0.05994987487792969, 0.06469345092773438, 0.06943702697753906, 0.07418060302734375, 0.07892417907714844, 0.08366775512695312, 0.08841133117675781, 0.0931549072265625, 0.09789848327636719, 0.10264205932617188, 0.10738563537597656, 0.11212921142578125, 0.11687278747558594, 0.12161636352539062, 0.1263599395751953, 0.131103515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 23.0, 28.0, 60.0, 116.0, 144.0, 256.0, 388.0, 1713.0, 4179879.0, 10853.0, 363.0, 202.0, 113.0, 80.0, 35.0, 17.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.90625, -30.06298828125, -29.2197265625, -28.37646484375, -27.533203125, -26.68994140625, -25.8466796875, -25.00341796875, -24.16015625, -23.31689453125, -22.4736328125, -21.63037109375, -20.787109375, -19.94384765625, -19.1005859375, -18.25732421875, -17.4140625, -16.57080078125, -15.7275390625, -14.88427734375, -14.041015625, -13.19775390625, -12.3544921875, -11.51123046875, -10.66796875, -9.82470703125, -8.9814453125, -8.13818359375, -7.294921875, -6.45166015625, -5.6083984375, -4.76513671875, -3.921875, -3.07861328125, -2.2353515625, -1.39208984375, -0.548828125, 0.29443359375, 1.1376953125, 1.98095703125, 2.82421875, 3.66748046875, 4.5107421875, 5.35400390625, 6.197265625, 7.04052734375, 7.8837890625, 8.72705078125, 9.5703125, 10.41357421875, 11.2568359375, 12.10009765625, 12.943359375, 13.78662109375, 14.6298828125, 15.47314453125, 16.31640625, 17.15966796875, 18.0029296875, 18.84619140625, 19.689453125, 20.53271484375, 21.3759765625, 22.21923828125, 23.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 21.0, 95.0, 790.0, 2891.0, 246.0, 32.0, 10.0], "bins": [-4.74609375, -4.667285919189453, -4.588478088378906, -4.509670257568359, -4.4308624267578125, -4.352054595947266, -4.273246765136719, -4.194438934326172, -4.115631103515625, -4.036823272705078, -3.9580154418945312, -3.8792076110839844, -3.8003997802734375, -3.7215919494628906, -3.6427841186523438, -3.563976287841797, -3.48516845703125, -3.406360626220703, -3.3275527954101562, -3.2487449645996094, -3.1699371337890625, -3.0911293029785156, -3.0123214721679688, -2.933513641357422, -2.854705810546875, -2.775897979736328, -2.6970901489257812, -2.6182823181152344, -2.5394744873046875, -2.4606666564941406, -2.3818588256835938, -2.303050994873047, -2.2242431640625, -2.145435333251953, -2.0666275024414062, -1.9878196716308594, -1.9090118408203125, -1.8302040100097656, -1.7513961791992188, -1.6725883483886719, -1.593780517578125, -1.5149726867675781, -1.4361648559570312, -1.3573570251464844, -1.2785491943359375, -1.1997413635253906, -1.1209335327148438, -1.0421257019042969, -0.96331787109375, -0.8845100402832031, -0.8057022094726562, -0.7268943786621094, -0.6480865478515625, -0.5692787170410156, -0.49047088623046875, -0.4116630554199219, -0.332855224609375, -0.2540473937988281, -0.17523956298828125, -0.09643173217773438, -0.0176239013671875, 0.061183929443359375, 0.13999176025390625, 0.21879959106445312, 0.297607421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 33.0, 143.0, 544.0, 230.0, 36.0, 12.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.44783020019531, -42.63691711425781, -41.82600402832031, -41.01509094238281, -40.20417785644531, -39.39326858520508, -38.58235549926758, -37.77144241333008, -36.96052932739258, -36.14961624145508, -35.33870315551758, -34.52779006958008, -33.716880798339844, -32.905967712402344, -32.095054626464844, -31.284141540527344, -30.473228454589844, -29.662315368652344, -28.851402282714844, -28.040491104125977, -27.229578018188477, -26.418664932250977, -25.60775375366211, -24.79684066772461, -23.98592758178711, -23.17501449584961, -22.36410140991211, -21.553190231323242, -20.742277145385742, -19.931364059448242, -19.120452880859375, -18.309539794921875, -17.498624801635742, -16.687711715698242, -15.876799583435059, -15.065887451171875, -14.254974365234375, -13.444061279296875, -12.633149147033691, -11.822237014770508, -11.011323928833008, -10.200410842895508, -9.389498710632324, -8.57858657836914, -7.767673492431641, -6.956760883331299, -6.145848274230957, -5.334935665130615, -4.524023056030273, -3.7131104469299316, -2.90219783782959, -2.091285228729248, -1.2803726196289062, -0.46946001052856445, 0.34145259857177734, 1.1523652076721191, 1.963277816772461, 2.7741904258728027, 3.5851030349731445, 4.396015644073486, 5.206928253173828, 6.01784086227417, 6.828753471374512, 7.6396660804748535, 8.450578689575195]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 18.0, 37.0, 44.0, 76.0, 109.0, 135.0, 160.0, 130.0, 87.0, 82.0, 63.0, 35.0, 10.0, 10.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.518835067749023, -12.085025787353516, -11.651217460632324, -11.217408180236816, -10.783599853515625, -10.349790573120117, -9.91598129272461, -9.482172012329102, -9.04836368560791, -8.614554405212402, -8.180746078491211, -7.746936798095703, -7.3131279945373535, -6.879319190979004, -6.445509910583496, -6.0117011070251465, -5.577892303466797, -5.144083499908447, -4.710274696350098, -4.27646541595459, -3.8426566123962402, -3.4088478088378906, -2.975038766860962, -2.541229724884033, -2.1074209213256836, -1.6736119985580444, -1.2398030757904053, -0.8059941530227661, -0.37218523025512695, 0.061623573303222656, 0.49543261528015137, 0.9292416572570801, 1.363051414489746, 1.7968603372573853, 2.2306692600250244, 2.664478302001953, 3.0982871055603027, 3.5320959091186523, 3.965904951095581, 4.39971399307251, 4.833522796630859, 5.267331600189209, 5.701140403747559, 6.134949684143066, 6.568758487701416, 7.002567291259766, 7.436376571655273, 7.870185375213623, 8.303994178771973, 8.73780345916748, 9.171611785888672, 9.60542106628418, 10.039230346679688, 10.473038673400879, 10.906847953796387, 11.340656280517578, 11.774465560913086, 12.208274841308594, 12.642083168029785, 13.075892448425293, 13.509700775146484, 13.943510055541992, 14.3773193359375, 14.811128616333008, 15.2449369430542]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 9.0, 5.0, 2.0, 9.0, 15.0, 16.0, 17.0, 27.0, 40.0, 53.0, 62.0, 120.0, 233.0, 555.0, 1343.0, 5495.0, 52407.0, 611332.0, 347556.0, 23936.0, 3339.0, 1019.0, 448.0, 178.0, 103.0, 57.0, 46.0, 29.0, 17.0, 20.0, 9.0, 8.0, 7.0, 8.0, 8.0, 3.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.53424072265625, -4.3653564453125, -4.19647216796875, -4.027587890625, -3.85870361328125, -3.6898193359375, -3.52093505859375, -3.35205078125, -3.18316650390625, -3.0142822265625, -2.84539794921875, -2.676513671875, -2.50762939453125, -2.3387451171875, -2.16986083984375, -2.0009765625, -1.83209228515625, -1.6632080078125, -1.49432373046875, -1.325439453125, -1.15655517578125, -0.9876708984375, -0.81878662109375, -0.64990234375, -0.48101806640625, -0.3121337890625, -0.14324951171875, 0.025634765625, 0.19451904296875, 0.3634033203125, 0.53228759765625, 0.701171875, 0.87005615234375, 1.0389404296875, 1.20782470703125, 1.376708984375, 1.54559326171875, 1.7144775390625, 1.88336181640625, 2.05224609375, 2.22113037109375, 2.3900146484375, 2.55889892578125, 2.727783203125, 2.89666748046875, 3.0655517578125, 3.23443603515625, 3.4033203125, 3.57220458984375, 3.7410888671875, 3.90997314453125, 4.078857421875, 4.24774169921875, 4.4166259765625, 4.58551025390625, 4.75439453125, 4.92327880859375, 5.0921630859375, 5.26104736328125, 5.429931640625, 5.59881591796875, 5.7677001953125, 5.93658447265625, 6.10546875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 16.0, 24.0, 30.0, 33.0, 45.0, 45.0, 68.0, 71.0, 81.0, 86.0, 81.0, 79.0, 61.0, 51.0, 48.0, 48.0, 33.0, 25.0, 14.0, 16.0, 11.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41552734375, -0.404205322265625, -0.39288330078125, -0.381561279296875, -0.3702392578125, -0.358917236328125, -0.34759521484375, -0.336273193359375, -0.324951171875, -0.313629150390625, -0.30230712890625, -0.290985107421875, -0.2796630859375, -0.268341064453125, -0.25701904296875, -0.245697021484375, -0.234375, -0.223052978515625, -0.21173095703125, -0.200408935546875, -0.1890869140625, -0.177764892578125, -0.16644287109375, -0.155120849609375, -0.143798828125, -0.132476806640625, -0.12115478515625, -0.109832763671875, -0.0985107421875, -0.087188720703125, -0.07586669921875, -0.064544677734375, -0.05322265625, -0.041900634765625, -0.03057861328125, -0.019256591796875, -0.0079345703125, 0.003387451171875, 0.01470947265625, 0.026031494140625, 0.037353515625, 0.048675537109375, 0.05999755859375, 0.071319580078125, 0.0826416015625, 0.093963623046875, 0.10528564453125, 0.116607666015625, 0.1279296875, 0.139251708984375, 0.15057373046875, 0.161895751953125, 0.1732177734375, 0.184539794921875, 0.19586181640625, 0.207183837890625, 0.218505859375, 0.229827880859375, 0.24114990234375, 0.252471923828125, 0.2637939453125, 0.275115966796875, 0.28643798828125, 0.297760009765625, 0.30908203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 15.0, 18.0, 25.0, 35.0, 46.0, 73.0, 82.0, 166.0, 201.0, 313.0, 523.0, 822.0, 1582.0, 3747.0, 11602.0, 47103.0, 195655.0, 440874.0, 256103.0, 64525.0, 15642.0, 4794.0, 1868.0, 1015.0, 600.0, 366.0, 227.0, 174.0, 97.0, 84.0, 42.0, 28.0, 25.0, 18.0, 12.0, 10.0, 6.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7978515625, -1.7303009033203125, -1.662750244140625, -1.5951995849609375, -1.52764892578125, -1.4600982666015625, -1.392547607421875, -1.3249969482421875, -1.2574462890625, -1.1898956298828125, -1.122344970703125, -1.0547943115234375, -0.98724365234375, -0.9196929931640625, -0.852142333984375, -0.7845916748046875, -0.717041015625, -0.6494903564453125, -0.581939697265625, -0.5143890380859375, -0.44683837890625, -0.3792877197265625, -0.311737060546875, -0.2441864013671875, -0.1766357421875, -0.1090850830078125, -0.041534423828125, 0.0260162353515625, 0.09356689453125, 0.1611175537109375, 0.228668212890625, 0.2962188720703125, 0.36376953125, 0.4313201904296875, 0.498870849609375, 0.5664215087890625, 0.63397216796875, 0.7015228271484375, 0.769073486328125, 0.8366241455078125, 0.9041748046875, 0.9717254638671875, 1.039276123046875, 1.1068267822265625, 1.17437744140625, 1.2419281005859375, 1.309478759765625, 1.3770294189453125, 1.444580078125, 1.5121307373046875, 1.579681396484375, 1.6472320556640625, 1.71478271484375, 1.7823333740234375, 1.849884033203125, 1.9174346923828125, 1.9849853515625, 2.0525360107421875, 2.120086669921875, 2.1876373291015625, 2.25518798828125, 2.3227386474609375, 2.390289306640625, 2.4578399658203125, 2.525390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 7.0, 7.0, 10.0, 12.0, 17.0, 18.0, 24.0, 30.0, 31.0, 27.0, 33.0, 34.0, 39.0, 39.0, 44.0, 45.0, 50.0, 45.0, 35.0, 44.0, 52.0, 41.0, 40.0, 33.0, 46.0, 30.0, 23.0, 24.0, 23.0, 12.0, 11.0, 12.0, 10.0, 4.0, 5.0, 4.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0032958984375, -0.970458984375, -0.9376220703125, -0.90478515625, -0.8719482421875, -0.839111328125, -0.8062744140625, -0.7734375, -0.7406005859375, -0.707763671875, -0.6749267578125, -0.64208984375, -0.6092529296875, -0.576416015625, -0.5435791015625, -0.5107421875, -0.4779052734375, -0.445068359375, -0.4122314453125, -0.37939453125, -0.3465576171875, -0.313720703125, -0.2808837890625, -0.248046875, -0.2152099609375, -0.182373046875, -0.1495361328125, -0.11669921875, -0.0838623046875, -0.051025390625, -0.0181884765625, 0.0146484375, 0.0474853515625, 0.080322265625, 0.1131591796875, 0.14599609375, 0.1788330078125, 0.211669921875, 0.2445068359375, 0.27734375, 0.3101806640625, 0.343017578125, 0.3758544921875, 0.40869140625, 0.4415283203125, 0.474365234375, 0.5072021484375, 0.5400390625, 0.5728759765625, 0.605712890625, 0.6385498046875, 0.67138671875, 0.7042236328125, 0.737060546875, 0.7698974609375, 0.802734375, 0.8355712890625, 0.868408203125, 0.9012451171875, 0.93408203125, 0.9669189453125, 0.999755859375, 1.0325927734375, 1.0654296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 15.0, 21.0, 29.0, 52.0, 82.0, 107.0, 160.0, 309.0, 576.0, 1321.0, 3083.0, 9398.0, 36609.0, 220565.0, 582758.0, 153678.0, 27491.0, 7217.0, 2544.0, 1142.0, 528.0, 311.0, 164.0, 109.0, 85.0, 54.0, 36.0, 27.0, 16.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7534027099609375, -1.689422607421875, -1.6254425048828125, -1.56146240234375, -1.4974822998046875, -1.433502197265625, -1.3695220947265625, -1.3055419921875, -1.2415618896484375, -1.177581787109375, -1.1136016845703125, -1.04962158203125, -0.9856414794921875, -0.921661376953125, -0.8576812744140625, -0.793701171875, -0.7297210693359375, -0.665740966796875, -0.6017608642578125, -0.53778076171875, -0.4738006591796875, -0.409820556640625, -0.3458404541015625, -0.2818603515625, -0.2178802490234375, -0.153900146484375, -0.0899200439453125, -0.02593994140625, 0.0380401611328125, 0.102020263671875, 0.1660003662109375, 0.22998046875, 0.2939605712890625, 0.357940673828125, 0.4219207763671875, 0.48590087890625, 0.5498809814453125, 0.613861083984375, 0.6778411865234375, 0.7418212890625, 0.8058013916015625, 0.869781494140625, 0.9337615966796875, 0.99774169921875, 1.0617218017578125, 1.125701904296875, 1.1896820068359375, 1.253662109375, 1.3176422119140625, 1.381622314453125, 1.4456024169921875, 1.50958251953125, 1.5735626220703125, 1.637542724609375, 1.7015228271484375, 1.7655029296875, 1.8294830322265625, 1.893463134765625, 1.9574432373046875, 2.02142333984375, 2.0854034423828125, 2.149383544921875, 2.2133636474609375, 2.27734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 11.0, 9.0, 10.0, 18.0, 17.0, 19.0, 27.0, 32.0, 35.0, 48.0, 55.0, 76.0, 61.0, 69.0, 68.0, 74.0, 53.0, 56.0, 50.0, 44.0, 33.0, 27.0, 27.0, 14.0, 17.0, 17.0, 5.0, 9.0, 4.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019943714141845703, -0.00019270740449428558, -0.00018597766757011414, -0.0001792479306459427, -0.00017251819372177124, -0.0001657884567975998, -0.00015905871987342834, -0.0001523289829492569, -0.00014559924602508545, -0.000138869509100914, -0.00013213977217674255, -0.0001254100352525711, -0.00011868029832839966, -0.00011195056140422821, -0.00010522082448005676, -9.849108755588531e-05, -9.176135063171387e-05, -8.503161370754242e-05, -7.830187678337097e-05, -7.157213985919952e-05, -6.484240293502808e-05, -5.811266601085663e-05, -5.138292908668518e-05, -4.465319216251373e-05, -3.7923455238342285e-05, -3.119371831417084e-05, -2.446398138999939e-05, -1.7734244465827942e-05, -1.1004507541656494e-05, -4.274770617485046e-06, 2.4549663066864014e-06, 9.184703230857849e-06, 1.5914440155029297e-05, 2.2644177079200745e-05, 2.9373914003372192e-05, 3.610365092754364e-05, 4.283338785171509e-05, 4.9563124775886536e-05, 5.6292861700057983e-05, 6.302259862422943e-05, 6.975233554840088e-05, 7.648207247257233e-05, 8.321180939674377e-05, 8.994154632091522e-05, 9.667128324508667e-05, 0.00010340102016925812, 0.00011013075709342957, 0.00011686049401760101, 0.00012359023094177246, 0.0001303199678659439, 0.00013704970479011536, 0.0001437794417142868, 0.00015050917863845825, 0.0001572389155626297, 0.00016396865248680115, 0.0001706983894109726, 0.00017742812633514404, 0.0001841578632593155, 0.00019088760018348694, 0.00019761733710765839, 0.00020434707403182983, 0.00021107681095600128, 0.00021780654788017273, 0.00022453628480434418, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 16.0, 24.0, 38.0, 73.0, 135.0, 218.0, 478.0, 1184.0, 3787.0, 20397.0, 240860.0, 688856.0, 78732.0, 9704.0, 2340.0, 850.0, 397.0, 192.0, 109.0, 44.0, 37.0, 21.0, 16.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.806793212890625, -2.71710205078125, -2.627410888671875, -2.5377197265625, -2.448028564453125, -2.35833740234375, -2.268646240234375, -2.178955078125, -2.089263916015625, -1.99957275390625, -1.909881591796875, -1.8201904296875, -1.730499267578125, -1.64080810546875, -1.551116943359375, -1.46142578125, -1.371734619140625, -1.28204345703125, -1.192352294921875, -1.1026611328125, -1.012969970703125, -0.92327880859375, -0.833587646484375, -0.743896484375, -0.654205322265625, -0.56451416015625, -0.474822998046875, -0.3851318359375, -0.295440673828125, -0.20574951171875, -0.116058349609375, -0.0263671875, 0.063323974609375, 0.15301513671875, 0.242706298828125, 0.3323974609375, 0.422088623046875, 0.51177978515625, 0.601470947265625, 0.691162109375, 0.780853271484375, 0.87054443359375, 0.960235595703125, 1.0499267578125, 1.139617919921875, 1.22930908203125, 1.319000244140625, 1.40869140625, 1.498382568359375, 1.58807373046875, 1.677764892578125, 1.7674560546875, 1.857147216796875, 1.94683837890625, 2.036529541015625, 2.126220703125, 2.215911865234375, 2.30560302734375, 2.395294189453125, 2.4849853515625, 2.574676513671875, 2.66436767578125, 2.754058837890625, 2.84375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 11.0, 15.0, 22.0, 18.0, 33.0, 45.0, 58.0, 71.0, 77.0, 78.0, 87.0, 87.0, 80.0, 70.0, 61.0, 43.0, 39.0, 14.0, 21.0, 20.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.7998809814453125, -0.768707275390625, -0.7375335693359375, -0.70635986328125, -0.6751861572265625, -0.644012451171875, -0.6128387451171875, -0.5816650390625, -0.5504913330078125, -0.519317626953125, -0.4881439208984375, -0.45697021484375, -0.4257965087890625, -0.394622802734375, -0.3634490966796875, -0.332275390625, -0.3011016845703125, -0.269927978515625, -0.2387542724609375, -0.20758056640625, -0.1764068603515625, -0.145233154296875, -0.1140594482421875, -0.0828857421875, -0.0517120361328125, -0.020538330078125, 0.0106353759765625, 0.04180908203125, 0.0729827880859375, 0.104156494140625, 0.1353302001953125, 0.16650390625, 0.1976776123046875, 0.228851318359375, 0.2600250244140625, 0.29119873046875, 0.3223724365234375, 0.353546142578125, 0.3847198486328125, 0.4158935546875, 0.4470672607421875, 0.478240966796875, 0.5094146728515625, 0.54058837890625, 0.5717620849609375, 0.602935791015625, 0.6341094970703125, 0.665283203125, 0.6964569091796875, 0.727630615234375, 0.7588043212890625, 0.78997802734375, 0.8211517333984375, 0.852325439453125, 0.8834991455078125, 0.9146728515625, 0.9458465576171875, 0.977020263671875, 1.0081939697265625, 1.03936767578125, 1.0705413818359375, 1.101715087890625, 1.1328887939453125, 1.1640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 10.0, 24.0, 107.0, 218.0, 318.0, 208.0, 79.0, 26.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.307259559631348, -11.382889747619629, -10.458520889282227, -9.534151077270508, -8.609781265258789, -7.68541145324707, -6.76104211807251, -5.836672782897949, -4.9123029708862305, -3.987933397293091, -3.063563823699951, -2.1391942501068115, -1.2148246765136719, -0.2904548645019531, 0.6339144706726074, 1.558283805847168, 2.4826536178588867, 3.4070231914520264, 4.331392765045166, 5.255762100219727, 6.180131912231445, 7.104501724243164, 8.028871536254883, 8.953240394592285, 9.877610206604004, 10.801980018615723, 11.726348876953125, 12.650718688964844, 13.575088500976562, 14.499458312988281, 15.423828125, 16.34819793701172, 17.272567749023438, 18.196937561035156, 19.121307373046875, 20.045677185058594, 20.970046997070312, 21.89441680908203, 22.818784713745117, 23.743154525756836, 24.667524337768555, 25.591894149780273, 26.516263961791992, 27.44063377380371, 28.365001678466797, 29.289371490478516, 30.213741302490234, 31.138111114501953, 32.06248092651367, 32.98685073852539, 33.91122055053711, 34.83559036254883, 35.75996017456055, 36.684329986572266, 37.608699798583984, 38.53306579589844, 39.457435607910156, 40.381805419921875, 41.306175231933594, 42.23054504394531, 43.15491485595703, 44.07928466796875, 45.00365447998047, 45.92802429199219, 46.852394104003906]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 6.0, 11.0, 16.0, 19.0, 19.0, 19.0, 37.0, 34.0, 42.0, 38.0, 38.0, 44.0, 46.0, 52.0, 48.0, 38.0, 54.0, 41.0, 42.0, 35.0, 46.0, 36.0, 31.0, 22.0, 29.0, 30.0, 26.0, 10.0, 8.0, 9.0, 8.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.671116352081299, -7.450446128845215, -7.229775905609131, -7.009105682373047, -6.788434982299805, -6.567764759063721, -6.347094535827637, -6.126424312591553, -5.905754089355469, -5.685083866119385, -5.464413642883301, -5.243742942810059, -5.023072719573975, -4.802402496337891, -4.581732273101807, -4.361062049865723, -4.1403913497924805, -3.9197211265563965, -3.6990506649017334, -3.4783804416656494, -3.2577099800109863, -3.0370397567749023, -2.8163695335388184, -2.5956993103027344, -2.3750288486480713, -2.1543586254119873, -1.9336881637573242, -1.7130179405212402, -1.4923475980758667, -1.2716772556304932, -1.0510070323944092, -0.8303366899490356, -0.6096658706665039, -0.38899555802345276, -0.1683252453804016, 0.05234503746032715, 0.2730153799057007, 0.4936857223510742, 0.7143559455871582, 0.9350262880325317, 1.1556966304779053, 1.3763669729232788, 1.5970373153686523, 1.8177075386047363, 2.0383777618408203, 2.2590482234954834, 2.4797184467315674, 2.7003889083862305, 2.9210591316223145, 3.1417293548583984, 3.3623998165130615, 3.5830700397491455, 3.8037405014038086, 4.024410724639893, 4.245080947875977, 4.4657511711120605, 4.6864213943481445, 4.9070916175842285, 5.1277618408203125, 5.348432540893555, 5.569102764129639, 5.789772987365723, 6.010443210601807, 6.231113433837891, 6.451784133911133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 10.0, 3.0, 8.0, 15.0, 15.0, 13.0, 25.0, 28.0, 39.0, 49.0, 94.0, 127.0, 242.0, 510.0, 1122.0, 3793.0, 19237.0, 296440.0, 3790170.0, 70435.0, 8806.0, 1928.0, 637.0, 253.0, 101.0, 52.0, 34.0, 16.0, 12.0, 7.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.06597900390625, -5.8780517578125, -5.69012451171875, -5.502197265625, -5.31427001953125, -5.1263427734375, -4.93841552734375, -4.75048828125, -4.56256103515625, -4.3746337890625, -4.18670654296875, -3.998779296875, -3.81085205078125, -3.6229248046875, -3.43499755859375, -3.2470703125, -3.05914306640625, -2.8712158203125, -2.68328857421875, -2.495361328125, -2.30743408203125, -2.1195068359375, -1.93157958984375, -1.74365234375, -1.55572509765625, -1.3677978515625, -1.17987060546875, -0.991943359375, -0.80401611328125, -0.6160888671875, -0.42816162109375, -0.240234375, -0.05230712890625, 0.1356201171875, 0.32354736328125, 0.511474609375, 0.69940185546875, 0.8873291015625, 1.07525634765625, 1.26318359375, 1.45111083984375, 1.6390380859375, 1.82696533203125, 2.014892578125, 2.20281982421875, 2.3907470703125, 2.57867431640625, 2.7666015625, 2.95452880859375, 3.1424560546875, 3.33038330078125, 3.518310546875, 3.70623779296875, 3.8941650390625, 4.08209228515625, 4.27001953125, 4.45794677734375, 4.6458740234375, 4.83380126953125, 5.021728515625, 5.20965576171875, 5.3975830078125, 5.58551025390625, 5.7734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 19.0, 16.0, 18.0, 47.0, 23.0, 41.0, 49.0, 81.0, 79.0, 75.0, 98.0, 76.0, 83.0, 51.0, 51.0, 34.0, 29.0, 25.0, 28.0, 19.0, 13.0, 11.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4599609375, -0.44878387451171875, -0.4376068115234375, -0.42642974853515625, -0.415252685546875, -0.40407562255859375, -0.3928985595703125, -0.38172149658203125, -0.37054443359375, -0.35936737060546875, -0.3481903076171875, -0.33701324462890625, -0.325836181640625, -0.31465911865234375, -0.3034820556640625, -0.29230499267578125, -0.2811279296875, -0.26995086669921875, -0.2587738037109375, -0.24759674072265625, -0.236419677734375, -0.22524261474609375, -0.2140655517578125, -0.20288848876953125, -0.19171142578125, -0.18053436279296875, -0.1693572998046875, -0.15818023681640625, -0.147003173828125, -0.13582611083984375, -0.1246490478515625, -0.11347198486328125, -0.102294921875, -0.09111785888671875, -0.0799407958984375, -0.06876373291015625, -0.057586669921875, -0.04640960693359375, -0.0352325439453125, -0.02405548095703125, -0.01287841796875, -0.00170135498046875, 0.0094757080078125, 0.02065277099609375, 0.031829833984375, 0.04300689697265625, 0.0541839599609375, 0.06536102294921875, 0.0765380859375, 0.08771514892578125, 0.0988922119140625, 0.11006927490234375, 0.121246337890625, 0.13242340087890625, 0.1436004638671875, 0.15477752685546875, 0.16595458984375, 0.17713165283203125, 0.1883087158203125, 0.19948577880859375, 0.210662841796875, 0.22183990478515625, 0.2330169677734375, 0.24419403076171875, 0.25537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 12.0, 14.0, 31.0, 53.0, 112.0, 229.0, 876.0, 28119.0, 4160066.0, 4183.0, 365.0, 102.0, 59.0, 35.0, 12.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.2078857421875, -27.525146484375, -26.8424072265625, -26.15966796875, -25.4769287109375, -24.794189453125, -24.1114501953125, -23.4287109375, -22.7459716796875, -22.063232421875, -21.3804931640625, -20.69775390625, -20.0150146484375, -19.332275390625, -18.6495361328125, -17.966796875, -17.2840576171875, -16.601318359375, -15.9185791015625, -15.23583984375, -14.5531005859375, -13.870361328125, -13.1876220703125, -12.5048828125, -11.8221435546875, -11.139404296875, -10.4566650390625, -9.77392578125, -9.0911865234375, -8.408447265625, -7.7257080078125, -7.04296875, -6.3602294921875, -5.677490234375, -4.9947509765625, -4.31201171875, -3.6292724609375, -2.946533203125, -2.2637939453125, -1.5810546875, -0.8983154296875, -0.215576171875, 0.4671630859375, 1.14990234375, 1.8326416015625, 2.515380859375, 3.1981201171875, 3.880859375, 4.5635986328125, 5.246337890625, 5.9290771484375, 6.61181640625, 7.2945556640625, 7.977294921875, 8.6600341796875, 9.3427734375, 10.0255126953125, 10.708251953125, 11.3909912109375, 12.07373046875, 12.7564697265625, 13.439208984375, 14.1219482421875, 14.8046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 24.0, 63.0, 183.0, 856.0, 2329.0, 412.0, 116.0, 39.0, 20.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.0078125, -2.9491729736328125, -2.890533447265625, -2.8318939208984375, -2.77325439453125, -2.7146148681640625, -2.655975341796875, -2.5973358154296875, -2.5386962890625, -2.4800567626953125, -2.421417236328125, -2.3627777099609375, -2.30413818359375, -2.2454986572265625, -2.186859130859375, -2.1282196044921875, -2.069580078125, -2.0109405517578125, -1.952301025390625, -1.8936614990234375, -1.83502197265625, -1.7763824462890625, -1.717742919921875, -1.6591033935546875, -1.6004638671875, -1.5418243408203125, -1.483184814453125, -1.4245452880859375, -1.36590576171875, -1.3072662353515625, -1.248626708984375, -1.1899871826171875, -1.13134765625, -1.0727081298828125, -1.014068603515625, -0.9554290771484375, -0.89678955078125, -0.8381500244140625, -0.779510498046875, -0.7208709716796875, -0.6622314453125, -0.6035919189453125, -0.544952392578125, -0.4863128662109375, -0.42767333984375, -0.3690338134765625, -0.310394287109375, -0.2517547607421875, -0.193115234375, -0.1344757080078125, -0.075836181640625, -0.0171966552734375, 0.04144287109375, 0.1000823974609375, 0.158721923828125, 0.2173614501953125, 0.2760009765625, 0.3346405029296875, 0.393280029296875, 0.4519195556640625, 0.51055908203125, 0.5691986083984375, 0.627838134765625, 0.6864776611328125, 0.7451171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 23.0, 64.0, 568.0, 318.0, 32.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.848087310791016, -42.86951446533203, -41.89094543457031, -40.91237258911133, -39.93380355834961, -38.955230712890625, -37.976661682128906, -36.99808883666992, -36.01951599121094, -35.04094314575195, -34.062374114990234, -33.08380126953125, -32.10523223876953, -31.126659393310547, -30.148088455200195, -29.169517517089844, -28.190948486328125, -27.212377548217773, -26.233806610107422, -25.255233764648438, -24.276662826538086, -23.298091888427734, -22.319520950317383, -21.34095001220703, -20.362377166748047, -19.383806228637695, -18.405235290527344, -17.42666244506836, -16.448091506958008, -15.469520568847656, -14.490949630737305, -13.512378692626953, -12.533807754516602, -11.55523681640625, -10.576664924621582, -9.59809398651123, -8.619523048400879, -7.640951633453369, -6.662380218505859, -5.683809280395508, -4.705237865447998, -3.7266666889190674, -2.7480955123901367, -1.769524097442627, -0.7909529209136963, 0.18761825561523438, 1.1661896705627441, 2.1447606086730957, 3.1233320236206055, 4.101903438568115, 5.080474376678467, 6.059045791625977, 7.037616729736328, 8.01618766784668, 8.994759559631348, 9.9733304977417, 10.951902389526367, 11.930473327636719, 12.909045219421387, 13.887616157531738, 14.86618709564209, 15.844758987426758, 16.82332992553711, 17.80190086364746, 18.780471801757812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 10.0, 5.0, 8.0, 18.0, 17.0, 34.0, 34.0, 62.0, 77.0, 63.0, 74.0, 86.0, 81.0, 73.0, 81.0, 68.0, 56.0, 57.0, 47.0, 21.0, 10.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.372196197509766, -6.1926469802856445, -6.013097286224365, -5.833547592163086, -5.653998374938965, -5.474449157714844, -5.2948994636535645, -5.115349769592285, -4.935800552368164, -4.756251335144043, -4.576701641082764, -4.397151947021484, -4.217602729797363, -4.038053512573242, -3.858503818511963, -3.6789543628692627, -3.4994049072265625, -3.3198554515838623, -3.140305995941162, -2.960756540298462, -2.7812070846557617, -2.6016576290130615, -2.4221081733703613, -2.242558717727661, -2.063009262084961, -1.8834598064422607, -1.7039103507995605, -1.5243608951568604, -1.3448114395141602, -1.16526198387146, -0.9857125282287598, -0.8061630725860596, -0.6266131401062012, -0.447063684463501, -0.2675142288208008, -0.08796477317810059, 0.09158468246459961, 0.2711341381072998, 0.45068359375, 0.6302330493927002, 0.8097825050354004, 0.9893319606781006, 1.1688814163208008, 1.348430871963501, 1.5279803276062012, 1.7075297832489014, 1.8870792388916016, 2.0666286945343018, 2.246178150177002, 2.425727605819702, 2.6052770614624023, 2.7848265171051025, 2.9643759727478027, 3.143925428390503, 3.323474884033203, 3.5030243396759033, 3.6825737953186035, 3.8621232509613037, 4.041672706604004, 4.221221923828125, 4.400771617889404, 4.580321311950684, 4.759870529174805, 4.939419746398926, 5.118969440460205]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 9.0, 18.0, 18.0, 25.0, 33.0, 41.0, 59.0, 115.0, 182.0, 364.0, 856.0, 2969.0, 17148.0, 203980.0, 708904.0, 100276.0, 10002.0, 2069.0, 706.0, 299.0, 164.0, 103.0, 62.0, 39.0, 19.0, 19.0, 11.0, 10.0, 5.0, 8.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.63671875, -5.4935302734375, -5.350341796875, -5.2071533203125, -5.06396484375, -4.9207763671875, -4.777587890625, -4.6343994140625, -4.4912109375, -4.3480224609375, -4.204833984375, -4.0616455078125, -3.91845703125, -3.7752685546875, -3.632080078125, -3.4888916015625, -3.345703125, -3.2025146484375, -3.059326171875, -2.9161376953125, -2.77294921875, -2.6297607421875, -2.486572265625, -2.3433837890625, -2.2001953125, -2.0570068359375, -1.913818359375, -1.7706298828125, -1.62744140625, -1.4842529296875, -1.341064453125, -1.1978759765625, -1.0546875, -0.9114990234375, -0.768310546875, -0.6251220703125, -0.48193359375, -0.3387451171875, -0.195556640625, -0.0523681640625, 0.0908203125, 0.2340087890625, 0.377197265625, 0.5203857421875, 0.66357421875, 0.8067626953125, 0.949951171875, 1.0931396484375, 1.236328125, 1.3795166015625, 1.522705078125, 1.6658935546875, 1.80908203125, 1.9522705078125, 2.095458984375, 2.2386474609375, 2.3818359375, 2.5250244140625, 2.668212890625, 2.8114013671875, 2.95458984375, 3.0977783203125, 3.240966796875, 3.3841552734375, 3.52734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 10.0, 9.0, 13.0, 19.0, 23.0, 36.0, 34.0, 60.0, 63.0, 90.0, 69.0, 85.0, 89.0, 68.0, 77.0, 64.0, 37.0, 40.0, 38.0, 31.0, 10.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.53955078125, -0.5252456665039062, -0.5109405517578125, -0.49663543701171875, -0.482330322265625, -0.46802520751953125, -0.4537200927734375, -0.43941497802734375, -0.42510986328125, -0.41080474853515625, -0.3964996337890625, -0.38219451904296875, -0.367889404296875, -0.35358428955078125, -0.3392791748046875, -0.32497406005859375, -0.3106689453125, -0.29636383056640625, -0.2820587158203125, -0.26775360107421875, -0.253448486328125, -0.23914337158203125, -0.2248382568359375, -0.21053314208984375, -0.19622802734375, -0.18192291259765625, -0.1676177978515625, -0.15331268310546875, -0.139007568359375, -0.12470245361328125, -0.1103973388671875, -0.09609222412109375, -0.081787109375, -0.06748199462890625, -0.0531768798828125, -0.03887176513671875, -0.024566650390625, -0.01026153564453125, 0.0040435791015625, 0.01834869384765625, 0.03265380859375, 0.04695892333984375, 0.0612640380859375, 0.07556915283203125, 0.089874267578125, 0.10417938232421875, 0.1184844970703125, 0.13278961181640625, 0.1470947265625, 0.16139984130859375, 0.1757049560546875, 0.19001007080078125, 0.204315185546875, 0.21862030029296875, 0.2329254150390625, 0.24723052978515625, 0.26153564453125, 0.27584075927734375, 0.2901458740234375, 0.30445098876953125, 0.318756103515625, 0.33306121826171875, 0.3473663330078125, 0.36167144775390625, 0.3759765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 10.0, 21.0, 20.0, 28.0, 37.0, 56.0, 74.0, 113.0, 145.0, 179.0, 305.0, 434.0, 730.0, 1274.0, 2426.0, 5536.0, 15307.0, 52112.0, 186801.0, 403862.0, 262675.0, 79392.0, 22339.0, 7479.0, 3124.0, 1549.0, 857.0, 491.0, 347.0, 236.0, 139.0, 132.0, 72.0, 64.0, 47.0, 30.0, 22.0, 17.0, 15.0, 10.0, 15.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.828948974609375, -1.77117919921875, -1.713409423828125, -1.6556396484375, -1.597869873046875, -1.54010009765625, -1.482330322265625, -1.424560546875, -1.366790771484375, -1.30902099609375, -1.251251220703125, -1.1934814453125, -1.135711669921875, -1.07794189453125, -1.020172119140625, -0.96240234375, -0.904632568359375, -0.84686279296875, -0.789093017578125, -0.7313232421875, -0.673553466796875, -0.61578369140625, -0.558013916015625, -0.500244140625, -0.442474365234375, -0.38470458984375, -0.326934814453125, -0.2691650390625, -0.211395263671875, -0.15362548828125, -0.095855712890625, -0.0380859375, 0.019683837890625, 0.07745361328125, 0.135223388671875, 0.1929931640625, 0.250762939453125, 0.30853271484375, 0.366302490234375, 0.424072265625, 0.481842041015625, 0.53961181640625, 0.597381591796875, 0.6551513671875, 0.712921142578125, 0.77069091796875, 0.828460693359375, 0.88623046875, 0.944000244140625, 1.00177001953125, 1.059539794921875, 1.1173095703125, 1.175079345703125, 1.23284912109375, 1.290618896484375, 1.348388671875, 1.406158447265625, 1.46392822265625, 1.521697998046875, 1.5794677734375, 1.637237548828125, 1.69500732421875, 1.752777099609375, 1.810546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 16.0, 9.0, 10.0, 13.0, 12.0, 18.0, 18.0, 24.0, 13.0, 25.0, 37.0, 33.0, 31.0, 42.0, 39.0, 39.0, 44.0, 30.0, 50.0, 36.0, 39.0, 33.0, 40.0, 44.0, 30.0, 34.0, 31.0, 23.0, 21.0, 26.0, 19.0, 14.0, 13.0, 13.0, 11.0, 8.0, 5.0, 8.0, 10.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.984375, -0.949249267578125, -0.91412353515625, -0.878997802734375, -0.8438720703125, -0.808746337890625, -0.77362060546875, -0.738494873046875, -0.703369140625, -0.668243408203125, -0.63311767578125, -0.597991943359375, -0.5628662109375, -0.527740478515625, -0.49261474609375, -0.457489013671875, -0.42236328125, -0.387237548828125, -0.35211181640625, -0.316986083984375, -0.2818603515625, -0.246734619140625, -0.21160888671875, -0.176483154296875, -0.141357421875, -0.106231689453125, -0.07110595703125, -0.035980224609375, -0.0008544921875, 0.034271240234375, 0.06939697265625, 0.104522705078125, 0.1396484375, 0.174774169921875, 0.20989990234375, 0.245025634765625, 0.2801513671875, 0.315277099609375, 0.35040283203125, 0.385528564453125, 0.420654296875, 0.455780029296875, 0.49090576171875, 0.526031494140625, 0.5611572265625, 0.596282958984375, 0.63140869140625, 0.666534423828125, 0.70166015625, 0.736785888671875, 0.77191162109375, 0.807037353515625, 0.8421630859375, 0.877288818359375, 0.91241455078125, 0.947540283203125, 0.982666015625, 1.017791748046875, 1.05291748046875, 1.088043212890625, 1.1231689453125, 1.158294677734375, 1.19342041015625, 1.228546142578125, 1.263671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 12.0, 16.0, 23.0, 43.0, 61.0, 99.0, 168.0, 319.0, 644.0, 1464.0, 3880.0, 13165.0, 64097.0, 358201.0, 477047.0, 101658.0, 19122.0, 5088.0, 1745.0, 778.0, 381.0, 219.0, 103.0, 88.0, 42.0, 23.0, 21.0, 15.0, 13.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2764892578125, -1.232666015625, -1.1888427734375, -1.14501953125, -1.1011962890625, -1.057373046875, -1.0135498046875, -0.9697265625, -0.9259033203125, -0.882080078125, -0.8382568359375, -0.79443359375, -0.7506103515625, -0.706787109375, -0.6629638671875, -0.619140625, -0.5753173828125, -0.531494140625, -0.4876708984375, -0.44384765625, -0.4000244140625, -0.356201171875, -0.3123779296875, -0.2685546875, -0.2247314453125, -0.180908203125, -0.1370849609375, -0.09326171875, -0.0494384765625, -0.005615234375, 0.0382080078125, 0.08203125, 0.1258544921875, 0.169677734375, 0.2135009765625, 0.25732421875, 0.3011474609375, 0.344970703125, 0.3887939453125, 0.4326171875, 0.4764404296875, 0.520263671875, 0.5640869140625, 0.60791015625, 0.6517333984375, 0.695556640625, 0.7393798828125, 0.783203125, 0.8270263671875, 0.870849609375, 0.9146728515625, 0.95849609375, 1.0023193359375, 1.046142578125, 1.0899658203125, 1.1337890625, 1.1776123046875, 1.221435546875, 1.2652587890625, 1.30908203125, 1.3529052734375, 1.396728515625, 1.4405517578125, 1.484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 13.0, 7.0, 23.0, 20.0, 21.0, 27.0, 37.0, 37.0, 56.0, 53.0, 60.0, 66.0, 83.0, 69.0, 54.0, 52.0, 47.0, 46.0, 37.0, 27.0, 18.0, 18.0, 18.0, 18.0, 11.0, 12.0, 4.0, 10.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013363361358642578, -0.0001293141394853592, -0.0001249946653842926, -0.00012067519128322601, -0.00011635571718215942, -0.00011203624308109283, -0.00010771676898002625, -0.00010339729487895966, -9.907782077789307e-05, -9.475834667682648e-05, -9.043887257575989e-05, -8.61193984746933e-05, -8.179992437362671e-05, -7.748045027256012e-05, -7.316097617149353e-05, -6.884150207042694e-05, -6.452202796936035e-05, -6.020255386829376e-05, -5.588307976722717e-05, -5.1563605666160583e-05, -4.7244131565093994e-05, -4.2924657464027405e-05, -3.8605183362960815e-05, -3.4285709261894226e-05, -2.9966235160827637e-05, -2.5646761059761047e-05, -2.1327286958694458e-05, -1.700781285762787e-05, -1.268833875656128e-05, -8.36886465549469e-06, -4.049390554428101e-06, 2.7008354663848877e-07, 4.589557647705078e-06, 8.909031748771667e-06, 1.3228505849838257e-05, 1.7547979950904846e-05, 2.1867454051971436e-05, 2.6186928153038025e-05, 3.0506402254104614e-05, 3.4825876355171204e-05, 3.914535045623779e-05, 4.346482455730438e-05, 4.778429865837097e-05, 5.210377275943756e-05, 5.642324686050415e-05, 6.074272096157074e-05, 6.506219506263733e-05, 6.938166916370392e-05, 7.370114326477051e-05, 7.80206173658371e-05, 8.234009146690369e-05, 8.665956556797028e-05, 9.097903966903687e-05, 9.529851377010345e-05, 9.961798787117004e-05, 0.00010393746197223663, 0.00010825693607330322, 0.00011257641017436981, 0.0001168958842754364, 0.00012121535837650299, 0.00012553483247756958, 0.00012985430657863617, 0.00013417378067970276, 0.00013849325478076935, 0.00014281272888183594]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 10.0, 4.0, 16.0, 23.0, 21.0, 30.0, 41.0, 56.0, 88.0, 130.0, 198.0, 317.0, 571.0, 1016.0, 1921.0, 3949.0, 9542.0, 27774.0, 103135.0, 346768.0, 380272.0, 120629.0, 31951.0, 10848.0, 4475.0, 2038.0, 1099.0, 617.0, 315.0, 184.0, 167.0, 77.0, 82.0, 39.0, 29.0, 35.0, 17.0, 12.0, 13.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0274658203125, -0.994384765625, -0.9613037109375, -0.92822265625, -0.8951416015625, -0.862060546875, -0.8289794921875, -0.7958984375, -0.7628173828125, -0.729736328125, -0.6966552734375, -0.66357421875, -0.6304931640625, -0.597412109375, -0.5643310546875, -0.53125, -0.4981689453125, -0.465087890625, -0.4320068359375, -0.39892578125, -0.3658447265625, -0.332763671875, -0.2996826171875, -0.2666015625, -0.2335205078125, -0.200439453125, -0.1673583984375, -0.13427734375, -0.1011962890625, -0.068115234375, -0.0350341796875, -0.001953125, 0.0311279296875, 0.064208984375, 0.0972900390625, 0.13037109375, 0.1634521484375, 0.196533203125, 0.2296142578125, 0.2626953125, 0.2957763671875, 0.328857421875, 0.3619384765625, 0.39501953125, 0.4281005859375, 0.461181640625, 0.4942626953125, 0.52734375, 0.5604248046875, 0.593505859375, 0.6265869140625, 0.65966796875, 0.6927490234375, 0.725830078125, 0.7589111328125, 0.7919921875, 0.8250732421875, 0.858154296875, 0.8912353515625, 0.92431640625, 0.9573974609375, 0.990478515625, 1.0235595703125, 1.056640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 10.0, 21.0, 20.0, 20.0, 32.0, 24.0, 57.0, 51.0, 54.0, 53.0, 75.0, 76.0, 81.0, 70.0, 71.0, 63.0, 32.0, 36.0, 31.0, 29.0, 17.0, 12.0, 11.0, 5.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69287109375, -0.667724609375, -0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 21.0, 67.0, 157.0, 245.0, 231.0, 144.0, 70.0, 32.0, 14.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53908348083496, -22.84380531311035, -22.148527145385742, -21.453248977661133, -20.75796890258789, -20.06269073486328, -19.367412567138672, -18.672134399414062, -17.976856231689453, -17.281578063964844, -16.586299896240234, -15.891020774841309, -15.1957426071167, -14.50046443939209, -13.805185317993164, -13.109907150268555, -12.414628982543945, -11.719350814819336, -11.024072647094727, -10.3287935256958, -9.633515357971191, -8.938237190246582, -8.242958068847656, -7.547679901123047, -6.8524017333984375, -6.157123565673828, -5.4618449211120605, -4.766566276550293, -4.071288108825684, -3.376009702682495, -2.6807312965393066, -1.985452651977539, -1.2901725769042969, -0.5948941707611084, 0.10038423538208008, 0.7956626415252686, 1.490941047668457, 2.1862194538116455, 2.881497859954834, 3.5767765045166016, 4.272054672241211, 4.96733283996582, 5.662611484527588, 6.3578901290893555, 7.053168296813965, 7.748446464538574, 8.4437255859375, 9.13900375366211, 9.834281921386719, 10.529560089111328, 11.224838256835938, 11.920117378234863, 12.615395545959473, 13.310673713684082, 14.005952835083008, 14.701231002807617, 15.396509170532227, 16.091787338256836, 16.787065505981445, 17.482343673706055, 18.177623748779297, 18.872901916503906, 19.568180084228516, 20.263458251953125, 20.958736419677734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 12.0, 12.0, 12.0, 11.0, 17.0, 11.0, 25.0, 27.0, 23.0, 32.0, 34.0, 36.0, 58.0, 38.0, 45.0, 59.0, 63.0, 49.0, 51.0, 40.0, 34.0, 40.0, 31.0, 34.0, 41.0, 26.0, 26.0, 12.0, 11.0, 21.0, 12.0, 10.0, 9.0, 6.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.7847723960876465, -6.530965805053711, -6.277159214019775, -6.02335262298584, -5.7695465087890625, -5.515739440917969, -5.261933326721191, -5.008126735687256, -4.75432014465332, -4.500513553619385, -4.246706962585449, -3.9929006099700928, -3.7390940189361572, -3.4852874279022217, -3.2314810752868652, -2.9776744842529297, -2.723867893218994, -2.4700613021850586, -2.216254711151123, -1.9624483585357666, -1.708641767501831, -1.4548351764678955, -1.2010287046432495, -0.9472222328186035, -0.693415641784668, -0.4396091103553772, -0.18580257892608643, 0.06800395250320435, 0.3218104839324951, 0.5756170749664307, 0.8294235467910767, 1.0832300186157227, 1.3370361328125, 1.5908427238464355, 1.8446491956710815, 2.0984556674957275, 2.352262258529663, 2.6060688495635986, 2.859875202178955, 3.1136817932128906, 3.367488384246826, 3.6212949752807617, 3.8751015663146973, 4.128908157348633, 4.38271427154541, 4.636521339416504, 4.890327453613281, 5.144134044647217, 5.397940635681152, 5.651747226715088, 5.905553817749023, 6.159360408782959, 6.4131669998168945, 6.666973114013672, 6.920779705047607, 7.174586296081543, 7.4283928871154785, 7.682199478149414, 7.93600606918335, 8.189812660217285, 8.443618774414062, 8.697425842285156, 8.951231956481934, 9.205038070678711, 9.458845138549805]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 14.0, 5.0, 10.0, 10.0, 21.0, 25.0, 30.0, 43.0, 65.0, 78.0, 109.0, 155.0, 248.0, 484.0, 1247.0, 3750.0, 16202.0, 177915.0, 3886101.0, 91308.0, 11649.0, 2917.0, 993.0, 415.0, 181.0, 111.0, 66.0, 27.0, 26.0, 18.0, 6.0, 5.0, 14.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.90234375, -4.75555419921875, -4.6087646484375, -4.46197509765625, -4.315185546875, -4.16839599609375, -4.0216064453125, -3.87481689453125, -3.72802734375, -3.58123779296875, -3.4344482421875, -3.28765869140625, -3.140869140625, -2.99407958984375, -2.8472900390625, -2.70050048828125, -2.5537109375, -2.40692138671875, -2.2601318359375, -2.11334228515625, -1.966552734375, -1.81976318359375, -1.6729736328125, -1.52618408203125, -1.37939453125, -1.23260498046875, -1.0858154296875, -0.93902587890625, -0.792236328125, -0.64544677734375, -0.4986572265625, -0.35186767578125, -0.205078125, -0.05828857421875, 0.0885009765625, 0.23529052734375, 0.382080078125, 0.52886962890625, 0.6756591796875, 0.82244873046875, 0.96923828125, 1.11602783203125, 1.2628173828125, 1.40960693359375, 1.556396484375, 1.70318603515625, 1.8499755859375, 1.99676513671875, 2.1435546875, 2.29034423828125, 2.4371337890625, 2.58392333984375, 2.730712890625, 2.87750244140625, 3.0242919921875, 3.17108154296875, 3.31787109375, 3.46466064453125, 3.6114501953125, 3.75823974609375, 3.905029296875, 4.05181884765625, 4.1986083984375, 4.34539794921875, 4.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 3.0, 8.0, 19.0, 18.0, 25.0, 44.0, 51.0, 59.0, 58.0, 69.0, 81.0, 79.0, 82.0, 59.0, 70.0, 53.0, 49.0, 39.0, 32.0, 27.0, 15.0, 14.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.54248046875, -0.5287551879882812, -0.5150299072265625, -0.5013046264648438, -0.487579345703125, -0.47385406494140625, -0.4601287841796875, -0.44640350341796875, -0.43267822265625, -0.41895294189453125, -0.4052276611328125, -0.39150238037109375, -0.377777099609375, -0.36405181884765625, -0.3503265380859375, -0.33660125732421875, -0.3228759765625, -0.30915069580078125, -0.2954254150390625, -0.28170013427734375, -0.267974853515625, -0.25424957275390625, -0.2405242919921875, -0.22679901123046875, -0.21307373046875, -0.19934844970703125, -0.1856231689453125, -0.17189788818359375, -0.158172607421875, -0.14444732666015625, -0.1307220458984375, -0.11699676513671875, -0.103271484375, -0.08954620361328125, -0.0758209228515625, -0.06209564208984375, -0.048370361328125, -0.03464508056640625, -0.0209197998046875, -0.00719451904296875, 0.00653076171875, 0.02025604248046875, 0.0339813232421875, 0.04770660400390625, 0.061431884765625, 0.07515716552734375, 0.0888824462890625, 0.10260772705078125, 0.1163330078125, 0.13005828857421875, 0.1437835693359375, 0.15750885009765625, 0.171234130859375, 0.18495941162109375, 0.1986846923828125, 0.21240997314453125, 0.22613525390625, 0.23986053466796875, 0.2535858154296875, 0.26731109619140625, 0.281036376953125, 0.29476165771484375, 0.3084869384765625, 0.32221221923828125, 0.3359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 10.0, 15.0, 19.0, 23.0, 48.0, 65.0, 93.0, 125.0, 175.0, 507.0, 5117.0, 3762717.0, 421604.0, 2862.0, 345.0, 153.0, 108.0, 70.0, 60.0, 33.0, 37.0, 37.0, 22.0, 12.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.25, -7.8896484375, -7.529296875, -7.1689453125, -6.80859375, -6.4482421875, -6.087890625, -5.7275390625, -5.3671875, -5.0068359375, -4.646484375, -4.2861328125, -3.92578125, -3.5654296875, -3.205078125, -2.8447265625, -2.484375, -2.1240234375, -1.763671875, -1.4033203125, -1.04296875, -0.6826171875, -0.322265625, 0.0380859375, 0.3984375, 0.7587890625, 1.119140625, 1.4794921875, 1.83984375, 2.2001953125, 2.560546875, 2.9208984375, 3.28125, 3.6416015625, 4.001953125, 4.3623046875, 4.72265625, 5.0830078125, 5.443359375, 5.8037109375, 6.1640625, 6.5244140625, 6.884765625, 7.2451171875, 7.60546875, 7.9658203125, 8.326171875, 8.6865234375, 9.046875, 9.4072265625, 9.767578125, 10.1279296875, 10.48828125, 10.8486328125, 11.208984375, 11.5693359375, 11.9296875, 12.2900390625, 12.650390625, 13.0107421875, 13.37109375, 13.7314453125, 14.091796875, 14.4521484375, 14.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 16.0, 41.0, 315.0, 3052.0, 544.0, 84.0, 19.0, 12.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.483154296875, -2.38623046875, -2.289306640625, -2.1923828125, -2.095458984375, -1.99853515625, -1.901611328125, -1.8046875, -1.707763671875, -1.61083984375, -1.513916015625, -1.4169921875, -1.320068359375, -1.22314453125, -1.126220703125, -1.029296875, -0.932373046875, -0.83544921875, -0.738525390625, -0.6416015625, -0.544677734375, -0.44775390625, -0.350830078125, -0.25390625, -0.156982421875, -0.06005859375, 0.036865234375, 0.1337890625, 0.230712890625, 0.32763671875, 0.424560546875, 0.521484375, 0.618408203125, 0.71533203125, 0.812255859375, 0.9091796875, 1.006103515625, 1.10302734375, 1.199951171875, 1.296875, 1.393798828125, 1.49072265625, 1.587646484375, 1.6845703125, 1.781494140625, 1.87841796875, 1.975341796875, 2.072265625, 2.169189453125, 2.26611328125, 2.363037109375, 2.4599609375, 2.556884765625, 2.65380859375, 2.750732421875, 2.84765625, 2.944580078125, 3.04150390625, 3.138427734375, 3.2353515625, 3.332275390625, 3.42919921875, 3.526123046875, 3.623046875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 13.0, 148.0, 590.0, 212.0, 33.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.634317874908447, -5.9419779777526855, -5.249637603759766, -4.557297706604004, -3.864957809448242, -3.1726179122924805, -2.4802775382995605, -1.7879376411437988, -1.095597743988037, -0.40325772762298584, 0.28908228874206543, 0.9814224243164062, 1.673762321472168, 2.3661022186279297, 3.0584425926208496, 3.7507824897766113, 4.443122386932373, 5.135462284088135, 5.827802658081055, 6.520142555236816, 7.212482452392578, 7.90482234954834, 8.597162246704102, 9.28950309753418, 9.981842041015625, 10.674181938171387, 11.366521835327148, 12.058862686157227, 12.751201629638672, 13.44354248046875, 14.135882377624512, 14.828222274780273, 15.520561218261719, 16.212902069091797, 16.905241012573242, 17.59758186340332, 18.289920806884766, 18.982261657714844, 19.674602508544922, 20.366941452026367, 21.059280395507812, 21.75162124633789, 22.443960189819336, 23.136301040649414, 23.82863998413086, 24.520980834960938, 25.213321685791016, 25.90566062927246, 26.59800148010254, 27.290342330932617, 27.982681274414062, 28.67502212524414, 29.367361068725586, 30.059701919555664, 30.75204086303711, 31.444381713867188, 32.136722564697266, 32.829063415527344, 33.52140426635742, 34.213741302490234, 34.90608215332031, 35.59842300415039, 36.29076385498047, 36.98310089111328, 37.67544174194336]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 10.0, 17.0, 23.0, 45.0, 68.0, 98.0, 112.0, 124.0, 118.0, 96.0, 110.0, 66.0, 46.0, 34.0, 14.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.434198379516602, -8.22624397277832, -8.018289566040039, -7.810335159301758, -7.602380752563477, -7.394426345825195, -7.186471939086914, -6.978517532348633, -6.770563125610352, -6.56260871887207, -6.354654312133789, -6.146699905395508, -5.938745498657227, -5.730791091918945, -5.522836685180664, -5.314882278442383, -5.106927871704102, -4.89897346496582, -4.691019058227539, -4.483064651489258, -4.275110244750977, -4.067155838012695, -3.859201431274414, -3.651247024536133, -3.4432926177978516, -3.2353382110595703, -3.027383804321289, -2.819429397583008, -2.6114749908447266, -2.4035205841064453, -2.195566177368164, -1.9876117706298828, -1.7796573638916016, -1.5717029571533203, -1.363748550415039, -1.1557941436767578, -0.9478397369384766, -0.7398853302001953, -0.5319309234619141, -0.3239765167236328, -0.11602210998535156, 0.09193229675292969, 0.29988670349121094, 0.5078411102294922, 0.7157955169677734, 0.9237499237060547, 1.131704330444336, 1.3396587371826172, 1.5476131439208984, 1.7555675506591797, 1.963521957397461, 2.171476364135742, 2.3794307708740234, 2.5873851776123047, 2.795339584350586, 3.003293991088867, 3.2112483978271484, 3.4192028045654297, 3.627157211303711, 3.835111618041992, 4.043066024780273, 4.251020431518555, 4.458974838256836, 4.666929244995117, 4.874883651733398]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 18.0, 26.0, 49.0, 91.0, 171.0, 412.0, 1472.0, 9789.0, 267981.0, 734818.0, 29902.0, 2654.0, 669.0, 243.0, 103.0, 52.0, 30.0, 25.0, 13.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.5302734375, -4.326171875, -4.1220703125, -3.91796875, -3.7138671875, -3.509765625, -3.3056640625, -3.1015625, -2.8974609375, -2.693359375, -2.4892578125, -2.28515625, -2.0810546875, -1.876953125, -1.6728515625, -1.46875, -1.2646484375, -1.060546875, -0.8564453125, -0.65234375, -0.4482421875, -0.244140625, -0.0400390625, 0.1640625, 0.3681640625, 0.572265625, 0.7763671875, 0.98046875, 1.1845703125, 1.388671875, 1.5927734375, 1.796875, 2.0009765625, 2.205078125, 2.4091796875, 2.61328125, 2.8173828125, 3.021484375, 3.2255859375, 3.4296875, 3.6337890625, 3.837890625, 4.0419921875, 4.24609375, 4.4501953125, 4.654296875, 4.8583984375, 5.0625, 5.2666015625, 5.470703125, 5.6748046875, 5.87890625, 6.0830078125, 6.287109375, 6.4912109375, 6.6953125, 6.8994140625, 7.103515625, 7.3076171875, 7.51171875, 7.7158203125, 7.919921875, 8.1240234375, 8.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 10.0, 16.0, 31.0, 30.0, 39.0, 31.0, 53.0, 64.0, 50.0, 60.0, 70.0, 68.0, 52.0, 56.0, 53.0, 57.0, 39.0, 39.0, 30.0, 19.0, 17.0, 18.0, 12.0, 12.0, 0.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.372314453125, -0.36093902587890625, -0.3495635986328125, -0.33818817138671875, -0.326812744140625, -0.31543731689453125, -0.3040618896484375, -0.29268646240234375, -0.28131103515625, -0.26993560791015625, -0.2585601806640625, -0.24718475341796875, -0.235809326171875, -0.22443389892578125, -0.2130584716796875, -0.20168304443359375, -0.1903076171875, -0.17893218994140625, -0.1675567626953125, -0.15618133544921875, -0.144805908203125, -0.13343048095703125, -0.1220550537109375, -0.11067962646484375, -0.09930419921875, -0.08792877197265625, -0.0765533447265625, -0.06517791748046875, -0.053802490234375, -0.04242706298828125, -0.0310516357421875, -0.01967620849609375, -0.00830078125, 0.00307464599609375, 0.0144500732421875, 0.02582550048828125, 0.037200927734375, 0.04857635498046875, 0.0599517822265625, 0.07132720947265625, 0.08270263671875, 0.09407806396484375, 0.1054534912109375, 0.11682891845703125, 0.128204345703125, 0.13957977294921875, 0.1509552001953125, 0.16233062744140625, 0.1737060546875, 0.18508148193359375, 0.1964569091796875, 0.20783233642578125, 0.219207763671875, 0.23058319091796875, 0.2419586181640625, 0.25333404541015625, 0.26470947265625, 0.27608489990234375, 0.2874603271484375, 0.29883575439453125, 0.310211181640625, 0.32158660888671875, 0.3329620361328125, 0.34433746337890625, 0.355712890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 18.0, 27.0, 25.0, 33.0, 50.0, 76.0, 109.0, 126.0, 212.0, 295.0, 451.0, 724.0, 1302.0, 2612.0, 5857.0, 16768.0, 62589.0, 240845.0, 440559.0, 200452.0, 50634.0, 14204.0, 4969.0, 2334.0, 1216.0, 672.0, 421.0, 266.0, 217.0, 110.0, 85.0, 74.0, 48.0, 52.0, 31.0, 20.0, 16.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.087890625, -2.02349853515625, -1.9591064453125, -1.89471435546875, -1.830322265625, -1.76593017578125, -1.7015380859375, -1.63714599609375, -1.57275390625, -1.50836181640625, -1.4439697265625, -1.37957763671875, -1.315185546875, -1.25079345703125, -1.1864013671875, -1.12200927734375, -1.0576171875, -0.99322509765625, -0.9288330078125, -0.86444091796875, -0.800048828125, -0.73565673828125, -0.6712646484375, -0.60687255859375, -0.54248046875, -0.47808837890625, -0.4136962890625, -0.34930419921875, -0.284912109375, -0.22052001953125, -0.1561279296875, -0.09173583984375, -0.02734375, 0.03704833984375, 0.1014404296875, 0.16583251953125, 0.230224609375, 0.29461669921875, 0.3590087890625, 0.42340087890625, 0.48779296875, 0.55218505859375, 0.6165771484375, 0.68096923828125, 0.745361328125, 0.80975341796875, 0.8741455078125, 0.93853759765625, 1.0029296875, 1.06732177734375, 1.1317138671875, 1.19610595703125, 1.260498046875, 1.32489013671875, 1.3892822265625, 1.45367431640625, 1.51806640625, 1.58245849609375, 1.6468505859375, 1.71124267578125, 1.775634765625, 1.84002685546875, 1.9044189453125, 1.96881103515625, 2.033203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 13.0, 5.0, 8.0, 14.0, 7.0, 19.0, 21.0, 30.0, 21.0, 22.0, 35.0, 35.0, 40.0, 48.0, 45.0, 64.0, 55.0, 54.0, 60.0, 53.0, 40.0, 44.0, 54.0, 35.0, 22.0, 30.0, 22.0, 19.0, 15.0, 22.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.9658203125, -1.914215087890625, -1.86260986328125, -1.811004638671875, -1.7593994140625, -1.707794189453125, -1.65618896484375, -1.604583740234375, -1.552978515625, -1.501373291015625, -1.44976806640625, -1.398162841796875, -1.3465576171875, -1.294952392578125, -1.24334716796875, -1.191741943359375, -1.14013671875, -1.088531494140625, -1.03692626953125, -0.985321044921875, -0.9337158203125, -0.882110595703125, -0.83050537109375, -0.778900146484375, -0.727294921875, -0.675689697265625, -0.62408447265625, -0.572479248046875, -0.5208740234375, -0.469268798828125, -0.41766357421875, -0.366058349609375, -0.314453125, -0.262847900390625, -0.21124267578125, -0.159637451171875, -0.1080322265625, -0.056427001953125, -0.00482177734375, 0.046783447265625, 0.098388671875, 0.149993896484375, 0.20159912109375, 0.253204345703125, 0.3048095703125, 0.356414794921875, 0.40802001953125, 0.459625244140625, 0.51123046875, 0.562835693359375, 0.61444091796875, 0.666046142578125, 0.7176513671875, 0.769256591796875, 0.82086181640625, 0.872467041015625, 0.924072265625, 0.975677490234375, 1.02728271484375, 1.078887939453125, 1.1304931640625, 1.182098388671875, 1.23370361328125, 1.285308837890625, 1.3369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 7.0, 23.0, 36.0, 42.0, 63.0, 84.0, 169.0, 279.0, 459.0, 1057.0, 2330.0, 6425.0, 23757.0, 109620.0, 451595.0, 351656.0, 74982.0, 17107.0, 5041.0, 1870.0, 856.0, 452.0, 238.0, 132.0, 88.0, 55.0, 37.0, 30.0, 8.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.2896270751953125, -1.249176025390625, -1.2087249755859375, -1.16827392578125, -1.1278228759765625, -1.087371826171875, -1.0469207763671875, -1.0064697265625, -0.9660186767578125, -0.925567626953125, -0.8851165771484375, -0.84466552734375, -0.8042144775390625, -0.763763427734375, -0.7233123779296875, -0.682861328125, -0.6424102783203125, -0.601959228515625, -0.5615081787109375, -0.52105712890625, -0.4806060791015625, -0.440155029296875, -0.3997039794921875, -0.3592529296875, -0.3188018798828125, -0.278350830078125, -0.2378997802734375, -0.19744873046875, -0.1569976806640625, -0.116546630859375, -0.0760955810546875, -0.03564453125, 0.0048065185546875, 0.045257568359375, 0.0857086181640625, 0.12615966796875, 0.1666107177734375, 0.207061767578125, 0.2475128173828125, 0.2879638671875, 0.3284149169921875, 0.368865966796875, 0.4093170166015625, 0.44976806640625, 0.4902191162109375, 0.530670166015625, 0.5711212158203125, 0.611572265625, 0.6520233154296875, 0.692474365234375, 0.7329254150390625, 0.77337646484375, 0.8138275146484375, 0.854278564453125, 0.8947296142578125, 0.9351806640625, 0.9756317138671875, 1.016082763671875, 1.0565338134765625, 1.09698486328125, 1.1374359130859375, 1.177886962890625, 1.2183380126953125, 1.2587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 15.0, 9.0, 12.0, 16.0, 21.0, 34.0, 33.0, 46.0, 54.0, 75.0, 87.0, 106.0, 88.0, 74.0, 67.0, 47.0, 40.0, 45.0, 40.0, 21.0, 14.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025582313537597656, -0.0002496875822544098, -0.00024355202913284302, -0.00023741647601127625, -0.00023128092288970947, -0.0002251453697681427, -0.00021900981664657593, -0.00021287426352500916, -0.00020673871040344238, -0.0002006031572818756, -0.00019446760416030884, -0.00018833205103874207, -0.0001821964979171753, -0.00017606094479560852, -0.00016992539167404175, -0.00016378983855247498, -0.0001576542854309082, -0.00015151873230934143, -0.00014538317918777466, -0.00013924762606620789, -0.0001331120729446411, -0.00012697651982307434, -0.00012084096670150757, -0.0001147054135799408, -0.00010856986045837402, -0.00010243430733680725, -9.629875421524048e-05, -9.01632010936737e-05, -8.402764797210693e-05, -7.789209485054016e-05, -7.175654172897339e-05, -6.562098860740662e-05, -5.9485435485839844e-05, -5.334988236427307e-05, -4.72143292427063e-05, -4.1078776121139526e-05, -3.4943222999572754e-05, -2.880766987800598e-05, -2.267211675643921e-05, -1.6536563634872437e-05, -1.0401010513305664e-05, -4.265457391738892e-06, 1.8700957298278809e-06, 8.005648851394653e-06, 1.4141201972961426e-05, 2.0276755094528198e-05, 2.641230821609497e-05, 3.254786133766174e-05, 3.8683414459228516e-05, 4.481896758079529e-05, 5.095452070236206e-05, 5.709007382392883e-05, 6.32256269454956e-05, 6.936118006706238e-05, 7.549673318862915e-05, 8.163228631019592e-05, 8.77678394317627e-05, 9.390339255332947e-05, 0.00010003894567489624, 0.00010617449879646301, 0.00011231005191802979, 0.00011844560503959656, 0.00012458115816116333, 0.0001307167112827301, 0.00013685226440429688]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 21.0, 23.0, 29.0, 51.0, 94.0, 140.0, 222.0, 347.0, 625.0, 1236.0, 2533.0, 6153.0, 18152.0, 68614.0, 294202.0, 466605.0, 138793.0, 33151.0, 10028.0, 3792.0, 1668.0, 852.0, 423.0, 293.0, 169.0, 92.0, 68.0, 49.0, 33.0, 13.0, 12.0, 13.0, 12.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.12109375, -1.085205078125, -1.04931640625, -1.013427734375, -0.9775390625, -0.941650390625, -0.90576171875, -0.869873046875, -0.833984375, -0.798095703125, -0.76220703125, -0.726318359375, -0.6904296875, -0.654541015625, -0.61865234375, -0.582763671875, -0.546875, -0.510986328125, -0.47509765625, -0.439208984375, -0.4033203125, -0.367431640625, -0.33154296875, -0.295654296875, -0.259765625, -0.223876953125, -0.18798828125, -0.152099609375, -0.1162109375, -0.080322265625, -0.04443359375, -0.008544921875, 0.02734375, 0.063232421875, 0.09912109375, 0.135009765625, 0.1708984375, 0.206787109375, 0.24267578125, 0.278564453125, 0.314453125, 0.350341796875, 0.38623046875, 0.422119140625, 0.4580078125, 0.493896484375, 0.52978515625, 0.565673828125, 0.6015625, 0.637451171875, 0.67333984375, 0.709228515625, 0.7451171875, 0.781005859375, 0.81689453125, 0.852783203125, 0.888671875, 0.924560546875, 0.96044921875, 0.996337890625, 1.0322265625, 1.068115234375, 1.10400390625, 1.139892578125, 1.17578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 6.0, 16.0, 14.0, 35.0, 35.0, 48.0, 47.0, 52.0, 74.0, 93.0, 97.0, 92.0, 83.0, 70.0, 50.0, 42.0, 25.0, 25.0, 24.0, 17.0, 11.0, 6.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9664154052734375, -0.934783935546875, -0.9031524658203125, -0.87152099609375, -0.8398895263671875, -0.808258056640625, -0.7766265869140625, -0.7449951171875, -0.7133636474609375, -0.681732177734375, -0.6501007080078125, -0.61846923828125, -0.5868377685546875, -0.555206298828125, -0.5235748291015625, -0.491943359375, -0.4603118896484375, -0.428680419921875, -0.3970489501953125, -0.36541748046875, -0.3337860107421875, -0.302154541015625, -0.2705230712890625, -0.2388916015625, -0.2072601318359375, -0.175628662109375, -0.1439971923828125, -0.11236572265625, -0.0807342529296875, -0.049102783203125, -0.0174713134765625, 0.01416015625, 0.0457916259765625, 0.077423095703125, 0.1090545654296875, 0.14068603515625, 0.1723175048828125, 0.203948974609375, 0.2355804443359375, 0.2672119140625, 0.2988433837890625, 0.330474853515625, 0.3621063232421875, 0.39373779296875, 0.4253692626953125, 0.457000732421875, 0.4886322021484375, 0.520263671875, 0.5518951416015625, 0.583526611328125, 0.6151580810546875, 0.64678955078125, 0.6784210205078125, 0.710052490234375, 0.7416839599609375, 0.7733154296875, 0.8049468994140625, 0.836578369140625, 0.8682098388671875, 0.89984130859375, 0.9314727783203125, 0.963104248046875, 0.9947357177734375, 1.0263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 25.0, 27.0, 60.0, 108.0, 137.0, 176.0, 148.0, 102.0, 93.0, 45.0, 27.0, 21.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.19582748413086, -17.657377243041992, -17.118927001953125, -16.580474853515625, -16.042024612426758, -15.50357437133789, -14.965124130249023, -14.426673889160156, -13.888222694396973, -13.349772453308105, -12.811321258544922, -12.272871017456055, -11.734420776367188, -11.195969581604004, -10.657519340515137, -10.119068145751953, -9.580617904663086, -9.042167663574219, -8.503716468811035, -7.965266227722168, -7.426815509796143, -6.888364791870117, -6.34991455078125, -5.811463832855225, -5.273013114929199, -4.734562397003174, -4.196111679077148, -3.6576614379882812, -3.119210720062256, -2.5807600021362305, -2.042309522628784, -1.503859043121338, -0.9654083251953125, -0.42695772647857666, 0.11149287223815918, 0.649943470954895, 1.1883940696716309, 1.7268447875976562, 2.2652952671051025, 2.803745746612549, 3.342196464538574, 3.8806471824645996, 4.419097900390625, 4.957548141479492, 5.495998859405518, 6.034449577331543, 6.57289981842041, 7.1113505363464355, 7.649801254272461, 8.188251495361328, 8.726702690124512, 9.265152931213379, 9.803604125976562, 10.34205436706543, 10.880504608154297, 11.418954849243164, 11.957406044006348, 12.495856285095215, 13.034307479858398, 13.572757720947266, 14.111207962036133, 14.649659156799316, 15.188109397888184, 15.726560592651367, 16.265010833740234]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 1.0, 7.0, 6.0, 9.0, 20.0, 20.0, 27.0, 21.0, 28.0, 29.0, 18.0, 38.0, 34.0, 40.0, 45.0, 38.0, 45.0, 53.0, 50.0, 46.0, 53.0, 49.0, 43.0, 43.0, 33.0, 35.0, 26.0, 15.0, 23.0, 15.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.792655944824219, -8.506147384643555, -8.219637870788574, -7.93312931060791, -7.646620750427246, -7.360111713409424, -7.073602676391602, -6.7870941162109375, -6.500585556030273, -6.214076519012451, -5.927567958831787, -5.641058921813965, -5.354550361633301, -5.0680413246154785, -4.781532287597656, -4.495023727416992, -4.20851469039917, -3.9220058917999268, -3.6354970932006836, -3.3489880561828613, -3.0624794960021973, -2.775970458984375, -2.489461660385132, -2.2029528617858887, -1.9164440631866455, -1.6299352645874023, -1.3434264659881592, -1.0569175481796265, -0.7704087495803833, -0.48389995098114014, -0.19739103317260742, 0.08911776542663574, 0.3756265640258789, 0.6621353626251221, 0.94864422082901, 1.235153079032898, 1.5216618776321411, 1.8081706762313843, 2.094679594039917, 2.38118839263916, 2.6676971912384033, 2.9542059898376465, 3.2407147884368896, 3.527223587036133, 3.813732624053955, 4.100241184234619, 4.386750221252441, 4.6732587814331055, 4.959767818450928, 5.24627685546875, 5.532785415649414, 5.819294452667236, 6.1058030128479, 6.392312049865723, 6.678820610046387, 6.965329647064209, 7.251838684082031, 7.5383477210998535, 7.824856281280518, 8.11136531829834, 8.397873878479004, 8.684382438659668, 8.970891952514648, 9.257400512695312, 9.543909072875977]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 12.0, 10.0, 24.0, 29.0, 48.0, 53.0, 77.0, 119.0, 169.0, 274.0, 521.0, 1055.0, 2608.0, 7992.0, 35873.0, 350709.0, 3607440.0, 154926.0, 22482.0, 6071.0, 2073.0, 849.0, 400.0, 189.0, 96.0, 54.0, 29.0, 18.0, 18.0, 7.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.261688232421875, -4.14447021484375, -4.027252197265625, -3.9100341796875, -3.792816162109375, -3.67559814453125, -3.558380126953125, -3.441162109375, -3.323944091796875, -3.20672607421875, -3.089508056640625, -2.9722900390625, -2.855072021484375, -2.73785400390625, -2.620635986328125, -2.50341796875, -2.386199951171875, -2.26898193359375, -2.151763916015625, -2.0345458984375, -1.917327880859375, -1.80010986328125, -1.682891845703125, -1.565673828125, -1.448455810546875, -1.33123779296875, -1.214019775390625, -1.0968017578125, -0.979583740234375, -0.86236572265625, -0.745147705078125, -0.6279296875, -0.510711669921875, -0.39349365234375, -0.276275634765625, -0.1590576171875, -0.041839599609375, 0.07537841796875, 0.192596435546875, 0.309814453125, 0.427032470703125, 0.54425048828125, 0.661468505859375, 0.7786865234375, 0.895904541015625, 1.01312255859375, 1.130340576171875, 1.24755859375, 1.364776611328125, 1.48199462890625, 1.599212646484375, 1.7164306640625, 1.833648681640625, 1.95086669921875, 2.068084716796875, 2.185302734375, 2.302520751953125, 2.41973876953125, 2.536956787109375, 2.6541748046875, 2.771392822265625, 2.88861083984375, 3.005828857421875, 3.123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 9.0, 11.0, 8.0, 10.0, 15.0, 21.0, 22.0, 38.0, 37.0, 40.0, 44.0, 55.0, 59.0, 52.0, 63.0, 59.0, 63.0, 59.0, 62.0, 42.0, 35.0, 41.0, 26.0, 38.0, 27.0, 20.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396728515625, -0.3847236633300781, -0.37271881103515625, -0.3607139587402344, -0.3487091064453125, -0.3367042541503906, -0.32469940185546875, -0.3126945495605469, -0.300689697265625, -0.2886848449707031, -0.27667999267578125, -0.2646751403808594, -0.2526702880859375, -0.24066543579101562, -0.22866058349609375, -0.21665573120117188, -0.20465087890625, -0.19264602661132812, -0.18064117431640625, -0.16863632202148438, -0.1566314697265625, -0.14462661743164062, -0.13262176513671875, -0.12061691284179688, -0.108612060546875, -0.09660720825195312, -0.08460235595703125, -0.07259750366210938, -0.0605926513671875, -0.048587799072265625, -0.03658294677734375, -0.024578094482421875, -0.0125732421875, -0.000568389892578125, 0.01143646240234375, 0.023441314697265625, 0.0354461669921875, 0.047451019287109375, 0.05945587158203125, 0.07146072387695312, 0.083465576171875, 0.09547042846679688, 0.10747528076171875, 0.11948013305664062, 0.1314849853515625, 0.14348983764648438, 0.15549468994140625, 0.16749954223632812, 0.17950439453125, 0.19150924682617188, 0.20351409912109375, 0.21551895141601562, 0.2275238037109375, 0.23952865600585938, 0.25153350830078125, 0.2635383605957031, 0.275543212890625, 0.2875480651855469, 0.29955291748046875, 0.3115577697753906, 0.3235626220703125, 0.3355674743652344, 0.34757232666015625, 0.3595771789550781, 0.37158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 11.0, 9.0, 16.0, 25.0, 30.0, 50.0, 55.0, 76.0, 132.0, 204.0, 331.0, 672.0, 1892.0, 8303.0, 325949.0, 3835483.0, 16371.0, 2611.0, 849.0, 406.0, 239.0, 142.0, 132.0, 84.0, 50.0, 55.0, 29.0, 20.0, 10.0, 16.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.899658203125, -10.58056640625, -10.261474609375, -9.9423828125, -9.623291015625, -9.30419921875, -8.985107421875, -8.666015625, -8.346923828125, -8.02783203125, -7.708740234375, -7.3896484375, -7.070556640625, -6.75146484375, -6.432373046875, -6.11328125, -5.794189453125, -5.47509765625, -5.156005859375, -4.8369140625, -4.517822265625, -4.19873046875, -3.879638671875, -3.560546875, -3.241455078125, -2.92236328125, -2.603271484375, -2.2841796875, -1.965087890625, -1.64599609375, -1.326904296875, -1.0078125, -0.688720703125, -0.36962890625, -0.050537109375, 0.2685546875, 0.587646484375, 0.90673828125, 1.225830078125, 1.544921875, 1.864013671875, 2.18310546875, 2.502197265625, 2.8212890625, 3.140380859375, 3.45947265625, 3.778564453125, 4.09765625, 4.416748046875, 4.73583984375, 5.054931640625, 5.3740234375, 5.693115234375, 6.01220703125, 6.331298828125, 6.650390625, 6.969482421875, 7.28857421875, 7.607666015625, 7.9267578125, 8.245849609375, 8.56494140625, 8.884033203125, 9.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 24.0, 32.0, 108.0, 486.0, 2227.0, 881.0, 194.0, 49.0, 20.0, 13.0, 12.0, 7.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.5149383544921875, -1.429290771484375, -1.3436431884765625, -1.25799560546875, -1.1723480224609375, -1.086700439453125, -1.0010528564453125, -0.9154052734375, -0.8297576904296875, -0.744110107421875, -0.6584625244140625, -0.57281494140625, -0.4871673583984375, -0.401519775390625, -0.3158721923828125, -0.230224609375, -0.1445770263671875, -0.058929443359375, 0.0267181396484375, 0.11236572265625, 0.1980133056640625, 0.283660888671875, 0.3693084716796875, 0.4549560546875, 0.5406036376953125, 0.626251220703125, 0.7118988037109375, 0.79754638671875, 0.8831939697265625, 0.968841552734375, 1.0544891357421875, 1.14013671875, 1.2257843017578125, 1.311431884765625, 1.3970794677734375, 1.48272705078125, 1.5683746337890625, 1.654022216796875, 1.7396697998046875, 1.8253173828125, 1.9109649658203125, 1.996612548828125, 2.0822601318359375, 2.16790771484375, 2.2535552978515625, 2.339202880859375, 2.4248504638671875, 2.510498046875, 2.5961456298828125, 2.681793212890625, 2.7674407958984375, 2.85308837890625, 2.9387359619140625, 3.024383544921875, 3.1100311279296875, 3.1956787109375, 3.2813262939453125, 3.366973876953125, 3.4526214599609375, 3.53826904296875, 3.6239166259765625, 3.709564208984375, 3.7952117919921875, 3.880859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 11.0, 32.0, 101.0, 272.0, 309.0, 171.0, 62.0, 21.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.170495986938477, -28.445274353027344, -27.72005271911621, -26.994831085205078, -26.269609451293945, -25.544387817382812, -24.81916618347168, -24.093944549560547, -23.368722915649414, -22.64350128173828, -21.91827964782715, -21.193058013916016, -20.467836380004883, -19.74261474609375, -19.017393112182617, -18.292171478271484, -17.56694984436035, -16.84172821044922, -16.116506576538086, -15.391284942626953, -14.66606330871582, -13.940841674804688, -13.215620040893555, -12.490398406982422, -11.765176773071289, -11.039955139160156, -10.314733505249023, -9.58951187133789, -8.864290237426758, -8.139068603515625, -7.413846969604492, -6.688625335693359, -5.963405609130859, -5.238183975219727, -4.512962341308594, -3.787740707397461, -3.062519073486328, -2.3372974395751953, -1.6120758056640625, -0.8868541717529297, -0.16163253784179688, 0.5635890960693359, 1.2888107299804688, 2.0140323638916016, 2.7392539978027344, 3.464475631713867, 4.189697265625, 4.914918899536133, 5.640140533447266, 6.365362167358398, 7.090583801269531, 7.815805435180664, 8.541027069091797, 9.26624870300293, 9.991470336914062, 10.716691970825195, 11.441913604736328, 12.167135238647461, 12.892356872558594, 13.617578506469727, 14.34280014038086, 15.068021774291992, 15.793243408203125, 16.518465042114258, 17.24368667602539]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 4.0, 11.0, 14.0, 10.0, 18.0, 38.0, 31.0, 26.0, 38.0, 70.0, 58.0, 67.0, 77.0, 65.0, 61.0, 60.0, 49.0, 44.0, 49.0, 34.0, 37.0, 19.0, 29.0, 20.0, 11.0, 19.0, 5.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.304987907409668, -6.130555152893066, -5.956122398376465, -5.781689643859863, -5.607256889343262, -5.43282413482666, -5.258391380310059, -5.083958625793457, -4.9095258712768555, -4.735093116760254, -4.560660362243652, -4.386227607727051, -4.211794853210449, -4.037362098693848, -3.862929105758667, -3.6884963512420654, -3.5140633583068848, -3.339630603790283, -3.1651978492736816, -2.99076509475708, -2.8163323402404785, -2.641899585723877, -2.4674665927886963, -2.2930338382720947, -2.118601083755493, -1.9441683292388916, -1.76973557472229, -1.595302700996399, -1.4208699464797974, -1.2464371919631958, -1.0720043182373047, -0.8975715637207031, -0.7231383323669434, -0.5487055778503418, -0.37427276372909546, -0.19983994960784912, -0.02540719509124756, 0.149025559425354, 0.3234584331512451, 0.4978911876678467, 0.6723239421844482, 0.8467566967010498, 1.0211894512176514, 1.1956223249435425, 1.370055079460144, 1.5444878339767456, 1.7189207077026367, 1.8933534622192383, 2.06778621673584, 2.2422189712524414, 2.416651725769043, 2.5910844802856445, 2.765517234802246, 2.9399499893188477, 3.1143829822540283, 3.28881573677063, 3.4632484912872314, 3.637681245803833, 3.8121140003204346, 3.9865469932556152, 4.160979747772217, 4.335412502288818, 4.50984525680542, 4.6842780113220215, 4.858710765838623]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 10.0, 4.0, 17.0, 19.0, 27.0, 34.0, 60.0, 67.0, 89.0, 170.0, 306.0, 488.0, 885.0, 1800.0, 4098.0, 11437.0, 41076.0, 169566.0, 478468.0, 252309.0, 61066.0, 16148.0, 5419.0, 2297.0, 1100.0, 582.0, 341.0, 219.0, 143.0, 84.0, 72.0, 40.0, 33.0, 16.0, 19.0, 11.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.553436279296875, -2.46429443359375, -2.375152587890625, -2.2860107421875, -2.196868896484375, -2.10772705078125, -2.018585205078125, -1.929443359375, -1.840301513671875, -1.75115966796875, -1.662017822265625, -1.5728759765625, -1.483734130859375, -1.39459228515625, -1.305450439453125, -1.21630859375, -1.127166748046875, -1.03802490234375, -0.948883056640625, -0.8597412109375, -0.770599365234375, -0.68145751953125, -0.592315673828125, -0.503173828125, -0.414031982421875, -0.32489013671875, -0.235748291015625, -0.1466064453125, -0.057464599609375, 0.03167724609375, 0.120819091796875, 0.2099609375, 0.299102783203125, 0.38824462890625, 0.477386474609375, 0.5665283203125, 0.655670166015625, 0.74481201171875, 0.833953857421875, 0.923095703125, 1.012237548828125, 1.10137939453125, 1.190521240234375, 1.2796630859375, 1.368804931640625, 1.45794677734375, 1.547088623046875, 1.63623046875, 1.725372314453125, 1.81451416015625, 1.903656005859375, 1.9927978515625, 2.081939697265625, 2.17108154296875, 2.260223388671875, 2.349365234375, 2.438507080078125, 2.52764892578125, 2.616790771484375, 2.7059326171875, 2.795074462890625, 2.88421630859375, 2.973358154296875, 3.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 15.0, 24.0, 24.0, 40.0, 39.0, 54.0, 56.0, 62.0, 70.0, 75.0, 70.0, 67.0, 68.0, 60.0, 58.0, 50.0, 42.0, 32.0, 16.0, 19.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49755859375, -0.4821281433105469, -0.46669769287109375, -0.4512672424316406, -0.4358367919921875, -0.4204063415527344, -0.40497589111328125, -0.3895454406738281, -0.374114990234375, -0.3586845397949219, -0.34325408935546875, -0.3278236389160156, -0.3123931884765625, -0.2969627380371094, -0.28153228759765625, -0.2661018371582031, -0.25067138671875, -0.23524093627929688, -0.21981048583984375, -0.20438003540039062, -0.1889495849609375, -0.17351913452148438, -0.15808868408203125, -0.14265823364257812, -0.127227783203125, -0.11179733276367188, -0.09636688232421875, -0.08093643188476562, -0.0655059814453125, -0.050075531005859375, -0.03464508056640625, -0.019214630126953125, -0.0037841796875, 0.011646270751953125, 0.02707672119140625, 0.042507171630859375, 0.0579376220703125, 0.07336807250976562, 0.08879852294921875, 0.10422897338867188, 0.119659423828125, 0.13508987426757812, 0.15052032470703125, 0.16595077514648438, 0.1813812255859375, 0.19681167602539062, 0.21224212646484375, 0.22767257690429688, 0.24310302734375, 0.2585334777832031, 0.27396392822265625, 0.2893943786621094, 0.3048248291015625, 0.3202552795410156, 0.33568572998046875, 0.3511161804199219, 0.366546630859375, 0.3819770812988281, 0.39740753173828125, 0.4128379821777344, 0.4282684326171875, 0.4436988830566406, 0.45912933349609375, 0.4745597839355469, 0.489990234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 22.0, 14.0, 32.0, 45.0, 55.0, 95.0, 127.0, 210.0, 345.0, 481.0, 922.0, 1856.0, 4280.0, 11506.0, 38635.0, 135895.0, 369441.0, 326233.0, 109876.0, 31288.0, 9632.0, 3754.0, 1607.0, 871.0, 419.0, 289.0, 201.0, 134.0, 89.0, 49.0, 52.0, 19.0, 23.0, 16.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.549835205078125, -1.49224853515625, -1.434661865234375, -1.3770751953125, -1.319488525390625, -1.26190185546875, -1.204315185546875, -1.146728515625, -1.089141845703125, -1.03155517578125, -0.973968505859375, -0.9163818359375, -0.858795166015625, -0.80120849609375, -0.743621826171875, -0.68603515625, -0.628448486328125, -0.57086181640625, -0.513275146484375, -0.4556884765625, -0.398101806640625, -0.34051513671875, -0.282928466796875, -0.225341796875, -0.167755126953125, -0.11016845703125, -0.052581787109375, 0.0050048828125, 0.062591552734375, 0.12017822265625, 0.177764892578125, 0.2353515625, 0.292938232421875, 0.35052490234375, 0.408111572265625, 0.4656982421875, 0.523284912109375, 0.58087158203125, 0.638458251953125, 0.696044921875, 0.753631591796875, 0.81121826171875, 0.868804931640625, 0.9263916015625, 0.983978271484375, 1.04156494140625, 1.099151611328125, 1.15673828125, 1.214324951171875, 1.27191162109375, 1.329498291015625, 1.3870849609375, 1.444671630859375, 1.50225830078125, 1.559844970703125, 1.617431640625, 1.675018310546875, 1.73260498046875, 1.790191650390625, 1.8477783203125, 1.905364990234375, 1.96295166015625, 2.020538330078125, 2.078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 2.0, 6.0, 11.0, 14.0, 9.0, 17.0, 28.0, 23.0, 24.0, 36.0, 38.0, 40.0, 32.0, 41.0, 42.0, 56.0, 48.0, 42.0, 61.0, 52.0, 42.0, 42.0, 41.0, 36.0, 29.0, 37.0, 30.0, 19.0, 20.0, 16.0, 17.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.88671875, -1.8379058837890625, -1.789093017578125, -1.7402801513671875, -1.69146728515625, -1.6426544189453125, -1.593841552734375, -1.5450286865234375, -1.4962158203125, -1.4474029541015625, -1.398590087890625, -1.3497772216796875, -1.30096435546875, -1.2521514892578125, -1.203338623046875, -1.1545257568359375, -1.105712890625, -1.0569000244140625, -1.008087158203125, -0.9592742919921875, -0.91046142578125, -0.8616485595703125, -0.812835693359375, -0.7640228271484375, -0.7152099609375, -0.6663970947265625, -0.617584228515625, -0.5687713623046875, -0.51995849609375, -0.4711456298828125, -0.422332763671875, -0.3735198974609375, -0.32470703125, -0.2758941650390625, -0.227081298828125, -0.1782684326171875, -0.12945556640625, -0.0806427001953125, -0.031829833984375, 0.0169830322265625, 0.0657958984375, 0.1146087646484375, 0.163421630859375, 0.2122344970703125, 0.26104736328125, 0.3098602294921875, 0.358673095703125, 0.4074859619140625, 0.456298828125, 0.5051116943359375, 0.553924560546875, 0.6027374267578125, 0.65155029296875, 0.7003631591796875, 0.749176025390625, 0.7979888916015625, 0.8468017578125, 0.8956146240234375, 0.944427490234375, 0.9932403564453125, 1.04205322265625, 1.0908660888671875, 1.139678955078125, 1.1884918212890625, 1.2373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 2.0, 8.0, 10.0, 11.0, 15.0, 32.0, 49.0, 73.0, 135.0, 201.0, 449.0, 920.0, 2404.0, 7916.0, 45350.0, 729111.0, 236670.0, 17795.0, 4504.0, 1520.0, 643.0, 312.0, 149.0, 89.0, 56.0, 29.0, 18.0, 20.0, 15.0, 5.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.857421875, -2.761444091796875, -2.66546630859375, -2.569488525390625, -2.4735107421875, -2.377532958984375, -2.28155517578125, -2.185577392578125, -2.089599609375, -1.993621826171875, -1.89764404296875, -1.801666259765625, -1.7056884765625, -1.609710693359375, -1.51373291015625, -1.417755126953125, -1.32177734375, -1.225799560546875, -1.12982177734375, -1.033843994140625, -0.9378662109375, -0.841888427734375, -0.74591064453125, -0.649932861328125, -0.553955078125, -0.457977294921875, -0.36199951171875, -0.266021728515625, -0.1700439453125, -0.074066162109375, 0.02191162109375, 0.117889404296875, 0.2138671875, 0.309844970703125, 0.40582275390625, 0.501800537109375, 0.5977783203125, 0.693756103515625, 0.78973388671875, 0.885711669921875, 0.981689453125, 1.077667236328125, 1.17364501953125, 1.269622802734375, 1.3656005859375, 1.461578369140625, 1.55755615234375, 1.653533935546875, 1.74951171875, 1.845489501953125, 1.94146728515625, 2.037445068359375, 2.1334228515625, 2.229400634765625, 2.32537841796875, 2.421356201171875, 2.517333984375, 2.613311767578125, 2.70928955078125, 2.805267333984375, 2.9012451171875, 2.997222900390625, 3.09320068359375, 3.189178466796875, 3.28515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 18.0, 20.0, 26.0, 34.0, 41.0, 56.0, 62.0, 80.0, 83.0, 106.0, 87.0, 61.0, 63.0, 34.0, 29.0, 29.0, 34.0, 20.0, 15.0, 15.0, 8.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015825405716896057, -0.00015319138765335083, -0.0001481287181377411, -0.00014306604862213135, -0.0001380033791065216, -0.00013294070959091187, -0.00012787804007530212, -0.00012281537055969238, -0.00011775270104408264, -0.0001126900315284729, -0.00010762736201286316, -0.00010256469249725342, -9.750202298164368e-05, -9.243935346603394e-05, -8.73766839504242e-05, -8.231401443481445e-05, -7.725134491920471e-05, -7.218867540359497e-05, -6.712600588798523e-05, -6.206333637237549e-05, -5.700066685676575e-05, -5.1937997341156006e-05, -4.6875327825546265e-05, -4.1812658309936523e-05, -3.674998879432678e-05, -3.168731927871704e-05, -2.66246497631073e-05, -2.156198024749756e-05, -1.6499310731887817e-05, -1.1436641216278076e-05, -6.373971700668335e-06, -1.3113021850585938e-06, 3.7513673305511475e-06, 8.814036846160889e-06, 1.387670636177063e-05, 1.893937587738037e-05, 2.4002045392990112e-05, 2.9064714908599854e-05, 3.4127384424209595e-05, 3.9190053939819336e-05, 4.425272345542908e-05, 4.931539297103882e-05, 5.437806248664856e-05, 5.94407320022583e-05, 6.450340151786804e-05, 6.956607103347778e-05, 7.462874054908752e-05, 7.969141006469727e-05, 8.475407958030701e-05, 8.981674909591675e-05, 9.487941861152649e-05, 9.994208812713623e-05, 0.00010500475764274597, 0.00011006742715835571, 0.00011513009667396545, 0.0001201927661895752, 0.00012525543570518494, 0.00013031810522079468, 0.00013538077473640442, 0.00014044344425201416, 0.0001455061137676239, 0.00015056878328323364, 0.00015563145279884338, 0.00016069412231445312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 10.0, 20.0, 21.0, 37.0, 58.0, 89.0, 131.0, 226.0, 350.0, 670.0, 1182.0, 2261.0, 4989.0, 16840.0, 255302.0, 713861.0, 38289.0, 7497.0, 3127.0, 1513.0, 760.0, 494.0, 280.0, 186.0, 101.0, 64.0, 54.0, 34.0, 22.0, 12.0, 9.0, 8.0, 5.0, 1.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.500274658203125, -2.40484619140625, -2.309417724609375, -2.2139892578125, -2.118560791015625, -2.02313232421875, -1.927703857421875, -1.832275390625, -1.736846923828125, -1.64141845703125, -1.545989990234375, -1.4505615234375, -1.355133056640625, -1.25970458984375, -1.164276123046875, -1.06884765625, -0.973419189453125, -0.87799072265625, -0.782562255859375, -0.6871337890625, -0.591705322265625, -0.49627685546875, -0.400848388671875, -0.305419921875, -0.209991455078125, -0.11456298828125, -0.019134521484375, 0.0762939453125, 0.171722412109375, 0.26715087890625, 0.362579345703125, 0.4580078125, 0.553436279296875, 0.64886474609375, 0.744293212890625, 0.8397216796875, 0.935150146484375, 1.03057861328125, 1.126007080078125, 1.221435546875, 1.316864013671875, 1.41229248046875, 1.507720947265625, 1.6031494140625, 1.698577880859375, 1.79400634765625, 1.889434814453125, 1.98486328125, 2.080291748046875, 2.17572021484375, 2.271148681640625, 2.3665771484375, 2.462005615234375, 2.55743408203125, 2.652862548828125, 2.748291015625, 2.843719482421875, 2.93914794921875, 3.034576416015625, 3.1300048828125, 3.225433349609375, 3.32086181640625, 3.416290283203125, 3.51171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 9.0, 15.0, 51.0, 137.0, 267.0, 247.0, 134.0, 61.0, 24.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.341094970703125, -3.24273681640625, -3.144378662109375, -3.0460205078125, -2.947662353515625, -2.84930419921875, -2.750946044921875, -2.652587890625, -2.554229736328125, -2.45587158203125, -2.357513427734375, -2.2591552734375, -2.160797119140625, -2.06243896484375, -1.964080810546875, -1.86572265625, -1.767364501953125, -1.66900634765625, -1.570648193359375, -1.4722900390625, -1.373931884765625, -1.27557373046875, -1.177215576171875, -1.078857421875, -0.980499267578125, -0.88214111328125, -0.783782958984375, -0.6854248046875, -0.587066650390625, -0.48870849609375, -0.390350341796875, -0.2919921875, -0.193634033203125, -0.09527587890625, 0.003082275390625, 0.1014404296875, 0.199798583984375, 0.29815673828125, 0.396514892578125, 0.494873046875, 0.593231201171875, 0.69158935546875, 0.789947509765625, 0.8883056640625, 0.986663818359375, 1.08502197265625, 1.183380126953125, 1.28173828125, 1.380096435546875, 1.47845458984375, 1.576812744140625, 1.6751708984375, 1.773529052734375, 1.87188720703125, 1.970245361328125, 2.068603515625, 2.166961669921875, 2.26531982421875, 2.363677978515625, 2.4620361328125, 2.560394287109375, 2.65875244140625, 2.757110595703125, 2.85546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 12.0, 15.0, 17.0, 23.0, 49.0, 78.0, 127.0, 157.0, 167.0, 135.0, 93.0, 57.0, 28.0, 15.0, 9.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375171661376953, -18.81422233581543, -18.253273010253906, -17.692323684692383, -17.13137435913086, -16.570425033569336, -16.009475708007812, -15.448526382446289, -14.887577056884766, -14.326627731323242, -13.765678405761719, -13.204729080200195, -12.643779754638672, -12.082830429077148, -11.521881103515625, -10.960931777954102, -10.399982452392578, -9.839033126831055, -9.278083801269531, -8.717134475708008, -8.156185150146484, -7.595235824584961, -7.0342864990234375, -6.473337173461914, -5.912387847900391, -5.351438522338867, -4.790489196777344, -4.22953987121582, -3.668590545654297, -3.1076412200927734, -2.54669189453125, -1.9857425689697266, -1.4247913360595703, -0.8638420104980469, -0.30289268493652344, 0.258056640625, 0.8190059661865234, 1.3799552917480469, 1.9409046173095703, 2.5018539428710938, 3.062803268432617, 3.6237525939941406, 4.184701919555664, 4.7456512451171875, 5.306600570678711, 5.867549896240234, 6.428499221801758, 6.989448547363281, 7.550397872924805, 8.111347198486328, 8.672296524047852, 9.233245849609375, 9.794195175170898, 10.355144500732422, 10.916093826293945, 11.477043151855469, 12.037992477416992, 12.598941802978516, 13.159891128540039, 13.720840454101562, 14.281789779663086, 14.84273910522461, 15.403688430786133, 15.964637756347656, 16.52558708190918]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 30.0, 21.0, 27.0, 26.0, 42.0, 47.0, 68.0, 45.0, 52.0, 54.0, 59.0, 56.0, 53.0, 57.0, 39.0, 55.0, 34.0, 43.0, 32.0, 19.0, 19.0, 14.0, 12.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.465709686279297, -9.090006828308105, -8.714303970336914, -8.338601112365723, -7.962898254394531, -7.58719539642334, -7.211493015289307, -6.835790157318115, -6.460087299346924, -6.084384441375732, -5.708681583404541, -5.332979202270508, -4.957276344299316, -4.581573486328125, -4.205870628356934, -3.830167770385742, -3.454464912414551, -3.0787620544433594, -2.703059196472168, -2.3273565769195557, -1.9516537189483643, -1.5759508609771729, -1.2002482414245605, -0.8245453834533691, -0.44884252548217773, -0.0731397271156311, 0.3025630712509155, 0.6782658100128174, 1.0539686679840088, 1.4296715259552002, 1.8053741455078125, 2.181077003479004, 2.556778907775879, 2.9324817657470703, 3.3081846237182617, 3.683887243270874, 4.0595903396606445, 4.435293197631836, 4.810995578765869, 5.1866984367370605, 5.562401294708252, 5.938104152679443, 6.313807010650635, 6.689509391784668, 7.065212249755859, 7.440915107727051, 7.816617965698242, 8.192320823669434, 8.568023681640625, 8.943726539611816, 9.319429397583008, 9.6951322555542, 10.07083511352539, 10.446537971496582, 10.822240829467773, 11.197942733764648, 11.573646545410156, 11.949349403381348, 12.325052261352539, 12.70075511932373, 13.076457977294922, 13.452160835266113, 13.827863693237305, 14.20356559753418, 14.579268455505371]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 16.0, 35.0, 65.0, 88.0, 183.0, 338.0, 772.0, 2481.0, 14309.0, 988862.0, 3164369.0, 17926.0, 3165.0, 911.0, 356.0, 179.0, 85.0, 41.0, 32.0, 12.0, 15.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6796875, -7.46051025390625, -7.2413330078125, -7.02215576171875, -6.802978515625, -6.58380126953125, -6.3646240234375, -6.14544677734375, -5.92626953125, -5.70709228515625, -5.4879150390625, -5.26873779296875, -5.049560546875, -4.83038330078125, -4.6112060546875, -4.39202880859375, -4.1728515625, -3.95367431640625, -3.7344970703125, -3.51531982421875, -3.296142578125, -3.07696533203125, -2.8577880859375, -2.63861083984375, -2.41943359375, -2.20025634765625, -1.9810791015625, -1.76190185546875, -1.542724609375, -1.32354736328125, -1.1043701171875, -0.88519287109375, -0.666015625, -0.44683837890625, -0.2276611328125, -0.00848388671875, 0.210693359375, 0.42987060546875, 0.6490478515625, 0.86822509765625, 1.08740234375, 1.30657958984375, 1.5257568359375, 1.74493408203125, 1.964111328125, 2.18328857421875, 2.4024658203125, 2.62164306640625, 2.8408203125, 3.05999755859375, 3.2791748046875, 3.49835205078125, 3.717529296875, 3.93670654296875, 4.1558837890625, 4.37506103515625, 4.59423828125, 4.81341552734375, 5.0325927734375, 5.25177001953125, 5.470947265625, 5.69012451171875, 5.9093017578125, 6.12847900390625, 6.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 4.0, 8.0, 8.0, 13.0, 15.0, 9.0, 26.0, 30.0, 30.0, 44.0, 63.0, 51.0, 53.0, 53.0, 61.0, 71.0, 73.0, 54.0, 60.0, 37.0, 41.0, 44.0, 41.0, 22.0, 27.0, 8.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.484619140625, -0.47092437744140625, -0.4572296142578125, -0.44353485107421875, -0.429840087890625, -0.41614532470703125, -0.4024505615234375, -0.38875579833984375, -0.37506103515625, -0.36136627197265625, -0.3476715087890625, -0.33397674560546875, -0.320281982421875, -0.30658721923828125, -0.2928924560546875, -0.27919769287109375, -0.2655029296875, -0.25180816650390625, -0.2381134033203125, -0.22441864013671875, -0.210723876953125, -0.19702911376953125, -0.1833343505859375, -0.16963958740234375, -0.15594482421875, -0.14225006103515625, -0.1285552978515625, -0.11486053466796875, -0.101165771484375, -0.08747100830078125, -0.0737762451171875, -0.06008148193359375, -0.04638671875, -0.03269195556640625, -0.0189971923828125, -0.00530242919921875, 0.008392333984375, 0.02208709716796875, 0.0357818603515625, 0.04947662353515625, 0.06317138671875, 0.07686614990234375, 0.0905609130859375, 0.10425567626953125, 0.117950439453125, 0.13164520263671875, 0.1453399658203125, 0.15903472900390625, 0.1727294921875, 0.18642425537109375, 0.2001190185546875, 0.21381378173828125, 0.227508544921875, 0.24120330810546875, 0.2548980712890625, 0.26859283447265625, 0.28228759765625, 0.29598236083984375, 0.3096771240234375, 0.32337188720703125, 0.337066650390625, 0.35076141357421875, 0.3644561767578125, 0.37815093994140625, 0.391845703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 7.0, 5.0, 6.0, 14.0, 20.0, 8.0, 36.0, 29.0, 31.0, 57.0, 87.0, 143.0, 261.0, 560.0, 1596.0, 6263.0, 44340.0, 3544291.0, 568293.0, 22310.0, 3836.0, 1019.0, 427.0, 216.0, 118.0, 49.0, 61.0, 43.0, 36.0, 25.0, 23.0, 8.0, 18.0, 4.0, 7.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2685546875, -4.115234375, -3.9619140625, -3.80859375, -3.6552734375, -3.501953125, -3.3486328125, -3.1953125, -3.0419921875, -2.888671875, -2.7353515625, -2.58203125, -2.4287109375, -2.275390625, -2.1220703125, -1.96875, -1.8154296875, -1.662109375, -1.5087890625, -1.35546875, -1.2021484375, -1.048828125, -0.8955078125, -0.7421875, -0.5888671875, -0.435546875, -0.2822265625, -0.12890625, 0.0244140625, 0.177734375, 0.3310546875, 0.484375, 0.6376953125, 0.791015625, 0.9443359375, 1.09765625, 1.2509765625, 1.404296875, 1.5576171875, 1.7109375, 1.8642578125, 2.017578125, 2.1708984375, 2.32421875, 2.4775390625, 2.630859375, 2.7841796875, 2.9375, 3.0908203125, 3.244140625, 3.3974609375, 3.55078125, 3.7041015625, 3.857421875, 4.0107421875, 4.1640625, 4.3173828125, 4.470703125, 4.6240234375, 4.77734375, 4.9306640625, 5.083984375, 5.2373046875, 5.390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 10.0, 14.0, 8.0, 37.0, 42.0, 106.0, 241.0, 668.0, 1865.0, 611.0, 201.0, 98.0, 52.0, 37.0, 26.0, 18.0, 8.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1163482666015625, -1.078399658203125, -1.0404510498046875, -1.00250244140625, -0.9645538330078125, -0.926605224609375, -0.8886566162109375, -0.8507080078125, -0.8127593994140625, -0.774810791015625, -0.7368621826171875, -0.69891357421875, -0.6609649658203125, -0.623016357421875, -0.5850677490234375, -0.547119140625, -0.5091705322265625, -0.471221923828125, -0.4332733154296875, -0.39532470703125, -0.3573760986328125, -0.319427490234375, -0.2814788818359375, -0.2435302734375, -0.2055816650390625, -0.167633056640625, -0.1296844482421875, -0.09173583984375, -0.0537872314453125, -0.015838623046875, 0.0221099853515625, 0.06005859375, 0.0980072021484375, 0.135955810546875, 0.1739044189453125, 0.21185302734375, 0.2498016357421875, 0.287750244140625, 0.3256988525390625, 0.3636474609375, 0.4015960693359375, 0.439544677734375, 0.4774932861328125, 0.51544189453125, 0.5533905029296875, 0.591339111328125, 0.6292877197265625, 0.667236328125, 0.7051849365234375, 0.743133544921875, 0.7810821533203125, 0.81903076171875, 0.8569793701171875, 0.894927978515625, 0.9328765869140625, 0.9708251953125, 1.0087738037109375, 1.046722412109375, 1.0846710205078125, 1.12261962890625, 1.1605682373046875, 1.198516845703125, 1.2364654541015625, 1.2744140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 19.0, 57.0, 167.0, 270.0, 258.0, 135.0, 59.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.97625160217285, -17.565088272094727, -17.1539249420166, -16.742759704589844, -16.33159637451172, -15.920433044433594, -15.509268760681152, -15.098105430603027, -14.686941146850586, -14.275777816772461, -13.86461353302002, -13.453450202941895, -13.042285919189453, -12.631122589111328, -12.219958305358887, -11.808794975280762, -11.39763069152832, -10.986467361450195, -10.575303077697754, -10.164139747619629, -9.752975463867188, -9.341812133789062, -8.930647850036621, -8.519484519958496, -8.108321189880371, -7.697157382965088, -7.285993576049805, -6.8748297691345215, -6.463665962219238, -6.052502632141113, -5.641338348388672, -5.230175018310547, -4.8190107345581055, -4.407846927642822, -3.996683120727539, -3.585519313812256, -3.1743555068969727, -2.7631919384002686, -2.3520281314849854, -1.9408643245697021, -1.529700517654419, -1.1185367107391357, -0.7073729634284973, -0.2962092161178589, 0.11495459079742432, 0.526118278503418, 0.9372820854187012, 1.3484458923339844, 1.7596096992492676, 2.170773506164551, 2.581937313079834, 2.993101119995117, 3.4042649269104004, 3.8154284954071045, 4.226592063903809, 4.63775634765625, 5.048919677734375, 5.460083484649658, 5.871247291564941, 6.282411098480225, 6.693574905395508, 7.104738235473633, 7.515902519226074, 7.927065849304199, 8.33823013305664]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 10.0, 22.0, 18.0, 23.0, 31.0, 41.0, 52.0, 41.0, 65.0, 63.0, 56.0, 72.0, 73.0, 57.0, 51.0, 58.0, 48.0, 44.0, 47.0, 33.0, 28.0, 13.0, 19.0, 8.0, 8.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.697535037994385, -4.567294597625732, -4.43705415725708, -4.306813716888428, -4.176573753356934, -4.046333312988281, -3.916092872619629, -3.7858524322509766, -3.655611991882324, -3.525371551513672, -3.3951311111450195, -3.2648909091949463, -3.134650468826294, -3.0044100284576416, -2.8741698265075684, -2.743929386138916, -2.6136889457702637, -2.4834485054016113, -2.353208065032959, -2.2229678630828857, -2.0927274227142334, -1.962486982345581, -1.8322466611862183, -1.7020063400268555, -1.5717658996582031, -1.4415254592895508, -1.311285138130188, -1.1810448169708252, -1.0508043766021729, -0.9205639958381653, -0.7903236150741577, -0.6600832343101501, -0.5298428535461426, -0.399602472782135, -0.26936209201812744, -0.13912171125411987, -0.008881330490112305, 0.12135905027389526, 0.25159943103790283, 0.3818398118019104, 0.512080192565918, 0.6423205733299255, 0.7725609540939331, 0.9028013348579407, 1.0330417156219482, 1.1632821559906006, 1.2935224771499634, 1.4237627983093262, 1.5540032386779785, 1.6842436790466309, 1.8144840002059937, 1.9447243213653564, 2.074964761734009, 2.205205202102661, 2.3354454040527344, 2.4656858444213867, 2.595926284790039, 2.7261667251586914, 2.8564071655273438, 2.986647367477417, 3.1168878078460693, 3.2471282482147217, 3.377368450164795, 3.5076088905334473, 3.6378493309020996]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 7.0, 26.0, 18.0, 32.0, 29.0, 42.0, 59.0, 89.0, 128.0, 184.0, 281.0, 525.0, 817.0, 1504.0, 2934.0, 6530.0, 16793.0, 52565.0, 188764.0, 438792.0, 237120.0, 65571.0, 20448.0, 7675.0, 3486.0, 1691.0, 920.0, 490.0, 305.0, 232.0, 153.0, 95.0, 67.0, 41.0, 31.0, 22.0, 16.0, 4.0, 11.0, 11.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.44921875, -2.363555908203125, -2.27789306640625, -2.192230224609375, -2.1065673828125, -2.020904541015625, -1.93524169921875, -1.849578857421875, -1.763916015625, -1.678253173828125, -1.59259033203125, -1.506927490234375, -1.4212646484375, -1.335601806640625, -1.24993896484375, -1.164276123046875, -1.07861328125, -0.992950439453125, -0.90728759765625, -0.821624755859375, -0.7359619140625, -0.650299072265625, -0.56463623046875, -0.478973388671875, -0.393310546875, -0.307647705078125, -0.22198486328125, -0.136322021484375, -0.0506591796875, 0.035003662109375, 0.12066650390625, 0.206329345703125, 0.2919921875, 0.377655029296875, 0.46331787109375, 0.548980712890625, 0.6346435546875, 0.720306396484375, 0.80596923828125, 0.891632080078125, 0.977294921875, 1.062957763671875, 1.14862060546875, 1.234283447265625, 1.3199462890625, 1.405609130859375, 1.49127197265625, 1.576934814453125, 1.66259765625, 1.748260498046875, 1.83392333984375, 1.919586181640625, 2.0052490234375, 2.090911865234375, 2.17657470703125, 2.262237548828125, 2.347900390625, 2.433563232421875, 2.51922607421875, 2.604888916015625, 2.6905517578125, 2.776214599609375, 2.86187744140625, 2.947540283203125, 3.033203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 17.0, 19.0, 21.0, 25.0, 32.0, 51.0, 37.0, 46.0, 44.0, 73.0, 62.0, 70.0, 64.0, 53.0, 57.0, 48.0, 39.0, 42.0, 39.0, 19.0, 24.0, 22.0, 18.0, 13.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4853515625, -0.471771240234375, -0.45819091796875, -0.444610595703125, -0.4310302734375, -0.417449951171875, -0.40386962890625, -0.390289306640625, -0.376708984375, -0.363128662109375, -0.34954833984375, -0.335968017578125, -0.3223876953125, -0.308807373046875, -0.29522705078125, -0.281646728515625, -0.26806640625, -0.254486083984375, -0.24090576171875, -0.227325439453125, -0.2137451171875, -0.200164794921875, -0.18658447265625, -0.173004150390625, -0.159423828125, -0.145843505859375, -0.13226318359375, -0.118682861328125, -0.1051025390625, -0.091522216796875, -0.07794189453125, -0.064361572265625, -0.05078125, -0.037200927734375, -0.02362060546875, -0.010040283203125, 0.0035400390625, 0.017120361328125, 0.03070068359375, 0.044281005859375, 0.057861328125, 0.071441650390625, 0.08502197265625, 0.098602294921875, 0.1121826171875, 0.125762939453125, 0.13934326171875, 0.152923583984375, 0.16650390625, 0.180084228515625, 0.19366455078125, 0.207244873046875, 0.2208251953125, 0.234405517578125, 0.24798583984375, 0.261566162109375, 0.275146484375, 0.288726806640625, 0.30230712890625, 0.315887451171875, 0.3294677734375, 0.343048095703125, 0.35662841796875, 0.370208740234375, 0.3837890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 0.0, 10.0, 13.0, 13.0, 16.0, 18.0, 35.0, 41.0, 85.0, 108.0, 137.0, 208.0, 314.0, 478.0, 810.0, 1683.0, 4631.0, 17033.0, 76282.0, 304845.0, 444864.0, 149870.0, 33519.0, 8167.0, 2556.0, 1111.0, 624.0, 327.0, 241.0, 155.0, 88.0, 70.0, 51.0, 39.0, 44.0, 17.0, 13.0, 11.0, 9.0, 8.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.115234375, -2.045257568359375, -1.97528076171875, -1.905303955078125, -1.8353271484375, -1.765350341796875, -1.69537353515625, -1.625396728515625, -1.555419921875, -1.485443115234375, -1.41546630859375, -1.345489501953125, -1.2755126953125, -1.205535888671875, -1.13555908203125, -1.065582275390625, -0.99560546875, -0.925628662109375, -0.85565185546875, -0.785675048828125, -0.7156982421875, -0.645721435546875, -0.57574462890625, -0.505767822265625, -0.435791015625, -0.365814208984375, -0.29583740234375, -0.225860595703125, -0.1558837890625, -0.085906982421875, -0.01593017578125, 0.054046630859375, 0.1240234375, 0.194000244140625, 0.26397705078125, 0.333953857421875, 0.4039306640625, 0.473907470703125, 0.54388427734375, 0.613861083984375, 0.683837890625, 0.753814697265625, 0.82379150390625, 0.893768310546875, 0.9637451171875, 1.033721923828125, 1.10369873046875, 1.173675537109375, 1.24365234375, 1.313629150390625, 1.38360595703125, 1.453582763671875, 1.5235595703125, 1.593536376953125, 1.66351318359375, 1.733489990234375, 1.803466796875, 1.873443603515625, 1.94342041015625, 2.013397216796875, 2.0833740234375, 2.153350830078125, 2.22332763671875, 2.293304443359375, 2.36328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 18.0, 13.0, 17.0, 11.0, 21.0, 35.0, 19.0, 25.0, 31.0, 36.0, 31.0, 34.0, 45.0, 40.0, 37.0, 43.0, 41.0, 38.0, 37.0, 47.0, 42.0, 36.0, 35.0, 32.0, 25.0, 26.0, 23.0, 28.0, 25.0, 23.0, 18.0, 13.0, 10.0, 8.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3828125, -1.3404998779296875, -1.298187255859375, -1.2558746337890625, -1.21356201171875, -1.1712493896484375, -1.128936767578125, -1.0866241455078125, -1.0443115234375, -1.0019989013671875, -0.959686279296875, -0.9173736572265625, -0.87506103515625, -0.8327484130859375, -0.790435791015625, -0.7481231689453125, -0.705810546875, -0.6634979248046875, -0.621185302734375, -0.5788726806640625, -0.53656005859375, -0.4942474365234375, -0.451934814453125, -0.4096221923828125, -0.3673095703125, -0.3249969482421875, -0.282684326171875, -0.2403717041015625, -0.19805908203125, -0.1557464599609375, -0.113433837890625, -0.0711212158203125, -0.02880859375, 0.0135040283203125, 0.055816650390625, 0.0981292724609375, 0.14044189453125, 0.1827545166015625, 0.225067138671875, 0.2673797607421875, 0.3096923828125, 0.3520050048828125, 0.394317626953125, 0.4366302490234375, 0.47894287109375, 0.5212554931640625, 0.563568115234375, 0.6058807373046875, 0.648193359375, 0.6905059814453125, 0.732818603515625, 0.7751312255859375, 0.81744384765625, 0.8597564697265625, 0.902069091796875, 0.9443817138671875, 0.9866943359375, 1.0290069580078125, 1.071319580078125, 1.1136322021484375, 1.15594482421875, 1.1982574462890625, 1.240570068359375, 1.2828826904296875, 1.3251953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 14.0, 30.0, 46.0, 75.0, 131.0, 205.0, 379.0, 853.0, 1882.0, 5329.0, 20163.0, 145867.0, 720438.0, 126114.0, 18413.0, 5112.0, 1811.0, 811.0, 403.0, 181.0, 107.0, 63.0, 39.0, 25.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37890625, -2.307830810546875, -2.23675537109375, -2.165679931640625, -2.0946044921875, -2.023529052734375, -1.95245361328125, -1.881378173828125, -1.810302734375, -1.739227294921875, -1.66815185546875, -1.597076416015625, -1.5260009765625, -1.454925537109375, -1.38385009765625, -1.312774658203125, -1.24169921875, -1.170623779296875, -1.09954833984375, -1.028472900390625, -0.9573974609375, -0.886322021484375, -0.81524658203125, -0.744171142578125, -0.673095703125, -0.602020263671875, -0.53094482421875, -0.459869384765625, -0.3887939453125, -0.317718505859375, -0.24664306640625, -0.175567626953125, -0.1044921875, -0.033416748046875, 0.03765869140625, 0.108734130859375, 0.1798095703125, 0.250885009765625, 0.32196044921875, 0.393035888671875, 0.464111328125, 0.535186767578125, 0.60626220703125, 0.677337646484375, 0.7484130859375, 0.819488525390625, 0.89056396484375, 0.961639404296875, 1.03271484375, 1.103790283203125, 1.17486572265625, 1.245941162109375, 1.3170166015625, 1.388092041015625, 1.45916748046875, 1.530242919921875, 1.601318359375, 1.672393798828125, 1.74346923828125, 1.814544677734375, 1.8856201171875, 1.956695556640625, 2.02777099609375, 2.098846435546875, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 16.0, 18.0, 22.0, 37.0, 32.0, 55.0, 93.0, 115.0, 126.0, 97.0, 66.0, 61.0, 57.0, 41.0, 20.0, 22.0, 11.0, 8.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002562999725341797, -0.00024925172328948975, -0.0002422034740447998, -0.00023515522480010986, -0.00022810697555541992, -0.00022105872631072998, -0.00021401047706604004, -0.0002069622278213501, -0.00019991397857666016, -0.00019286572933197021, -0.00018581748008728027, -0.00017876923084259033, -0.0001717209815979004, -0.00016467273235321045, -0.0001576244831085205, -0.00015057623386383057, -0.00014352798461914062, -0.00013647973537445068, -0.00012943148612976074, -0.0001223832368850708, -0.00011533498764038086, -0.00010828673839569092, -0.00010123848915100098, -9.419023990631104e-05, -8.71419906616211e-05, -8.009374141693115e-05, -7.304549217224121e-05, -6.599724292755127e-05, -5.894899368286133e-05, -5.190074443817139e-05, -4.4852495193481445e-05, -3.7804245948791504e-05, -3.075599670410156e-05, -2.370774745941162e-05, -1.665949821472168e-05, -9.611248970031738e-06, -2.562999725341797e-06, 4.4852495193481445e-06, 1.1533498764038086e-05, 1.8581748008728027e-05, 2.562999725341797e-05, 3.267824649810791e-05, 3.972649574279785e-05, 4.677474498748779e-05, 5.3822994232177734e-05, 6.0871243476867676e-05, 6.791949272155762e-05, 7.496774196624756e-05, 8.20159912109375e-05, 8.906424045562744e-05, 9.611248970031738e-05, 0.00010316073894500732, 0.00011020898818969727, 0.00011725723743438721, 0.00012430548667907715, 0.0001313537359237671, 0.00013840198516845703, 0.00014545023441314697, 0.00015249848365783691, 0.00015954673290252686, 0.0001665949821472168, 0.00017364323139190674, 0.00018069148063659668, 0.00018773972988128662, 0.00019478797912597656]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 16.0, 29.0, 37.0, 53.0, 109.0, 212.0, 383.0, 890.0, 2919.0, 14384.0, 223354.0, 766518.0, 32189.0, 5015.0, 1365.0, 504.0, 235.0, 128.0, 73.0, 46.0, 29.0, 12.0, 14.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.53515625, -3.418060302734375, -3.30096435546875, -3.183868408203125, -3.0667724609375, -2.949676513671875, -2.83258056640625, -2.715484619140625, -2.598388671875, -2.481292724609375, -2.36419677734375, -2.247100830078125, -2.1300048828125, -2.012908935546875, -1.89581298828125, -1.778717041015625, -1.66162109375, -1.544525146484375, -1.42742919921875, -1.310333251953125, -1.1932373046875, -1.076141357421875, -0.95904541015625, -0.841949462890625, -0.724853515625, -0.607757568359375, -0.49066162109375, -0.373565673828125, -0.2564697265625, -0.139373779296875, -0.02227783203125, 0.094818115234375, 0.2119140625, 0.329010009765625, 0.44610595703125, 0.563201904296875, 0.6802978515625, 0.797393798828125, 0.91448974609375, 1.031585693359375, 1.148681640625, 1.265777587890625, 1.38287353515625, 1.499969482421875, 1.6170654296875, 1.734161376953125, 1.85125732421875, 1.968353271484375, 2.08544921875, 2.202545166015625, 2.31964111328125, 2.436737060546875, 2.5538330078125, 2.670928955078125, 2.78802490234375, 2.905120849609375, 3.022216796875, 3.139312744140625, 3.25640869140625, 3.373504638671875, 3.4906005859375, 3.607696533203125, 3.72479248046875, 3.841888427734375, 3.958984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 12.0, 14.0, 29.0, 48.0, 60.0, 108.0, 163.0, 186.0, 128.0, 80.0, 51.0, 26.0, 15.0, 17.0, 13.0, 7.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8647308349609375, -1.808563232421875, -1.7523956298828125, -1.69622802734375, -1.6400604248046875, -1.583892822265625, -1.5277252197265625, -1.4715576171875, -1.4153900146484375, -1.359222412109375, -1.3030548095703125, -1.24688720703125, -1.1907196044921875, -1.134552001953125, -1.0783843994140625, -1.022216796875, -0.9660491943359375, -0.909881591796875, -0.8537139892578125, -0.79754638671875, -0.7413787841796875, -0.685211181640625, -0.6290435791015625, -0.5728759765625, -0.5167083740234375, -0.460540771484375, -0.4043731689453125, -0.34820556640625, -0.2920379638671875, -0.235870361328125, -0.1797027587890625, -0.12353515625, -0.0673675537109375, -0.011199951171875, 0.0449676513671875, 0.10113525390625, 0.1573028564453125, 0.213470458984375, 0.2696380615234375, 0.3258056640625, 0.3819732666015625, 0.438140869140625, 0.4943084716796875, 0.55047607421875, 0.6066436767578125, 0.662811279296875, 0.7189788818359375, 0.775146484375, 0.8313140869140625, 0.887481689453125, 0.9436492919921875, 0.99981689453125, 1.0559844970703125, 1.112152099609375, 1.1683197021484375, 1.2244873046875, 1.2806549072265625, 1.336822509765625, 1.3929901123046875, 1.44915771484375, 1.5053253173828125, 1.561492919921875, 1.6176605224609375, 1.673828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 11.0, 63.0, 151.0, 295.0, 276.0, 148.0, 33.0, 19.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.460739135742188, -25.25513458251953, -24.049531936645508, -22.84392738342285, -21.638324737548828, -20.432720184326172, -19.227115631103516, -18.021512985229492, -16.81591033935547, -15.610306739807129, -14.404703140258789, -13.199098587036133, -11.99349594116211, -10.787891387939453, -9.582287788391113, -8.376684188842773, -7.171079635620117, -5.965476036071777, -4.7598724365234375, -3.5542683601379395, -2.3486647605895996, -1.1430611610412598, 0.06254291534423828, 1.2681465148925781, 2.473750114440918, 3.679353713989258, 4.884957313537598, 6.090561389923096, 7.2961649894714355, 8.501768112182617, 9.707372665405273, 10.912976264953613, 12.118579864501953, 13.324183464050293, 14.529787063598633, 15.735391616821289, 16.940994262695312, 18.14659881591797, 19.352203369140625, 20.55780601501465, 21.763408660888672, 22.969013214111328, 24.17461585998535, 25.380220413208008, 26.58582305908203, 27.791427612304688, 28.997032165527344, 30.202634811401367, 31.408239364624023, 32.61384201049805, 33.8194465637207, 35.02505111694336, 36.230655670166016, 37.436256408691406, 38.64186096191406, 39.84746551513672, 41.053070068359375, 42.25867462158203, 43.46427917480469, 44.66987991333008, 45.875484466552734, 47.08108901977539, 48.28669357299805, 49.49229431152344, 50.697898864746094]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 11.0, 11.0, 24.0, 15.0, 24.0, 25.0, 18.0, 33.0, 38.0, 25.0, 37.0, 35.0, 42.0, 39.0, 40.0, 38.0, 52.0, 34.0, 41.0, 27.0, 31.0, 40.0, 50.0, 34.0, 27.0, 44.0, 21.0, 16.0, 13.0, 16.0, 12.0, 15.0, 9.0, 8.0, 6.0, 6.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-9.608081817626953, -9.353487014770508, -9.098893165588379, -8.844298362731934, -8.589704513549805, -8.33510971069336, -8.08051586151123, -7.825921058654785, -7.571327209472656, -7.316732883453369, -7.062138557434082, -6.807544231414795, -6.552949905395508, -6.298355579376221, -6.043761253356934, -5.789166450500488, -5.534572124481201, -5.279977798461914, -5.025383472442627, -4.77078914642334, -4.516194820404053, -4.261600494384766, -4.00700569152832, -3.7524116039276123, -3.497817277908325, -3.243222951889038, -2.988628625869751, -2.7340340614318848, -2.4794397354125977, -2.2248454093933105, -1.9702510833740234, -1.7156567573547363, -1.4610624313354492, -1.206468105316162, -0.9518737196922302, -0.6972793340682983, -0.44268500804901123, -0.18809068202972412, 0.06650376319885254, 0.32109808921813965, 0.5756924152374268, 0.8302867412567139, 1.084881067276001, 1.3394755125045776, 1.5940698385238647, 1.8486641645431519, 2.1032586097717285, 2.3578529357910156, 2.6124472618103027, 2.86704158782959, 3.121635913848877, 3.376230239868164, 3.630824565887451, 3.8854188919067383, 4.140013694763184, 4.3946075439453125, 4.649202346801758, 4.903796672821045, 5.158390998840332, 5.412985324859619, 5.667579650878906, 5.922173976898193, 6.1767683029174805, 6.431363105773926, 6.685956954956055]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 12.0, 17.0, 20.0, 22.0, 42.0, 49.0, 68.0, 85.0, 124.0, 177.0, 273.0, 443.0, 720.0, 1403.0, 3060.0, 6505.0, 18102.0, 76773.0, 2534349.0, 1454108.0, 67883.0, 17055.0, 6383.0, 2983.0, 1478.0, 868.0, 469.0, 271.0, 173.0, 122.0, 59.0, 47.0, 28.0, 31.0, 12.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71875, -3.612396240234375, -3.50604248046875, -3.399688720703125, -3.2933349609375, -3.186981201171875, -3.08062744140625, -2.974273681640625, -2.867919921875, -2.761566162109375, -2.65521240234375, -2.548858642578125, -2.4425048828125, -2.336151123046875, -2.22979736328125, -2.123443603515625, -2.01708984375, -1.910736083984375, -1.80438232421875, -1.698028564453125, -1.5916748046875, -1.485321044921875, -1.37896728515625, -1.272613525390625, -1.166259765625, -1.059906005859375, -0.95355224609375, -0.847198486328125, -0.7408447265625, -0.634490966796875, -0.52813720703125, -0.421783447265625, -0.3154296875, -0.209075927734375, -0.10272216796875, 0.003631591796875, 0.1099853515625, 0.216339111328125, 0.32269287109375, 0.429046630859375, 0.535400390625, 0.641754150390625, 0.74810791015625, 0.854461669921875, 0.9608154296875, 1.067169189453125, 1.17352294921875, 1.279876708984375, 1.38623046875, 1.492584228515625, 1.59893798828125, 1.705291748046875, 1.8116455078125, 1.917999267578125, 2.02435302734375, 2.130706787109375, 2.237060546875, 2.343414306640625, 2.44976806640625, 2.556121826171875, 2.6624755859375, 2.768829345703125, 2.87518310546875, 2.981536865234375, 3.087890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 6.0, 10.0, 18.0, 21.0, 28.0, 31.0, 35.0, 47.0, 37.0, 57.0, 50.0, 58.0, 73.0, 56.0, 63.0, 51.0, 64.0, 53.0, 36.0, 36.0, 24.0, 35.0, 21.0, 10.0, 13.0, 6.0, 15.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.509765625, -0.4956817626953125, -0.481597900390625, -0.4675140380859375, -0.45343017578125, -0.4393463134765625, -0.425262451171875, -0.4111785888671875, -0.3970947265625, -0.3830108642578125, -0.368927001953125, -0.3548431396484375, -0.34075927734375, -0.3266754150390625, -0.312591552734375, -0.2985076904296875, -0.284423828125, -0.2703399658203125, -0.256256103515625, -0.2421722412109375, -0.22808837890625, -0.2140045166015625, -0.199920654296875, -0.1858367919921875, -0.1717529296875, -0.1576690673828125, -0.143585205078125, -0.1295013427734375, -0.11541748046875, -0.1013336181640625, -0.087249755859375, -0.0731658935546875, -0.05908203125, -0.0449981689453125, -0.030914306640625, -0.0168304443359375, -0.00274658203125, 0.0113372802734375, 0.025421142578125, 0.0395050048828125, 0.0535888671875, 0.0676727294921875, 0.081756591796875, 0.0958404541015625, 0.10992431640625, 0.1240081787109375, 0.138092041015625, 0.1521759033203125, 0.166259765625, 0.1803436279296875, 0.194427490234375, 0.2085113525390625, 0.22259521484375, 0.2366790771484375, 0.250762939453125, 0.2648468017578125, 0.2789306640625, 0.2930145263671875, 0.307098388671875, 0.3211822509765625, 0.33526611328125, 0.3493499755859375, 0.363433837890625, 0.3775177001953125, 0.3916015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 15.0, 15.0, 29.0, 24.0, 33.0, 62.0, 103.0, 162.0, 265.0, 621.0, 1471.0, 4492.0, 24172.0, 493295.0, 3589376.0, 67082.0, 8791.0, 2367.0, 921.0, 365.0, 222.0, 96.0, 60.0, 52.0, 27.0, 26.0, 26.0, 19.0, 8.0, 11.0, 13.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.76666259765625, -4.6231689453125, -4.47967529296875, -4.336181640625, -4.19268798828125, -4.0491943359375, -3.90570068359375, -3.76220703125, -3.61871337890625, -3.4752197265625, -3.33172607421875, -3.188232421875, -3.04473876953125, -2.9012451171875, -2.75775146484375, -2.6142578125, -2.47076416015625, -2.3272705078125, -2.18377685546875, -2.040283203125, -1.89678955078125, -1.7532958984375, -1.60980224609375, -1.46630859375, -1.32281494140625, -1.1793212890625, -1.03582763671875, -0.892333984375, -0.74884033203125, -0.6053466796875, -0.46185302734375, -0.318359375, -0.17486572265625, -0.0313720703125, 0.11212158203125, 0.255615234375, 0.39910888671875, 0.5426025390625, 0.68609619140625, 0.82958984375, 0.97308349609375, 1.1165771484375, 1.26007080078125, 1.403564453125, 1.54705810546875, 1.6905517578125, 1.83404541015625, 1.9775390625, 2.12103271484375, 2.2645263671875, 2.40802001953125, 2.551513671875, 2.69500732421875, 2.8385009765625, 2.98199462890625, 3.12548828125, 3.26898193359375, 3.4124755859375, 3.55596923828125, 3.699462890625, 3.84295654296875, 3.9864501953125, 4.12994384765625, 4.2734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 8.0, 11.0, 23.0, 35.0, 60.0, 125.0, 298.0, 784.0, 1721.0, 580.0, 217.0, 101.0, 41.0, 15.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5857696533203125, -1.536773681640625, -1.4877777099609375, -1.43878173828125, -1.3897857666015625, -1.340789794921875, -1.2917938232421875, -1.2427978515625, -1.1938018798828125, -1.144805908203125, -1.0958099365234375, -1.04681396484375, -0.9978179931640625, -0.948822021484375, -0.8998260498046875, -0.850830078125, -0.8018341064453125, -0.752838134765625, -0.7038421630859375, -0.65484619140625, -0.6058502197265625, -0.556854248046875, -0.5078582763671875, -0.4588623046875, -0.4098663330078125, -0.360870361328125, -0.3118743896484375, -0.26287841796875, -0.2138824462890625, -0.164886474609375, -0.1158905029296875, -0.06689453125, -0.0178985595703125, 0.031097412109375, 0.0800933837890625, 0.12908935546875, 0.1780853271484375, 0.227081298828125, 0.2760772705078125, 0.3250732421875, 0.3740692138671875, 0.423065185546875, 0.4720611572265625, 0.52105712890625, 0.5700531005859375, 0.619049072265625, 0.6680450439453125, 0.717041015625, 0.7660369873046875, 0.815032958984375, 0.8640289306640625, 0.91302490234375, 0.9620208740234375, 1.011016845703125, 1.0600128173828125, 1.1090087890625, 1.1580047607421875, 1.207000732421875, 1.2559967041015625, 1.30499267578125, 1.3539886474609375, 1.402984619140625, 1.4519805908203125, 1.5009765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 6.0, 16.0, 18.0, 27.0, 55.0, 79.0, 93.0, 147.0, 116.0, 143.0, 113.0, 55.0, 47.0, 34.0, 18.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21065616607666, -5.977004051208496, -5.743351936340332, -5.509699821472168, -5.276047706604004, -5.04239559173584, -4.808743476867676, -4.575091361999512, -4.341439247131348, -4.107787132263184, -3.8741350173950195, -3.6404829025268555, -3.4068307876586914, -3.1731786727905273, -2.9395267963409424, -2.7058746814727783, -2.4722228050231934, -2.2385706901550293, -2.0049185752868652, -1.7712665796279907, -1.5376144647598267, -1.3039623498916626, -1.070310354232788, -0.836658239364624, -0.60300612449646, -0.3693540394306183, -0.1357019543647766, 0.09795010089874268, 0.33160221576690674, 0.5652543306350708, 0.7989063262939453, 1.0325584411621094, 1.2662105560302734, 1.4998626708984375, 1.7335147857666016, 1.967166781425476, 2.2008190155029297, 2.4344711303710938, 2.6681230068206787, 2.9017751216888428, 3.135427236557007, 3.369079351425171, 3.602731466293335, 3.83638334274292, 4.070035457611084, 4.303687572479248, 4.537339687347412, 4.770991802215576, 5.00464391708374, 5.238296031951904, 5.471948146820068, 5.705600261688232, 5.9392523765563965, 6.1729044914245605, 6.406556129455566, 6.6402082443237305, 6.8738603591918945, 7.107512474060059, 7.341164588928223, 7.574816703796387, 7.808468818664551, 8.042120933532715, 8.275773048400879, 8.509425163269043, 8.743077278137207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 13.0, 11.0, 12.0, 17.0, 21.0, 22.0, 27.0, 35.0, 47.0, 47.0, 46.0, 50.0, 45.0, 79.0, 53.0, 52.0, 52.0, 62.0, 52.0, 45.0, 38.0, 39.0, 24.0, 24.0, 24.0, 15.0, 12.0, 5.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4587721824645996, -3.318309783935547, -3.177847385406494, -3.0373847484588623, -2.8969223499298096, -2.756459951400757, -2.615997314453125, -2.4755349159240723, -2.3350725173950195, -2.194610118865967, -2.054147720336914, -1.9136850833892822, -1.7732226848602295, -1.6327602863311768, -1.4922977685928345, -1.3518352508544922, -1.2113728523254395, -1.0709104537963867, -0.9304479360580444, -0.7899854779243469, -0.6495230197906494, -0.5090605616569519, -0.3685981035232544, -0.22813564538955688, -0.08767318725585938, 0.052789270877838135, 0.19325172901153564, 0.33371418714523315, 0.47417664527893066, 0.6146391034126282, 0.7551015615463257, 0.8955640196800232, 1.0360264778137207, 1.1764888763427734, 1.3169513940811157, 1.457413911819458, 1.5978763103485107, 1.7383387088775635, 1.8788012266159058, 2.019263744354248, 2.159726142883301, 2.3001885414123535, 2.4406509399414062, 2.581113576889038, 2.721575975418091, 2.8620383739471436, 3.0025010108947754, 3.142963409423828, 3.283425807952881, 3.4238882064819336, 3.5643506050109863, 3.704813241958618, 3.845275640487671, 3.9857380390167236, 4.1262006759643555, 4.266663074493408, 4.407125473022461, 4.547587871551514, 4.688050270080566, 4.828512668609619, 4.968975067138672, 5.109437942504883, 5.2499003410339355, 5.390362739562988, 5.530825138092041]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 7.0, 5.0, 18.0, 30.0, 47.0, 69.0, 151.0, 278.0, 631.0, 1575.0, 4364.0, 18520.0, 119148.0, 705327.0, 165860.0, 23880.0, 5434.0, 1788.0, 748.0, 319.0, 159.0, 85.0, 38.0, 28.0, 17.0, 18.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.0987548828125, -3.955322265625, -3.8118896484375, -3.66845703125, -3.5250244140625, -3.381591796875, -3.2381591796875, -3.0947265625, -2.9512939453125, -2.807861328125, -2.6644287109375, -2.52099609375, -2.3775634765625, -2.234130859375, -2.0906982421875, -1.947265625, -1.8038330078125, -1.660400390625, -1.5169677734375, -1.37353515625, -1.2301025390625, -1.086669921875, -0.9432373046875, -0.7998046875, -0.6563720703125, -0.512939453125, -0.3695068359375, -0.22607421875, -0.0826416015625, 0.060791015625, 0.2042236328125, 0.34765625, 0.4910888671875, 0.634521484375, 0.7779541015625, 0.92138671875, 1.0648193359375, 1.208251953125, 1.3516845703125, 1.4951171875, 1.6385498046875, 1.781982421875, 1.9254150390625, 2.06884765625, 2.2122802734375, 2.355712890625, 2.4991455078125, 2.642578125, 2.7860107421875, 2.929443359375, 3.0728759765625, 3.21630859375, 3.3597412109375, 3.503173828125, 3.6466064453125, 3.7900390625, 3.9334716796875, 4.076904296875, 4.2203369140625, 4.36376953125, 4.5072021484375, 4.650634765625, 4.7940673828125, 4.9375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 10.0, 10.0, 19.0, 10.0, 33.0, 33.0, 24.0, 37.0, 58.0, 57.0, 54.0, 62.0, 59.0, 65.0, 65.0, 57.0, 58.0, 49.0, 48.0, 37.0, 34.0, 27.0, 11.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5498046875, -0.5346870422363281, -0.5195693969726562, -0.5044517517089844, -0.4893341064453125, -0.4742164611816406, -0.45909881591796875, -0.4439811706542969, -0.428863525390625, -0.4137458801269531, -0.39862823486328125, -0.3835105895996094, -0.3683929443359375, -0.3532752990722656, -0.33815765380859375, -0.3230400085449219, -0.30792236328125, -0.2928047180175781, -0.27768707275390625, -0.2625694274902344, -0.2474517822265625, -0.23233413696289062, -0.21721649169921875, -0.20209884643554688, -0.186981201171875, -0.17186355590820312, -0.15674591064453125, -0.14162826538085938, -0.1265106201171875, -0.11139297485351562, -0.09627532958984375, -0.08115768432617188, -0.0660400390625, -0.050922393798828125, -0.03580474853515625, -0.020687103271484375, -0.0055694580078125, 0.009548187255859375, 0.02466583251953125, 0.039783477783203125, 0.054901123046875, 0.07001876831054688, 0.08513641357421875, 0.10025405883789062, 0.1153717041015625, 0.13048934936523438, 0.14560699462890625, 0.16072463989257812, 0.17584228515625, 0.19095993041992188, 0.20607757568359375, 0.22119522094726562, 0.2363128662109375, 0.2514305114746094, 0.26654815673828125, 0.2816658020019531, 0.296783447265625, 0.3119010925292969, 0.32701873779296875, 0.3421363830566406, 0.3572540283203125, 0.3723716735839844, 0.38748931884765625, 0.4026069641113281, 0.417724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 6.0, 8.0, 13.0, 8.0, 25.0, 37.0, 32.0, 52.0, 82.0, 109.0, 136.0, 222.0, 340.0, 628.0, 1072.0, 2268.0, 6080.0, 19562.0, 74596.0, 340462.0, 458312.0, 103999.0, 26340.0, 8087.0, 2872.0, 1313.0, 654.0, 360.0, 256.0, 163.0, 117.0, 87.0, 61.0, 44.0, 28.0, 21.0, 22.0, 23.0, 11.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.408203125, -2.333221435546875, -2.25823974609375, -2.183258056640625, -2.1082763671875, -2.033294677734375, -1.95831298828125, -1.883331298828125, -1.808349609375, -1.733367919921875, -1.65838623046875, -1.583404541015625, -1.5084228515625, -1.433441162109375, -1.35845947265625, -1.283477783203125, -1.20849609375, -1.133514404296875, -1.05853271484375, -0.983551025390625, -0.9085693359375, -0.833587646484375, -0.75860595703125, -0.683624267578125, -0.608642578125, -0.533660888671875, -0.45867919921875, -0.383697509765625, -0.3087158203125, -0.233734130859375, -0.15875244140625, -0.083770751953125, -0.0087890625, 0.066192626953125, 0.14117431640625, 0.216156005859375, 0.2911376953125, 0.366119384765625, 0.44110107421875, 0.516082763671875, 0.591064453125, 0.666046142578125, 0.74102783203125, 0.816009521484375, 0.8909912109375, 0.965972900390625, 1.04095458984375, 1.115936279296875, 1.19091796875, 1.265899658203125, 1.34088134765625, 1.415863037109375, 1.4908447265625, 1.565826416015625, 1.64080810546875, 1.715789794921875, 1.790771484375, 1.865753173828125, 1.94073486328125, 2.015716552734375, 2.0906982421875, 2.165679931640625, 2.24066162109375, 2.315643310546875, 2.390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 4.0, 12.0, 14.0, 25.0, 16.0, 28.0, 23.0, 53.0, 52.0, 50.0, 51.0, 39.0, 55.0, 52.0, 72.0, 55.0, 47.0, 55.0, 54.0, 37.0, 42.0, 32.0, 20.0, 28.0, 19.0, 13.0, 11.0, 7.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.02734375, -1.96722412109375, -1.9071044921875, -1.84698486328125, -1.786865234375, -1.72674560546875, -1.6666259765625, -1.60650634765625, -1.54638671875, -1.48626708984375, -1.4261474609375, -1.36602783203125, -1.305908203125, -1.24578857421875, -1.1856689453125, -1.12554931640625, -1.0654296875, -1.00531005859375, -0.9451904296875, -0.88507080078125, -0.824951171875, -0.76483154296875, -0.7047119140625, -0.64459228515625, -0.58447265625, -0.52435302734375, -0.4642333984375, -0.40411376953125, -0.343994140625, -0.28387451171875, -0.2237548828125, -0.16363525390625, -0.103515625, -0.04339599609375, 0.0167236328125, 0.07684326171875, 0.136962890625, 0.19708251953125, 0.2572021484375, 0.31732177734375, 0.37744140625, 0.43756103515625, 0.4976806640625, 0.55780029296875, 0.617919921875, 0.67803955078125, 0.7381591796875, 0.79827880859375, 0.8583984375, 0.91851806640625, 0.9786376953125, 1.03875732421875, 1.098876953125, 1.15899658203125, 1.2191162109375, 1.27923583984375, 1.33935546875, 1.39947509765625, 1.4595947265625, 1.51971435546875, 1.579833984375, 1.63995361328125, 1.7000732421875, 1.76019287109375, 1.8203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 11.0, 9.0, 20.0, 40.0, 48.0, 100.0, 149.0, 286.0, 645.0, 1539.0, 4888.0, 20452.0, 143080.0, 761612.0, 93661.0, 15606.0, 3972.0, 1281.0, 521.0, 263.0, 140.0, 83.0, 55.0, 36.0, 19.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.175079345703125, -2.10797119140625, -2.040863037109375, -1.9737548828125, -1.906646728515625, -1.83953857421875, -1.772430419921875, -1.705322265625, -1.638214111328125, -1.57110595703125, -1.503997802734375, -1.4368896484375, -1.369781494140625, -1.30267333984375, -1.235565185546875, -1.16845703125, -1.101348876953125, -1.03424072265625, -0.967132568359375, -0.9000244140625, -0.832916259765625, -0.76580810546875, -0.698699951171875, -0.631591796875, -0.564483642578125, -0.49737548828125, -0.430267333984375, -0.3631591796875, -0.296051025390625, -0.22894287109375, -0.161834716796875, -0.0947265625, -0.027618408203125, 0.03948974609375, 0.106597900390625, 0.1737060546875, 0.240814208984375, 0.30792236328125, 0.375030517578125, 0.442138671875, 0.509246826171875, 0.57635498046875, 0.643463134765625, 0.7105712890625, 0.777679443359375, 0.84478759765625, 0.911895751953125, 0.97900390625, 1.046112060546875, 1.11322021484375, 1.180328369140625, 1.2474365234375, 1.314544677734375, 1.38165283203125, 1.448760986328125, 1.515869140625, 1.582977294921875, 1.65008544921875, 1.717193603515625, 1.7843017578125, 1.851409912109375, 1.91851806640625, 1.985626220703125, 2.052734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 17.0, 14.0, 32.0, 37.0, 71.0, 237.0, 346.0, 102.0, 53.0, 23.0, 23.0, 12.0, 8.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006055831909179688, -0.0005901232361793518, -0.0005746632814407349, -0.0005592033267021179, -0.000543743371963501, -0.000528283417224884, -0.0005128234624862671, -0.0004973635077476501, -0.0004819035530090332, -0.00046644359827041626, -0.0004509836435317993, -0.0004355236887931824, -0.00042006373405456543, -0.0004046037793159485, -0.00038914382457733154, -0.0003736838698387146, -0.00035822391510009766, -0.0003427639603614807, -0.00032730400562286377, -0.0003118440508842468, -0.0002963840961456299, -0.00028092414140701294, -0.000265464186668396, -0.00025000423192977905, -0.0002345442771911621, -0.00021908432245254517, -0.00020362436771392822, -0.00018816441297531128, -0.00017270445823669434, -0.0001572445034980774, -0.00014178454875946045, -0.0001263245940208435, -0.00011086463928222656, -9.540468454360962e-05, -7.994472980499268e-05, -6.448477506637573e-05, -4.902482032775879e-05, -3.3564865589141846e-05, -1.8104910850524902e-05, -2.644956111907959e-06, 1.2814998626708984e-05, 2.8274953365325928e-05, 4.373490810394287e-05, 5.9194862842559814e-05, 7.465481758117676e-05, 9.01147723197937e-05, 0.00010557472705841064, 0.00012103468179702759, 0.00013649463653564453, 0.00015195459127426147, 0.00016741454601287842, 0.00018287450075149536, 0.0001983344554901123, 0.00021379441022872925, 0.0002292543649673462, 0.00024471431970596313, 0.0002601742744445801, 0.000275634229183197, 0.00029109418392181396, 0.0003065541386604309, 0.00032201409339904785, 0.0003374740481376648, 0.00035293400287628174, 0.0003683939576148987, 0.0003838539123535156]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 12.0, 13.0, 16.0, 15.0, 22.0, 35.0, 26.0, 42.0, 76.0, 100.0, 131.0, 271.0, 495.0, 996.0, 2381.0, 6156.0, 18936.0, 73313.0, 687874.0, 205020.0, 35272.0, 10403.0, 3780.0, 1463.0, 696.0, 412.0, 185.0, 121.0, 78.0, 57.0, 44.0, 30.0, 24.0, 19.0, 16.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.674041748046875, -1.61370849609375, -1.553375244140625, -1.4930419921875, -1.432708740234375, -1.37237548828125, -1.312042236328125, -1.251708984375, -1.191375732421875, -1.13104248046875, -1.070709228515625, -1.0103759765625, -0.950042724609375, -0.88970947265625, -0.829376220703125, -0.76904296875, -0.708709716796875, -0.64837646484375, -0.588043212890625, -0.5277099609375, -0.467376708984375, -0.40704345703125, -0.346710205078125, -0.286376953125, -0.226043701171875, -0.16571044921875, -0.105377197265625, -0.0450439453125, 0.015289306640625, 0.07562255859375, 0.135955810546875, 0.1962890625, 0.256622314453125, 0.31695556640625, 0.377288818359375, 0.4376220703125, 0.497955322265625, 0.55828857421875, 0.618621826171875, 0.678955078125, 0.739288330078125, 0.79962158203125, 0.859954833984375, 0.9202880859375, 0.980621337890625, 1.04095458984375, 1.101287841796875, 1.16162109375, 1.221954345703125, 1.28228759765625, 1.342620849609375, 1.4029541015625, 1.463287353515625, 1.52362060546875, 1.583953857421875, 1.644287109375, 1.704620361328125, 1.76495361328125, 1.825286865234375, 1.8856201171875, 1.945953369140625, 2.00628662109375, 2.066619873046875, 2.126953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 9.0, 4.0, 12.0, 12.0, 12.0, 21.0, 21.0, 25.0, 45.0, 68.0, 100.0, 151.0, 160.0, 110.0, 69.0, 34.0, 28.0, 20.0, 18.0, 15.0, 19.0, 18.0, 8.0, 2.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9423751831054688, -0.9018402099609375, -0.8613052368164062, -0.820770263671875, -0.7802352905273438, -0.7397003173828125, -0.6991653442382812, -0.65863037109375, -0.6180953979492188, -0.5775604248046875, -0.5370254516601562, -0.496490478515625, -0.45595550537109375, -0.4154205322265625, -0.37488555908203125, -0.3343505859375, -0.29381561279296875, -0.2532806396484375, -0.21274566650390625, -0.172210693359375, -0.13167572021484375, -0.0911407470703125, -0.05060577392578125, -0.01007080078125, 0.03046417236328125, 0.0709991455078125, 0.11153411865234375, 0.152069091796875, 0.19260406494140625, 0.2331390380859375, 0.27367401123046875, 0.314208984375, 0.35474395751953125, 0.3952789306640625, 0.43581390380859375, 0.476348876953125, 0.5168838500976562, 0.5574188232421875, 0.5979537963867188, 0.63848876953125, 0.6790237426757812, 0.7195587158203125, 0.7600936889648438, 0.800628662109375, 0.8411636352539062, 0.8816986083984375, 0.9222335815429688, 0.9627685546875, 1.0033035278320312, 1.0438385009765625, 1.0843734741210938, 1.124908447265625, 1.1654434204101562, 1.2059783935546875, 1.2465133666992188, 1.28704833984375, 1.3275833129882812, 1.3681182861328125, 1.4086532592773438, 1.449188232421875, 1.4897232055664062, 1.5302581787109375, 1.5707931518554688, 1.611328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 14.0, 31.0, 68.0, 127.0, 176.0, 186.0, 165.0, 115.0, 52.0, 31.0, 14.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.84744644165039, -24.052867889404297, -23.25828742980957, -22.463708877563477, -21.66912841796875, -20.874549865722656, -20.079971313476562, -19.285390853881836, -18.49081039428711, -17.696231842041016, -16.90165138244629, -16.107072830200195, -15.312492370605469, -14.517913818359375, -13.723334312438965, -12.928754806518555, -12.134176254272461, -11.33959674835205, -10.54501724243164, -9.750438690185547, -8.95585823059082, -8.161279678344727, -7.366700172424316, -6.572120666503906, -5.777541160583496, -4.982961654663086, -4.188382148742676, -3.393803119659424, -2.5992236137390137, -1.8046441078186035, -1.0100650787353516, -0.2154855728149414, 0.5790958404541016, 1.3736752271652222, 2.1682546138763428, 2.962833881378174, 3.757413387298584, 4.551992893218994, 5.346571922302246, 6.141151428222656, 6.935730934143066, 7.730310440063477, 8.524889945983887, 9.319469451904297, 10.11404800415039, 10.908628463745117, 11.703207015991211, 12.497786521911621, 13.292366027832031, 14.086945533752441, 14.881525039672852, 15.676103591918945, 16.470684051513672, 17.265262603759766, 18.05984115600586, 18.854421615600586, 19.649002075195312, 20.443580627441406, 21.238161087036133, 22.032739639282227, 22.827320098876953, 23.621898651123047, 24.41647720336914, 25.211057662963867, 26.00563621520996]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 4.0, 8.0, 9.0, 4.0, 12.0, 14.0, 9.0, 15.0, 12.0, 23.0, 23.0, 26.0, 21.0, 23.0, 35.0, 33.0, 28.0, 39.0, 36.0, 37.0, 31.0, 39.0, 34.0, 38.0, 41.0, 44.0, 40.0, 35.0, 27.0, 32.0, 29.0, 17.0, 23.0, 23.0, 27.0, 8.0, 14.0, 13.0, 12.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.466588497161865, -7.238072395324707, -7.009555816650391, -6.781039714813232, -6.552523136138916, -6.324007034301758, -6.095490455627441, -5.866974353790283, -5.638458251953125, -5.409942150115967, -5.18142557144165, -4.952909469604492, -4.724392890930176, -4.495876789093018, -4.267360687255859, -4.038844108581543, -3.8103275299072266, -3.5818111896514893, -3.353294849395752, -3.1247787475585938, -2.8962621688842773, -2.667746067047119, -2.439229726791382, -2.2107133865356445, -1.9821970462799072, -1.75368070602417, -1.5251643657684326, -1.2966481447219849, -1.0681318044662476, -0.8396154642105103, -0.6110992431640625, -0.3825829029083252, -0.1540665626525879, 0.07444974780082703, 0.30296605825424194, 0.5314823389053345, 0.7599986791610718, 0.9885150194168091, 1.2170312404632568, 1.4455475807189941, 1.6740639209747314, 1.9025802612304688, 2.131096601486206, 2.3596129417419434, 2.5881290435791016, 2.816645622253418, 3.045161724090576, 3.2736780643463135, 3.502194404602051, 3.730710744857788, 3.9592270851135254, 4.187743186950684, 4.416259765625, 4.644775867462158, 4.873291969299316, 5.101808547973633, 5.330325126647949, 5.558841228485107, 5.787357807159424, 6.015873908996582, 6.244390487670898, 6.472906589508057, 6.701422691345215, 6.929939270019531, 7.1584553718566895]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 16.0, 22.0, 27.0, 25.0, 44.0, 48.0, 71.0, 92.0, 138.0, 205.0, 284.0, 489.0, 928.0, 1726.0, 3564.0, 8578.0, 25818.0, 124598.0, 3425362.0, 521178.0, 54047.0, 14892.0, 5939.0, 2662.0, 1412.0, 810.0, 461.0, 269.0, 187.0, 107.0, 75.0, 60.0, 32.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-4.1796875, -4.071868896484375, -3.96405029296875, -3.856231689453125, -3.7484130859375, -3.640594482421875, -3.53277587890625, -3.424957275390625, -3.317138671875, -3.209320068359375, -3.10150146484375, -2.993682861328125, -2.8858642578125, -2.778045654296875, -2.67022705078125, -2.562408447265625, -2.45458984375, -2.346771240234375, -2.23895263671875, -2.131134033203125, -2.0233154296875, -1.915496826171875, -1.80767822265625, -1.699859619140625, -1.592041015625, -1.484222412109375, -1.37640380859375, -1.268585205078125, -1.1607666015625, -1.052947998046875, -0.94512939453125, -0.837310791015625, -0.7294921875, -0.621673583984375, -0.51385498046875, -0.406036376953125, -0.2982177734375, -0.190399169921875, -0.08258056640625, 0.025238037109375, 0.133056640625, 0.240875244140625, 0.34869384765625, 0.456512451171875, 0.5643310546875, 0.672149658203125, 0.77996826171875, 0.887786865234375, 0.99560546875, 1.103424072265625, 1.21124267578125, 1.319061279296875, 1.4268798828125, 1.534698486328125, 1.64251708984375, 1.750335693359375, 1.858154296875, 1.965972900390625, 2.07379150390625, 2.181610107421875, 2.2894287109375, 2.397247314453125, 2.50506591796875, 2.612884521484375, 2.720703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 3.0, 9.0, 8.0, 17.0, 24.0, 24.0, 32.0, 35.0, 33.0, 43.0, 43.0, 56.0, 51.0, 64.0, 72.0, 57.0, 57.0, 50.0, 54.0, 39.0, 40.0, 34.0, 36.0, 28.0, 20.0, 14.0, 14.0, 9.0, 5.0, 10.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.51220703125, -0.4975318908691406, -0.48285675048828125, -0.4681816101074219, -0.4535064697265625, -0.4388313293457031, -0.42415618896484375, -0.4094810485839844, -0.394805908203125, -0.3801307678222656, -0.36545562744140625, -0.3507804870605469, -0.3361053466796875, -0.3214302062988281, -0.30675506591796875, -0.2920799255371094, -0.27740478515625, -0.2627296447753906, -0.24805450439453125, -0.23337936401367188, -0.2187042236328125, -0.20402908325195312, -0.18935394287109375, -0.17467880249023438, -0.160003662109375, -0.14532852172851562, -0.13065338134765625, -0.11597824096679688, -0.1013031005859375, -0.08662796020507812, -0.07195281982421875, -0.057277679443359375, -0.0426025390625, -0.027927398681640625, -0.01325225830078125, 0.001422882080078125, 0.0160980224609375, 0.030773162841796875, 0.04544830322265625, 0.060123443603515625, 0.074798583984375, 0.08947372436523438, 0.10414886474609375, 0.11882400512695312, 0.1334991455078125, 0.14817428588867188, 0.16284942626953125, 0.17752456665039062, 0.19219970703125, 0.20687484741210938, 0.22154998779296875, 0.23622512817382812, 0.2509002685546875, 0.2655754089355469, 0.28025054931640625, 0.2949256896972656, 0.309600830078125, 0.3242759704589844, 0.33895111083984375, 0.3536262512207031, 0.3683013916015625, 0.3829765319824219, 0.39765167236328125, 0.4123268127441406, 0.427001953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 7.0, 15.0, 17.0, 15.0, 29.0, 19.0, 39.0, 50.0, 71.0, 102.0, 130.0, 222.0, 307.0, 708.0, 2132.0, 12830.0, 424871.0, 3719186.0, 27894.0, 3510.0, 935.0, 406.0, 221.0, 155.0, 81.0, 72.0, 65.0, 39.0, 38.0, 34.0, 17.0, 13.0, 10.0, 12.0, 8.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.5859375, -8.3609619140625, -8.135986328125, -7.9110107421875, -7.68603515625, -7.4610595703125, -7.236083984375, -7.0111083984375, -6.7861328125, -6.5611572265625, -6.336181640625, -6.1112060546875, -5.88623046875, -5.6612548828125, -5.436279296875, -5.2113037109375, -4.986328125, -4.7613525390625, -4.536376953125, -4.3114013671875, -4.08642578125, -3.8614501953125, -3.636474609375, -3.4114990234375, -3.1865234375, -2.9615478515625, -2.736572265625, -2.5115966796875, -2.28662109375, -2.0616455078125, -1.836669921875, -1.6116943359375, -1.38671875, -1.1617431640625, -0.936767578125, -0.7117919921875, -0.48681640625, -0.2618408203125, -0.036865234375, 0.1881103515625, 0.4130859375, 0.6380615234375, 0.863037109375, 1.0880126953125, 1.31298828125, 1.5379638671875, 1.762939453125, 1.9879150390625, 2.212890625, 2.4378662109375, 2.662841796875, 2.8878173828125, 3.11279296875, 3.3377685546875, 3.562744140625, 3.7877197265625, 4.0126953125, 4.2376708984375, 4.462646484375, 4.6876220703125, 4.91259765625, 5.1375732421875, 5.362548828125, 5.5875244140625, 5.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 26.0, 48.0, 116.0, 610.0, 2649.0, 459.0, 94.0, 38.0, 14.0, 10.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.9769287109375, -3.887451171875, -3.7979736328125, -3.70849609375, -3.6190185546875, -3.529541015625, -3.4400634765625, -3.3505859375, -3.2611083984375, -3.171630859375, -3.0821533203125, -2.99267578125, -2.9031982421875, -2.813720703125, -2.7242431640625, -2.634765625, -2.5452880859375, -2.455810546875, -2.3663330078125, -2.27685546875, -2.1873779296875, -2.097900390625, -2.0084228515625, -1.9189453125, -1.8294677734375, -1.739990234375, -1.6505126953125, -1.56103515625, -1.4715576171875, -1.382080078125, -1.2926025390625, -1.203125, -1.1136474609375, -1.024169921875, -0.9346923828125, -0.84521484375, -0.7557373046875, -0.666259765625, -0.5767822265625, -0.4873046875, -0.3978271484375, -0.308349609375, -0.2188720703125, -0.12939453125, -0.0399169921875, 0.049560546875, 0.1390380859375, 0.228515625, 0.3179931640625, 0.407470703125, 0.4969482421875, 0.58642578125, 0.6759033203125, 0.765380859375, 0.8548583984375, 0.9443359375, 1.0338134765625, 1.123291015625, 1.2127685546875, 1.30224609375, 1.3917236328125, 1.481201171875, 1.5706787109375, 1.66015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 42.0, 58.0, 90.0, 129.0, 169.0, 170.0, 123.0, 62.0, 50.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-10.343038558959961, -10.069808959960938, -9.796579360961914, -9.52334976196289, -9.25011920928955, -8.976889610290527, -8.703660011291504, -8.43043041229248, -8.157200813293457, -7.883971214294434, -7.610741138458252, -7.3375115394592285, -7.064281940460205, -6.791051864624023, -6.517822265625, -6.244592666625977, -5.971362590789795, -5.6981329917907715, -5.42490291595459, -5.151673316955566, -4.878443717956543, -4.6052141189575195, -4.331984043121338, -4.0587544441223145, -3.785524606704712, -3.5122947692871094, -3.239065170288086, -2.9658353328704834, -2.692605495452881, -2.4193758964538574, -2.146146059036255, -1.872916340827942, -1.5996861457824707, -1.3264564275741577, -1.0532267093658447, -0.7799968719482422, -0.5067671537399292, -0.2335374355316162, 0.03969240188598633, 0.3129221200942993, 0.5861518383026123, 0.8593815565109253, 1.1326112747192383, 1.4058411121368408, 1.6790708303451538, 1.9523005485534668, 2.2255303859710693, 2.498760223388672, 2.7719898223876953, 3.045219659805298, 3.3184492588043213, 3.591679096221924, 3.8649086952209473, 4.138138771057129, 4.411368370056152, 4.684597969055176, 4.957827568054199, 5.231057167053223, 5.504287242889404, 5.777516841888428, 6.050746440887451, 6.323976516723633, 6.597206115722656, 6.87043571472168, 7.143665790557861]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 11.0, 12.0, 22.0, 26.0, 58.0, 74.0, 65.0, 95.0, 96.0, 92.0, 76.0, 80.0, 72.0, 62.0, 44.0, 31.0, 17.0, 20.0, 14.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.705615043640137, -8.498294830322266, -8.290974617004395, -8.083654403686523, -7.876333713531494, -7.669013500213623, -7.461693286895752, -7.254373073577881, -7.047052383422852, -6.8397321701049805, -6.632411956787109, -6.425091743469238, -6.217771053314209, -6.010450839996338, -5.803130626678467, -5.595810413360596, -5.388490200042725, -5.1811699867248535, -4.973849773406982, -4.766529083251953, -4.559208869934082, -4.351888656616211, -4.14456844329834, -3.9372482299804688, -3.7299277782440186, -3.5226075649261475, -3.3152871131896973, -3.107966899871826, -2.900646686553955, -2.693326234817505, -2.486006021499634, -2.2786855697631836, -2.0713658332824707, -1.86404550075531, -1.6567251682281494, -1.4494049549102783, -1.2420846223831177, -1.034764289855957, -0.8274440765380859, -0.6201237440109253, -0.41280341148376465, -0.2054831087589264, 0.0018371939659118652, 0.20915746688842773, 0.4164777994155884, 0.623798131942749, 0.8311183452606201, 1.0384386777877808, 1.2457590103149414, 1.453079342842102, 1.6603996753692627, 1.8677198886871338, 2.075040340423584, 2.282360553741455, 2.489680767059326, 2.6970009803771973, 2.9043214321136475, 3.1116416454315186, 3.3189620971679688, 3.52628231048584, 3.733602523803711, 3.940922975540161, 4.148242950439453, 4.355563640594482, 4.5628838539123535]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 6.0, 8.0, 15.0, 38.0, 55.0, 78.0, 108.0, 156.0, 277.0, 415.0, 878.0, 1891.0, 4824.0, 16099.0, 67042.0, 416978.0, 442629.0, 71200.0, 16810.0, 4984.0, 1952.0, 887.0, 443.0, 247.0, 196.0, 103.0, 69.0, 50.0, 38.0, 23.0, 15.0, 14.0, 10.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.400146484375, -3.29052734375, -3.180908203125, -3.0712890625, -2.961669921875, -2.85205078125, -2.742431640625, -2.6328125, -2.523193359375, -2.41357421875, -2.303955078125, -2.1943359375, -2.084716796875, -1.97509765625, -1.865478515625, -1.755859375, -1.646240234375, -1.53662109375, -1.427001953125, -1.3173828125, -1.207763671875, -1.09814453125, -0.988525390625, -0.87890625, -0.769287109375, -0.65966796875, -0.550048828125, -0.4404296875, -0.330810546875, -0.22119140625, -0.111572265625, -0.001953125, 0.107666015625, 0.21728515625, 0.326904296875, 0.4365234375, 0.546142578125, 0.65576171875, 0.765380859375, 0.875, 0.984619140625, 1.09423828125, 1.203857421875, 1.3134765625, 1.423095703125, 1.53271484375, 1.642333984375, 1.751953125, 1.861572265625, 1.97119140625, 2.080810546875, 2.1904296875, 2.300048828125, 2.40966796875, 2.519287109375, 2.62890625, 2.738525390625, 2.84814453125, 2.957763671875, 3.0673828125, 3.177001953125, 3.28662109375, 3.396240234375, 3.505859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 14.0, 13.0, 30.0, 33.0, 38.0, 37.0, 68.0, 66.0, 65.0, 72.0, 87.0, 72.0, 72.0, 68.0, 54.0, 45.0, 42.0, 34.0, 17.0, 16.0, 14.0, 16.0, 6.0, 3.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7314453125, -0.712005615234375, -0.69256591796875, -0.673126220703125, -0.6536865234375, -0.634246826171875, -0.61480712890625, -0.595367431640625, -0.575927734375, -0.556488037109375, -0.53704833984375, -0.517608642578125, -0.4981689453125, -0.478729248046875, -0.45928955078125, -0.439849853515625, -0.42041015625, -0.400970458984375, -0.38153076171875, -0.362091064453125, -0.3426513671875, -0.323211669921875, -0.30377197265625, -0.284332275390625, -0.264892578125, -0.245452880859375, -0.22601318359375, -0.206573486328125, -0.1871337890625, -0.167694091796875, -0.14825439453125, -0.128814697265625, -0.109375, -0.089935302734375, -0.07049560546875, -0.051055908203125, -0.0316162109375, -0.012176513671875, 0.00726318359375, 0.026702880859375, 0.046142578125, 0.065582275390625, 0.08502197265625, 0.104461669921875, 0.1239013671875, 0.143341064453125, 0.16278076171875, 0.182220458984375, 0.20166015625, 0.221099853515625, 0.24053955078125, 0.259979248046875, 0.2794189453125, 0.298858642578125, 0.31829833984375, 0.337738037109375, 0.357177734375, 0.376617431640625, 0.39605712890625, 0.415496826171875, 0.4349365234375, 0.454376220703125, 0.47381591796875, 0.493255615234375, 0.5126953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 10.0, 22.0, 25.0, 39.0, 51.0, 76.0, 87.0, 150.0, 220.0, 343.0, 600.0, 1108.0, 2296.0, 4958.0, 10947.0, 26471.0, 68342.0, 208686.0, 425368.0, 190796.0, 63717.0, 24539.0, 10376.0, 4540.0, 2085.0, 1027.0, 587.0, 315.0, 236.0, 144.0, 106.0, 71.0, 61.0, 29.0, 22.0, 21.0, 12.0, 10.0, 8.0, 4.0, 4.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.48919677734375, -1.4403076171875, -1.39141845703125, -1.342529296875, -1.29364013671875, -1.2447509765625, -1.19586181640625, -1.14697265625, -1.09808349609375, -1.0491943359375, -1.00030517578125, -0.951416015625, -0.90252685546875, -0.8536376953125, -0.80474853515625, -0.755859375, -0.70697021484375, -0.6580810546875, -0.60919189453125, -0.560302734375, -0.51141357421875, -0.4625244140625, -0.41363525390625, -0.36474609375, -0.31585693359375, -0.2669677734375, -0.21807861328125, -0.169189453125, -0.12030029296875, -0.0714111328125, -0.02252197265625, 0.0263671875, 0.07525634765625, 0.1241455078125, 0.17303466796875, 0.221923828125, 0.27081298828125, 0.3197021484375, 0.36859130859375, 0.41748046875, 0.46636962890625, 0.5152587890625, 0.56414794921875, 0.613037109375, 0.66192626953125, 0.7108154296875, 0.75970458984375, 0.80859375, 0.85748291015625, 0.9063720703125, 0.95526123046875, 1.004150390625, 1.05303955078125, 1.1019287109375, 1.15081787109375, 1.19970703125, 1.24859619140625, 1.2974853515625, 1.34637451171875, 1.395263671875, 1.44415283203125, 1.4930419921875, 1.54193115234375, 1.5908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 11.0, 13.0, 17.0, 16.0, 14.0, 24.0, 13.0, 29.0, 26.0, 31.0, 36.0, 28.0, 39.0, 47.0, 27.0, 34.0, 51.0, 32.0, 55.0, 36.0, 39.0, 43.0, 44.0, 28.0, 28.0, 16.0, 20.0, 34.0, 23.0, 21.0, 10.0, 14.0, 18.0, 8.0, 5.0, 6.0, 11.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.4296875, -1.388214111328125, -1.34674072265625, -1.305267333984375, -1.2637939453125, -1.222320556640625, -1.18084716796875, -1.139373779296875, -1.097900390625, -1.056427001953125, -1.01495361328125, -0.973480224609375, -0.9320068359375, -0.890533447265625, -0.84906005859375, -0.807586669921875, -0.76611328125, -0.724639892578125, -0.68316650390625, -0.641693115234375, -0.6002197265625, -0.558746337890625, -0.51727294921875, -0.475799560546875, -0.434326171875, -0.392852783203125, -0.35137939453125, -0.309906005859375, -0.2684326171875, -0.226959228515625, -0.18548583984375, -0.144012451171875, -0.1025390625, -0.061065673828125, -0.01959228515625, 0.021881103515625, 0.0633544921875, 0.104827880859375, 0.14630126953125, 0.187774658203125, 0.229248046875, 0.270721435546875, 0.31219482421875, 0.353668212890625, 0.3951416015625, 0.436614990234375, 0.47808837890625, 0.519561767578125, 0.56103515625, 0.602508544921875, 0.64398193359375, 0.685455322265625, 0.7269287109375, 0.768402099609375, 0.80987548828125, 0.851348876953125, 0.892822265625, 0.934295654296875, 0.97576904296875, 1.017242431640625, 1.0587158203125, 1.100189208984375, 1.14166259765625, 1.183135986328125, 1.224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 27.0, 39.0, 52.0, 83.0, 118.0, 170.0, 294.0, 506.0, 1049.0, 2315.0, 5887.0, 20013.0, 98126.0, 737430.0, 144588.0, 25357.0, 7203.0, 2544.0, 1225.0, 635.0, 298.0, 193.0, 108.0, 74.0, 51.0, 37.0, 29.0, 12.0, 15.0, 10.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.1905670166015625, -1.145782470703125, -1.1009979248046875, -1.05621337890625, -1.0114288330078125, -0.966644287109375, -0.9218597412109375, -0.8770751953125, -0.8322906494140625, -0.787506103515625, -0.7427215576171875, -0.69793701171875, -0.6531524658203125, -0.608367919921875, -0.5635833740234375, -0.518798828125, -0.4740142822265625, -0.429229736328125, -0.3844451904296875, -0.33966064453125, -0.2948760986328125, -0.250091552734375, -0.2053070068359375, -0.1605224609375, -0.1157379150390625, -0.070953369140625, -0.0261688232421875, 0.01861572265625, 0.0634002685546875, 0.108184814453125, 0.1529693603515625, 0.19775390625, 0.2425384521484375, 0.287322998046875, 0.3321075439453125, 0.37689208984375, 0.4216766357421875, 0.466461181640625, 0.5112457275390625, 0.5560302734375, 0.6008148193359375, 0.645599365234375, 0.6903839111328125, 0.73516845703125, 0.7799530029296875, 0.824737548828125, 0.8695220947265625, 0.914306640625, 0.9590911865234375, 1.003875732421875, 1.0486602783203125, 1.09344482421875, 1.1382293701171875, 1.183013916015625, 1.2277984619140625, 1.2725830078125, 1.3173675537109375, 1.362152099609375, 1.4069366455078125, 1.45172119140625, 1.4965057373046875, 1.541290283203125, 1.5860748291015625, 1.630859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 7.0, 10.0, 18.0, 10.0, 11.0, 26.0, 19.0, 49.0, 139.0, 353.0, 186.0, 70.0, 41.0, 16.0, 16.0, 9.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025177001953125, -0.00024109333753585815, -0.0002304166555404663, -0.00021973997354507446, -0.00020906329154968262, -0.00019838660955429077, -0.00018770992755889893, -0.00017703324556350708, -0.00016635656356811523, -0.0001556798815727234, -0.00014500319957733154, -0.0001343265175819397, -0.00012364983558654785, -0.000112973153591156, -0.00010229647159576416, -9.161978960037231e-05, -8.094310760498047e-05, -7.026642560958862e-05, -5.958974361419678e-05, -4.891306161880493e-05, -3.8236379623413086e-05, -2.755969762802124e-05, -1.6883015632629395e-05, -6.206333637237549e-06, 4.470348358154297e-06, 1.5147030353546143e-05, 2.5823712348937988e-05, 3.6500394344329834e-05, 4.717707633972168e-05, 5.7853758335113525e-05, 6.853044033050537e-05, 7.920712232589722e-05, 8.988380432128906e-05, 0.00010056048631668091, 0.00011123716831207275, 0.0001219138503074646, 0.00013259053230285645, 0.0001432672142982483, 0.00015394389629364014, 0.00016462057828903198, 0.00017529726028442383, 0.00018597394227981567, 0.00019665062427520752, 0.00020732730627059937, 0.0002180039882659912, 0.00022868067026138306, 0.0002393573522567749, 0.00025003403425216675, 0.0002607107162475586, 0.00027138739824295044, 0.0002820640802383423, 0.00029274076223373413, 0.000303417444229126, 0.0003140941262245178, 0.00032477080821990967, 0.0003354474902153015, 0.00034612417221069336, 0.0003568008542060852, 0.00036747753620147705, 0.0003781542181968689, 0.00038883090019226074, 0.0003995075821876526, 0.00041018426418304443, 0.0004208609461784363, 0.0004315376281738281]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 8.0, 17.0, 21.0, 21.0, 44.0, 53.0, 123.0, 172.0, 304.0, 604.0, 1279.0, 3312.0, 9837.0, 38258.0, 388444.0, 542189.0, 45728.0, 11570.0, 3696.0, 1382.0, 661.0, 324.0, 216.0, 108.0, 67.0, 43.0, 24.0, 18.0, 12.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.729949951171875, -1.68060302734375, -1.631256103515625, -1.5819091796875, -1.532562255859375, -1.48321533203125, -1.433868408203125, -1.384521484375, -1.335174560546875, -1.28582763671875, -1.236480712890625, -1.1871337890625, -1.137786865234375, -1.08843994140625, -1.039093017578125, -0.98974609375, -0.940399169921875, -0.89105224609375, -0.841705322265625, -0.7923583984375, -0.743011474609375, -0.69366455078125, -0.644317626953125, -0.594970703125, -0.545623779296875, -0.49627685546875, -0.446929931640625, -0.3975830078125, -0.348236083984375, -0.29888916015625, -0.249542236328125, -0.2001953125, -0.150848388671875, -0.10150146484375, -0.052154541015625, -0.0028076171875, 0.046539306640625, 0.09588623046875, 0.145233154296875, 0.194580078125, 0.243927001953125, 0.29327392578125, 0.342620849609375, 0.3919677734375, 0.441314697265625, 0.49066162109375, 0.540008544921875, 0.58935546875, 0.638702392578125, 0.68804931640625, 0.737396240234375, 0.7867431640625, 0.836090087890625, 0.88543701171875, 0.934783935546875, 0.984130859375, 1.033477783203125, 1.08282470703125, 1.132171630859375, 1.1815185546875, 1.230865478515625, 1.28021240234375, 1.329559326171875, 1.37890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 11.0, 11.0, 15.0, 32.0, 35.0, 57.0, 101.0, 161.0, 164.0, 140.0, 93.0, 37.0, 17.0, 17.0, 18.0, 10.0, 11.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.4873046875, -1.4513168334960938, -1.4153289794921875, -1.3793411254882812, -1.343353271484375, -1.3073654174804688, -1.2713775634765625, -1.2353897094726562, -1.19940185546875, -1.1634140014648438, -1.1274261474609375, -1.0914382934570312, -1.055450439453125, -1.0194625854492188, -0.9834747314453125, -0.9474868774414062, -0.9114990234375, -0.8755111694335938, -0.8395233154296875, -0.8035354614257812, -0.767547607421875, -0.7315597534179688, -0.6955718994140625, -0.6595840454101562, -0.62359619140625, -0.5876083374023438, -0.5516204833984375, -0.5156326293945312, -0.479644775390625, -0.44365692138671875, -0.4076690673828125, -0.37168121337890625, -0.335693359375, -0.29970550537109375, -0.2637176513671875, -0.22772979736328125, -0.191741943359375, -0.15575408935546875, -0.1197662353515625, -0.08377838134765625, -0.04779052734375, -0.01180267333984375, 0.0241851806640625, 0.06017303466796875, 0.096160888671875, 0.13214874267578125, 0.1681365966796875, 0.20412445068359375, 0.2401123046875, 0.27610015869140625, 0.3120880126953125, 0.34807586669921875, 0.384063720703125, 0.42005157470703125, 0.4560394287109375, 0.49202728271484375, 0.52801513671875, 0.5640029907226562, 0.5999908447265625, 0.6359786987304688, 0.671966552734375, 0.7079544067382812, 0.7439422607421875, 0.7799301147460938, 0.81591796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 12.0, 24.0, 47.0, 86.0, 121.0, 149.0, 160.0, 142.0, 106.0, 72.0, 40.0, 25.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.285001754760742, -25.67831039428711, -25.07162094116211, -24.46493148803711, -23.858240127563477, -23.251548767089844, -22.644859313964844, -22.038169860839844, -21.43147850036621, -20.824787139892578, -20.218097686767578, -19.611408233642578, -19.004716873168945, -18.398025512695312, -17.791336059570312, -17.184646606445312, -16.57795524597168, -15.971264839172363, -15.364574432373047, -14.75788402557373, -14.151193618774414, -13.544503211975098, -12.937812805175781, -12.331122398376465, -11.724431991577148, -11.117741584777832, -10.511051177978516, -9.9043607711792, -9.297670364379883, -8.690979957580566, -8.08428955078125, -7.477599143981934, -6.87091064453125, -6.264220237731934, -5.657529830932617, -5.050839424133301, -4.444149017333984, -3.837458610534668, -3.2307682037353516, -2.624077796936035, -2.0173873901367188, -1.4106969833374023, -0.8040065765380859, -0.19731616973876953, 0.4093742370605469, 1.0160646438598633, 1.6227550506591797, 2.229445457458496, 2.8361358642578125, 3.442826271057129, 4.049516677856445, 4.656207084655762, 5.262897491455078, 5.8695878982543945, 6.476278305053711, 7.082968711853027, 7.689659118652344, 8.29634952545166, 8.903039932250977, 9.509730339050293, 10.11642074584961, 10.723111152648926, 11.329801559448242, 11.936491966247559, 12.543182373046875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 7.0, 4.0, 8.0, 14.0, 20.0, 18.0, 19.0, 34.0, 27.0, 27.0, 23.0, 40.0, 19.0, 44.0, 38.0, 41.0, 45.0, 45.0, 36.0, 36.0, 35.0, 37.0, 36.0, 42.0, 23.0, 34.0, 28.0, 29.0, 25.0, 24.0, 11.0, 15.0, 17.0, 9.0, 15.0, 9.0, 8.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.608931064605713, -6.402459621429443, -6.195988178253174, -5.989516735076904, -5.783045291900635, -5.576573848724365, -5.370102405548096, -5.163630962371826, -4.957159519195557, -4.750688076019287, -4.544216632843018, -4.337745189666748, -4.1312737464904785, -3.924802303314209, -3.7183308601379395, -3.51185941696167, -3.3053879737854004, -3.098916530609131, -2.8924450874328613, -2.685973644256592, -2.4795022010803223, -2.2730307579040527, -2.066559314727783, -1.8600878715515137, -1.6536164283752441, -1.4471449851989746, -1.240673542022705, -1.0342020988464355, -0.827730655670166, -0.6212592124938965, -0.41478776931762695, -0.20831632614135742, -0.0018453598022460938, 0.20462608337402344, 0.41109752655029297, 0.6175689697265625, 0.824040412902832, 1.0305118560791016, 1.236983299255371, 1.4434547424316406, 1.6499261856079102, 1.8563976287841797, 2.062869071960449, 2.2693405151367188, 2.4758119583129883, 2.682283401489258, 2.8887548446655273, 3.095226287841797, 3.3016977310180664, 3.508169174194336, 3.7146406173706055, 3.921112060546875, 4.1275835037231445, 4.334054946899414, 4.540526390075684, 4.746997833251953, 4.953469276428223, 5.159940719604492, 5.366412162780762, 5.572883605957031, 5.779355049133301, 5.98582649230957, 6.19229793548584, 6.398769378662109, 6.605240821838379]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 17.0, 18.0, 21.0, 39.0, 64.0, 73.0, 121.0, 164.0, 270.0, 423.0, 697.0, 1373.0, 2965.0, 7949.0, 28749.0, 277955.0, 3763264.0, 84298.0, 15932.0, 5110.0, 2139.0, 1099.0, 580.0, 336.0, 193.0, 115.0, 98.0, 56.0, 38.0, 16.0, 18.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3125, -6.1385498046875, -5.964599609375, -5.7906494140625, -5.61669921875, -5.4427490234375, -5.268798828125, -5.0948486328125, -4.9208984375, -4.7469482421875, -4.572998046875, -4.3990478515625, -4.22509765625, -4.0511474609375, -3.877197265625, -3.7032470703125, -3.529296875, -3.3553466796875, -3.181396484375, -3.0074462890625, -2.83349609375, -2.6595458984375, -2.485595703125, -2.3116455078125, -2.1376953125, -1.9637451171875, -1.789794921875, -1.6158447265625, -1.44189453125, -1.2679443359375, -1.093994140625, -0.9200439453125, -0.74609375, -0.5721435546875, -0.398193359375, -0.2242431640625, -0.05029296875, 0.1236572265625, 0.297607421875, 0.4715576171875, 0.6455078125, 0.8194580078125, 0.993408203125, 1.1673583984375, 1.34130859375, 1.5152587890625, 1.689208984375, 1.8631591796875, 2.037109375, 2.2110595703125, 2.385009765625, 2.5589599609375, 2.73291015625, 2.9068603515625, 3.080810546875, 3.2547607421875, 3.4287109375, 3.6026611328125, 3.776611328125, 3.9505615234375, 4.12451171875, 4.2984619140625, 4.472412109375, 4.6463623046875, 4.8203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 18.0, 32.0, 31.0, 32.0, 42.0, 57.0, 61.0, 68.0, 80.0, 83.0, 76.0, 70.0, 58.0, 64.0, 50.0, 41.0, 31.0, 27.0, 21.0, 15.0, 5.0, 13.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79345703125, -0.7735137939453125, -0.753570556640625, -0.7336273193359375, -0.71368408203125, -0.6937408447265625, -0.673797607421875, -0.6538543701171875, -0.6339111328125, -0.6139678955078125, -0.594024658203125, -0.5740814208984375, -0.55413818359375, -0.5341949462890625, -0.514251708984375, -0.4943084716796875, -0.474365234375, -0.4544219970703125, -0.434478759765625, -0.4145355224609375, -0.39459228515625, -0.3746490478515625, -0.354705810546875, -0.3347625732421875, -0.3148193359375, -0.2948760986328125, -0.274932861328125, -0.2549896240234375, -0.23504638671875, -0.2151031494140625, -0.195159912109375, -0.1752166748046875, -0.1552734375, -0.1353302001953125, -0.115386962890625, -0.0954437255859375, -0.07550048828125, -0.0555572509765625, -0.035614013671875, -0.0156707763671875, 0.0042724609375, 0.0242156982421875, 0.044158935546875, 0.0641021728515625, 0.08404541015625, 0.1039886474609375, 0.123931884765625, 0.1438751220703125, 0.163818359375, 0.1837615966796875, 0.203704833984375, 0.2236480712890625, 0.24359130859375, 0.2635345458984375, 0.283477783203125, 0.3034210205078125, 0.3233642578125, 0.3433074951171875, 0.363250732421875, 0.3831939697265625, 0.40313720703125, 0.4230804443359375, 0.443023681640625, 0.4629669189453125, 0.48291015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 10.0, 6.0, 13.0, 13.0, 12.0, 26.0, 27.0, 55.0, 61.0, 71.0, 115.0, 186.0, 236.0, 489.0, 957.0, 2785.0, 10662.0, 73824.0, 3807163.0, 268394.0, 21614.0, 4557.0, 1399.0, 612.0, 344.0, 198.0, 111.0, 92.0, 68.0, 39.0, 33.0, 35.0, 14.0, 17.0, 9.0, 6.0, 12.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.11004638671875, -5.9232177734375, -5.73638916015625, -5.549560546875, -5.36273193359375, -5.1759033203125, -4.98907470703125, -4.80224609375, -4.61541748046875, -4.4285888671875, -4.24176025390625, -4.054931640625, -3.86810302734375, -3.6812744140625, -3.49444580078125, -3.3076171875, -3.12078857421875, -2.9339599609375, -2.74713134765625, -2.560302734375, -2.37347412109375, -2.1866455078125, -1.99981689453125, -1.81298828125, -1.62615966796875, -1.4393310546875, -1.25250244140625, -1.065673828125, -0.87884521484375, -0.6920166015625, -0.50518798828125, -0.318359375, -0.13153076171875, 0.0552978515625, 0.24212646484375, 0.428955078125, 0.61578369140625, 0.8026123046875, 0.98944091796875, 1.17626953125, 1.36309814453125, 1.5499267578125, 1.73675537109375, 1.923583984375, 2.11041259765625, 2.2972412109375, 2.48406982421875, 2.6708984375, 2.85772705078125, 3.0445556640625, 3.23138427734375, 3.418212890625, 3.60504150390625, 3.7918701171875, 3.97869873046875, 4.16552734375, 4.35235595703125, 4.5391845703125, 4.72601318359375, 4.912841796875, 5.09967041015625, 5.2864990234375, 5.47332763671875, 5.66015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 7.0, 5.0, 11.0, 17.0, 24.0, 32.0, 49.0, 135.0, 271.0, 903.0, 1891.0, 350.0, 158.0, 74.0, 41.0, 26.0, 27.0, 18.0, 11.0, 10.0, 6.0, 5.0, 1.0, 4.0, 2.0], "bins": [-2.365234375, -2.3171463012695312, -2.2690582275390625, -2.2209701538085938, -2.172882080078125, -2.1247940063476562, -2.0767059326171875, -2.0286178588867188, -1.98052978515625, -1.9324417114257812, -1.8843536376953125, -1.8362655639648438, -1.788177490234375, -1.7400894165039062, -1.6920013427734375, -1.6439132690429688, -1.5958251953125, -1.5477371215820312, -1.4996490478515625, -1.4515609741210938, -1.403472900390625, -1.3553848266601562, -1.3072967529296875, -1.2592086791992188, -1.21112060546875, -1.1630325317382812, -1.1149444580078125, -1.0668563842773438, -1.018768310546875, -0.9706802368164062, -0.9225921630859375, -0.8745040893554688, -0.826416015625, -0.7783279418945312, -0.7302398681640625, -0.6821517944335938, -0.634063720703125, -0.5859756469726562, -0.5378875732421875, -0.48979949951171875, -0.44171142578125, -0.39362335205078125, -0.3455352783203125, -0.29744720458984375, -0.249359130859375, -0.20127105712890625, -0.1531829833984375, -0.10509490966796875, -0.0570068359375, -0.00891876220703125, 0.0391693115234375, 0.08725738525390625, 0.135345458984375, 0.18343353271484375, 0.2315216064453125, 0.27960968017578125, 0.32769775390625, 0.37578582763671875, 0.4238739013671875, 0.47196197509765625, 0.520050048828125, 0.5681381225585938, 0.6162261962890625, 0.6643142700195312, 0.71240234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 16.0, 23.0, 69.0, 83.0, 164.0, 194.0, 168.0, 119.0, 63.0, 30.0, 25.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.199235916137695, -9.905003547668457, -9.610770225524902, -9.316537857055664, -9.022305488586426, -8.728072166442871, -8.433839797973633, -8.139606475830078, -7.84537410736084, -7.551141262054443, -7.256908893585205, -6.962676048278809, -6.668443202972412, -6.374210357666016, -6.079977989196777, -5.785745143890381, -5.491512775421143, -5.197279930114746, -4.903047561645508, -4.608814716339111, -4.314581871032715, -4.020349502563477, -3.72611665725708, -3.4318838119506836, -3.137651205062866, -2.843418598175049, -2.5491857528686523, -2.254953145980835, -1.960720419883728, -1.666487693786621, -1.3722550868988037, -1.0780222415924072, -0.7837896347045898, -0.4895569384098053, -0.19532424211502075, 0.0989084243774414, 0.39314115047454834, 0.6873738765716553, 0.9816064834594727, 1.2758393287658691, 1.5700719356536865, 1.8643046617507935, 2.1585373878479004, 2.4527699947357178, 2.747002601623535, 3.0412354469299316, 3.335468053817749, 3.6297008991241455, 3.923933506011963, 4.218166351318359, 4.512398719787598, 4.806631565093994, 5.100864410400391, 5.395096778869629, 5.689329624176025, 5.983562469482422, 6.27779483795166, 6.572027683258057, 6.866260051727295, 7.160492897033691, 7.454725742340088, 7.748958587646484, 8.043190956115723, 8.337423324584961, 8.631656646728516]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 21.0, 22.0, 32.0, 32.0, 43.0, 53.0, 54.0, 57.0, 58.0, 65.0, 73.0, 67.0, 65.0, 82.0, 73.0, 38.0, 34.0, 25.0, 24.0, 24.0, 16.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.457943916320801, -5.303596019744873, -5.149248123168945, -4.994900226593018, -4.84055233001709, -4.68620491027832, -4.531857013702393, -4.377509117126465, -4.223161220550537, -4.068813323974609, -3.9144654273986816, -3.760117769241333, -3.6057698726654053, -3.4514219760894775, -3.297074317932129, -3.142726421356201, -2.9883785247802734, -2.8340306282043457, -2.679682731628418, -2.5253350734710693, -2.3709871768951416, -2.216639280319214, -2.0622916221618652, -1.9079437255859375, -1.7535958290100098, -1.599247932434082, -1.4449001550674438, -1.2905523777008057, -1.136204481124878, -0.981856644153595, -0.827508807182312, -0.6731610298156738, -0.5188136100769043, -0.36446577310562134, -0.21011793613433838, -0.05577009916305542, 0.09857773780822754, 0.2529255747795105, 0.40727341175079346, 0.5616211891174316, 0.7159690856933594, 0.8703169226646423, 1.0246647596359253, 1.1790125370025635, 1.3333604335784912, 1.487708330154419, 1.6420561075210571, 1.7964038848876953, 1.950751781463623, 2.105099678039551, 2.2594475746154785, 2.413795232772827, 2.568143129348755, 2.7224910259246826, 2.8768386840820312, 3.031186580657959, 3.1855344772338867, 3.3398823738098145, 3.494230270385742, 3.648577928543091, 3.8029258251190186, 3.9572737216949463, 4.111621379852295, 4.265969276428223, 4.42031717300415]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 20.0, 30.0, 52.0, 65.0, 84.0, 112.0, 177.0, 290.0, 420.0, 764.0, 1410.0, 2683.0, 5984.0, 16258.0, 50038.0, 174750.0, 453084.0, 237980.0, 68496.0, 20990.0, 7628.0, 3247.0, 1637.0, 872.0, 462.0, 305.0, 206.0, 122.0, 86.0, 63.0, 62.0, 30.0, 25.0, 19.0, 13.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.490447998046875, -2.39691162109375, -2.303375244140625, -2.2098388671875, -2.116302490234375, -2.02276611328125, -1.929229736328125, -1.835693359375, -1.742156982421875, -1.64862060546875, -1.555084228515625, -1.4615478515625, -1.368011474609375, -1.27447509765625, -1.180938720703125, -1.08740234375, -0.993865966796875, -0.90032958984375, -0.806793212890625, -0.7132568359375, -0.619720458984375, -0.52618408203125, -0.432647705078125, -0.339111328125, -0.245574951171875, -0.15203857421875, -0.058502197265625, 0.0350341796875, 0.128570556640625, 0.22210693359375, 0.315643310546875, 0.4091796875, 0.502716064453125, 0.59625244140625, 0.689788818359375, 0.7833251953125, 0.876861572265625, 0.97039794921875, 1.063934326171875, 1.157470703125, 1.251007080078125, 1.34454345703125, 1.438079833984375, 1.5316162109375, 1.625152587890625, 1.71868896484375, 1.812225341796875, 1.90576171875, 1.999298095703125, 2.09283447265625, 2.186370849609375, 2.2799072265625, 2.373443603515625, 2.46697998046875, 2.560516357421875, 2.654052734375, 2.747589111328125, 2.84112548828125, 2.934661865234375, 3.0281982421875, 3.121734619140625, 3.21527099609375, 3.308807373046875, 3.40234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 13.0, 23.0, 15.0, 43.0, 38.0, 59.0, 74.0, 73.0, 72.0, 63.0, 74.0, 72.0, 67.0, 55.0, 58.0, 35.0, 47.0, 24.0, 27.0, 14.0, 10.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7669601440429688, -0.7463226318359375, -0.7256851196289062, -0.705047607421875, -0.6844100952148438, -0.6637725830078125, -0.6431350708007812, -0.62249755859375, -0.6018600463867188, -0.5812225341796875, -0.5605850219726562, -0.539947509765625, -0.5193099975585938, -0.4986724853515625, -0.47803497314453125, -0.4573974609375, -0.43675994873046875, -0.4161224365234375, -0.39548492431640625, -0.374847412109375, -0.35420989990234375, -0.3335723876953125, -0.31293487548828125, -0.29229736328125, -0.27165985107421875, -0.2510223388671875, -0.23038482666015625, -0.209747314453125, -0.18910980224609375, -0.1684722900390625, -0.14783477783203125, -0.127197265625, -0.10655975341796875, -0.0859222412109375, -0.06528472900390625, -0.044647216796875, -0.02400970458984375, -0.0033721923828125, 0.01726531982421875, 0.03790283203125, 0.05854034423828125, 0.0791778564453125, 0.09981536865234375, 0.120452880859375, 0.14109039306640625, 0.1617279052734375, 0.18236541748046875, 0.2030029296875, 0.22364044189453125, 0.2442779541015625, 0.26491546630859375, 0.285552978515625, 0.30619049072265625, 0.3268280029296875, 0.34746551513671875, 0.36810302734375, 0.38874053955078125, 0.4093780517578125, 0.43001556396484375, 0.450653076171875, 0.47129058837890625, 0.4919281005859375, 0.5125656127929688, 0.533203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 13.0, 14.0, 22.0, 21.0, 40.0, 64.0, 62.0, 98.0, 150.0, 217.0, 359.0, 665.0, 1403.0, 4481.0, 19836.0, 118342.0, 555544.0, 285341.0, 48058.0, 9083.0, 2390.0, 968.0, 472.0, 240.0, 201.0, 110.0, 84.0, 66.0, 41.0, 36.0, 25.0, 16.0, 13.0, 9.0, 7.0, 11.0, 5.0, 7.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.20703125, -3.109100341796875, -3.01116943359375, -2.913238525390625, -2.8153076171875, -2.717376708984375, -2.61944580078125, -2.521514892578125, -2.423583984375, -2.325653076171875, -2.22772216796875, -2.129791259765625, -2.0318603515625, -1.933929443359375, -1.83599853515625, -1.738067626953125, -1.64013671875, -1.542205810546875, -1.44427490234375, -1.346343994140625, -1.2484130859375, -1.150482177734375, -1.05255126953125, -0.954620361328125, -0.856689453125, -0.758758544921875, -0.66082763671875, -0.562896728515625, -0.4649658203125, -0.367034912109375, -0.26910400390625, -0.171173095703125, -0.0732421875, 0.024688720703125, 0.12261962890625, 0.220550537109375, 0.3184814453125, 0.416412353515625, 0.51434326171875, 0.612274169921875, 0.710205078125, 0.808135986328125, 0.90606689453125, 1.003997802734375, 1.1019287109375, 1.199859619140625, 1.29779052734375, 1.395721435546875, 1.49365234375, 1.591583251953125, 1.68951416015625, 1.787445068359375, 1.8853759765625, 1.983306884765625, 2.08123779296875, 2.179168701171875, 2.277099609375, 2.375030517578125, 2.47296142578125, 2.570892333984375, 2.6688232421875, 2.766754150390625, 2.86468505859375, 2.962615966796875, 3.060546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 7.0, 11.0, 21.0, 26.0, 26.0, 40.0, 38.0, 42.0, 28.0, 55.0, 42.0, 50.0, 43.0, 46.0, 39.0, 39.0, 55.0, 50.0, 43.0, 53.0, 36.0, 27.0, 36.0, 21.0, 29.0, 12.0, 10.0, 8.0, 9.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7843475341796875, -1.723968505859375, -1.6635894775390625, -1.60321044921875, -1.5428314208984375, -1.482452392578125, -1.4220733642578125, -1.3616943359375, -1.3013153076171875, -1.240936279296875, -1.1805572509765625, -1.12017822265625, -1.0597991943359375, -0.999420166015625, -0.9390411376953125, -0.878662109375, -0.8182830810546875, -0.757904052734375, -0.6975250244140625, -0.63714599609375, -0.5767669677734375, -0.516387939453125, -0.4560089111328125, -0.3956298828125, -0.3352508544921875, -0.274871826171875, -0.2144927978515625, -0.15411376953125, -0.0937347412109375, -0.033355712890625, 0.0270233154296875, 0.08740234375, 0.1477813720703125, 0.208160400390625, 0.2685394287109375, 0.32891845703125, 0.3892974853515625, 0.449676513671875, 0.5100555419921875, 0.5704345703125, 0.6308135986328125, 0.691192626953125, 0.7515716552734375, 0.81195068359375, 0.8723297119140625, 0.932708740234375, 0.9930877685546875, 1.053466796875, 1.1138458251953125, 1.174224853515625, 1.2346038818359375, 1.29498291015625, 1.3553619384765625, 1.415740966796875, 1.4761199951171875, 1.5364990234375, 1.5968780517578125, 1.657257080078125, 1.7176361083984375, 1.77801513671875, 1.8383941650390625, 1.898773193359375, 1.9591522216796875, 2.01953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 10.0, 9.0, 18.0, 16.0, 22.0, 42.0, 55.0, 85.0, 159.0, 223.0, 392.0, 749.0, 1358.0, 2904.0, 6411.0, 16392.0, 49720.0, 189400.0, 582903.0, 136117.0, 37934.0, 13161.0, 5344.0, 2342.0, 1248.0, 623.0, 349.0, 202.0, 129.0, 70.0, 48.0, 35.0, 23.0, 12.0, 14.0, 9.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.599609375, -1.5556488037109375, -1.511688232421875, -1.4677276611328125, -1.42376708984375, -1.3798065185546875, -1.335845947265625, -1.2918853759765625, -1.2479248046875, -1.2039642333984375, -1.160003662109375, -1.1160430908203125, -1.07208251953125, -1.0281219482421875, -0.984161376953125, -0.9402008056640625, -0.896240234375, -0.8522796630859375, -0.808319091796875, -0.7643585205078125, -0.72039794921875, -0.6764373779296875, -0.632476806640625, -0.5885162353515625, -0.5445556640625, -0.5005950927734375, -0.456634521484375, -0.4126739501953125, -0.36871337890625, -0.3247528076171875, -0.280792236328125, -0.2368316650390625, -0.19287109375, -0.1489105224609375, -0.104949951171875, -0.0609893798828125, -0.01702880859375, 0.0269317626953125, 0.070892333984375, 0.1148529052734375, 0.1588134765625, 0.2027740478515625, 0.246734619140625, 0.2906951904296875, 0.33465576171875, 0.3786163330078125, 0.422576904296875, 0.4665374755859375, 0.510498046875, 0.5544586181640625, 0.598419189453125, 0.6423797607421875, 0.68634033203125, 0.7303009033203125, 0.774261474609375, 0.8182220458984375, 0.8621826171875, 0.9061431884765625, 0.950103759765625, 0.9940643310546875, 1.03802490234375, 1.0819854736328125, 1.125946044921875, 1.1699066162109375, 1.2138671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 1.0, 4.0, 7.0, 7.0, 8.0, 6.0, 21.0, 10.0, 32.0, 21.0, 27.0, 31.0, 43.0, 45.0, 85.0, 119.0, 141.0, 74.0, 80.0, 40.0, 34.0, 38.0, 24.0, 26.0, 20.0, 14.0, 13.0, 4.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021791458129882812, -0.00021151266992092133, -0.00020511075854301453, -0.00019870884716510773, -0.00019230693578720093, -0.00018590502440929413, -0.00017950311303138733, -0.00017310120165348053, -0.00016669929027557373, -0.00016029737889766693, -0.00015389546751976013, -0.00014749355614185333, -0.00014109164476394653, -0.00013468973338603973, -0.00012828782200813293, -0.00012188591063022614, -0.00011548399925231934, -0.00010908208787441254, -0.00010268017649650574, -9.627826511859894e-05, -8.987635374069214e-05, -8.347444236278534e-05, -7.707253098487854e-05, -7.067061960697174e-05, -6.426870822906494e-05, -5.786679685115814e-05, -5.146488547325134e-05, -4.5062974095344543e-05, -3.8661062717437744e-05, -3.2259151339530945e-05, -2.5857239961624146e-05, -1.9455328583717346e-05, -1.3053417205810547e-05, -6.6515058279037476e-06, -2.4959444999694824e-07, 6.152316927909851e-06, 1.255422830581665e-05, 1.895613968372345e-05, 2.535805106163025e-05, 3.175996243953705e-05, 3.816187381744385e-05, 4.456378519535065e-05, 5.0965696573257446e-05, 5.7367607951164246e-05, 6.376951932907104e-05, 7.017143070697784e-05, 7.657334208488464e-05, 8.297525346279144e-05, 8.937716484069824e-05, 9.577907621860504e-05, 0.00010218098759651184, 0.00010858289897441864, 0.00011498481035232544, 0.00012138672173023224, 0.00012778863310813904, 0.00013419054448604584, 0.00014059245586395264, 0.00014699436724185944, 0.00015339627861976624, 0.00015979818999767303, 0.00016620010137557983, 0.00017260201275348663, 0.00017900392413139343, 0.00018540583550930023, 0.00019180774688720703]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 15.0, 22.0, 51.0, 70.0, 124.0, 236.0, 376.0, 913.0, 2495.0, 10201.0, 82717.0, 820827.0, 113016.0, 12574.0, 2951.0, 935.0, 447.0, 225.0, 106.0, 67.0, 51.0, 36.0, 9.0, 16.0, 10.0, 8.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.182952880859375, -3.07879638671875, -2.974639892578125, -2.8704833984375, -2.766326904296875, -2.66217041015625, -2.558013916015625, -2.453857421875, -2.349700927734375, -2.24554443359375, -2.141387939453125, -2.0372314453125, -1.933074951171875, -1.82891845703125, -1.724761962890625, -1.62060546875, -1.516448974609375, -1.41229248046875, -1.308135986328125, -1.2039794921875, -1.099822998046875, -0.99566650390625, -0.891510009765625, -0.787353515625, -0.683197021484375, -0.57904052734375, -0.474884033203125, -0.3707275390625, -0.266571044921875, -0.16241455078125, -0.058258056640625, 0.0458984375, 0.150054931640625, 0.25421142578125, 0.358367919921875, 0.4625244140625, 0.566680908203125, 0.67083740234375, 0.774993896484375, 0.879150390625, 0.983306884765625, 1.08746337890625, 1.191619873046875, 1.2957763671875, 1.399932861328125, 1.50408935546875, 1.608245849609375, 1.71240234375, 1.816558837890625, 1.92071533203125, 2.024871826171875, 2.1290283203125, 2.233184814453125, 2.33734130859375, 2.441497802734375, 2.545654296875, 2.649810791015625, 2.75396728515625, 2.858123779296875, 2.9622802734375, 3.066436767578125, 3.17059326171875, 3.274749755859375, 3.37890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 9.0, 9.0, 12.0, 17.0, 17.0, 11.0, 39.0, 33.0, 57.0, 90.0, 168.0, 169.0, 107.0, 68.0, 51.0, 37.0, 18.0, 21.0, 15.0, 11.0, 9.0, 8.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.5775299072265625, -2.516387939453125, -2.4552459716796875, -2.39410400390625, -2.3329620361328125, -2.271820068359375, -2.2106781005859375, -2.1495361328125, -2.0883941650390625, -2.027252197265625, -1.9661102294921875, -1.90496826171875, -1.8438262939453125, -1.782684326171875, -1.7215423583984375, -1.660400390625, -1.5992584228515625, -1.538116455078125, -1.4769744873046875, -1.41583251953125, -1.3546905517578125, -1.293548583984375, -1.2324066162109375, -1.1712646484375, -1.1101226806640625, -1.048980712890625, -0.9878387451171875, -0.92669677734375, -0.8655548095703125, -0.804412841796875, -0.7432708740234375, -0.68212890625, -0.6209869384765625, -0.559844970703125, -0.4987030029296875, -0.43756103515625, -0.3764190673828125, -0.315277099609375, -0.2541351318359375, -0.1929931640625, -0.1318511962890625, -0.070709228515625, -0.0095672607421875, 0.05157470703125, 0.1127166748046875, 0.173858642578125, 0.2350006103515625, 0.296142578125, 0.3572845458984375, 0.418426513671875, 0.4795684814453125, 0.54071044921875, 0.6018524169921875, 0.662994384765625, 0.7241363525390625, 0.7852783203125, 0.8464202880859375, 0.907562255859375, 0.9687042236328125, 1.02984619140625, 1.0909881591796875, 1.152130126953125, 1.2132720947265625, 1.2744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 25.0, 43.0, 94.0, 203.0, 232.0, 180.0, 123.0, 59.0, 20.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.7812557220459, -15.626142501831055, -14.471028327941895, -13.315914154052734, -12.16080093383789, -11.005687713623047, -9.850573539733887, -8.695459365844727, -7.540346145629883, -6.385232448577881, -5.230118751525879, -4.075005054473877, -2.919891357421875, -1.764777660369873, -0.6096639633178711, 0.5454502105712891, 1.7005634307861328, 2.8556771278381348, 4.010790824890137, 5.165904521942139, 6.321018218994141, 7.476131916046143, 8.631245613098145, 9.786359786987305, 10.941473007202148, 12.096586227416992, 13.251700401306152, 14.406814575195312, 15.561927795410156, 16.717041015625, 17.872154235839844, 19.02726936340332, 20.182384490966797, 21.33749771118164, 22.492610931396484, 23.64772605895996, 24.802839279174805, 25.95795249938965, 27.113067626953125, 28.26818084716797, 29.423294067382812, 30.578407287597656, 31.7335205078125, 32.888633728027344, 34.04374694824219, 35.1988639831543, 36.35397720336914, 37.509090423583984, 38.66420364379883, 39.81931686401367, 40.974430084228516, 42.12954330444336, 43.28466033935547, 44.43977355957031, 45.594886779785156, 46.75, 47.905113220214844, 49.06022644042969, 50.21533966064453, 51.370452880859375, 52.52556610107422, 53.68068313598633, 54.83579635620117, 55.990909576416016, 57.14602279663086]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 6.0, 12.0, 13.0, 15.0, 16.0, 19.0, 20.0, 20.0, 31.0, 30.0, 27.0, 31.0, 41.0, 34.0, 34.0, 47.0, 47.0, 46.0, 40.0, 38.0, 40.0, 49.0, 32.0, 28.0, 41.0, 36.0, 28.0, 30.0, 20.0, 18.0, 12.0, 19.0, 16.0, 12.0, 13.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.910199165344238, -7.616495609283447, -7.322792053222656, -7.029088973999023, -6.735385417938232, -6.441681861877441, -6.147978782653809, -5.854275226593018, -5.560571670532227, -5.2668681144714355, -4.9731645584106445, -4.679461479187012, -4.385757923126221, -4.09205436706543, -3.7983510494232178, -3.504647731781006, -3.210944175720215, -2.917240619659424, -2.623537302017212, -2.329833984375, -2.036130428314209, -1.7424269914627075, -1.448723554611206, -1.1550202369689941, -0.8613166809082031, -0.5676132440567017, -0.2739098072052002, 0.01979362964630127, 0.31349706649780273, 0.6072005033493042, 0.9009039402008057, 1.1946072578430176, 1.488311767578125, 1.7820152044296265, 2.075718641281128, 2.36942195892334, 2.663125514984131, 2.956829071044922, 3.250532388687134, 3.5442357063293457, 3.8379392623901367, 4.131642818450928, 4.425346374511719, 4.719049453735352, 5.012753009796143, 5.306456565856934, 5.600159645080566, 5.893863201141357, 6.187566757202148, 6.4812703132629395, 6.7749738693237305, 7.068676948547363, 7.362380504608154, 7.656084060668945, 7.949787139892578, 8.243490219116211, 8.53719425201416, 8.830897331237793, 9.124601364135742, 9.418304443359375, 9.712007522583008, 10.005711555480957, 10.29941463470459, 10.593118667602539, 10.886821746826172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 9.0, 4.0, 13.0, 7.0, 25.0, 15.0, 25.0, 50.0, 64.0, 86.0, 127.0, 199.0, 310.0, 558.0, 1049.0, 2350.0, 6409.0, 24992.0, 271522.0, 3765249.0, 97414.0, 15068.0, 4665.0, 1879.0, 880.0, 480.0, 287.0, 168.0, 127.0, 66.0, 40.0, 36.0, 21.0, 18.0, 18.0, 8.0, 7.0, 6.0, 0.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2147216796875, -6.038818359375, -5.8629150390625, -5.68701171875, -5.5111083984375, -5.335205078125, -5.1593017578125, -4.9833984375, -4.8074951171875, -4.631591796875, -4.4556884765625, -4.27978515625, -4.1038818359375, -3.927978515625, -3.7520751953125, -3.576171875, -3.4002685546875, -3.224365234375, -3.0484619140625, -2.87255859375, -2.6966552734375, -2.520751953125, -2.3448486328125, -2.1689453125, -1.9930419921875, -1.817138671875, -1.6412353515625, -1.46533203125, -1.2894287109375, -1.113525390625, -0.9376220703125, -0.76171875, -0.5858154296875, -0.409912109375, -0.2340087890625, -0.05810546875, 0.1177978515625, 0.293701171875, 0.4696044921875, 0.6455078125, 0.8214111328125, 0.997314453125, 1.1732177734375, 1.34912109375, 1.5250244140625, 1.700927734375, 1.8768310546875, 2.052734375, 2.2286376953125, 2.404541015625, 2.5804443359375, 2.75634765625, 2.9322509765625, 3.108154296875, 3.2840576171875, 3.4599609375, 3.6358642578125, 3.811767578125, 3.9876708984375, 4.16357421875, 4.3394775390625, 4.515380859375, 4.6912841796875, 4.8671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 17.0, 14.0, 20.0, 20.0, 39.0, 36.0, 53.0, 58.0, 62.0, 63.0, 69.0, 82.0, 64.0, 69.0, 65.0, 56.0, 51.0, 29.0, 31.0, 21.0, 26.0, 14.0, 10.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.798828125, -0.7780838012695312, -0.7573394775390625, -0.7365951538085938, -0.715850830078125, -0.6951065063476562, -0.6743621826171875, -0.6536178588867188, -0.63287353515625, -0.6121292114257812, -0.5913848876953125, -0.5706405639648438, -0.549896240234375, -0.5291519165039062, -0.5084075927734375, -0.48766326904296875, -0.4669189453125, -0.44617462158203125, -0.4254302978515625, -0.40468597412109375, -0.383941650390625, -0.36319732666015625, -0.3424530029296875, -0.32170867919921875, -0.30096435546875, -0.28022003173828125, -0.2594757080078125, -0.23873138427734375, -0.217987060546875, -0.19724273681640625, -0.1764984130859375, -0.15575408935546875, -0.135009765625, -0.11426544189453125, -0.0935211181640625, -0.07277679443359375, -0.052032470703125, -0.03128814697265625, -0.0105438232421875, 0.01020050048828125, 0.03094482421875, 0.05168914794921875, 0.0724334716796875, 0.09317779541015625, 0.113922119140625, 0.13466644287109375, 0.1554107666015625, 0.17615509033203125, 0.1968994140625, 0.21764373779296875, 0.2383880615234375, 0.25913238525390625, 0.279876708984375, 0.30062103271484375, 0.3213653564453125, 0.34210968017578125, 0.36285400390625, 0.38359832763671875, 0.4043426513671875, 0.42508697509765625, 0.445831298828125, 0.46657562255859375, 0.4873199462890625, 0.5080642700195312, 0.52880859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 15.0, 20.0, 26.0, 26.0, 53.0, 70.0, 99.0, 171.0, 285.0, 413.0, 813.0, 1656.0, 3428.0, 7868.0, 20878.0, 75520.0, 702115.0, 3166686.0, 159211.0, 33724.0, 11509.0, 4817.0, 2280.0, 1086.0, 597.0, 334.0, 213.0, 119.0, 91.0, 38.0, 37.0, 25.0, 11.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.142578125, -3.045013427734375, -2.94744873046875, -2.849884033203125, -2.7523193359375, -2.654754638671875, -2.55718994140625, -2.459625244140625, -2.362060546875, -2.264495849609375, -2.16693115234375, -2.069366455078125, -1.9718017578125, -1.874237060546875, -1.77667236328125, -1.679107666015625, -1.58154296875, -1.483978271484375, -1.38641357421875, -1.288848876953125, -1.1912841796875, -1.093719482421875, -0.99615478515625, -0.898590087890625, -0.801025390625, -0.703460693359375, -0.60589599609375, -0.508331298828125, -0.4107666015625, -0.313201904296875, -0.21563720703125, -0.118072509765625, -0.0205078125, 0.077056884765625, 0.17462158203125, 0.272186279296875, 0.3697509765625, 0.467315673828125, 0.56488037109375, 0.662445068359375, 0.760009765625, 0.857574462890625, 0.95513916015625, 1.052703857421875, 1.1502685546875, 1.247833251953125, 1.34539794921875, 1.442962646484375, 1.54052734375, 1.638092041015625, 1.73565673828125, 1.833221435546875, 1.9307861328125, 2.028350830078125, 2.12591552734375, 2.223480224609375, 2.321044921875, 2.418609619140625, 2.51617431640625, 2.613739013671875, 2.7113037109375, 2.808868408203125, 2.90643310546875, 3.003997802734375, 3.1015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 13.0, 9.0, 18.0, 19.0, 44.0, 43.0, 107.0, 175.0, 414.0, 1100.0, 1316.0, 350.0, 177.0, 83.0, 59.0, 38.0, 27.0, 16.0, 14.0, 5.0, 10.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.2677459716796875, -1.217132568359375, -1.1665191650390625, -1.11590576171875, -1.0652923583984375, -1.014678955078125, -0.9640655517578125, -0.9134521484375, -0.8628387451171875, -0.812225341796875, -0.7616119384765625, -0.71099853515625, -0.6603851318359375, -0.609771728515625, -0.5591583251953125, -0.508544921875, -0.4579315185546875, -0.407318115234375, -0.3567047119140625, -0.30609130859375, -0.2554779052734375, -0.204864501953125, -0.1542510986328125, -0.1036376953125, -0.0530242919921875, -0.002410888671875, 0.0482025146484375, 0.09881591796875, 0.1494293212890625, 0.200042724609375, 0.2506561279296875, 0.30126953125, 0.3518829345703125, 0.402496337890625, 0.4531097412109375, 0.50372314453125, 0.5543365478515625, 0.604949951171875, 0.6555633544921875, 0.7061767578125, 0.7567901611328125, 0.807403564453125, 0.8580169677734375, 0.90863037109375, 0.9592437744140625, 1.009857177734375, 1.0604705810546875, 1.111083984375, 1.1616973876953125, 1.212310791015625, 1.2629241943359375, 1.31353759765625, 1.3641510009765625, 1.414764404296875, 1.4653778076171875, 1.5159912109375, 1.5666046142578125, 1.617218017578125, 1.6678314208984375, 1.71844482421875, 1.7690582275390625, 1.819671630859375, 1.8702850341796875, 1.9208984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 8.0, 18.0, 34.0, 50.0, 85.0, 147.0, 192.0, 179.0, 129.0, 75.0, 31.0, 21.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.364502906799316, -13.94583797454834, -13.527173042297363, -13.10850715637207, -12.689842224121094, -12.271177291870117, -11.85251235961914, -11.433847427368164, -11.015182495117188, -10.596517562866211, -10.177852630615234, -9.759187698364258, -9.340521812438965, -8.921856880187988, -8.503191947937012, -8.084527015686035, -7.6658616065979, -7.247196674346924, -6.828531265258789, -6.4098663330078125, -5.991201400756836, -5.572536468505859, -5.153871059417725, -4.735206127166748, -4.316540718078613, -3.8978755474090576, -3.479210615158081, -3.0605454444885254, -2.641880512237549, -2.223215341567993, -1.8045501708984375, -1.385885238647461, -0.9672203063964844, -0.5485552549362183, -0.12989014387130737, 0.2887749671936035, 0.7074400186538696, 1.1261050701141357, 1.5447702407836914, 1.963435173034668, 2.3821003437042236, 2.8007655143737793, 3.219430446624756, 3.6380956172943115, 4.056760787963867, 4.475425720214844, 4.89409065246582, 5.312755584716797, 5.731420993804932, 6.150085926055908, 6.568751335144043, 6.9874162673950195, 7.406081199645996, 7.824746131896973, 8.243412017822266, 8.662076950073242, 9.080741882324219, 9.499406814575195, 9.918071746826172, 10.336736679077148, 10.755402565002441, 11.174067497253418, 11.592732429504395, 12.011397361755371, 12.430062294006348]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 16.0, 13.0, 11.0, 20.0, 19.0, 35.0, 26.0, 26.0, 46.0, 43.0, 45.0, 40.0, 44.0, 57.0, 43.0, 48.0, 55.0, 47.0, 50.0, 35.0, 40.0, 27.0, 28.0, 34.0, 23.0, 20.0, 14.0, 18.0, 11.0, 10.0, 6.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.550609588623047, -4.380953311920166, -4.211296558380127, -4.041640281677246, -3.8719840049743652, -3.7023274898529053, -3.5326709747314453, -3.3630146980285645, -3.1933581829071045, -3.0237016677856445, -2.8540453910827637, -2.6843888759613037, -2.5147323608398438, -2.345076084136963, -2.175419569015503, -2.005763053894043, -1.836106777191162, -1.6664503812789917, -1.4967939853668213, -1.3271374702453613, -1.157481074333191, -0.9878246784210205, -0.8181681632995605, -0.6485117673873901, -0.4788553714752197, -0.30919894576072693, -0.13954252004623413, 0.030113935470581055, 0.19977033138275146, 0.3694267272949219, 0.5390832424163818, 0.7087396383285522, 0.8783965110778809, 1.0480529069900513, 1.2177093029022217, 1.3873658180236816, 1.557022213935852, 1.7266786098480225, 1.8963351249694824, 2.0659914016723633, 2.2356479167938232, 2.405304431915283, 2.574960708618164, 2.744617223739624, 2.914273738861084, 3.083930015563965, 3.253586530685425, 3.4232430458068848, 3.5928993225097656, 3.7625558376312256, 3.9322121143341064, 4.101868629455566, 4.271524906158447, 4.441181182861328, 4.610837936401367, 4.780494213104248, 4.950150489807129, 5.11980676651001, 5.289463520050049, 5.45911979675293, 5.6287760734558105, 5.798432350158691, 5.9680891036987305, 6.137745380401611, 6.30740213394165]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 13.0, 19.0, 25.0, 36.0, 61.0, 113.0, 145.0, 257.0, 427.0, 633.0, 1318.0, 2589.0, 6035.0, 15409.0, 44064.0, 134306.0, 314559.0, 318191.0, 137023.0, 45836.0, 15618.0, 6142.0, 2633.0, 1283.0, 716.0, 392.0, 236.0, 147.0, 86.0, 61.0, 46.0, 40.0, 22.0, 16.0, 11.0, 5.0, 6.0, 4.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.666015625, -2.582733154296875, -2.49945068359375, -2.416168212890625, -2.3328857421875, -2.249603271484375, -2.16632080078125, -2.083038330078125, -1.999755859375, -1.916473388671875, -1.83319091796875, -1.749908447265625, -1.6666259765625, -1.583343505859375, -1.50006103515625, -1.416778564453125, -1.33349609375, -1.250213623046875, -1.16693115234375, -1.083648681640625, -1.0003662109375, -0.917083740234375, -0.83380126953125, -0.750518798828125, -0.667236328125, -0.583953857421875, -0.50067138671875, -0.417388916015625, -0.3341064453125, -0.250823974609375, -0.16754150390625, -0.084259033203125, -0.0009765625, 0.082305908203125, 0.16558837890625, 0.248870849609375, 0.3321533203125, 0.415435791015625, 0.49871826171875, 0.582000732421875, 0.665283203125, 0.748565673828125, 0.83184814453125, 0.915130615234375, 0.9984130859375, 1.081695556640625, 1.16497802734375, 1.248260498046875, 1.33154296875, 1.414825439453125, 1.49810791015625, 1.581390380859375, 1.6646728515625, 1.747955322265625, 1.83123779296875, 1.914520263671875, 1.997802734375, 2.081085205078125, 2.16436767578125, 2.247650146484375, 2.3309326171875, 2.414215087890625, 2.49749755859375, 2.580780029296875, 2.6640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 17.0, 14.0, 15.0, 33.0, 42.0, 35.0, 43.0, 62.0, 66.0, 68.0, 76.0, 60.0, 67.0, 67.0, 56.0, 50.0, 48.0, 36.0, 34.0, 20.0, 16.0, 17.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.900390625, -0.8780746459960938, -0.8557586669921875, -0.8334426879882812, -0.811126708984375, -0.7888107299804688, -0.7664947509765625, -0.7441787719726562, -0.72186279296875, -0.6995468139648438, -0.6772308349609375, -0.6549148559570312, -0.632598876953125, -0.6102828979492188, -0.5879669189453125, -0.5656509399414062, -0.5433349609375, -0.5210189819335938, -0.4987030029296875, -0.47638702392578125, -0.454071044921875, -0.43175506591796875, -0.4094390869140625, -0.38712310791015625, -0.36480712890625, -0.34249114990234375, -0.3201751708984375, -0.29785919189453125, -0.275543212890625, -0.25322723388671875, -0.2309112548828125, -0.20859527587890625, -0.186279296875, -0.16396331787109375, -0.1416473388671875, -0.11933135986328125, -0.097015380859375, -0.07469940185546875, -0.0523834228515625, -0.03006744384765625, -0.00775146484375, 0.01456451416015625, 0.0368804931640625, 0.05919647216796875, 0.081512451171875, 0.10382843017578125, 0.1261444091796875, 0.14846038818359375, 0.1707763671875, 0.19309234619140625, 0.2154083251953125, 0.23772430419921875, 0.260040283203125, 0.28235626220703125, 0.3046722412109375, 0.32698822021484375, 0.34930419921875, 0.37162017822265625, 0.3939361572265625, 0.41625213623046875, 0.438568115234375, 0.46088409423828125, 0.4832000732421875, 0.5055160522460938, 0.52783203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 9.0, 7.0, 14.0, 10.0, 23.0, 34.0, 46.0, 79.0, 86.0, 111.0, 226.0, 318.0, 592.0, 1313.0, 4609.0, 29396.0, 286185.0, 621855.0, 88723.0, 10428.0, 2292.0, 865.0, 437.0, 277.0, 185.0, 122.0, 76.0, 59.0, 38.0, 27.0, 21.0, 19.0, 12.0, 11.0, 2.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.4437255859375, -4.301513671875, -4.1593017578125, -4.01708984375, -3.8748779296875, -3.732666015625, -3.5904541015625, -3.4482421875, -3.3060302734375, -3.163818359375, -3.0216064453125, -2.87939453125, -2.7371826171875, -2.594970703125, -2.4527587890625, -2.310546875, -2.1683349609375, -2.026123046875, -1.8839111328125, -1.74169921875, -1.5994873046875, -1.457275390625, -1.3150634765625, -1.1728515625, -1.0306396484375, -0.888427734375, -0.7462158203125, -0.60400390625, -0.4617919921875, -0.319580078125, -0.1773681640625, -0.03515625, 0.1070556640625, 0.249267578125, 0.3914794921875, 0.53369140625, 0.6759033203125, 0.818115234375, 0.9603271484375, 1.1025390625, 1.2447509765625, 1.386962890625, 1.5291748046875, 1.67138671875, 1.8135986328125, 1.955810546875, 2.0980224609375, 2.240234375, 2.3824462890625, 2.524658203125, 2.6668701171875, 2.80908203125, 2.9512939453125, 3.093505859375, 3.2357177734375, 3.3779296875, 3.5201416015625, 3.662353515625, 3.8045654296875, 3.94677734375, 4.0889892578125, 4.231201171875, 4.3734130859375, 4.515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 13.0, 22.0, 14.0, 18.0, 20.0, 31.0, 26.0, 26.0, 38.0, 37.0, 33.0, 32.0, 42.0, 37.0, 46.0, 49.0, 39.0, 46.0, 39.0, 36.0, 39.0, 35.0, 28.0, 29.0, 26.0, 21.0, 14.0, 20.0, 17.0, 19.0, 10.0, 15.0, 10.0, 14.0, 3.0, 5.0, 10.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.96875, -1.906036376953125, -1.84332275390625, -1.780609130859375, -1.7178955078125, -1.655181884765625, -1.59246826171875, -1.529754638671875, -1.467041015625, -1.404327392578125, -1.34161376953125, -1.278900146484375, -1.2161865234375, -1.153472900390625, -1.09075927734375, -1.028045654296875, -0.96533203125, -0.902618408203125, -0.83990478515625, -0.777191162109375, -0.7144775390625, -0.651763916015625, -0.58905029296875, -0.526336669921875, -0.463623046875, -0.400909423828125, -0.33819580078125, -0.275482177734375, -0.2127685546875, -0.150054931640625, -0.08734130859375, -0.024627685546875, 0.0380859375, 0.100799560546875, 0.16351318359375, 0.226226806640625, 0.2889404296875, 0.351654052734375, 0.41436767578125, 0.477081298828125, 0.539794921875, 0.602508544921875, 0.66522216796875, 0.727935791015625, 0.7906494140625, 0.853363037109375, 0.91607666015625, 0.978790283203125, 1.04150390625, 1.104217529296875, 1.16693115234375, 1.229644775390625, 1.2923583984375, 1.355072021484375, 1.41778564453125, 1.480499267578125, 1.543212890625, 1.605926513671875, 1.66864013671875, 1.731353759765625, 1.7940673828125, 1.856781005859375, 1.91949462890625, 1.982208251953125, 2.044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 6.0, 8.0, 12.0, 15.0, 12.0, 29.0, 26.0, 38.0, 59.0, 92.0, 138.0, 268.0, 475.0, 963.0, 2276.0, 6050.0, 18977.0, 81406.0, 404469.0, 418415.0, 84276.0, 19876.0, 6083.0, 2396.0, 975.0, 524.0, 272.0, 141.0, 86.0, 61.0, 40.0, 33.0, 17.0, 15.0, 12.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.3143157958984375, -1.254608154296875, -1.1949005126953125, -1.13519287109375, -1.0754852294921875, -1.015777587890625, -0.9560699462890625, -0.8963623046875, -0.8366546630859375, -0.776947021484375, -0.7172393798828125, -0.65753173828125, -0.5978240966796875, -0.538116455078125, -0.4784088134765625, -0.418701171875, -0.3589935302734375, -0.299285888671875, -0.2395782470703125, -0.17987060546875, -0.1201629638671875, -0.060455322265625, -0.0007476806640625, 0.0589599609375, 0.1186676025390625, 0.178375244140625, 0.2380828857421875, 0.29779052734375, 0.3574981689453125, 0.417205810546875, 0.4769134521484375, 0.53662109375, 0.5963287353515625, 0.656036376953125, 0.7157440185546875, 0.77545166015625, 0.8351593017578125, 0.894866943359375, 0.9545745849609375, 1.0142822265625, 1.0739898681640625, 1.133697509765625, 1.1934051513671875, 1.25311279296875, 1.3128204345703125, 1.372528076171875, 1.4322357177734375, 1.491943359375, 1.5516510009765625, 1.611358642578125, 1.6710662841796875, 1.73077392578125, 1.7904815673828125, 1.850189208984375, 1.9098968505859375, 1.9696044921875, 2.0293121337890625, 2.089019775390625, 2.1487274169921875, 2.20843505859375, 2.2681427001953125, 2.327850341796875, 2.3875579833984375, 2.447265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 15.0, 17.0, 23.0, 26.0, 20.0, 38.0, 36.0, 58.0, 58.0, 64.0, 68.0, 66.0, 70.0, 77.0, 66.0, 63.0, 50.0, 37.0, 17.0, 29.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001826845109462738, -0.00017630308866500854, -0.00016992166638374329, -0.00016354024410247803, -0.00015715882182121277, -0.0001507773995399475, -0.00014439597725868225, -0.000138014554977417, -0.00013163313269615173, -0.00012525171041488647, -0.00011887028813362122, -0.00011248886585235596, -0.0001061074435710907, -9.972602128982544e-05, -9.334459900856018e-05, -8.696317672729492e-05, -8.058175444602966e-05, -7.42003321647644e-05, -6.781890988349915e-05, -6.143748760223389e-05, -5.505606532096863e-05, -4.867464303970337e-05, -4.229322075843811e-05, -3.591179847717285e-05, -2.9530376195907593e-05, -2.3148953914642334e-05, -1.6767531633377075e-05, -1.0386109352111816e-05, -4.004687070846558e-06, 2.376735210418701e-06, 8.75815749168396e-06, 1.5139579772949219e-05, 2.1521002054214478e-05, 2.7902424335479736e-05, 3.4283846616744995e-05, 4.0665268898010254e-05, 4.704669117927551e-05, 5.342811346054077e-05, 5.980953574180603e-05, 6.619095802307129e-05, 7.257238030433655e-05, 7.89538025856018e-05, 8.533522486686707e-05, 9.171664714813232e-05, 9.809806942939758e-05, 0.00010447949171066284, 0.0001108609139919281, 0.00011724233627319336, 0.00012362375855445862, 0.00013000518083572388, 0.00013638660311698914, 0.0001427680253982544, 0.00014914944767951965, 0.0001555308699607849, 0.00016191229224205017, 0.00016829371452331543, 0.0001746751368045807, 0.00018105655908584595, 0.0001874379813671112, 0.00019381940364837646, 0.00020020082592964172, 0.00020658224821090698, 0.00021296367049217224, 0.0002193450927734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 16.0, 23.0, 58.0, 78.0, 111.0, 223.0, 434.0, 1060.0, 3227.0, 16296.0, 185588.0, 749278.0, 79085.0, 9173.0, 2298.0, 767.0, 377.0, 180.0, 108.0, 73.0, 27.0, 15.0, 14.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.960113525390625, -2.85186767578125, -2.743621826171875, -2.6353759765625, -2.527130126953125, -2.41888427734375, -2.310638427734375, -2.202392578125, -2.094146728515625, -1.98590087890625, -1.877655029296875, -1.7694091796875, -1.661163330078125, -1.55291748046875, -1.444671630859375, -1.33642578125, -1.228179931640625, -1.11993408203125, -1.011688232421875, -0.9034423828125, -0.795196533203125, -0.68695068359375, -0.578704833984375, -0.470458984375, -0.362213134765625, -0.25396728515625, -0.145721435546875, -0.0374755859375, 0.070770263671875, 0.17901611328125, 0.287261962890625, 0.3955078125, 0.503753662109375, 0.61199951171875, 0.720245361328125, 0.8284912109375, 0.936737060546875, 1.04498291015625, 1.153228759765625, 1.261474609375, 1.369720458984375, 1.47796630859375, 1.586212158203125, 1.6944580078125, 1.802703857421875, 1.91094970703125, 2.019195556640625, 2.12744140625, 2.235687255859375, 2.34393310546875, 2.452178955078125, 2.5604248046875, 2.668670654296875, 2.77691650390625, 2.885162353515625, 2.993408203125, 3.101654052734375, 3.20989990234375, 3.318145751953125, 3.4263916015625, 3.534637451171875, 3.64288330078125, 3.751129150390625, 3.859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 18.0, 19.0, 26.0, 25.0, 38.0, 46.0, 49.0, 79.0, 68.0, 90.0, 89.0, 84.0, 77.0, 50.0, 45.0, 28.0, 28.0, 18.0, 12.0, 18.0, 11.0, 12.0, 4.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8544921875, -1.801513671875, -1.74853515625, -1.695556640625, -1.642578125, -1.589599609375, -1.53662109375, -1.483642578125, -1.4306640625, -1.377685546875, -1.32470703125, -1.271728515625, -1.21875, -1.165771484375, -1.11279296875, -1.059814453125, -1.0068359375, -0.953857421875, -0.90087890625, -0.847900390625, -0.794921875, -0.741943359375, -0.68896484375, -0.635986328125, -0.5830078125, -0.530029296875, -0.47705078125, -0.424072265625, -0.37109375, -0.318115234375, -0.26513671875, -0.212158203125, -0.1591796875, -0.106201171875, -0.05322265625, -0.000244140625, 0.052734375, 0.105712890625, 0.15869140625, 0.211669921875, 0.2646484375, 0.317626953125, 0.37060546875, 0.423583984375, 0.4765625, 0.529541015625, 0.58251953125, 0.635498046875, 0.6884765625, 0.741455078125, 0.79443359375, 0.847412109375, 0.900390625, 0.953369140625, 1.00634765625, 1.059326171875, 1.1123046875, 1.165283203125, 1.21826171875, 1.271240234375, 1.32421875, 1.377197265625, 1.43017578125, 1.483154296875, 1.5361328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 12.0, 24.0, 50.0, 104.0, 155.0, 184.0, 172.0, 131.0, 82.0, 36.0, 25.0, 9.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.456741333007812, -21.41472053527832, -20.372697830200195, -19.330677032470703, -18.288654327392578, -17.246633529663086, -16.204612731933594, -15.162590980529785, -14.120569229125977, -13.078547477722168, -12.03652572631836, -10.994504928588867, -9.952483177185059, -8.91046142578125, -7.8684401512146, -6.826418876647949, -5.784397125244141, -4.742375373840332, -3.7003540992736816, -2.658332586288452, -1.6163110733032227, -0.5742893218994141, 0.46773195266723633, 1.5097532272338867, 2.5517749786376953, 3.593796491622925, 4.635818004608154, 5.677839279174805, 6.719861030578613, 7.761882781982422, 8.803903579711914, 9.845925331115723, 10.887947082519531, 11.92996883392334, 12.971990585327148, 14.01401138305664, 15.05603313446045, 16.098054885864258, 17.14007568359375, 18.182098388671875, 19.224119186401367, 20.26613998413086, 21.308162689208984, 22.350183486938477, 23.39220428466797, 24.434226989746094, 25.476247787475586, 26.518268585205078, 27.560291290283203, 28.602312088012695, 29.64433479309082, 30.686355590820312, 31.728378295898438, 32.77040100097656, 33.81241989135742, 34.85444259643555, 35.896461486816406, 36.93848419189453, 37.98050308227539, 39.022525787353516, 40.06454849243164, 41.1065673828125, 42.148590087890625, 43.19061279296875, 44.232635498046875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 6.0, 8.0, 9.0, 13.0, 10.0, 15.0, 20.0, 33.0, 22.0, 25.0, 39.0, 47.0, 49.0, 43.0, 56.0, 44.0, 43.0, 39.0, 54.0, 30.0, 31.0, 43.0, 44.0, 39.0, 34.0, 29.0, 27.0, 31.0, 20.0, 24.0, 9.0, 15.0, 10.0, 5.0, 8.0, 6.0, 3.0, 9.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.737166404724121, -11.365572929382324, -10.993978500366211, -10.622385025024414, -10.250791549682617, -9.87919807434082, -9.507604598999023, -9.13601016998291, -8.764416694641113, -8.392823219299316, -8.021228790283203, -7.649635314941406, -7.278041839599609, -6.9064483642578125, -6.534854412078857, -6.163260459899902, -5.7916669845581055, -5.420073509216309, -5.0484795570373535, -4.676885604858398, -4.305292129516602, -3.9336984157562256, -3.5621047019958496, -3.1905109882354736, -2.8189172744750977, -2.4473235607147217, -2.0757298469543457, -1.7041361331939697, -1.3325424194335938, -0.9609487056732178, -0.5893549919128418, -0.21776127815246582, 0.15383148193359375, 0.5254251956939697, 0.8970189094543457, 1.2686126232147217, 1.6402063369750977, 2.0118000507354736, 2.3833937644958496, 2.7549874782562256, 3.1265811920166016, 3.4981749057769775, 3.8697686195373535, 4.241362571716309, 4.6129560470581055, 4.984549522399902, 5.356143474578857, 5.7277374267578125, 6.099330902099609, 6.470924377441406, 6.842518329620361, 7.214112281799316, 7.585705757141113, 7.95729923248291, 8.328893661499023, 8.70048713684082, 9.072080612182617, 9.443674087524414, 9.815267562866211, 10.186861991882324, 10.558455467224121, 10.930048942565918, 11.301643371582031, 11.673236846923828, 12.044830322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 17.0, 29.0, 36.0, 65.0, 128.0, 199.0, 391.0, 776.0, 4127.0, 3936858.0, 246800.0, 3271.0, 713.0, 327.0, 174.0, 113.0, 75.0, 41.0, 27.0, 23.0, 7.0, 7.0, 15.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-19.3125, -18.8289794921875, -18.345458984375, -17.8619384765625, -17.37841796875, -16.8948974609375, -16.411376953125, -15.9278564453125, -15.4443359375, -14.9608154296875, -14.477294921875, -13.9937744140625, -13.51025390625, -13.0267333984375, -12.543212890625, -12.0596923828125, -11.576171875, -11.0926513671875, -10.609130859375, -10.1256103515625, -9.64208984375, -9.1585693359375, -8.675048828125, -8.1915283203125, -7.7080078125, -7.2244873046875, -6.740966796875, -6.2574462890625, -5.77392578125, -5.2904052734375, -4.806884765625, -4.3233642578125, -3.83984375, -3.3563232421875, -2.872802734375, -2.3892822265625, -1.90576171875, -1.4222412109375, -0.938720703125, -0.4552001953125, 0.0283203125, 0.5118408203125, 0.995361328125, 1.4788818359375, 1.96240234375, 2.4459228515625, 2.929443359375, 3.4129638671875, 3.896484375, 4.3800048828125, 4.863525390625, 5.3470458984375, 5.83056640625, 6.3140869140625, 6.797607421875, 7.2811279296875, 7.7646484375, 8.2481689453125, 8.731689453125, 9.2152099609375, 9.69873046875, 10.1822509765625, 10.665771484375, 11.1492919921875, 11.6328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 9.0, 13.0, 17.0, 22.0, 24.0, 34.0, 38.0, 46.0, 53.0, 53.0, 55.0, 52.0, 58.0, 57.0, 51.0, 56.0, 62.0, 61.0, 42.0, 44.0, 23.0, 40.0, 33.0, 12.0, 9.0, 6.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9130859375, -0.8897933959960938, -0.8665008544921875, -0.8432083129882812, -0.819915771484375, -0.7966232299804688, -0.7733306884765625, -0.7500381469726562, -0.72674560546875, -0.7034530639648438, -0.6801605224609375, -0.6568679809570312, -0.633575439453125, -0.6102828979492188, -0.5869903564453125, -0.5636978149414062, -0.5404052734375, -0.5171127319335938, -0.4938201904296875, -0.47052764892578125, -0.447235107421875, -0.42394256591796875, -0.4006500244140625, -0.37735748291015625, -0.35406494140625, -0.33077239990234375, -0.3074798583984375, -0.28418731689453125, -0.260894775390625, -0.23760223388671875, -0.2143096923828125, -0.19101715087890625, -0.167724609375, -0.14443206787109375, -0.1211395263671875, -0.09784698486328125, -0.074554443359375, -0.05126190185546875, -0.0279693603515625, -0.00467681884765625, 0.01861572265625, 0.04190826416015625, 0.0652008056640625, 0.08849334716796875, 0.111785888671875, 0.13507843017578125, 0.1583709716796875, 0.18166351318359375, 0.2049560546875, 0.22824859619140625, 0.2515411376953125, 0.27483367919921875, 0.298126220703125, 0.32141876220703125, 0.3447113037109375, 0.36800384521484375, 0.39129638671875, 0.41458892822265625, 0.4378814697265625, 0.46117401123046875, 0.484466552734375, 0.5077590942382812, 0.5310516357421875, 0.5543441772460938, 0.57763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 22.0, 20.0, 28.0, 38.0, 54.0, 56.0, 66.0, 96.0, 148.0, 176.0, 240.0, 324.0, 419.0, 602.0, 861.0, 1324.0, 2372.0, 4621.0, 11764.0, 48329.0, 1033662.0, 3014736.0, 50125.0, 12243.0, 4787.0, 2375.0, 1413.0, 902.0, 621.0, 463.0, 354.0, 230.0, 204.0, 123.0, 120.0, 61.0, 57.0, 55.0, 39.0, 24.0, 26.0, 15.0, 12.0, 10.0, 5.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.8359375, -2.747344970703125, -2.65875244140625, -2.570159912109375, -2.4815673828125, -2.392974853515625, -2.30438232421875, -2.215789794921875, -2.127197265625, -2.038604736328125, -1.95001220703125, -1.861419677734375, -1.7728271484375, -1.684234619140625, -1.59564208984375, -1.507049560546875, -1.41845703125, -1.329864501953125, -1.24127197265625, -1.152679443359375, -1.0640869140625, -0.975494384765625, -0.88690185546875, -0.798309326171875, -0.709716796875, -0.621124267578125, -0.53253173828125, -0.443939208984375, -0.3553466796875, -0.266754150390625, -0.17816162109375, -0.089569091796875, -0.0009765625, 0.087615966796875, 0.17620849609375, 0.264801025390625, 0.3533935546875, 0.441986083984375, 0.53057861328125, 0.619171142578125, 0.707763671875, 0.796356201171875, 0.88494873046875, 0.973541259765625, 1.0621337890625, 1.150726318359375, 1.23931884765625, 1.327911376953125, 1.41650390625, 1.505096435546875, 1.59368896484375, 1.682281494140625, 1.7708740234375, 1.859466552734375, 1.94805908203125, 2.036651611328125, 2.125244140625, 2.213836669921875, 2.30242919921875, 2.391021728515625, 2.4796142578125, 2.568206787109375, 2.65679931640625, 2.745391845703125, 2.833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 5.0, 5.0, 23.0, 26.0, 65.0, 130.0, 466.0, 2941.0, 202.0, 93.0, 44.0, 21.0, 11.0, 12.0, 7.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8349609375, -0.811920166015625, -0.78887939453125, -0.765838623046875, -0.7427978515625, -0.719757080078125, -0.69671630859375, -0.673675537109375, -0.650634765625, -0.627593994140625, -0.60455322265625, -0.581512451171875, -0.5584716796875, -0.535430908203125, -0.51239013671875, -0.489349365234375, -0.46630859375, -0.443267822265625, -0.42022705078125, -0.397186279296875, -0.3741455078125, -0.351104736328125, -0.32806396484375, -0.305023193359375, -0.281982421875, -0.258941650390625, -0.23590087890625, -0.212860107421875, -0.1898193359375, -0.166778564453125, -0.14373779296875, -0.120697021484375, -0.09765625, -0.074615478515625, -0.05157470703125, -0.028533935546875, -0.0054931640625, 0.017547607421875, 0.04058837890625, 0.063629150390625, 0.086669921875, 0.109710693359375, 0.13275146484375, 0.155792236328125, 0.1788330078125, 0.201873779296875, 0.22491455078125, 0.247955322265625, 0.27099609375, 0.294036865234375, 0.31707763671875, 0.340118408203125, 0.3631591796875, 0.386199951171875, 0.40924072265625, 0.432281494140625, 0.455322265625, 0.478363037109375, 0.50140380859375, 0.524444580078125, 0.5474853515625, 0.570526123046875, 0.59356689453125, 0.616607666015625, 0.6396484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 17.0, 27.0, 54.0, 66.0, 95.0, 119.0, 123.0, 115.0, 110.0, 81.0, 55.0, 38.0, 31.0, 17.0, 7.0, 10.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1890366077423096, -2.0963294506073, -2.00362229347229, -1.9109150171279907, -1.8182077407836914, -1.7255005836486816, -1.6327934265136719, -1.540086269378662, -1.4473789930343628, -1.354671835899353, -1.2619645595550537, -1.169257402420044, -1.0765502452850342, -0.9838429689407349, -0.8911358118057251, -0.7984285950660706, -0.705721378326416, -0.6130141615867615, -0.5203069448471069, -0.42759978771209717, -0.3348925709724426, -0.24218535423278809, -0.14947819709777832, -0.05677098035812378, 0.03593623638153076, 0.1286434382200241, 0.22135064005851746, 0.3140578269958496, 0.40676504373550415, 0.4994722604751587, 0.5921794176101685, 0.684886634349823, 0.7775936126708984, 0.870300829410553, 0.9630080461502075, 1.0557152032852173, 1.1484224796295166, 1.2411296367645264, 1.3338367938995361, 1.426543951034546, 1.5192512273788452, 1.611958384513855, 1.7046656608581543, 1.797372817993164, 1.8900799751281738, 1.9827872514724731, 2.0754942893981934, 2.1682016849517822, 2.260908842086792, 2.3536159992218018, 2.4463231563568115, 2.5390305519104004, 2.63173770904541, 2.72444486618042, 2.8171520233154297, 2.9098591804504395, 3.002566337585449, 3.095273494720459, 3.1879806518554688, 3.2806878089904785, 3.3733952045440674, 3.466102361679077, 3.558809518814087, 3.6515166759490967, 3.7442240715026855]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 14.0, 6.0, 11.0, 8.0, 19.0, 18.0, 25.0, 24.0, 28.0, 26.0, 38.0, 42.0, 31.0, 38.0, 38.0, 41.0, 40.0, 35.0, 34.0, 45.0, 33.0, 35.0, 49.0, 40.0, 36.0, 36.0, 25.0, 27.0, 13.0, 25.0, 18.0, 18.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3123985528945923, -1.2752782106399536, -1.2381579875946045, -1.2010376453399658, -1.1639174222946167, -1.126797080039978, -1.089676856994629, -1.0525565147399902, -1.0154361724853516, -0.9783158898353577, -0.9411956071853638, -0.9040753245353699, -0.866955041885376, -0.8298346996307373, -0.7927144169807434, -0.7555941343307495, -0.7184739112854004, -0.6813536286354065, -0.6442333459854126, -0.6071130633354187, -0.5699927806854248, -0.5328724384307861, -0.49575215578079224, -0.45863187313079834, -0.42151159048080444, -0.38439130783081055, -0.34727102518081665, -0.31015071272850037, -0.27303043007850647, -0.23591014742851257, -0.19878984987735748, -0.1616695523262024, -0.12454915046691895, -0.08742886036634445, -0.05030857026576996, -0.013188280165195465, 0.02393200993537903, 0.061052292585372925, 0.09817259013652802, 0.1352928876876831, 0.172413170337677, 0.2095334529876709, 0.246653750538826, 0.2837740480899811, 0.320894330739975, 0.35801461338996887, 0.39513492584228516, 0.43225520849227905, 0.46937549114227295, 0.5064957737922668, 0.5436160564422607, 0.5807363390922546, 0.6178566217422485, 0.6549769639968872, 0.6920972466468811, 0.729217529296875, 0.7663378119468689, 0.8034580945968628, 0.8405783772468567, 0.8776986598968506, 0.9148190021514893, 0.9519392251968384, 0.989059567451477, 1.0261797904968262, 1.0633001327514648]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 17.0, 28.0, 35.0, 47.0, 63.0, 97.0, 173.0, 254.0, 404.0, 588.0, 1136.0, 2059.0, 4168.0, 8587.0, 19632.0, 45649.0, 104759.0, 208480.0, 275655.0, 199791.0, 98548.0, 43161.0, 18219.0, 8192.0, 3919.0, 2003.0, 1069.0, 616.0, 410.0, 247.0, 157.0, 116.0, 73.0, 60.0, 37.0, 20.0, 24.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8012237548828125, -1.742095947265625, -1.6829681396484375, -1.62384033203125, -1.5647125244140625, -1.505584716796875, -1.4464569091796875, -1.3873291015625, -1.3282012939453125, -1.269073486328125, -1.2099456787109375, -1.15081787109375, -1.0916900634765625, -1.032562255859375, -0.9734344482421875, -0.914306640625, -0.8551788330078125, -0.796051025390625, -0.7369232177734375, -0.67779541015625, -0.6186676025390625, -0.559539794921875, -0.5004119873046875, -0.4412841796875, -0.3821563720703125, -0.323028564453125, -0.2639007568359375, -0.20477294921875, -0.1456451416015625, -0.086517333984375, -0.0273895263671875, 0.03173828125, 0.0908660888671875, 0.149993896484375, 0.2091217041015625, 0.26824951171875, 0.3273773193359375, 0.386505126953125, 0.4456329345703125, 0.5047607421875, 0.5638885498046875, 0.623016357421875, 0.6821441650390625, 0.74127197265625, 0.8003997802734375, 0.859527587890625, 0.9186553955078125, 0.977783203125, 1.0369110107421875, 1.096038818359375, 1.1551666259765625, 1.21429443359375, 1.2734222412109375, 1.332550048828125, 1.3916778564453125, 1.4508056640625, 1.5099334716796875, 1.569061279296875, 1.6281890869140625, 1.68731689453125, 1.7464447021484375, 1.805572509765625, 1.8647003173828125, 1.923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 7.0, 4.0, 3.0, 4.0, 9.0, 7.0, 13.0, 15.0, 20.0, 21.0, 33.0, 43.0, 38.0, 48.0, 58.0, 51.0, 64.0, 55.0, 54.0, 63.0, 60.0, 49.0, 42.0, 42.0, 40.0, 39.0, 31.0, 25.0, 22.0, 14.0, 9.0, 10.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.9228515625, -0.8993453979492188, -0.8758392333984375, -0.8523330688476562, -0.828826904296875, -0.8053207397460938, -0.7818145751953125, -0.7583084106445312, -0.73480224609375, -0.7112960815429688, -0.6877899169921875, -0.6642837524414062, -0.640777587890625, -0.6172714233398438, -0.5937652587890625, -0.5702590942382812, -0.5467529296875, -0.5232467651367188, -0.4997406005859375, -0.47623443603515625, -0.452728271484375, -0.42922210693359375, -0.4057159423828125, -0.38220977783203125, -0.35870361328125, -0.33519744873046875, -0.3116912841796875, -0.28818511962890625, -0.264678955078125, -0.24117279052734375, -0.2176666259765625, -0.19416046142578125, -0.170654296875, -0.14714813232421875, -0.1236419677734375, -0.10013580322265625, -0.076629638671875, -0.05312347412109375, -0.0296173095703125, -0.00611114501953125, 0.01739501953125, 0.04090118408203125, 0.0644073486328125, 0.08791351318359375, 0.111419677734375, 0.13492584228515625, 0.1584320068359375, 0.18193817138671875, 0.2054443359375, 0.22895050048828125, 0.2524566650390625, 0.27596282958984375, 0.299468994140625, 0.32297515869140625, 0.3464813232421875, 0.36998748779296875, 0.39349365234375, 0.41699981689453125, 0.4405059814453125, 0.46401214599609375, 0.487518310546875, 0.5110244750976562, 0.5345306396484375, 0.5580368041992188, 0.58154296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 19.0, 25.0, 28.0, 29.0, 41.0, 61.0, 87.0, 107.0, 139.0, 223.0, 302.0, 471.0, 741.0, 1411.0, 4831.0, 39239.0, 533320.0, 428839.0, 30913.0, 4161.0, 1326.0, 692.0, 418.0, 296.0, 186.0, 177.0, 107.0, 84.0, 62.0, 38.0, 41.0, 26.0, 17.0, 14.0, 12.0, 12.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.50390625, -5.341796875, -5.1796875, -5.017578125, -4.85546875, -4.693359375, -4.53125, -4.369140625, -4.20703125, -4.044921875, -3.8828125, -3.720703125, -3.55859375, -3.396484375, -3.234375, -3.072265625, -2.91015625, -2.748046875, -2.5859375, -2.423828125, -2.26171875, -2.099609375, -1.9375, -1.775390625, -1.61328125, -1.451171875, -1.2890625, -1.126953125, -0.96484375, -0.802734375, -0.640625, -0.478515625, -0.31640625, -0.154296875, 0.0078125, 0.169921875, 0.33203125, 0.494140625, 0.65625, 0.818359375, 0.98046875, 1.142578125, 1.3046875, 1.466796875, 1.62890625, 1.791015625, 1.953125, 2.115234375, 2.27734375, 2.439453125, 2.6015625, 2.763671875, 2.92578125, 3.087890625, 3.25, 3.412109375, 3.57421875, 3.736328125, 3.8984375, 4.060546875, 4.22265625, 4.384765625, 4.546875, 4.708984375, 4.87109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 2.0, 8.0, 9.0, 5.0, 6.0, 8.0, 17.0, 19.0, 15.0, 19.0, 23.0, 26.0, 30.0, 33.0, 39.0, 40.0, 30.0, 44.0, 43.0, 48.0, 50.0, 40.0, 36.0, 34.0, 41.0, 31.0, 32.0, 29.0, 32.0, 29.0, 28.0, 29.0, 30.0, 21.0, 14.0, 10.0, 8.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.51544189453125, -2.4351806640625, -2.35491943359375, -2.274658203125, -2.19439697265625, -2.1141357421875, -2.03387451171875, -1.95361328125, -1.87335205078125, -1.7930908203125, -1.71282958984375, -1.632568359375, -1.55230712890625, -1.4720458984375, -1.39178466796875, -1.3115234375, -1.23126220703125, -1.1510009765625, -1.07073974609375, -0.990478515625, -0.91021728515625, -0.8299560546875, -0.74969482421875, -0.66943359375, -0.58917236328125, -0.5089111328125, -0.42864990234375, -0.348388671875, -0.26812744140625, -0.1878662109375, -0.10760498046875, -0.02734375, 0.05291748046875, 0.1331787109375, 0.21343994140625, 0.293701171875, 0.37396240234375, 0.4542236328125, 0.53448486328125, 0.61474609375, 0.69500732421875, 0.7752685546875, 0.85552978515625, 0.935791015625, 1.01605224609375, 1.0963134765625, 1.17657470703125, 1.2568359375, 1.33709716796875, 1.4173583984375, 1.49761962890625, 1.577880859375, 1.65814208984375, 1.7384033203125, 1.81866455078125, 1.89892578125, 1.97918701171875, 2.0594482421875, 2.13970947265625, 2.219970703125, 2.30023193359375, 2.3804931640625, 2.46075439453125, 2.541015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 4.0, 9.0, 8.0, 9.0, 15.0, 11.0, 18.0, 34.0, 48.0, 75.0, 142.0, 292.0, 694.0, 2113.0, 9651.0, 68241.0, 593680.0, 330633.0, 34692.0, 5623.0, 1476.0, 513.0, 249.0, 118.0, 76.0, 38.0, 26.0, 19.0, 14.0, 4.0, 9.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.029998779296875, -1.96624755859375, -1.902496337890625, -1.8387451171875, -1.774993896484375, -1.71124267578125, -1.647491455078125, -1.583740234375, -1.519989013671875, -1.45623779296875, -1.392486572265625, -1.3287353515625, -1.264984130859375, -1.20123291015625, -1.137481689453125, -1.07373046875, -1.009979248046875, -0.94622802734375, -0.882476806640625, -0.8187255859375, -0.754974365234375, -0.69122314453125, -0.627471923828125, -0.563720703125, -0.499969482421875, -0.43621826171875, -0.372467041015625, -0.3087158203125, -0.244964599609375, -0.18121337890625, -0.117462158203125, -0.0537109375, 0.010040283203125, 0.07379150390625, 0.137542724609375, 0.2012939453125, 0.265045166015625, 0.32879638671875, 0.392547607421875, 0.456298828125, 0.520050048828125, 0.58380126953125, 0.647552490234375, 0.7113037109375, 0.775054931640625, 0.83880615234375, 0.902557373046875, 0.96630859375, 1.030059814453125, 1.09381103515625, 1.157562255859375, 1.2213134765625, 1.285064697265625, 1.34881591796875, 1.412567138671875, 1.476318359375, 1.540069580078125, 1.60382080078125, 1.667572021484375, 1.7313232421875, 1.795074462890625, 1.85882568359375, 1.922576904296875, 1.986328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 5.0, 13.0, 10.0, 18.0, 21.0, 21.0, 33.0, 35.0, 48.0, 70.0, 64.0, 104.0, 87.0, 82.0, 85.0, 72.0, 62.0, 39.0, 26.0, 15.0, 21.0, 17.0, 9.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003135204315185547, -0.0003064200282096863, -0.00029931962490081787, -0.00029221922159194946, -0.00028511881828308105, -0.00027801841497421265, -0.00027091801166534424, -0.00026381760835647583, -0.0002567172050476074, -0.000249616801738739, -0.0002425163984298706, -0.0002354159951210022, -0.0002283155918121338, -0.00022121518850326538, -0.00021411478519439697, -0.00020701438188552856, -0.00019991397857666016, -0.00019281357526779175, -0.00018571317195892334, -0.00017861276865005493, -0.00017151236534118652, -0.00016441196203231812, -0.0001573115587234497, -0.0001502111554145813, -0.0001431107521057129, -0.00013601034879684448, -0.00012890994548797607, -0.00012180954217910767, -0.00011470913887023926, -0.00010760873556137085, -0.00010050833225250244, -9.340792894363403e-05, -8.630752563476562e-05, -7.920712232589722e-05, -7.210671901702881e-05, -6.50063157081604e-05, -5.790591239929199e-05, -5.0805509090423584e-05, -4.3705105781555176e-05, -3.660470247268677e-05, -2.950429916381836e-05, -2.240389585494995e-05, -1.5303492546081543e-05, -8.203089237213135e-06, -1.1026859283447266e-06, 5.997717380523682e-06, 1.309812068939209e-05, 2.0198523998260498e-05, 2.7298927307128906e-05, 3.4399330615997314e-05, 4.149973392486572e-05, 4.860013723373413e-05, 5.570054054260254e-05, 6.280094385147095e-05, 6.990134716033936e-05, 7.700175046920776e-05, 8.410215377807617e-05, 9.120255708694458e-05, 9.830296039581299e-05, 0.0001054033637046814, 0.0001125037670135498, 0.00011960417032241821, 0.00012670457363128662, 0.00013380497694015503, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 4.0, 12.0, 9.0, 19.0, 25.0, 42.0, 59.0, 76.0, 122.0, 209.0, 413.0, 744.0, 1646.0, 4505.0, 19403.0, 160432.0, 709395.0, 127736.0, 16459.0, 4159.0, 1473.0, 662.0, 357.0, 195.0, 131.0, 83.0, 54.0, 37.0, 24.0, 21.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4882965087890625, -1.424835205078125, -1.3613739013671875, -1.29791259765625, -1.2344512939453125, -1.170989990234375, -1.1075286865234375, -1.0440673828125, -0.9806060791015625, -0.917144775390625, -0.8536834716796875, -0.79022216796875, -0.7267608642578125, -0.663299560546875, -0.5998382568359375, -0.536376953125, -0.4729156494140625, -0.409454345703125, -0.3459930419921875, -0.28253173828125, -0.2190704345703125, -0.155609130859375, -0.0921478271484375, -0.0286865234375, 0.0347747802734375, 0.098236083984375, 0.1616973876953125, 0.22515869140625, 0.2886199951171875, 0.352081298828125, 0.4155426025390625, 0.47900390625, 0.5424652099609375, 0.605926513671875, 0.6693878173828125, 0.73284912109375, 0.7963104248046875, 0.859771728515625, 0.9232330322265625, 0.9866943359375, 1.0501556396484375, 1.113616943359375, 1.1770782470703125, 1.24053955078125, 1.3040008544921875, 1.367462158203125, 1.4309234619140625, 1.494384765625, 1.5578460693359375, 1.621307373046875, 1.6847686767578125, 1.74822998046875, 1.8116912841796875, 1.875152587890625, 1.9386138916015625, 2.0020751953125, 2.0655364990234375, 2.128997802734375, 2.1924591064453125, 2.25592041015625, 2.3193817138671875, 2.382843017578125, 2.4463043212890625, 2.509765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 15.0, 19.0, 40.0, 45.0, 50.0, 60.0, 90.0, 108.0, 90.0, 103.0, 68.0, 65.0, 44.0, 37.0, 25.0, 21.0, 22.0, 17.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6654205322265625, -1.611114501953125, -1.5568084716796875, -1.50250244140625, -1.4481964111328125, -1.393890380859375, -1.3395843505859375, -1.2852783203125, -1.2309722900390625, -1.176666259765625, -1.1223602294921875, -1.06805419921875, -1.0137481689453125, -0.959442138671875, -0.9051361083984375, -0.850830078125, -0.7965240478515625, -0.742218017578125, -0.6879119873046875, -0.63360595703125, -0.5792999267578125, -0.524993896484375, -0.4706878662109375, -0.4163818359375, -0.3620758056640625, -0.307769775390625, -0.2534637451171875, -0.19915771484375, -0.1448516845703125, -0.090545654296875, -0.0362396240234375, 0.01806640625, 0.0723724365234375, 0.126678466796875, 0.1809844970703125, 0.23529052734375, 0.2895965576171875, 0.343902587890625, 0.3982086181640625, 0.4525146484375, 0.5068206787109375, 0.561126708984375, 0.6154327392578125, 0.66973876953125, 0.7240447998046875, 0.778350830078125, 0.8326568603515625, 0.886962890625, 0.9412689208984375, 0.995574951171875, 1.0498809814453125, 1.10418701171875, 1.1584930419921875, 1.212799072265625, 1.2671051025390625, 1.3214111328125, 1.3757171630859375, 1.430023193359375, 1.4843292236328125, 1.53863525390625, 1.5929412841796875, 1.647247314453125, 1.7015533447265625, 1.755859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 23.0, 109.0, 185.0, 262.0, 243.0, 108.0, 40.0, 4.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03076934814453, -34.6136589050293, -33.19654846191406, -31.77943992614746, -30.36233139038086, -28.945220947265625, -27.52811050415039, -26.111000061035156, -24.693891525268555, -23.27678108215332, -21.85967254638672, -20.442562103271484, -19.02545166015625, -17.60834312438965, -16.191232681274414, -14.774123191833496, -13.357013702392578, -11.93990421295166, -10.522794723510742, -9.105684280395508, -7.68857479095459, -6.271465301513672, -4.8543548583984375, -3.4372453689575195, -2.0201358795166016, -0.6030261516571045, 0.8140835762023926, 2.2311935424804688, 3.6483030319213867, 5.065412521362305, 6.482522964477539, 7.899632453918457, 9.31673812866211, 10.733847618103027, 12.150957107543945, 13.56806755065918, 14.985177040100098, 16.402286529541016, 17.81939697265625, 19.236507415771484, 20.653615951538086, 22.07072639465332, 23.487834930419922, 24.904945373535156, 26.32205581665039, 27.739164352416992, 29.156274795532227, 30.573383331298828, 31.990493774414062, 33.4076042175293, 34.82471466064453, 36.2418212890625, 37.658931732177734, 39.07604217529297, 40.4931526184082, 41.91026306152344, 43.327369689941406, 44.74448013305664, 46.161590576171875, 47.578697204589844, 48.99580764770508, 50.41291809082031, 51.83002853393555, 53.24713897705078, 54.664249420166016]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 4.0, 3.0, 9.0, 9.0, 8.0, 19.0, 17.0, 19.0, 17.0, 27.0, 34.0, 23.0, 38.0, 25.0, 48.0, 36.0, 53.0, 56.0, 49.0, 56.0, 47.0, 42.0, 38.0, 43.0, 44.0, 28.0, 26.0, 25.0, 24.0, 27.0, 28.0, 13.0, 8.0, 10.0, 5.0, 5.0, 11.0, 5.0, 1.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.027986526489258, -12.592302322387695, -12.156618118286133, -11.720934867858887, -11.285250663757324, -10.849566459655762, -10.413883209228516, -9.978199005126953, -9.54251480102539, -9.106830596923828, -8.671146392822266, -8.23546314239502, -7.799778938293457, -7.3640947341918945, -6.92841100692749, -6.492727279663086, -6.057043075561523, -5.621358871459961, -5.185675144195557, -4.749991416931152, -4.31430721282959, -3.8786232471466064, -3.442939281463623, -3.0072553157806396, -2.5715713500976562, -2.135887384414673, -1.7002034187316895, -1.264519453048706, -0.8288354873657227, -0.39315152168273926, 0.04253244400024414, 0.47821640968322754, 0.9139003753662109, 1.3495843410491943, 1.7852683067321777, 2.220952272415161, 2.6566362380981445, 3.092320203781128, 3.5280041694641113, 3.9636881351470947, 4.399372100830078, 4.835056304931641, 5.270740032196045, 5.706423759460449, 6.142107963562012, 6.577792167663574, 7.0134758949279785, 7.449159622192383, 7.884843826293945, 8.320528030395508, 8.75621223449707, 9.191895484924316, 9.627579689025879, 10.063263893127441, 10.498947143554688, 10.93463134765625, 11.370315551757812, 11.805999755859375, 12.241683959960938, 12.677367210388184, 13.113051414489746, 13.548735618591309, 13.984418869018555, 14.420103073120117, 14.85578727722168]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 11.0, 29.0, 38.0, 64.0, 90.0, 169.0, 367.0, 943.0, 8059.0, 4164181.0, 18082.0, 1288.0, 432.0, 204.0, 101.0, 57.0, 45.0, 24.0, 26.0, 7.0, 9.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.90625, -16.4793701171875, -16.052490234375, -15.6256103515625, -15.19873046875, -14.7718505859375, -14.344970703125, -13.9180908203125, -13.4912109375, -13.0643310546875, -12.637451171875, -12.2105712890625, -11.78369140625, -11.3568115234375, -10.929931640625, -10.5030517578125, -10.076171875, -9.6492919921875, -9.222412109375, -8.7955322265625, -8.36865234375, -7.9417724609375, -7.514892578125, -7.0880126953125, -6.6611328125, -6.2342529296875, -5.807373046875, -5.3804931640625, -4.95361328125, -4.5267333984375, -4.099853515625, -3.6729736328125, -3.24609375, -2.8192138671875, -2.392333984375, -1.9654541015625, -1.53857421875, -1.1116943359375, -0.684814453125, -0.2579345703125, 0.1689453125, 0.5958251953125, 1.022705078125, 1.4495849609375, 1.87646484375, 2.3033447265625, 2.730224609375, 3.1571044921875, 3.583984375, 4.0108642578125, 4.437744140625, 4.8646240234375, 5.29150390625, 5.7183837890625, 6.145263671875, 6.5721435546875, 6.9990234375, 7.4259033203125, 7.852783203125, 8.2796630859375, 8.70654296875, 9.1334228515625, 9.560302734375, 9.9871826171875, 10.4140625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 12.0, 18.0, 10.0, 18.0, 24.0, 22.0, 45.0, 32.0, 56.0, 66.0, 53.0, 56.0, 75.0, 65.0, 42.0, 48.0, 50.0, 40.0, 49.0, 45.0, 37.0, 25.0, 29.0, 12.0, 12.0, 13.0, 2.0, 13.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8427810668945312, -0.8193511962890625, -0.7959213256835938, -0.772491455078125, -0.7490615844726562, -0.7256317138671875, -0.7022018432617188, -0.67877197265625, -0.6553421020507812, -0.6319122314453125, -0.6084823608398438, -0.585052490234375, -0.5616226196289062, -0.5381927490234375, -0.5147628784179688, -0.4913330078125, -0.46790313720703125, -0.4444732666015625, -0.42104339599609375, -0.397613525390625, -0.37418365478515625, -0.3507537841796875, -0.32732391357421875, -0.30389404296875, -0.28046417236328125, -0.2570343017578125, -0.23360443115234375, -0.210174560546875, -0.18674468994140625, -0.1633148193359375, -0.13988494873046875, -0.116455078125, -0.09302520751953125, -0.0695953369140625, -0.04616546630859375, -0.022735595703125, 0.00069427490234375, 0.0241241455078125, 0.04755401611328125, 0.07098388671875, 0.09441375732421875, 0.1178436279296875, 0.14127349853515625, 0.164703369140625, 0.18813323974609375, 0.2115631103515625, 0.23499298095703125, 0.2584228515625, 0.28185272216796875, 0.3052825927734375, 0.32871246337890625, 0.352142333984375, 0.37557220458984375, 0.3990020751953125, 0.42243194580078125, 0.44586181640625, 0.46929168701171875, 0.4927215576171875, 0.5161514282226562, 0.539581298828125, 0.5630111694335938, 0.5864410400390625, 0.6098709106445312, 0.63330078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 21.0, 11.0, 17.0, 42.0, 47.0, 60.0, 83.0, 104.0, 190.0, 243.0, 411.0, 574.0, 933.0, 1520.0, 2750.0, 5444.0, 12905.0, 42955.0, 367419.0, 3645889.0, 77727.0, 18850.0, 7278.0, 3588.0, 1938.0, 1134.0, 680.0, 453.0, 282.0, 191.0, 155.0, 98.0, 71.0, 56.0, 44.0, 30.0, 17.0, 16.0, 2.0, 10.0, 4.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.091796875, -2.022491455078125, -1.95318603515625, -1.883880615234375, -1.8145751953125, -1.745269775390625, -1.67596435546875, -1.606658935546875, -1.537353515625, -1.468048095703125, -1.39874267578125, -1.329437255859375, -1.2601318359375, -1.190826416015625, -1.12152099609375, -1.052215576171875, -0.98291015625, -0.913604736328125, -0.84429931640625, -0.774993896484375, -0.7056884765625, -0.636383056640625, -0.56707763671875, -0.497772216796875, -0.428466796875, -0.359161376953125, -0.28985595703125, -0.220550537109375, -0.1512451171875, -0.081939697265625, -0.01263427734375, 0.056671142578125, 0.1259765625, 0.195281982421875, 0.26458740234375, 0.333892822265625, 0.4031982421875, 0.472503662109375, 0.54180908203125, 0.611114501953125, 0.680419921875, 0.749725341796875, 0.81903076171875, 0.888336181640625, 0.9576416015625, 1.026947021484375, 1.09625244140625, 1.165557861328125, 1.23486328125, 1.304168701171875, 1.37347412109375, 1.442779541015625, 1.5120849609375, 1.581390380859375, 1.65069580078125, 1.720001220703125, 1.789306640625, 1.858612060546875, 1.92791748046875, 1.997222900390625, 2.0665283203125, 2.135833740234375, 2.20513916015625, 2.274444580078125, 2.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 9.0, 15.0, 15.0, 30.0, 73.0, 114.0, 399.0, 2989.0, 211.0, 93.0, 32.0, 24.0, 12.0, 10.0, 9.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.781951904296875, -0.75775146484375, -0.733551025390625, -0.7093505859375, -0.685150146484375, -0.66094970703125, -0.636749267578125, -0.612548828125, -0.588348388671875, -0.56414794921875, -0.539947509765625, -0.5157470703125, -0.491546630859375, -0.46734619140625, -0.443145751953125, -0.4189453125, -0.394744873046875, -0.37054443359375, -0.346343994140625, -0.3221435546875, -0.297943115234375, -0.27374267578125, -0.249542236328125, -0.225341796875, -0.201141357421875, -0.17694091796875, -0.152740478515625, -0.1285400390625, -0.104339599609375, -0.08013916015625, -0.055938720703125, -0.03173828125, -0.007537841796875, 0.01666259765625, 0.040863037109375, 0.0650634765625, 0.089263916015625, 0.11346435546875, 0.137664794921875, 0.161865234375, 0.186065673828125, 0.21026611328125, 0.234466552734375, 0.2586669921875, 0.282867431640625, 0.30706787109375, 0.331268310546875, 0.35546875, 0.379669189453125, 0.40386962890625, 0.428070068359375, 0.4522705078125, 0.476470947265625, 0.50067138671875, 0.524871826171875, 0.549072265625, 0.573272705078125, 0.59747314453125, 0.621673583984375, 0.6458740234375, 0.670074462890625, 0.69427490234375, 0.718475341796875, 0.74267578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 11.0, 16.0, 40.0, 71.0, 124.0, 184.0, 219.0, 166.0, 100.0, 41.0, 20.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.143086910247803, -5.97553014755249, -5.8079729080200195, -5.640416145324707, -5.4728593826293945, -5.305302619934082, -5.137745380401611, -4.970188617706299, -4.802631378173828, -4.635074615478516, -4.467517375946045, -4.299960613250732, -4.13240385055542, -3.9648468494415283, -3.7972898483276367, -3.629733085632324, -3.4621763229370117, -3.29461932182312, -3.1270625591278076, -2.959505558013916, -2.7919487953186035, -2.624391794204712, -2.4568347930908203, -2.289278030395508, -2.121721029281616, -1.9541641473770142, -1.786607265472412, -1.6190502643585205, -1.4514933824539185, -1.2839365005493164, -1.1163794994354248, -0.9488226175308228, -0.7812662124633789, -0.6137093305587769, -0.44615238904953003, -0.2785954475402832, -0.11103856563568115, 0.0565183162689209, 0.2240753173828125, 0.39163219928741455, 0.5591890811920166, 0.7267459630966187, 0.8943029046058655, 1.0618598461151123, 1.2294167280197144, 1.3969736099243164, 1.564530611038208, 1.73208749294281, 1.899644374847412, 2.0672013759613037, 2.234758138656616, 2.402315139770508, 2.5698719024658203, 2.737428903579712, 2.9049859046936035, 3.072542667388916, 3.2400996685028076, 3.407656669616699, 3.5752134323120117, 3.7427704334259033, 3.910327434539795, 4.077884197235107, 4.245441436767578, 4.412998199462891, 4.580554962158203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 6.0, 8.0, 13.0, 17.0, 19.0, 25.0, 20.0, 35.0, 16.0, 29.0, 22.0, 43.0, 42.0, 36.0, 44.0, 34.0, 47.0, 35.0, 38.0, 40.0, 44.0, 40.0, 37.0, 34.0, 36.0, 35.0, 25.0, 22.0, 25.0, 26.0, 17.0, 15.0, 6.0, 6.0, 15.0, 7.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7347486019134521, -1.6803596019744873, -1.625970482826233, -1.571581482887268, -1.5171924829483032, -1.4628033638000488, -1.408414363861084, -1.3540253639221191, -1.2996362447738647, -1.2452472448349, -1.1908581256866455, -1.1364691257476807, -1.0820801258087158, -1.0276910066604614, -0.9733020067214966, -0.918912947177887, -0.8645239472389221, -0.8101348876953125, -0.7557458877563477, -0.701356828212738, -0.6469677686691284, -0.5925787687301636, -0.538189709186554, -0.48380064964294434, -0.4294116199016571, -0.3750225901603699, -0.32063353061676025, -0.266244500875473, -0.2118554562330246, -0.15746641159057617, -0.10307738184928894, -0.04868832230567932, 0.00570070743560791, 0.06008974835276604, 0.11447878926992416, 0.168867826461792, 0.22325687110424042, 0.27764591574668884, 0.3320349454879761, 0.3864240050315857, 0.4408130347728729, 0.49520206451416016, 0.5495911240577698, 0.6039801836013794, 0.6583691835403442, 0.7127582430839539, 0.7671473026275635, 0.8215363025665283, 0.8759253621101379, 0.9303144216537476, 0.9847034215927124, 1.0390925407409668, 1.0934815406799316, 1.1478705406188965, 1.2022595405578613, 1.2566486597061157, 1.3110376596450806, 1.3654266595840454, 1.4198157787322998, 1.4742047786712646, 1.5285937786102295, 1.5829828977584839, 1.6373718976974487, 1.6917610168457031, 1.746150016784668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 11.0, 9.0, 9.0, 13.0, 15.0, 27.0, 24.0, 40.0, 54.0, 66.0, 97.0, 173.0, 251.0, 406.0, 632.0, 1002.0, 1812.0, 3397.0, 6663.0, 13731.0, 31133.0, 73371.0, 165301.0, 273988.0, 244627.0, 129512.0, 55642.0, 23677.0, 10920.0, 5296.0, 2744.0, 1458.0, 859.0, 528.0, 338.0, 225.0, 141.0, 95.0, 68.0, 58.0, 50.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6167144775390625, -1.562530517578125, -1.5083465576171875, -1.45416259765625, -1.3999786376953125, -1.345794677734375, -1.2916107177734375, -1.2374267578125, -1.1832427978515625, -1.129058837890625, -1.0748748779296875, -1.02069091796875, -0.9665069580078125, -0.912322998046875, -0.8581390380859375, -0.803955078125, -0.7497711181640625, -0.695587158203125, -0.6414031982421875, -0.58721923828125, -0.5330352783203125, -0.478851318359375, -0.4246673583984375, -0.3704833984375, -0.3162994384765625, -0.262115478515625, -0.2079315185546875, -0.15374755859375, -0.0995635986328125, -0.045379638671875, 0.0088043212890625, 0.06298828125, 0.1171722412109375, 0.171356201171875, 0.2255401611328125, 0.27972412109375, 0.3339080810546875, 0.388092041015625, 0.4422760009765625, 0.4964599609375, 0.5506439208984375, 0.604827880859375, 0.6590118408203125, 0.71319580078125, 0.7673797607421875, 0.821563720703125, 0.8757476806640625, 0.929931640625, 0.9841156005859375, 1.038299560546875, 1.0924835205078125, 1.14666748046875, 1.2008514404296875, 1.255035400390625, 1.3092193603515625, 1.3634033203125, 1.4175872802734375, 1.471771240234375, 1.5259552001953125, 1.58013916015625, 1.6343231201171875, 1.688507080078125, 1.7426910400390625, 1.796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 12.0, 22.0, 10.0, 24.0, 30.0, 30.0, 32.0, 43.0, 31.0, 50.0, 50.0, 60.0, 50.0, 55.0, 60.0, 42.0, 43.0, 45.0, 45.0, 45.0, 36.0, 35.0, 32.0, 19.0, 14.0, 12.0, 13.0, 11.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.8251953125, -0.8025283813476562, -0.7798614501953125, -0.7571945190429688, -0.734527587890625, -0.7118606567382812, -0.6891937255859375, -0.6665267944335938, -0.64385986328125, -0.6211929321289062, -0.5985260009765625, -0.5758590698242188, -0.553192138671875, -0.5305252075195312, -0.5078582763671875, -0.48519134521484375, -0.4625244140625, -0.43985748291015625, -0.4171905517578125, -0.39452362060546875, -0.371856689453125, -0.34918975830078125, -0.3265228271484375, -0.30385589599609375, -0.28118896484375, -0.25852203369140625, -0.2358551025390625, -0.21318817138671875, -0.190521240234375, -0.16785430908203125, -0.1451873779296875, -0.12252044677734375, -0.099853515625, -0.07718658447265625, -0.0545196533203125, -0.03185272216796875, -0.009185791015625, 0.01348114013671875, 0.0361480712890625, 0.05881500244140625, 0.08148193359375, 0.10414886474609375, 0.1268157958984375, 0.14948272705078125, 0.172149658203125, 0.19481658935546875, 0.2174835205078125, 0.24015045166015625, 0.2628173828125, 0.28548431396484375, 0.3081512451171875, 0.33081817626953125, 0.353485107421875, 0.37615203857421875, 0.3988189697265625, 0.42148590087890625, 0.44415283203125, 0.46681976318359375, 0.4894866943359375, 0.5121536254882812, 0.534820556640625, 0.5574874877929688, 0.5801544189453125, 0.6028213500976562, 0.62548828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 19.0, 23.0, 22.0, 38.0, 66.0, 100.0, 115.0, 172.0, 266.0, 365.0, 602.0, 1085.0, 3060.0, 22592.0, 625591.0, 375131.0, 14197.0, 2469.0, 1024.0, 523.0, 322.0, 207.0, 146.0, 112.0, 75.0, 54.0, 43.0, 31.0, 31.0, 16.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.46484375, -6.2796630859375, -6.094482421875, -5.9093017578125, -5.72412109375, -5.5389404296875, -5.353759765625, -5.1685791015625, -4.9833984375, -4.7982177734375, -4.613037109375, -4.4278564453125, -4.24267578125, -4.0574951171875, -3.872314453125, -3.6871337890625, -3.501953125, -3.3167724609375, -3.131591796875, -2.9464111328125, -2.76123046875, -2.5760498046875, -2.390869140625, -2.2056884765625, -2.0205078125, -1.8353271484375, -1.650146484375, -1.4649658203125, -1.27978515625, -1.0946044921875, -0.909423828125, -0.7242431640625, -0.5390625, -0.3538818359375, -0.168701171875, 0.0164794921875, 0.20166015625, 0.3868408203125, 0.572021484375, 0.7572021484375, 0.9423828125, 1.1275634765625, 1.312744140625, 1.4979248046875, 1.68310546875, 1.8682861328125, 2.053466796875, 2.2386474609375, 2.423828125, 2.6090087890625, 2.794189453125, 2.9793701171875, 3.16455078125, 3.3497314453125, 3.534912109375, 3.7200927734375, 3.9052734375, 4.0904541015625, 4.275634765625, 4.4608154296875, 4.64599609375, 4.8311767578125, 5.016357421875, 5.2015380859375, 5.38671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 15.0, 16.0, 24.0, 19.0, 20.0, 25.0, 31.0, 41.0, 37.0, 35.0, 44.0, 39.0, 30.0, 34.0, 50.0, 54.0, 44.0, 47.0, 41.0, 33.0, 41.0, 46.0, 31.0, 35.0, 20.0, 17.0, 15.0, 16.0, 14.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.30755615234375, -2.2225341796875, -2.13751220703125, -2.052490234375, -1.96746826171875, -1.8824462890625, -1.79742431640625, -1.71240234375, -1.62738037109375, -1.5423583984375, -1.45733642578125, -1.372314453125, -1.28729248046875, -1.2022705078125, -1.11724853515625, -1.0322265625, -0.94720458984375, -0.8621826171875, -0.77716064453125, -0.692138671875, -0.60711669921875, -0.5220947265625, -0.43707275390625, -0.35205078125, -0.26702880859375, -0.1820068359375, -0.09698486328125, -0.011962890625, 0.07305908203125, 0.1580810546875, 0.24310302734375, 0.328125, 0.41314697265625, 0.4981689453125, 0.58319091796875, 0.668212890625, 0.75323486328125, 0.8382568359375, 0.92327880859375, 1.00830078125, 1.09332275390625, 1.1783447265625, 1.26336669921875, 1.348388671875, 1.43341064453125, 1.5184326171875, 1.60345458984375, 1.6884765625, 1.77349853515625, 1.8585205078125, 1.94354248046875, 2.028564453125, 2.11358642578125, 2.1986083984375, 2.28363037109375, 2.36865234375, 2.45367431640625, 2.5386962890625, 2.62371826171875, 2.708740234375, 2.79376220703125, 2.8787841796875, 2.96380615234375, 3.048828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 25.0, 19.0, 36.0, 44.0, 74.0, 81.0, 122.0, 204.0, 365.0, 733.0, 1829.0, 6037.0, 34443.0, 402963.0, 544851.0, 45298.0, 7429.0, 2063.0, 787.0, 415.0, 204.0, 152.0, 81.0, 76.0, 53.0, 33.0, 19.0, 20.0, 10.0, 9.0, 5.0, 8.0, 9.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9306640625, -1.8685150146484375, -1.806365966796875, -1.7442169189453125, -1.68206787109375, -1.6199188232421875, -1.557769775390625, -1.4956207275390625, -1.4334716796875, -1.3713226318359375, -1.309173583984375, -1.2470245361328125, -1.18487548828125, -1.1227264404296875, -1.060577392578125, -0.9984283447265625, -0.936279296875, -0.8741302490234375, -0.811981201171875, -0.7498321533203125, -0.68768310546875, -0.6255340576171875, -0.563385009765625, -0.5012359619140625, -0.4390869140625, -0.3769378662109375, -0.314788818359375, -0.2526397705078125, -0.19049072265625, -0.1283416748046875, -0.066192626953125, -0.0040435791015625, 0.05810546875, 0.1202545166015625, 0.182403564453125, 0.2445526123046875, 0.30670166015625, 0.3688507080078125, 0.430999755859375, 0.4931488037109375, 0.5552978515625, 0.6174468994140625, 0.679595947265625, 0.7417449951171875, 0.80389404296875, 0.8660430908203125, 0.928192138671875, 0.9903411865234375, 1.052490234375, 1.1146392822265625, 1.176788330078125, 1.2389373779296875, 1.30108642578125, 1.3632354736328125, 1.425384521484375, 1.4875335693359375, 1.5496826171875, 1.6118316650390625, 1.673980712890625, 1.7361297607421875, 1.79827880859375, 1.8604278564453125, 1.922576904296875, 1.9847259521484375, 2.046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 11.0, 16.0, 33.0, 38.0, 47.0, 72.0, 94.0, 98.0, 120.0, 105.0, 86.0, 74.0, 64.0, 35.0, 22.0, 11.0, 13.0, 12.0, 6.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000186920166015625, -0.00017854943871498108, -0.00017017871141433716, -0.00016180798411369324, -0.00015343725681304932, -0.0001450665295124054, -0.00013669580221176147, -0.00012832507491111755, -0.00011995434761047363, -0.00011158362030982971, -0.00010321289300918579, -9.484216570854187e-05, -8.647143840789795e-05, -7.810071110725403e-05, -6.972998380661011e-05, -6.135925650596619e-05, -5.2988529205322266e-05, -4.4617801904678345e-05, -3.6247074604034424e-05, -2.7876347303390503e-05, -1.9505620002746582e-05, -1.1134892702102661e-05, -2.7641654014587402e-06, 5.606561899185181e-06, 1.3977289199829102e-05, 2.2348016500473022e-05, 3.071874380111694e-05, 3.9089471101760864e-05, 4.7460198402404785e-05, 5.5830925703048706e-05, 6.420165300369263e-05, 7.257238030433655e-05, 8.094310760498047e-05, 8.931383490562439e-05, 9.768456220626831e-05, 0.00010605528950691223, 0.00011442601680755615, 0.00012279674410820007, 0.000131167471408844, 0.00013953819870948792, 0.00014790892601013184, 0.00015627965331077576, 0.00016465038061141968, 0.0001730211079120636, 0.00018139183521270752, 0.00018976256251335144, 0.00019813328981399536, 0.00020650401711463928, 0.0002148747444152832, 0.00022324547171592712, 0.00023161619901657104, 0.00023998692631721497, 0.0002483576536178589, 0.0002567283809185028, 0.00026509910821914673, 0.00027346983551979065, 0.00028184056282043457, 0.0002902112901210785, 0.0002985820174217224, 0.00030695274472236633, 0.00031532347202301025, 0.0003236941993236542, 0.0003320649266242981, 0.000340435653924942, 0.00034880638122558594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 4.0, 8.0, 7.0, 16.0, 15.0, 14.0, 32.0, 47.0, 56.0, 97.0, 141.0, 240.0, 465.0, 849.0, 2152.0, 6704.0, 34801.0, 457532.0, 497345.0, 36684.0, 7046.0, 2205.0, 872.0, 485.0, 235.0, 157.0, 102.0, 60.0, 50.0, 33.0, 24.0, 18.0, 8.0, 7.0, 4.0, 7.0, 1.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.16796875, -2.100250244140625, -2.03253173828125, -1.964813232421875, -1.8970947265625, -1.829376220703125, -1.76165771484375, -1.693939208984375, -1.626220703125, -1.558502197265625, -1.49078369140625, -1.423065185546875, -1.3553466796875, -1.287628173828125, -1.21990966796875, -1.152191162109375, -1.08447265625, -1.016754150390625, -0.94903564453125, -0.881317138671875, -0.8135986328125, -0.745880126953125, -0.67816162109375, -0.610443115234375, -0.542724609375, -0.475006103515625, -0.40728759765625, -0.339569091796875, -0.2718505859375, -0.204132080078125, -0.13641357421875, -0.068695068359375, -0.0009765625, 0.066741943359375, 0.13446044921875, 0.202178955078125, 0.2698974609375, 0.337615966796875, 0.40533447265625, 0.473052978515625, 0.540771484375, 0.608489990234375, 0.67620849609375, 0.743927001953125, 0.8116455078125, 0.879364013671875, 0.94708251953125, 1.014801025390625, 1.08251953125, 1.150238037109375, 1.21795654296875, 1.285675048828125, 1.3533935546875, 1.421112060546875, 1.48883056640625, 1.556549072265625, 1.624267578125, 1.691986083984375, 1.75970458984375, 1.827423095703125, 1.8951416015625, 1.962860107421875, 2.03057861328125, 2.098297119140625, 2.166015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 1.0, 10.0, 16.0, 24.0, 45.0, 59.0, 105.0, 102.0, 125.0, 110.0, 103.0, 74.0, 51.0, 39.0, 34.0, 20.0, 13.0, 4.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.10009765625, -2.0361328125, -1.97216796875, -1.908203125, -1.84423828125, -1.7802734375, -1.71630859375, -1.65234375, -1.58837890625, -1.5244140625, -1.46044921875, -1.396484375, -1.33251953125, -1.2685546875, -1.20458984375, -1.140625, -1.07666015625, -1.0126953125, -0.94873046875, -0.884765625, -0.82080078125, -0.7568359375, -0.69287109375, -0.62890625, -0.56494140625, -0.5009765625, -0.43701171875, -0.373046875, -0.30908203125, -0.2451171875, -0.18115234375, -0.1171875, -0.05322265625, 0.0107421875, 0.07470703125, 0.138671875, 0.20263671875, 0.2666015625, 0.33056640625, 0.39453125, 0.45849609375, 0.5224609375, 0.58642578125, 0.650390625, 0.71435546875, 0.7783203125, 0.84228515625, 0.90625, 0.97021484375, 1.0341796875, 1.09814453125, 1.162109375, 1.22607421875, 1.2900390625, 1.35400390625, 1.41796875, 1.48193359375, 1.5458984375, 1.60986328125, 1.673828125, 1.73779296875, 1.8017578125, 1.86572265625, 1.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 14.0, 15.0, 22.0, 30.0, 38.0, 55.0, 73.0, 93.0, 117.0, 116.0, 103.0, 104.0, 58.0, 44.0, 32.0, 19.0, 18.0, 10.0, 4.0, 9.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.40669059753418, -15.849669456481934, -15.292649269104004, -14.735628128051758, -14.178607940673828, -13.621586799621582, -13.064565658569336, -12.507545471191406, -11.950525283813477, -11.39350414276123, -10.8364839553833, -10.279462814331055, -9.722442626953125, -9.165421485900879, -8.608400344848633, -8.051380157470703, -7.494359016418457, -6.937338352203369, -6.380317687988281, -5.823296546936035, -5.2662763595581055, -4.709255218505859, -4.1522345542907715, -3.5952138900756836, -3.0381932258605957, -2.481172561645508, -1.9241517782211304, -1.367130994796753, -0.810110330581665, -0.25308966636657715, 0.30393123626708984, 0.8609519004821777, 1.4179725646972656, 1.9749932289123535, 2.5320138931274414, 3.0890347957611084, 3.6460554599761963, 4.203076362609863, 4.760097026824951, 5.317117691040039, 5.874138355255127, 6.431159019470215, 6.988179683685303, 7.545200347900391, 8.102221488952637, 8.659241676330566, 9.216262817382812, 9.773283004760742, 10.330304145812988, 10.887325286865234, 11.444345474243164, 12.00136661529541, 12.55838680267334, 13.115407943725586, 13.672428131103516, 14.229449272155762, 14.786470413208008, 15.343491554260254, 15.900511741638184, 16.45753288269043, 17.01455307006836, 17.57157325744629, 18.12859535217285, 18.68561553955078, 19.24263572692871]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 11.0, 11.0, 15.0, 19.0, 19.0, 15.0, 31.0, 29.0, 40.0, 42.0, 39.0, 44.0, 45.0, 50.0, 45.0, 46.0, 47.0, 49.0, 44.0, 45.0, 36.0, 40.0, 47.0, 27.0, 18.0, 23.0, 27.0, 11.0, 16.0, 13.0, 13.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.54494857788086, -14.098066329956055, -13.65118408203125, -13.204301834106445, -12.75741958618164, -12.310537338256836, -11.863655090332031, -11.416772842407227, -10.969890594482422, -10.523008346557617, -10.076126098632812, -9.629243850708008, -9.182361602783203, -8.735479354858398, -8.288597106933594, -7.841714382171631, -7.394831657409668, -6.947949409484863, -6.501067161560059, -6.054184913635254, -5.607302665710449, -5.1604204177856445, -4.713537693023682, -4.266655445098877, -3.8197731971740723, -3.3728909492492676, -2.926008701324463, -2.479126214981079, -2.0322439670562744, -1.5853617191314697, -1.138479232788086, -0.6915969848632812, -0.24471378326416016, 0.2021685242652893, 0.6490508317947388, 1.095933198928833, 1.5428154468536377, 1.9896976947784424, 2.436580181121826, 2.883462429046631, 3.3303446769714355, 3.7772269248962402, 4.224109172821045, 4.670991897583008, 5.1178741455078125, 5.564756393432617, 6.011638641357422, 6.458520889282227, 6.905403137207031, 7.352285385131836, 7.799167633056641, 8.246049880981445, 8.69293212890625, 9.139814376831055, 9.58669662475586, 10.033578872680664, 10.480461120605469, 10.927343368530273, 11.374225616455078, 11.821107864379883, 12.267990112304688, 12.714872360229492, 13.161754608154297, 13.608636856079102, 14.055520057678223]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 17.0, 22.0, 43.0, 55.0, 88.0, 134.0, 247.0, 551.0, 2223.0, 41773.0, 4139690.0, 7361.0, 1144.0, 384.0, 229.0, 99.0, 54.0, 40.0, 30.0, 13.0, 11.0, 9.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.390625, -13.0496826171875, -12.708740234375, -12.3677978515625, -12.02685546875, -11.6859130859375, -11.344970703125, -11.0040283203125, -10.6630859375, -10.3221435546875, -9.981201171875, -9.6402587890625, -9.29931640625, -8.9583740234375, -8.617431640625, -8.2764892578125, -7.935546875, -7.5946044921875, -7.253662109375, -6.9127197265625, -6.57177734375, -6.2308349609375, -5.889892578125, -5.5489501953125, -5.2080078125, -4.8670654296875, -4.526123046875, -4.1851806640625, -3.84423828125, -3.5032958984375, -3.162353515625, -2.8214111328125, -2.48046875, -2.1395263671875, -1.798583984375, -1.4576416015625, -1.11669921875, -0.7757568359375, -0.434814453125, -0.0938720703125, 0.2470703125, 0.5880126953125, 0.928955078125, 1.2698974609375, 1.61083984375, 1.9517822265625, 2.292724609375, 2.6336669921875, 2.974609375, 3.3155517578125, 3.656494140625, 3.9974365234375, 4.33837890625, 4.6793212890625, 5.020263671875, 5.3612060546875, 5.7021484375, 6.0430908203125, 6.384033203125, 6.7249755859375, 7.06591796875, 7.4068603515625, 7.747802734375, 8.0887451171875, 8.4296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 8.0, 10.0, 15.0, 15.0, 30.0, 26.0, 23.0, 55.0, 42.0, 57.0, 46.0, 70.0, 62.0, 64.0, 63.0, 60.0, 50.0, 40.0, 41.0, 42.0, 34.0, 30.0, 26.0, 19.0, 14.0, 16.0, 7.0, 7.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8100433349609375, -0.782684326171875, -0.7553253173828125, -0.72796630859375, -0.7006072998046875, -0.673248291015625, -0.6458892822265625, -0.6185302734375, -0.5911712646484375, -0.563812255859375, -0.5364532470703125, -0.50909423828125, -0.4817352294921875, -0.454376220703125, -0.4270172119140625, -0.399658203125, -0.3722991943359375, -0.344940185546875, -0.3175811767578125, -0.29022216796875, -0.2628631591796875, -0.235504150390625, -0.2081451416015625, -0.1807861328125, -0.1534271240234375, -0.126068115234375, -0.0987091064453125, -0.07135009765625, -0.0439910888671875, -0.016632080078125, 0.0107269287109375, 0.0380859375, 0.0654449462890625, 0.092803955078125, 0.1201629638671875, 0.14752197265625, 0.1748809814453125, 0.202239990234375, 0.2295989990234375, 0.2569580078125, 0.2843170166015625, 0.311676025390625, 0.3390350341796875, 0.36639404296875, 0.3937530517578125, 0.421112060546875, 0.4484710693359375, 0.475830078125, 0.5031890869140625, 0.530548095703125, 0.5579071044921875, 0.58526611328125, 0.6126251220703125, 0.639984130859375, 0.6673431396484375, 0.6947021484375, 0.7220611572265625, 0.749420166015625, 0.7767791748046875, 0.80413818359375, 0.8314971923828125, 0.858856201171875, 0.8862152099609375, 0.91357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 3.0, 14.0, 18.0, 22.0, 31.0, 53.0, 66.0, 91.0, 115.0, 181.0, 346.0, 620.0, 1110.0, 2436.0, 6118.0, 21587.0, 257002.0, 3853134.0, 36748.0, 8336.0, 3110.0, 1360.0, 702.0, 372.0, 223.0, 161.0, 78.0, 60.0, 50.0, 40.0, 20.0, 20.0, 8.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.4915771484375, -2.403076171875, -2.3145751953125, -2.22607421875, -2.1375732421875, -2.049072265625, -1.9605712890625, -1.8720703125, -1.7835693359375, -1.695068359375, -1.6065673828125, -1.51806640625, -1.4295654296875, -1.341064453125, -1.2525634765625, -1.1640625, -1.0755615234375, -0.987060546875, -0.8985595703125, -0.81005859375, -0.7215576171875, -0.633056640625, -0.5445556640625, -0.4560546875, -0.3675537109375, -0.279052734375, -0.1905517578125, -0.10205078125, -0.0135498046875, 0.074951171875, 0.1634521484375, 0.251953125, 0.3404541015625, 0.428955078125, 0.5174560546875, 0.60595703125, 0.6944580078125, 0.782958984375, 0.8714599609375, 0.9599609375, 1.0484619140625, 1.136962890625, 1.2254638671875, 1.31396484375, 1.4024658203125, 1.490966796875, 1.5794677734375, 1.66796875, 1.7564697265625, 1.844970703125, 1.9334716796875, 2.02197265625, 2.1104736328125, 2.198974609375, 2.2874755859375, 2.3759765625, 2.4644775390625, 2.552978515625, 2.6414794921875, 2.72998046875, 2.8184814453125, 2.906982421875, 2.9954833984375, 3.083984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 25.0, 55.0, 146.0, 3173.0, 455.0, 102.0, 36.0, 14.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0783615112304688, -1.0532073974609375, -1.0280532836914062, -1.002899169921875, -0.9777450561523438, -0.9525909423828125, -0.9274368286132812, -0.90228271484375, -0.8771286010742188, -0.8519744873046875, -0.8268203735351562, -0.801666259765625, -0.7765121459960938, -0.7513580322265625, -0.7262039184570312, -0.7010498046875, -0.6758956909179688, -0.6507415771484375, -0.6255874633789062, -0.600433349609375, -0.5752792358398438, -0.5501251220703125, -0.5249710083007812, -0.49981689453125, -0.47466278076171875, -0.4495086669921875, -0.42435455322265625, -0.399200439453125, -0.37404632568359375, -0.3488922119140625, -0.32373809814453125, -0.298583984375, -0.27342987060546875, -0.2482757568359375, -0.22312164306640625, -0.197967529296875, -0.17281341552734375, -0.1476593017578125, -0.12250518798828125, -0.09735107421875, -0.07219696044921875, -0.0470428466796875, -0.02188873291015625, 0.003265380859375, 0.02841949462890625, 0.0535736083984375, 0.07872772216796875, 0.1038818359375, 0.12903594970703125, 0.1541900634765625, 0.17934417724609375, 0.204498291015625, 0.22965240478515625, 0.2548065185546875, 0.27996063232421875, 0.30511474609375, 0.33026885986328125, 0.3554229736328125, 0.38057708740234375, 0.405731201171875, 0.43088531494140625, 0.4560394287109375, 0.48119354248046875, 0.50634765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 10.0, 20.0, 26.0, 49.0, 84.0, 118.0, 163.0, 151.0, 137.0, 111.0, 45.0, 31.0, 18.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039318323135376, -2.9488184452056885, -2.85831880569458, -2.7678189277648926, -2.677319049835205, -2.5868191719055176, -2.496319532394409, -2.4058196544647217, -2.315319776535034, -2.2248198986053467, -2.1343202590942383, -2.043820381164551, -1.9533205032348633, -1.8628207445144653, -1.7723209857940674, -1.6818211078643799, -1.591321349143982, -1.500821590423584, -1.4103217124938965, -1.3198219537734985, -1.229322075843811, -1.138822317123413, -1.0483224391937256, -0.9578226804733276, -0.8673228621482849, -0.7768230438232422, -0.6863232254981995, -0.5958234071731567, -0.5053236484527588, -0.4148238003253937, -0.32432401180267334, -0.23382419347763062, -0.1433243751525879, -0.05282456427812576, 0.037675246596336365, 0.1281750500202179, 0.21867486834526062, 0.30917468667030334, 0.3996744751930237, 0.4901742935180664, 0.5806741118431091, 0.6711739301681519, 0.7616737484931946, 0.8521735668182373, 0.9426733255386353, 1.0331732034683228, 1.1236729621887207, 1.2141728401184082, 1.3046725988388062, 1.395172357559204, 1.4856722354888916, 1.5761719942092896, 1.666671872138977, 1.757171630859375, 1.8476715087890625, 1.9381712675094604, 2.0286710262298584, 2.119170904159546, 2.2096705436706543, 2.300170421600342, 2.3906702995300293, 2.481170177459717, 2.571669816970825, 2.6621696949005127, 2.7526695728302]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 11.0, 9.0, 14.0, 7.0, 24.0, 22.0, 32.0, 29.0, 32.0, 33.0, 40.0, 52.0, 51.0, 44.0, 64.0, 47.0, 44.0, 63.0, 46.0, 42.0, 31.0, 33.0, 28.0, 37.0, 36.0, 23.0, 32.0, 18.0, 12.0, 6.0, 4.0, 2.0, 5.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798314094543457, -1.747164011001587, -1.6960139274597168, -1.6448638439178467, -1.5937137603759766, -1.5425636768341064, -1.4914137125015259, -1.4402636289596558, -1.3891135454177856, -1.3379634618759155, -1.2868133783340454, -1.2356632947921753, -1.1845133304595947, -1.1333632469177246, -1.0822131633758545, -1.0310630798339844, -0.9799129962921143, -0.9287629127502441, -0.877612829208374, -0.8264628052711487, -0.7753127217292786, -0.7241626381874084, -0.6730126142501831, -0.621862530708313, -0.5707124471664429, -0.5195623636245728, -0.468412309885025, -0.4172622561454773, -0.3661121726036072, -0.31496208906173706, -0.26381203532218933, -0.2126619815826416, -0.16151189804077148, -0.11036182940006256, -0.05921176075935364, -0.008061692118644714, 0.04308837652206421, 0.09423846006393433, 0.14538851380348206, 0.19653856754302979, 0.2476886510848999, 0.29883873462677, 0.34998878836631775, 0.4011388421058655, 0.4522889256477356, 0.5034390091896057, 0.554589033126831, 0.6057391166687012, 0.6568892002105713, 0.7080392837524414, 0.7591893672943115, 0.8103393912315369, 0.861489474773407, 0.9126395583152771, 0.9637895822525024, 1.0149396657943726, 1.0660897493362427, 1.1172398328781128, 1.168389916419983, 1.219539999961853, 1.2706899642944336, 1.3218400478363037, 1.3729901313781738, 1.424140214920044, 1.475290298461914]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 5.0, 13.0, 19.0, 31.0, 55.0, 69.0, 139.0, 266.0, 561.0, 1141.0, 2871.0, 9184.0, 37109.0, 178648.0, 513278.0, 238060.0, 49100.0, 11849.0, 3618.0, 1334.0, 553.0, 269.0, 132.0, 91.0, 49.0, 30.0, 22.0, 10.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.498046875, -3.404998779296875, -3.31195068359375, -3.218902587890625, -3.1258544921875, -3.032806396484375, -2.93975830078125, -2.846710205078125, -2.753662109375, -2.660614013671875, -2.56756591796875, -2.474517822265625, -2.3814697265625, -2.288421630859375, -2.19537353515625, -2.102325439453125, -2.00927734375, -1.916229248046875, -1.82318115234375, -1.730133056640625, -1.6370849609375, -1.544036865234375, -1.45098876953125, -1.357940673828125, -1.264892578125, -1.171844482421875, -1.07879638671875, -0.985748291015625, -0.8927001953125, -0.799652099609375, -0.70660400390625, -0.613555908203125, -0.5205078125, -0.427459716796875, -0.33441162109375, -0.241363525390625, -0.1483154296875, -0.055267333984375, 0.03778076171875, 0.130828857421875, 0.223876953125, 0.316925048828125, 0.40997314453125, 0.503021240234375, 0.5960693359375, 0.689117431640625, 0.78216552734375, 0.875213623046875, 0.96826171875, 1.061309814453125, 1.15435791015625, 1.247406005859375, 1.3404541015625, 1.433502197265625, 1.52655029296875, 1.619598388671875, 1.712646484375, 1.805694580078125, 1.89874267578125, 1.991790771484375, 2.0848388671875, 2.177886962890625, 2.27093505859375, 2.363983154296875, 2.45703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 11.0, 12.0, 19.0, 19.0, 32.0, 36.0, 32.0, 56.0, 63.0, 56.0, 58.0, 65.0, 67.0, 73.0, 57.0, 51.0, 48.0, 43.0, 37.0, 37.0, 23.0, 21.0, 14.0, 16.0, 10.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.7950592041015625, -0.763946533203125, -0.7328338623046875, -0.70172119140625, -0.6706085205078125, -0.639495849609375, -0.6083831787109375, -0.5772705078125, -0.5461578369140625, -0.515045166015625, -0.4839324951171875, -0.45281982421875, -0.4217071533203125, -0.390594482421875, -0.3594818115234375, -0.328369140625, -0.2972564697265625, -0.266143798828125, -0.2350311279296875, -0.20391845703125, -0.1728057861328125, -0.141693115234375, -0.1105804443359375, -0.0794677734375, -0.0483551025390625, -0.017242431640625, 0.0138702392578125, 0.04498291015625, 0.0760955810546875, 0.107208251953125, 0.1383209228515625, 0.16943359375, 0.2005462646484375, 0.231658935546875, 0.2627716064453125, 0.29388427734375, 0.3249969482421875, 0.356109619140625, 0.3872222900390625, 0.4183349609375, 0.4494476318359375, 0.480560302734375, 0.5116729736328125, 0.54278564453125, 0.5738983154296875, 0.605010986328125, 0.6361236572265625, 0.667236328125, 0.6983489990234375, 0.729461669921875, 0.7605743408203125, 0.79168701171875, 0.8227996826171875, 0.853912353515625, 0.8850250244140625, 0.9161376953125, 0.9472503662109375, 0.978363037109375, 1.0094757080078125, 1.04058837890625, 1.0717010498046875, 1.102813720703125, 1.1339263916015625, 1.1650390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 11.0, 8.0, 9.0, 10.0, 30.0, 46.0, 81.0, 84.0, 114.0, 210.0, 328.0, 601.0, 1155.0, 2887.0, 25646.0, 858131.0, 149706.0, 6021.0, 1577.0, 766.0, 429.0, 257.0, 164.0, 93.0, 70.0, 49.0, 20.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.9705810546875, -6.757568359375, -6.5445556640625, -6.33154296875, -6.1185302734375, -5.905517578125, -5.6925048828125, -5.4794921875, -5.2664794921875, -5.053466796875, -4.8404541015625, -4.62744140625, -4.4144287109375, -4.201416015625, -3.9884033203125, -3.775390625, -3.5623779296875, -3.349365234375, -3.1363525390625, -2.92333984375, -2.7103271484375, -2.497314453125, -2.2843017578125, -2.0712890625, -1.8582763671875, -1.645263671875, -1.4322509765625, -1.21923828125, -1.0062255859375, -0.793212890625, -0.5802001953125, -0.3671875, -0.1541748046875, 0.058837890625, 0.2718505859375, 0.48486328125, 0.6978759765625, 0.910888671875, 1.1239013671875, 1.3369140625, 1.5499267578125, 1.762939453125, 1.9759521484375, 2.18896484375, 2.4019775390625, 2.614990234375, 2.8280029296875, 3.041015625, 3.2540283203125, 3.467041015625, 3.6800537109375, 3.89306640625, 4.1060791015625, 4.319091796875, 4.5321044921875, 4.7451171875, 4.9581298828125, 5.171142578125, 5.3841552734375, 5.59716796875, 5.8101806640625, 6.023193359375, 6.2362060546875, 6.44921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 0.0, 7.0, 7.0, 9.0, 10.0, 18.0, 25.0, 28.0, 23.0, 38.0, 46.0, 58.0, 53.0, 48.0, 89.0, 66.0, 58.0, 72.0, 60.0, 47.0, 46.0, 47.0, 38.0, 26.0, 21.0, 19.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.11285400390625, -3.9522705078125, -3.79168701171875, -3.631103515625, -3.47052001953125, -3.3099365234375, -3.14935302734375, -2.98876953125, -2.82818603515625, -2.6676025390625, -2.50701904296875, -2.346435546875, -2.18585205078125, -2.0252685546875, -1.86468505859375, -1.7041015625, -1.54351806640625, -1.3829345703125, -1.22235107421875, -1.061767578125, -0.90118408203125, -0.7406005859375, -0.58001708984375, -0.41943359375, -0.25885009765625, -0.0982666015625, 0.06231689453125, 0.222900390625, 0.38348388671875, 0.5440673828125, 0.70465087890625, 0.865234375, 1.02581787109375, 1.1864013671875, 1.34698486328125, 1.507568359375, 1.66815185546875, 1.8287353515625, 1.98931884765625, 2.14990234375, 2.31048583984375, 2.4710693359375, 2.63165283203125, 2.792236328125, 2.95281982421875, 3.1134033203125, 3.27398681640625, 3.4345703125, 3.59515380859375, 3.7557373046875, 3.91632080078125, 4.076904296875, 4.23748779296875, 4.3980712890625, 4.55865478515625, 4.71923828125, 4.87982177734375, 5.0404052734375, 5.20098876953125, 5.361572265625, 5.52215576171875, 5.6827392578125, 5.84332275390625, 6.00390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 19.0, 15.0, 35.0, 50.0, 57.0, 127.0, 182.0, 374.0, 1031.0, 10553.0, 974315.0, 58658.0, 1952.0, 545.0, 228.0, 130.0, 82.0, 59.0, 34.0, 22.0, 11.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.64227294921875, -5.4642333984375, -5.28619384765625, -5.108154296875, -4.93011474609375, -4.7520751953125, -4.57403564453125, -4.39599609375, -4.21795654296875, -4.0399169921875, -3.86187744140625, -3.683837890625, -3.50579833984375, -3.3277587890625, -3.14971923828125, -2.9716796875, -2.79364013671875, -2.6156005859375, -2.43756103515625, -2.259521484375, -2.08148193359375, -1.9034423828125, -1.72540283203125, -1.54736328125, -1.36932373046875, -1.1912841796875, -1.01324462890625, -0.835205078125, -0.65716552734375, -0.4791259765625, -0.30108642578125, -0.123046875, 0.05499267578125, 0.2330322265625, 0.41107177734375, 0.589111328125, 0.76715087890625, 0.9451904296875, 1.12322998046875, 1.30126953125, 1.47930908203125, 1.6573486328125, 1.83538818359375, 2.013427734375, 2.19146728515625, 2.3695068359375, 2.54754638671875, 2.7255859375, 2.90362548828125, 3.0816650390625, 3.25970458984375, 3.437744140625, 3.61578369140625, 3.7938232421875, 3.97186279296875, 4.14990234375, 4.32794189453125, 4.5059814453125, 4.68402099609375, 4.862060546875, 5.04010009765625, 5.2181396484375, 5.39617919921875, 5.57421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 6.0, 3.0, 11.0, 5.0, 11.0, 16.0, 20.0, 23.0, 36.0, 31.0, 58.0, 73.0, 98.0, 103.0, 115.0, 84.0, 59.0, 55.0, 39.0, 37.0, 25.0, 20.0, 10.0, 9.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022470951080322266, -0.0002178587019443512, -0.00021100789308547974, -0.00020415708422660828, -0.00019730627536773682, -0.00019045546650886536, -0.0001836046576499939, -0.00017675384879112244, -0.00016990303993225098, -0.00016305223107337952, -0.00015620142221450806, -0.0001493506133556366, -0.00014249980449676514, -0.00013564899563789368, -0.00012879818677902222, -0.00012194737792015076, -0.0001150965690612793, -0.00010824576020240784, -0.00010139495134353638, -9.454414248466492e-05, -8.769333362579346e-05, -8.0842524766922e-05, -7.399171590805054e-05, -6.714090704917908e-05, -6.029009819030762e-05, -5.343928933143616e-05, -4.65884804725647e-05, -3.973767161369324e-05, -3.288686275482178e-05, -2.6036053895950317e-05, -1.9185245037078857e-05, -1.2334436178207397e-05, -5.4836273193359375e-06, 1.3671815395355225e-06, 8.217990398406982e-06, 1.5068799257278442e-05, 2.1919608116149902e-05, 2.8770416975021362e-05, 3.562122583389282e-05, 4.247203469276428e-05, 4.932284355163574e-05, 5.61736524105072e-05, 6.302446126937866e-05, 6.987527012825012e-05, 7.672607898712158e-05, 8.357688784599304e-05, 9.04276967048645e-05, 9.727850556373596e-05, 0.00010412931442260742, 0.00011098012328147888, 0.00011783093214035034, 0.0001246817409992218, 0.00013153254985809326, 0.00013838335871696472, 0.00014523416757583618, 0.00015208497643470764, 0.0001589357852935791, 0.00016578659415245056, 0.00017263740301132202, 0.00017948821187019348, 0.00018633902072906494, 0.0001931898295879364, 0.00020004063844680786, 0.00020689144730567932, 0.00021374225616455078]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 12.0, 4.0, 11.0, 7.0, 20.0, 25.0, 40.0, 41.0, 72.0, 118.0, 180.0, 322.0, 794.0, 2212.0, 10675.0, 251798.0, 757432.0, 19608.0, 3113.0, 987.0, 449.0, 237.0, 140.0, 78.0, 48.0, 41.0, 25.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.442413330078125, -3.32818603515625, -3.213958740234375, -3.0997314453125, -2.985504150390625, -2.87127685546875, -2.757049560546875, -2.642822265625, -2.528594970703125, -2.41436767578125, -2.300140380859375, -2.1859130859375, -2.071685791015625, -1.95745849609375, -1.843231201171875, -1.72900390625, -1.614776611328125, -1.50054931640625, -1.386322021484375, -1.2720947265625, -1.157867431640625, -1.04364013671875, -0.929412841796875, -0.815185546875, -0.700958251953125, -0.58673095703125, -0.472503662109375, -0.3582763671875, -0.244049072265625, -0.12982177734375, -0.015594482421875, 0.0986328125, 0.212860107421875, 0.32708740234375, 0.441314697265625, 0.5555419921875, 0.669769287109375, 0.78399658203125, 0.898223876953125, 1.012451171875, 1.126678466796875, 1.24090576171875, 1.355133056640625, 1.4693603515625, 1.583587646484375, 1.69781494140625, 1.812042236328125, 1.92626953125, 2.040496826171875, 2.15472412109375, 2.268951416015625, 2.3831787109375, 2.497406005859375, 2.61163330078125, 2.725860595703125, 2.840087890625, 2.954315185546875, 3.06854248046875, 3.182769775390625, 3.2969970703125, 3.411224365234375, 3.52545166015625, 3.639678955078125, 3.75390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 8.0, 10.0, 28.0, 39.0, 51.0, 53.0, 94.0, 132.0, 134.0, 129.0, 71.0, 72.0, 59.0, 28.0, 20.0, 11.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.59381103515625, -2.5079345703125, -2.42205810546875, -2.336181640625, -2.25030517578125, -2.1644287109375, -2.07855224609375, -1.99267578125, -1.90679931640625, -1.8209228515625, -1.73504638671875, -1.649169921875, -1.56329345703125, -1.4774169921875, -1.39154052734375, -1.3056640625, -1.21978759765625, -1.1339111328125, -1.04803466796875, -0.962158203125, -0.87628173828125, -0.7904052734375, -0.70452880859375, -0.61865234375, -0.53277587890625, -0.4468994140625, -0.36102294921875, -0.275146484375, -0.18927001953125, -0.1033935546875, -0.01751708984375, 0.068359375, 0.15423583984375, 0.2401123046875, 0.32598876953125, 0.411865234375, 0.49774169921875, 0.5836181640625, 0.66949462890625, 0.75537109375, 0.84124755859375, 0.9271240234375, 1.01300048828125, 1.098876953125, 1.18475341796875, 1.2706298828125, 1.35650634765625, 1.4423828125, 1.52825927734375, 1.6141357421875, 1.70001220703125, 1.785888671875, 1.87176513671875, 1.9576416015625, 2.04351806640625, 2.12939453125, 2.21527099609375, 2.3011474609375, 2.38702392578125, 2.472900390625, 2.55877685546875, 2.6446533203125, 2.73052978515625, 2.81640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 28.0, 142.0, 433.0, 325.0, 60.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.46310424804688, -102.12818908691406, -99.79326629638672, -97.45834350585938, -95.12342834472656, -92.78851318359375, -90.4535903930664, -88.11866760253906, -85.78375244140625, -83.44883728027344, -81.1139144897461, -78.77899169921875, -76.44407653808594, -74.10916137695312, -71.77423858642578, -69.43931579589844, -67.10440063476562, -64.76948547363281, -62.43456268310547, -60.09964370727539, -57.76472473144531, -55.429805755615234, -53.094886779785156, -50.75996780395508, -48.425048828125, -46.09012985229492, -43.755210876464844, -41.420291900634766, -39.08537292480469, -36.75045394897461, -34.41553497314453, -32.08061599731445, -29.745704650878906, -27.410785675048828, -25.07586669921875, -22.740947723388672, -20.406028747558594, -18.071109771728516, -15.736190795898438, -13.40127182006836, -11.066352844238281, -8.731433868408203, -6.396514892578125, -4.061595916748047, -1.7266769409179688, 0.6082420349121094, 2.9431610107421875, 5.278079986572266, 7.612998962402344, 9.947917938232422, 12.2828369140625, 14.617755889892578, 16.952674865722656, 19.287593841552734, 21.622512817382812, 23.95743179321289, 26.29235076904297, 28.627269744873047, 30.962188720703125, 33.2971076965332, 35.63202667236328, 37.96694564819336, 40.30186462402344, 42.636783599853516, 44.971702575683594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 6.0, 4.0, 12.0, 7.0, 9.0, 11.0, 18.0, 17.0, 17.0, 21.0, 25.0, 30.0, 32.0, 35.0, 34.0, 34.0, 38.0, 43.0, 53.0, 34.0, 47.0, 45.0, 50.0, 41.0, 40.0, 38.0, 27.0, 28.0, 21.0, 25.0, 32.0, 24.0, 19.0, 9.0, 7.0, 5.0, 13.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.858171463012695, -15.4027681350708, -14.947365760803223, -14.491962432861328, -14.03656005859375, -13.581156730651855, -13.125754356384277, -12.670351028442383, -12.214948654174805, -11.75954532623291, -11.304142951965332, -10.848739624023438, -10.39333724975586, -9.937933921813965, -9.482531547546387, -9.027128219604492, -8.571725845336914, -8.11632251739502, -7.660920143127441, -7.205517292022705, -6.750114440917969, -6.294711112976074, -5.839308738708496, -5.383905410766602, -4.928502082824707, -4.473099231719971, -4.017696380615234, -3.562293529510498, -3.1068906784057617, -2.6514875888824463, -2.19608473777771, -1.7406818866729736, -1.2852792739868164, -0.8298764228820801, -0.374473512172699, 0.08092939853668213, 0.5363322496414185, 0.9917352199554443, 1.4471380710601807, 1.902540922164917, 2.3579437732696533, 2.8133466243743896, 3.268749475479126, 3.7241525650024414, 4.179555416107178, 4.634958267211914, 5.09036111831665, 5.545763969421387, 6.001166820526123, 6.456569671630859, 6.911972522735596, 7.367375373840332, 7.822778224945068, 8.278181076049805, 8.7335844039917, 9.188986778259277, 9.644390106201172, 10.099793434143066, 10.555195808410645, 11.010599136352539, 11.466001510620117, 11.921404838562012, 12.37680721282959, 12.832210540771484, 13.287612915039062]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 12.0, 16.0, 24.0, 42.0, 66.0, 113.0, 169.0, 261.0, 529.0, 1086.0, 3374.0, 24605.0, 4050376.0, 103531.0, 6759.0, 1683.0, 723.0, 373.0, 191.0, 123.0, 64.0, 43.0, 27.0, 15.0, 12.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0], "bins": [-6.80859375, -6.63714599609375, -6.4656982421875, -6.29425048828125, -6.122802734375, -5.95135498046875, -5.7799072265625, -5.60845947265625, -5.43701171875, -5.26556396484375, -5.0941162109375, -4.92266845703125, -4.751220703125, -4.57977294921875, -4.4083251953125, -4.23687744140625, -4.0654296875, -3.89398193359375, -3.7225341796875, -3.55108642578125, -3.379638671875, -3.20819091796875, -3.0367431640625, -2.86529541015625, -2.69384765625, -2.52239990234375, -2.3509521484375, -2.17950439453125, -2.008056640625, -1.83660888671875, -1.6651611328125, -1.49371337890625, -1.322265625, -1.15081787109375, -0.9793701171875, -0.80792236328125, -0.636474609375, -0.46502685546875, -0.2935791015625, -0.12213134765625, 0.04931640625, 0.22076416015625, 0.3922119140625, 0.56365966796875, 0.735107421875, 0.90655517578125, 1.0780029296875, 1.24945068359375, 1.4208984375, 1.59234619140625, 1.7637939453125, 1.93524169921875, 2.106689453125, 2.27813720703125, 2.4495849609375, 2.62103271484375, 2.79248046875, 2.96392822265625, 3.1353759765625, 3.30682373046875, 3.478271484375, 3.64971923828125, 3.8211669921875, 3.99261474609375, 4.1640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 6.0, 2.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 12.0, 26.0, 37.0, 36.0, 41.0, 46.0, 51.0, 62.0, 61.0, 52.0, 41.0, 51.0, 45.0, 47.0, 61.0, 35.0, 31.0, 34.0, 36.0, 21.0, 15.0, 14.0, 16.0, 13.0, 7.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.9150390625, -0.889007568359375, -0.86297607421875, -0.836944580078125, -0.8109130859375, -0.784881591796875, -0.75885009765625, -0.732818603515625, -0.706787109375, -0.680755615234375, -0.65472412109375, -0.628692626953125, -0.6026611328125, -0.576629638671875, -0.55059814453125, -0.524566650390625, -0.49853515625, -0.472503662109375, -0.44647216796875, -0.420440673828125, -0.3944091796875, -0.368377685546875, -0.34234619140625, -0.316314697265625, -0.290283203125, -0.264251708984375, -0.23822021484375, -0.212188720703125, -0.1861572265625, -0.160125732421875, -0.13409423828125, -0.108062744140625, -0.08203125, -0.055999755859375, -0.02996826171875, -0.003936767578125, 0.0220947265625, 0.048126220703125, 0.07415771484375, 0.100189208984375, 0.126220703125, 0.152252197265625, 0.17828369140625, 0.204315185546875, 0.2303466796875, 0.256378173828125, 0.28240966796875, 0.308441162109375, 0.33447265625, 0.360504150390625, 0.38653564453125, 0.412567138671875, 0.4385986328125, 0.464630126953125, 0.49066162109375, 0.516693115234375, 0.542724609375, 0.568756103515625, 0.59478759765625, 0.620819091796875, 0.6468505859375, 0.672882080078125, 0.69891357421875, 0.724945068359375, 0.7509765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 10.0, 7.0, 19.0, 11.0, 22.0, 28.0, 36.0, 41.0, 50.0, 79.0, 105.0, 172.0, 268.0, 416.0, 663.0, 1235.0, 2625.0, 6999.0, 27291.0, 336434.0, 3752924.0, 47351.0, 10187.0, 3471.0, 1607.0, 814.0, 456.0, 285.0, 209.0, 130.0, 88.0, 60.0, 60.0, 26.0, 18.0, 22.0, 16.0, 13.0, 7.0, 6.0, 8.0, 3.0, 6.0, 1.0, 6.0, 0.0, 1.0, 3.0], "bins": [-3.119140625, -3.032867431640625, -2.94659423828125, -2.860321044921875, -2.7740478515625, -2.687774658203125, -2.60150146484375, -2.515228271484375, -2.428955078125, -2.342681884765625, -2.25640869140625, -2.170135498046875, -2.0838623046875, -1.997589111328125, -1.91131591796875, -1.825042724609375, -1.73876953125, -1.652496337890625, -1.56622314453125, -1.479949951171875, -1.3936767578125, -1.307403564453125, -1.22113037109375, -1.134857177734375, -1.048583984375, -0.962310791015625, -0.87603759765625, -0.789764404296875, -0.7034912109375, -0.617218017578125, -0.53094482421875, -0.444671630859375, -0.3583984375, -0.272125244140625, -0.18585205078125, -0.099578857421875, -0.0133056640625, 0.072967529296875, 0.15924072265625, 0.245513916015625, 0.331787109375, 0.418060302734375, 0.50433349609375, 0.590606689453125, 0.6768798828125, 0.763153076171875, 0.84942626953125, 0.935699462890625, 1.02197265625, 1.108245849609375, 1.19451904296875, 1.280792236328125, 1.3670654296875, 1.453338623046875, 1.53961181640625, 1.625885009765625, 1.712158203125, 1.798431396484375, 1.88470458984375, 1.970977783203125, 2.0572509765625, 2.143524169921875, 2.22979736328125, 2.316070556640625, 2.40234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 19.0, 49.0, 83.0, 417.0, 3124.0, 209.0, 58.0, 31.0, 22.0, 15.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.26971435546875, -1.2152099609375, -1.16070556640625, -1.106201171875, -1.05169677734375, -0.9971923828125, -0.94268798828125, -0.88818359375, -0.83367919921875, -0.7791748046875, -0.72467041015625, -0.670166015625, -0.61566162109375, -0.5611572265625, -0.50665283203125, -0.4521484375, -0.39764404296875, -0.3431396484375, -0.28863525390625, -0.234130859375, -0.17962646484375, -0.1251220703125, -0.07061767578125, -0.01611328125, 0.03839111328125, 0.0928955078125, 0.14739990234375, 0.201904296875, 0.25640869140625, 0.3109130859375, 0.36541748046875, 0.419921875, 0.47442626953125, 0.5289306640625, 0.58343505859375, 0.637939453125, 0.69244384765625, 0.7469482421875, 0.80145263671875, 0.85595703125, 0.91046142578125, 0.9649658203125, 1.01947021484375, 1.073974609375, 1.12847900390625, 1.1829833984375, 1.23748779296875, 1.2919921875, 1.34649658203125, 1.4010009765625, 1.45550537109375, 1.510009765625, 1.56451416015625, 1.6190185546875, 1.67352294921875, 1.72802734375, 1.78253173828125, 1.8370361328125, 1.89154052734375, 1.946044921875, 2.00054931640625, 2.0550537109375, 2.10955810546875, 2.1640625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 14.0, 32.0, 64.0, 136.0, 208.0, 234.0, 148.0, 81.0, 39.0, 17.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1591782569885254, -2.898341178894043, -2.6375041007995605, -2.376666784286499, -2.1158297061920166, -1.8549926280975342, -1.5941554307937622, -1.3333182334899902, -1.0724811553955078, -0.8116440176963806, -0.5508068799972534, -0.2899697422981262, -0.029132604598999023, 0.2317044734954834, 0.49254167079925537, 0.7533788681030273, 1.0142159461975098, 1.2750530242919922, 1.5358902215957642, 1.7967274188995361, 2.0575644969940186, 2.318401575088501, 2.5792388916015625, 2.840075969696045, 3.1009130477905273, 3.3617501258850098, 3.622587203979492, 3.8834245204925537, 4.144261360168457, 4.405098915100098, 4.66593599319458, 4.9267730712890625, 5.187610626220703, 5.4484477043151855, 5.709284782409668, 5.97012186050415, 6.230958938598633, 6.491796493530273, 6.752633571624756, 7.013470649719238, 7.274307727813721, 7.535144805908203, 7.7959818840026855, 8.056818962097168, 8.317656517028809, 8.578493118286133, 8.839330673217773, 9.100168228149414, 9.361004829406738, 9.621842384338379, 9.882678985595703, 10.143516540527344, 10.404353141784668, 10.665190696716309, 10.926027297973633, 11.186864852905273, 11.447702407836914, 11.708539962768555, 11.969376564025879, 12.23021411895752, 12.491050720214844, 12.751888275146484, 13.012724876403809, 13.27356243133545, 13.534399032592773]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 14.0, 18.0, 20.0, 35.0, 36.0, 28.0, 41.0, 45.0, 53.0, 64.0, 59.0, 55.0, 67.0, 52.0, 58.0, 57.0, 46.0, 38.0, 35.0, 21.0, 28.0, 21.0, 18.0, 10.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.197094440460205, -4.079265117645264, -3.961435317993164, -3.8436059951782227, -3.725776433944702, -3.6079468727111816, -3.490117311477661, -3.3722877502441406, -3.254458427429199, -3.1366288661956787, -3.018799304962158, -2.900969982147217, -2.7831404209136963, -2.665310859680176, -2.5474812984466553, -2.4296517372131348, -2.3118221759796143, -2.1939926147460938, -2.0761630535125732, -1.9583336114883423, -1.8405041694641113, -1.7226746082305908, -1.6048450469970703, -1.4870154857635498, -1.3691860437393188, -1.2513564825057983, -1.1335270404815674, -1.0156974792480469, -0.8978679776191711, -0.7800384759902954, -0.6622089147567749, -0.5443794131278992, -0.42654991149902344, -0.3087204098701477, -0.19089087843894958, -0.07306134700775146, 0.04476815462112427, 0.16259765625, 0.2804272174835205, 0.39825671911239624, 0.516086220741272, 0.6339157223701477, 0.7517452239990234, 0.869574785232544, 0.9874042868614197, 1.1052337884902954, 1.223063349723816, 1.3408927917480469, 1.4587223529815674, 1.576551914215088, 1.6943813562393188, 1.8122109174728394, 1.9300403594970703, 2.047869920730591, 2.1656994819641113, 2.283529043197632, 2.4013586044311523, 2.519188165664673, 2.6370177268981934, 2.7548470497131348, 2.8726766109466553, 2.990506172180176, 3.1083357334136963, 3.226165294647217, 3.343994617462158]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 18.0, 36.0, 46.0, 62.0, 118.0, 201.0, 419.0, 857.0, 1965.0, 5700.0, 21539.0, 117615.0, 546344.0, 289656.0, 47702.0, 10467.0, 3337.0, 1241.0, 561.0, 265.0, 158.0, 72.0, 45.0, 39.0, 21.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.046875, -2.940887451171875, -2.83489990234375, -2.728912353515625, -2.6229248046875, -2.516937255859375, -2.41094970703125, -2.304962158203125, -2.198974609375, -2.092987060546875, -1.98699951171875, -1.881011962890625, -1.7750244140625, -1.669036865234375, -1.56304931640625, -1.457061767578125, -1.35107421875, -1.245086669921875, -1.13909912109375, -1.033111572265625, -0.9271240234375, -0.821136474609375, -0.71514892578125, -0.609161376953125, -0.503173828125, -0.397186279296875, -0.29119873046875, -0.185211181640625, -0.0792236328125, 0.026763916015625, 0.13275146484375, 0.238739013671875, 0.3447265625, 0.450714111328125, 0.55670166015625, 0.662689208984375, 0.7686767578125, 0.874664306640625, 0.98065185546875, 1.086639404296875, 1.192626953125, 1.298614501953125, 1.40460205078125, 1.510589599609375, 1.6165771484375, 1.722564697265625, 1.82855224609375, 1.934539794921875, 2.04052734375, 2.146514892578125, 2.25250244140625, 2.358489990234375, 2.4644775390625, 2.570465087890625, 2.67645263671875, 2.782440185546875, 2.888427734375, 2.994415283203125, 3.10040283203125, 3.206390380859375, 3.3123779296875, 3.418365478515625, 3.52435302734375, 3.630340576171875, 3.736328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 5.0, 7.0, 3.0, 12.0, 13.0, 24.0, 30.0, 37.0, 28.0, 41.0, 44.0, 42.0, 48.0, 51.0, 51.0, 48.0, 74.0, 54.0, 56.0, 39.0, 33.0, 43.0, 30.0, 35.0, 28.0, 20.0, 9.0, 12.0, 15.0, 10.0, 8.0, 7.0, 11.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8998947143554688, -0.8725433349609375, -0.8451919555664062, -0.817840576171875, -0.7904891967773438, -0.7631378173828125, -0.7357864379882812, -0.70843505859375, -0.6810836791992188, -0.6537322998046875, -0.6263809204101562, -0.599029541015625, -0.5716781616210938, -0.5443267822265625, -0.5169754028320312, -0.4896240234375, -0.46227264404296875, -0.4349212646484375, -0.40756988525390625, -0.380218505859375, -0.35286712646484375, -0.3255157470703125, -0.29816436767578125, -0.27081298828125, -0.24346160888671875, -0.2161102294921875, -0.18875885009765625, -0.161407470703125, -0.13405609130859375, -0.1067047119140625, -0.07935333251953125, -0.052001953125, -0.02465057373046875, 0.0027008056640625, 0.03005218505859375, 0.057403564453125, 0.08475494384765625, 0.1121063232421875, 0.13945770263671875, 0.16680908203125, 0.19416046142578125, 0.2215118408203125, 0.24886322021484375, 0.276214599609375, 0.30356597900390625, 0.3309173583984375, 0.35826873779296875, 0.3856201171875, 0.41297149658203125, 0.4403228759765625, 0.46767425537109375, 0.495025634765625, 0.5223770141601562, 0.5497283935546875, 0.5770797729492188, 0.60443115234375, 0.6317825317382812, 0.6591339111328125, 0.6864852905273438, 0.713836669921875, 0.7411880493164062, 0.7685394287109375, 0.7958908081054688, 0.8232421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 7.0, 10.0, 23.0, 27.0, 30.0, 45.0, 74.0, 91.0, 118.0, 193.0, 305.0, 489.0, 947.0, 2328.0, 8413.0, 90980.0, 856468.0, 75862.0, 7517.0, 2204.0, 987.0, 521.0, 318.0, 167.0, 125.0, 81.0, 52.0, 41.0, 37.0, 23.0, 16.0, 12.0, 7.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.59185791015625, -5.4141845703125, -5.23651123046875, -5.058837890625, -4.88116455078125, -4.7034912109375, -4.52581787109375, -4.34814453125, -4.17047119140625, -3.9927978515625, -3.81512451171875, -3.637451171875, -3.45977783203125, -3.2821044921875, -3.10443115234375, -2.9267578125, -2.74908447265625, -2.5714111328125, -2.39373779296875, -2.216064453125, -2.03839111328125, -1.8607177734375, -1.68304443359375, -1.50537109375, -1.32769775390625, -1.1500244140625, -0.97235107421875, -0.794677734375, -0.61700439453125, -0.4393310546875, -0.26165771484375, -0.083984375, 0.09368896484375, 0.2713623046875, 0.44903564453125, 0.626708984375, 0.80438232421875, 0.9820556640625, 1.15972900390625, 1.33740234375, 1.51507568359375, 1.6927490234375, 1.87042236328125, 2.048095703125, 2.22576904296875, 2.4034423828125, 2.58111572265625, 2.7587890625, 2.93646240234375, 3.1141357421875, 3.29180908203125, 3.469482421875, 3.64715576171875, 3.8248291015625, 4.00250244140625, 4.18017578125, 4.35784912109375, 4.5355224609375, 4.71319580078125, 4.890869140625, 5.06854248046875, 5.2462158203125, 5.42388916015625, 5.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 12.0, 8.0, 17.0, 28.0, 29.0, 41.0, 44.0, 60.0, 59.0, 61.0, 73.0, 84.0, 76.0, 77.0, 74.0, 46.0, 42.0, 31.0, 32.0, 29.0, 16.0, 15.0, 9.0, 9.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.109375, -5.93841552734375, -5.7674560546875, -5.59649658203125, -5.425537109375, -5.25457763671875, -5.0836181640625, -4.91265869140625, -4.74169921875, -4.57073974609375, -4.3997802734375, -4.22882080078125, -4.057861328125, -3.88690185546875, -3.7159423828125, -3.54498291015625, -3.3740234375, -3.20306396484375, -3.0321044921875, -2.86114501953125, -2.690185546875, -2.51922607421875, -2.3482666015625, -2.17730712890625, -2.00634765625, -1.83538818359375, -1.6644287109375, -1.49346923828125, -1.322509765625, -1.15155029296875, -0.9805908203125, -0.80963134765625, -0.638671875, -0.46771240234375, -0.2967529296875, -0.12579345703125, 0.045166015625, 0.21612548828125, 0.3870849609375, 0.55804443359375, 0.72900390625, 0.89996337890625, 1.0709228515625, 1.24188232421875, 1.412841796875, 1.58380126953125, 1.7547607421875, 1.92572021484375, 2.0966796875, 2.26763916015625, 2.4385986328125, 2.60955810546875, 2.780517578125, 2.95147705078125, 3.1224365234375, 3.29339599609375, 3.46435546875, 3.63531494140625, 3.8062744140625, 3.97723388671875, 4.148193359375, 4.31915283203125, 4.4901123046875, 4.66107177734375, 4.83203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 12.0, 8.0, 8.0, 18.0, 36.0, 30.0, 42.0, 71.0, 96.0, 120.0, 197.0, 317.0, 611.0, 1416.0, 4467.0, 21928.0, 183337.0, 717859.0, 98693.0, 13602.0, 3213.0, 1140.0, 522.0, 267.0, 170.0, 119.0, 66.0, 61.0, 47.0, 24.0, 30.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9580078125, -0.9202423095703125, -0.882476806640625, -0.8447113037109375, -0.80694580078125, -0.7691802978515625, -0.731414794921875, -0.6936492919921875, -0.6558837890625, -0.6181182861328125, -0.580352783203125, -0.5425872802734375, -0.50482177734375, -0.4670562744140625, -0.429290771484375, -0.3915252685546875, -0.353759765625, -0.3159942626953125, -0.278228759765625, -0.2404632568359375, -0.20269775390625, -0.1649322509765625, -0.127166748046875, -0.0894012451171875, -0.0516357421875, -0.0138702392578125, 0.023895263671875, 0.0616607666015625, 0.09942626953125, 0.1371917724609375, 0.174957275390625, 0.2127227783203125, 0.25048828125, 0.2882537841796875, 0.326019287109375, 0.3637847900390625, 0.40155029296875, 0.4393157958984375, 0.477081298828125, 0.5148468017578125, 0.5526123046875, 0.5903778076171875, 0.628143310546875, 0.6659088134765625, 0.70367431640625, 0.7414398193359375, 0.779205322265625, 0.8169708251953125, 0.854736328125, 0.8925018310546875, 0.930267333984375, 0.9680328369140625, 1.00579833984375, 1.0435638427734375, 1.081329345703125, 1.1190948486328125, 1.1568603515625, 1.1946258544921875, 1.232391357421875, 1.2701568603515625, 1.30792236328125, 1.3456878662109375, 1.383453369140625, 1.4212188720703125, 1.458984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 12.0, 28.0, 33.0, 37.0, 38.0, 75.0, 115.0, 150.0, 161.0, 104.0, 76.0, 44.0, 34.0, 21.0, 21.0, 13.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003228187561035156, -0.00031472742557525635, -0.00030663609504699707, -0.0002985447645187378, -0.0002904534339904785, -0.00028236210346221924, -0.00027427077293395996, -0.0002661794424057007, -0.0002580881118774414, -0.00024999678134918213, -0.00024190545082092285, -0.00023381412029266357, -0.0002257227897644043, -0.00021763145923614502, -0.00020954012870788574, -0.00020144879817962646, -0.0001933574676513672, -0.0001852661371231079, -0.00017717480659484863, -0.00016908347606658936, -0.00016099214553833008, -0.0001529008150100708, -0.00014480948448181152, -0.00013671815395355225, -0.00012862682342529297, -0.00012053549289703369, -0.00011244416236877441, -0.00010435283184051514, -9.626150131225586e-05, -8.817017078399658e-05, -8.00788402557373e-05, -7.198750972747803e-05, -6.389617919921875e-05, -5.580484867095947e-05, -4.7713518142700195e-05, -3.962218761444092e-05, -3.153085708618164e-05, -2.3439526557922363e-05, -1.5348196029663086e-05, -7.256865501403809e-06, 8.344650268554688e-07, 8.925795555114746e-06, 1.7017126083374023e-05, 2.51084566116333e-05, 3.319978713989258e-05, 4.1291117668151855e-05, 4.938244819641113e-05, 5.747377872467041e-05, 6.556510925292969e-05, 7.365643978118896e-05, 8.174777030944824e-05, 8.983910083770752e-05, 9.79304313659668e-05, 0.00010602176189422607, 0.00011411309242248535, 0.00012220442295074463, 0.0001302957534790039, 0.00013838708400726318, 0.00014647841453552246, 0.00015456974506378174, 0.00016266107559204102, 0.0001707524061203003, 0.00017884373664855957, 0.00018693506717681885, 0.00019502639770507812]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 15.0, 19.0, 22.0, 41.0, 65.0, 75.0, 106.0, 198.0, 324.0, 533.0, 1019.0, 2423.0, 8085.0, 44455.0, 525835.0, 416608.0, 37077.0, 7196.0, 2229.0, 948.0, 495.0, 278.0, 157.0, 111.0, 70.0, 57.0, 23.0, 18.0, 18.0, 13.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0693359375, -1.0296630859375, -0.989990234375, -0.9503173828125, -0.91064453125, -0.8709716796875, -0.831298828125, -0.7916259765625, -0.751953125, -0.7122802734375, -0.672607421875, -0.6329345703125, -0.59326171875, -0.5535888671875, -0.513916015625, -0.4742431640625, -0.4345703125, -0.3948974609375, -0.355224609375, -0.3155517578125, -0.27587890625, -0.2362060546875, -0.196533203125, -0.1568603515625, -0.1171875, -0.0775146484375, -0.037841796875, 0.0018310546875, 0.04150390625, 0.0811767578125, 0.120849609375, 0.1605224609375, 0.2001953125, 0.2398681640625, 0.279541015625, 0.3192138671875, 0.35888671875, 0.3985595703125, 0.438232421875, 0.4779052734375, 0.517578125, 0.5572509765625, 0.596923828125, 0.6365966796875, 0.67626953125, 0.7159423828125, 0.755615234375, 0.7952880859375, 0.8349609375, 0.8746337890625, 0.914306640625, 0.9539794921875, 0.99365234375, 1.0333251953125, 1.072998046875, 1.1126708984375, 1.15234375, 1.1920166015625, 1.231689453125, 1.2713623046875, 1.31103515625, 1.3507080078125, 1.390380859375, 1.4300537109375, 1.4697265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 6.0, 15.0, 15.0, 27.0, 32.0, 46.0, 58.0, 59.0, 89.0, 113.0, 101.0, 106.0, 69.0, 67.0, 56.0, 28.0, 20.0, 17.0, 13.0, 7.0, 7.0, 3.0, 7.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1303253173828125, -1.091705322265625, -1.0530853271484375, -1.01446533203125, -0.9758453369140625, -0.937225341796875, -0.8986053466796875, -0.8599853515625, -0.8213653564453125, -0.782745361328125, -0.7441253662109375, -0.70550537109375, -0.6668853759765625, -0.628265380859375, -0.5896453857421875, -0.551025390625, -0.5124053955078125, -0.473785400390625, -0.4351654052734375, -0.39654541015625, -0.3579254150390625, -0.319305419921875, -0.2806854248046875, -0.2420654296875, -0.2034454345703125, -0.164825439453125, -0.1262054443359375, -0.08758544921875, -0.0489654541015625, -0.010345458984375, 0.0282745361328125, 0.06689453125, 0.1055145263671875, 0.144134521484375, 0.1827545166015625, 0.22137451171875, 0.2599945068359375, 0.298614501953125, 0.3372344970703125, 0.3758544921875, 0.4144744873046875, 0.453094482421875, 0.4917144775390625, 0.53033447265625, 0.5689544677734375, 0.607574462890625, 0.6461944580078125, 0.684814453125, 0.7234344482421875, 0.762054443359375, 0.8006744384765625, 0.83929443359375, 0.8779144287109375, 0.916534423828125, 0.9551544189453125, 0.9937744140625, 1.0323944091796875, 1.071014404296875, 1.1096343994140625, 1.14825439453125, 1.1868743896484375, 1.225494384765625, 1.2641143798828125, 1.302734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 16.0, 24.0, 47.0, 86.0, 136.0, 174.0, 176.0, 154.0, 84.0, 46.0, 17.0, 13.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.5147705078125, -33.63487243652344, -32.754974365234375, -31.875076293945312, -30.99517822265625, -30.115280151367188, -29.235383987426758, -28.355485916137695, -27.475587844848633, -26.59568977355957, -25.715791702270508, -24.835893630981445, -23.955997467041016, -23.076099395751953, -22.19620132446289, -21.316303253173828, -20.436405181884766, -19.556507110595703, -18.67660903930664, -17.796710968017578, -16.916812896728516, -16.036914825439453, -15.157018661499023, -14.277120590209961, -13.397222518920898, -12.517324447631836, -11.637426376342773, -10.757529258728027, -9.877631187438965, -8.997733116149902, -8.117835998535156, -7.237937927246094, -6.358037948608398, -5.478139877319336, -4.598242282867432, -3.7183444499969482, -2.838446617126465, -1.9585485458374023, -1.078650951385498, -0.19875335693359375, 0.6811447143554688, 1.5610425472259521, 2.4409403800964355, 3.320838212966919, 4.200736045837402, 5.080634117126465, 5.960531711578369, 6.840429306030273, 7.720327377319336, 8.600225448608398, 9.480123519897461, 10.360020637512207, 11.23991870880127, 12.119816780090332, 12.999713897705078, 13.87961196899414, 14.759510040283203, 15.639408111572266, 16.519306182861328, 17.39920425415039, 18.279102325439453, 19.159000396728516, 20.038896560668945, 20.918794631958008, 21.79869270324707]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 16.0, 11.0, 19.0, 9.0, 32.0, 28.0, 32.0, 44.0, 25.0, 54.0, 37.0, 51.0, 46.0, 43.0, 57.0, 56.0, 39.0, 43.0, 34.0, 42.0, 25.0, 38.0, 28.0, 30.0, 22.0, 16.0, 19.0, 15.0, 10.0, 8.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-17.00653839111328, -16.527070999145508, -16.047605514526367, -15.568138122558594, -15.088671684265137, -14.60920524597168, -14.129738807678223, -13.650272369384766, -13.170804977416992, -12.691338539123535, -12.211872100830078, -11.732404708862305, -11.252938270568848, -10.77347183227539, -10.294005393981934, -9.814538955688477, -9.33507251739502, -8.855606079101562, -8.376139640808105, -7.89667272567749, -7.417205810546875, -6.937739372253418, -6.458272933959961, -5.978806495666504, -5.499339580535889, -5.019873142242432, -4.540406227111816, -4.060939788818359, -3.5814731121063232, -3.102006435394287, -2.62253999710083, -2.143073320388794, -1.6636066436767578, -1.1841399669647217, -0.7046734094619751, -0.22520685195922852, 0.2542598247528076, 0.7337265014648438, 1.2131929397583008, 1.692659616470337, 2.172126293182373, 2.651592969894409, 3.1310596466064453, 3.6105260848999023, 4.089992523193359, 4.569459438323975, 5.048925876617432, 5.528392791748047, 6.007859230041504, 6.487325668334961, 6.966792583465576, 7.446259021759033, 7.925725936889648, 8.405192375183105, 8.884658813476562, 9.36412525177002, 9.843591690063477, 10.323058128356934, 10.80252456665039, 11.281991958618164, 11.761458396911621, 12.240924835205078, 12.720391273498535, 13.199857711791992, 13.679325103759766]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 3.0, 6.0, 9.0, 11.0, 16.0, 16.0, 30.0, 32.0, 54.0, 86.0, 104.0, 153.0, 244.0, 331.0, 596.0, 1001.0, 1813.0, 3490.0, 7249.0, 16282.0, 45543.0, 235943.0, 3310723.0, 468714.0, 62339.0, 20470.0, 8891.0, 4293.0, 2345.0, 1376.0, 784.0, 456.0, 291.0, 199.0, 124.0, 75.0, 55.0, 43.0, 45.0, 17.0, 5.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.415130615234375, -1.36737060546875, -1.319610595703125, -1.2718505859375, -1.224090576171875, -1.17633056640625, -1.128570556640625, -1.080810546875, -1.033050537109375, -0.98529052734375, -0.937530517578125, -0.8897705078125, -0.842010498046875, -0.79425048828125, -0.746490478515625, -0.69873046875, -0.650970458984375, -0.60321044921875, -0.555450439453125, -0.5076904296875, -0.459930419921875, -0.41217041015625, -0.364410400390625, -0.316650390625, -0.268890380859375, -0.22113037109375, -0.173370361328125, -0.1256103515625, -0.077850341796875, -0.03009033203125, 0.017669677734375, 0.0654296875, 0.113189697265625, 0.16094970703125, 0.208709716796875, 0.2564697265625, 0.304229736328125, 0.35198974609375, 0.399749755859375, 0.447509765625, 0.495269775390625, 0.54302978515625, 0.590789794921875, 0.6385498046875, 0.686309814453125, 0.73406982421875, 0.781829833984375, 0.82958984375, 0.877349853515625, 0.92510986328125, 0.972869873046875, 1.0206298828125, 1.068389892578125, 1.11614990234375, 1.163909912109375, 1.211669921875, 1.259429931640625, 1.30718994140625, 1.354949951171875, 1.4027099609375, 1.450469970703125, 1.49822998046875, 1.545989990234375, 1.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 3.0, 10.0, 12.0, 18.0, 25.0, 22.0, 33.0, 42.0, 53.0, 52.0, 72.0, 83.0, 76.0, 81.0, 76.0, 59.0, 38.0, 44.0, 31.0, 36.0, 33.0, 18.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1289825439453125, -1.094879150390625, -1.0607757568359375, -1.02667236328125, -0.9925689697265625, -0.958465576171875, -0.9243621826171875, -0.8902587890625, -0.8561553955078125, -0.822052001953125, -0.7879486083984375, -0.75384521484375, -0.7197418212890625, -0.685638427734375, -0.6515350341796875, -0.617431640625, -0.5833282470703125, -0.549224853515625, -0.5151214599609375, -0.48101806640625, -0.4469146728515625, -0.412811279296875, -0.3787078857421875, -0.3446044921875, -0.3105010986328125, -0.276397705078125, -0.2422943115234375, -0.20819091796875, -0.1740875244140625, -0.139984130859375, -0.1058807373046875, -0.07177734375, -0.0376739501953125, -0.003570556640625, 0.0305328369140625, 0.06463623046875, 0.0987396240234375, 0.132843017578125, 0.1669464111328125, 0.2010498046875, 0.2351531982421875, 0.269256591796875, 0.3033599853515625, 0.33746337890625, 0.3715667724609375, 0.405670166015625, 0.4397735595703125, 0.473876953125, 0.5079803466796875, 0.542083740234375, 0.5761871337890625, 0.61029052734375, 0.6443939208984375, 0.678497314453125, 0.7126007080078125, 0.7467041015625, 0.7808074951171875, 0.814910888671875, 0.8490142822265625, 0.88311767578125, 0.9172210693359375, 0.951324462890625, 0.9854278564453125, 1.01953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 12.0, 16.0, 31.0, 30.0, 63.0, 88.0, 165.0, 444.0, 1306.0, 5923.0, 43659.0, 3505316.0, 606915.0, 24805.0, 3875.0, 911.0, 350.0, 157.0, 75.0, 43.0, 25.0, 18.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.03326416015625, -3.9141845703125, -3.79510498046875, -3.676025390625, -3.55694580078125, -3.4378662109375, -3.31878662109375, -3.19970703125, -3.08062744140625, -2.9615478515625, -2.84246826171875, -2.723388671875, -2.60430908203125, -2.4852294921875, -2.36614990234375, -2.2470703125, -2.12799072265625, -2.0089111328125, -1.88983154296875, -1.770751953125, -1.65167236328125, -1.5325927734375, -1.41351318359375, -1.29443359375, -1.17535400390625, -1.0562744140625, -0.93719482421875, -0.818115234375, -0.69903564453125, -0.5799560546875, -0.46087646484375, -0.341796875, -0.22271728515625, -0.1036376953125, 0.01544189453125, 0.134521484375, 0.25360107421875, 0.3726806640625, 0.49176025390625, 0.61083984375, 0.72991943359375, 0.8489990234375, 0.96807861328125, 1.087158203125, 1.20623779296875, 1.3253173828125, 1.44439697265625, 1.5634765625, 1.68255615234375, 1.8016357421875, 1.92071533203125, 2.039794921875, 2.15887451171875, 2.2779541015625, 2.39703369140625, 2.51611328125, 2.63519287109375, 2.7542724609375, 2.87335205078125, 2.992431640625, 3.11151123046875, 3.2305908203125, 3.34967041015625, 3.46875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 15.0, 16.0, 21.0, 30.0, 58.0, 112.0, 299.0, 1048.0, 1620.0, 470.0, 145.0, 86.0, 42.0, 31.0, 18.0, 11.0, 11.0, 15.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.2018585205078125, -4.106842041015625, -4.0118255615234375, -3.91680908203125, -3.8217926025390625, -3.726776123046875, -3.6317596435546875, -3.5367431640625, -3.4417266845703125, -3.346710205078125, -3.2516937255859375, -3.15667724609375, -3.0616607666015625, -2.966644287109375, -2.8716278076171875, -2.776611328125, -2.6815948486328125, -2.586578369140625, -2.4915618896484375, -2.39654541015625, -2.3015289306640625, -2.206512451171875, -2.1114959716796875, -2.0164794921875, -1.9214630126953125, -1.826446533203125, -1.7314300537109375, -1.63641357421875, -1.5413970947265625, -1.446380615234375, -1.3513641357421875, -1.25634765625, -1.1613311767578125, -1.066314697265625, -0.9712982177734375, -0.87628173828125, -0.7812652587890625, -0.686248779296875, -0.5912322998046875, -0.4962158203125, -0.4011993408203125, -0.306182861328125, -0.2111663818359375, -0.11614990234375, -0.0211334228515625, 0.073883056640625, 0.1688995361328125, 0.263916015625, 0.3589324951171875, 0.453948974609375, 0.5489654541015625, 0.64398193359375, 0.7389984130859375, 0.834014892578125, 0.9290313720703125, 1.0240478515625, 1.1190643310546875, 1.214080810546875, 1.3090972900390625, 1.40411376953125, 1.4991302490234375, 1.594146728515625, 1.6891632080078125, 1.7841796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 20.0, 22.0, 86.0, 161.0, 165.0, 178.0, 142.0, 86.0, 52.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77971076965332, -13.158794403076172, -12.537877082824707, -11.916959762573242, -11.296043395996094, -10.675127029418945, -10.05420970916748, -9.433292388916016, -8.812376022338867, -8.191459655761719, -7.570542335510254, -6.949625492095947, -6.328708648681641, -5.707791805267334, -5.086874961853027, -4.465958118438721, -3.845041275024414, -3.2241244316101074, -2.603207588195801, -1.9822907447814941, -1.3613739013671875, -0.7404570579528809, -0.11954021453857422, 0.5013766288757324, 1.122293472290039, 1.7432103157043457, 2.3641271591186523, 2.985044002532959, 3.6059608459472656, 4.226877689361572, 4.847794532775879, 5.4687113761901855, 6.089630126953125, 6.710546970367432, 7.331463813781738, 7.952380657196045, 8.573297500610352, 9.1942138671875, 9.815131187438965, 10.43604850769043, 11.056964874267578, 11.677881240844727, 12.298798561096191, 12.919715881347656, 13.540632247924805, 14.161548614501953, 14.782465934753418, 15.403383255004883, 16.02429962158203, 16.64521598815918, 17.266132354736328, 17.88705062866211, 18.507966995239258, 19.128883361816406, 19.749801635742188, 20.370718002319336, 20.991634368896484, 21.612550735473633, 22.23346710205078, 22.854385375976562, 23.47530174255371, 24.09621810913086, 24.71713638305664, 25.33805274963379, 25.958969116210938]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 14.0, 6.0, 8.0, 16.0, 15.0, 23.0, 23.0, 26.0, 32.0, 36.0, 34.0, 32.0, 34.0, 47.0, 43.0, 38.0, 38.0, 41.0, 44.0, 55.0, 48.0, 34.0, 39.0, 29.0, 30.0, 35.0, 37.0, 24.0, 23.0, 21.0, 18.0, 11.0, 6.0, 11.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.446706295013428, -7.216037750244141, -6.985368728637695, -6.754700183868408, -6.524031639099121, -6.293362617492676, -6.062694072723389, -5.832025527954102, -5.601356506347656, -5.370687961578369, -5.140018939971924, -4.909350395202637, -4.678681373596191, -4.448012828826904, -4.217344284057617, -3.986675500869751, -3.7560067176818848, -3.5253379344940186, -3.2946691513061523, -3.0640006065368652, -2.833331823348999, -2.602663040161133, -2.3719944953918457, -2.1413257122039795, -1.9106569290161133, -1.679988145828247, -1.4493194818496704, -1.2186508178710938, -0.9879820346832275, -0.7573132514953613, -0.5266445875167847, -0.295975923538208, -0.0653076171875, 0.16536110639572144, 0.39602982997894287, 0.6266985535621643, 0.8573672771453857, 1.088036060333252, 1.3187047243118286, 1.5493733882904053, 1.7800421714782715, 2.0107109546661377, 2.241379737854004, 2.472048282623291, 2.7027170658111572, 2.9333858489990234, 3.1640543937683105, 3.3947231769561768, 3.625391960144043, 3.856060743331909, 4.086729526519775, 4.3173980712890625, 4.548067092895508, 4.778735637664795, 5.009404182434082, 5.240073204040527, 5.4707417488098145, 5.701410293579102, 5.932079315185547, 6.162747859954834, 6.393416404724121, 6.624085426330566, 6.8547539710998535, 7.085422515869141, 7.316091537475586]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 20.0, 33.0, 25.0, 38.0, 73.0, 129.0, 206.0, 397.0, 738.0, 1296.0, 2970.0, 7433.0, 20242.0, 61442.0, 215915.0, 482460.0, 175197.0, 51256.0, 17022.0, 6286.0, 2611.0, 1301.0, 620.0, 317.0, 190.0, 94.0, 74.0, 46.0, 33.0, 23.0, 11.0, 9.0, 6.0, 4.0, 6.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.2578125, -2.18817138671875, -2.1185302734375, -2.04888916015625, -1.979248046875, -1.90960693359375, -1.8399658203125, -1.77032470703125, -1.70068359375, -1.63104248046875, -1.5614013671875, -1.49176025390625, -1.422119140625, -1.35247802734375, -1.2828369140625, -1.21319580078125, -1.1435546875, -1.07391357421875, -1.0042724609375, -0.93463134765625, -0.864990234375, -0.79534912109375, -0.7257080078125, -0.65606689453125, -0.58642578125, -0.51678466796875, -0.4471435546875, -0.37750244140625, -0.307861328125, -0.23822021484375, -0.1685791015625, -0.09893798828125, -0.029296875, 0.04034423828125, 0.1099853515625, 0.17962646484375, 0.249267578125, 0.31890869140625, 0.3885498046875, 0.45819091796875, 0.52783203125, 0.59747314453125, 0.6671142578125, 0.73675537109375, 0.806396484375, 0.87603759765625, 0.9456787109375, 1.01531982421875, 1.0849609375, 1.15460205078125, 1.2242431640625, 1.29388427734375, 1.363525390625, 1.43316650390625, 1.5028076171875, 1.57244873046875, 1.64208984375, 1.71173095703125, 1.7813720703125, 1.85101318359375, 1.920654296875, 1.99029541015625, 2.0599365234375, 2.12957763671875, 2.19921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 5.0, 5.0, 21.0, 15.0, 20.0, 36.0, 56.0, 46.0, 61.0, 66.0, 75.0, 69.0, 78.0, 69.0, 63.0, 44.0, 58.0, 27.0, 34.0, 21.0, 28.0, 19.0, 14.0, 13.0, 3.0, 13.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1727523803710938, -1.1404266357421875, -1.1081008911132812, -1.075775146484375, -1.0434494018554688, -1.0111236572265625, -0.9787979125976562, -0.94647216796875, -0.9141464233398438, -0.8818206787109375, -0.8494949340820312, -0.817169189453125, -0.7848434448242188, -0.7525177001953125, -0.7201919555664062, -0.6878662109375, -0.6555404663085938, -0.6232147216796875, -0.5908889770507812, -0.558563232421875, -0.5262374877929688, -0.4939117431640625, -0.46158599853515625, -0.42926025390625, -0.39693450927734375, -0.3646087646484375, -0.33228302001953125, -0.299957275390625, -0.26763153076171875, -0.2353057861328125, -0.20298004150390625, -0.170654296875, -0.13832855224609375, -0.1060028076171875, -0.07367706298828125, -0.041351318359375, -0.00902557373046875, 0.0233001708984375, 0.05562591552734375, 0.08795166015625, 0.12027740478515625, 0.1526031494140625, 0.18492889404296875, 0.217254638671875, 0.24958038330078125, 0.2819061279296875, 0.31423187255859375, 0.3465576171875, 0.37888336181640625, 0.4112091064453125, 0.44353485107421875, 0.475860595703125, 0.5081863403320312, 0.5405120849609375, 0.5728378295898438, 0.60516357421875, 0.6374893188476562, 0.6698150634765625, 0.7021408081054688, 0.734466552734375, 0.7667922973632812, 0.7991180419921875, 0.8314437866210938, 0.86376953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 20.0, 26.0, 30.0, 38.0, 56.0, 76.0, 90.0, 124.0, 192.0, 350.0, 566.0, 1187.0, 3115.0, 11280.0, 116772.0, 845896.0, 56048.0, 7760.0, 2451.0, 1008.0, 528.0, 295.0, 169.0, 146.0, 71.0, 54.0, 44.0, 35.0, 15.0, 20.0, 15.0, 6.0, 10.0, 4.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.876953125, -4.7109375, -4.544921875, -4.37890625, -4.212890625, -4.046875, -3.880859375, -3.71484375, -3.548828125, -3.3828125, -3.216796875, -3.05078125, -2.884765625, -2.71875, -2.552734375, -2.38671875, -2.220703125, -2.0546875, -1.888671875, -1.72265625, -1.556640625, -1.390625, -1.224609375, -1.05859375, -0.892578125, -0.7265625, -0.560546875, -0.39453125, -0.228515625, -0.0625, 0.103515625, 0.26953125, 0.435546875, 0.6015625, 0.767578125, 0.93359375, 1.099609375, 1.265625, 1.431640625, 1.59765625, 1.763671875, 1.9296875, 2.095703125, 2.26171875, 2.427734375, 2.59375, 2.759765625, 2.92578125, 3.091796875, 3.2578125, 3.423828125, 3.58984375, 3.755859375, 3.921875, 4.087890625, 4.25390625, 4.419921875, 4.5859375, 4.751953125, 4.91796875, 5.083984375, 5.25, 5.416015625, 5.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 11.0, 15.0, 17.0, 22.0, 33.0, 43.0, 40.0, 52.0, 55.0, 72.0, 72.0, 75.0, 80.0, 79.0, 50.0, 60.0, 48.0, 29.0, 31.0, 18.0, 17.0, 13.0, 9.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.78717041015625, -4.6251220703125, -4.46307373046875, -4.301025390625, -4.13897705078125, -3.9769287109375, -3.81488037109375, -3.65283203125, -3.49078369140625, -3.3287353515625, -3.16668701171875, -3.004638671875, -2.84259033203125, -2.6805419921875, -2.51849365234375, -2.3564453125, -2.19439697265625, -2.0323486328125, -1.87030029296875, -1.708251953125, -1.54620361328125, -1.3841552734375, -1.22210693359375, -1.06005859375, -0.89801025390625, -0.7359619140625, -0.57391357421875, -0.411865234375, -0.24981689453125, -0.0877685546875, 0.07427978515625, 0.236328125, 0.39837646484375, 0.5604248046875, 0.72247314453125, 0.884521484375, 1.04656982421875, 1.2086181640625, 1.37066650390625, 1.53271484375, 1.69476318359375, 1.8568115234375, 2.01885986328125, 2.180908203125, 2.34295654296875, 2.5050048828125, 2.66705322265625, 2.8291015625, 2.99114990234375, 3.1531982421875, 3.31524658203125, 3.477294921875, 3.63934326171875, 3.8013916015625, 3.96343994140625, 4.12548828125, 4.28753662109375, 4.4495849609375, 4.61163330078125, 4.773681640625, 4.93572998046875, 5.0977783203125, 5.25982666015625, 5.421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 12.0, 26.0, 20.0, 28.0, 35.0, 61.0, 84.0, 159.0, 290.0, 749.0, 2303.0, 12662.0, 347521.0, 663224.0, 16948.0, 2700.0, 848.0, 350.0, 171.0, 92.0, 76.0, 48.0, 29.0, 27.0, 21.0, 9.0, 8.0, 10.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.64453125, -2.571197509765625, -2.49786376953125, -2.424530029296875, -2.3511962890625, -2.277862548828125, -2.20452880859375, -2.131195068359375, -2.057861328125, -1.984527587890625, -1.91119384765625, -1.837860107421875, -1.7645263671875, -1.691192626953125, -1.61785888671875, -1.544525146484375, -1.47119140625, -1.397857666015625, -1.32452392578125, -1.251190185546875, -1.1778564453125, -1.104522705078125, -1.03118896484375, -0.957855224609375, -0.884521484375, -0.811187744140625, -0.73785400390625, -0.664520263671875, -0.5911865234375, -0.517852783203125, -0.44451904296875, -0.371185302734375, -0.2978515625, -0.224517822265625, -0.15118408203125, -0.077850341796875, -0.0045166015625, 0.068817138671875, 0.14215087890625, 0.215484619140625, 0.288818359375, 0.362152099609375, 0.43548583984375, 0.508819580078125, 0.5821533203125, 0.655487060546875, 0.72882080078125, 0.802154541015625, 0.87548828125, 0.948822021484375, 1.02215576171875, 1.095489501953125, 1.1688232421875, 1.242156982421875, 1.31549072265625, 1.388824462890625, 1.462158203125, 1.535491943359375, 1.60882568359375, 1.682159423828125, 1.7554931640625, 1.828826904296875, 1.90216064453125, 1.975494384765625, 2.048828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 11.0, 17.0, 27.0, 32.0, 51.0, 75.0, 114.0, 170.0, 180.0, 95.0, 62.0, 36.0, 35.0, 22.0, 15.0, 18.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003750324249267578, -0.0003658607602119446, -0.00035668909549713135, -0.0003475174307823181, -0.0003383457660675049, -0.00032917410135269165, -0.0003200024366378784, -0.0003108307719230652, -0.00030165910720825195, -0.0002924874424934387, -0.0002833157777786255, -0.00027414411306381226, -0.000264972448348999, -0.0002558007836341858, -0.00024662911891937256, -0.00023745745420455933, -0.0002282857894897461, -0.00021911412477493286, -0.00020994246006011963, -0.0002007707953453064, -0.00019159913063049316, -0.00018242746591567993, -0.0001732558012008667, -0.00016408413648605347, -0.00015491247177124023, -0.000145740807056427, -0.00013656914234161377, -0.00012739747762680054, -0.0001182258129119873, -0.00010905414819717407, -9.988248348236084e-05, -9.071081876754761e-05, -8.153915405273438e-05, -7.236748933792114e-05, -6.319582462310791e-05, -5.402415990829468e-05, -4.4852495193481445e-05, -3.568083047866821e-05, -2.650916576385498e-05, -1.7337501049041748e-05, -8.165836334228516e-06, 1.0058283805847168e-06, 1.017749309539795e-05, 1.934915781021118e-05, 2.8520822525024414e-05, 3.7692487239837646e-05, 4.686415195465088e-05, 5.603581666946411e-05, 6.520748138427734e-05, 7.437914609909058e-05, 8.355081081390381e-05, 9.272247552871704e-05, 0.00010189414024353027, 0.0001110658049583435, 0.00012023746967315674, 0.00012940913438796997, 0.0001385807991027832, 0.00014775246381759644, 0.00015692412853240967, 0.0001660957932472229, 0.00017526745796203613, 0.00018443912267684937, 0.0001936107873916626, 0.00020278245210647583, 0.00021195411682128906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 10.0, 21.0, 26.0, 33.0, 29.0, 42.0, 91.0, 138.0, 196.0, 347.0, 679.0, 1461.0, 4322.0, 20215.0, 296792.0, 679992.0, 34251.0, 6027.0, 1996.0, 849.0, 385.0, 239.0, 127.0, 76.0, 69.0, 34.0, 22.0, 21.0, 14.0, 9.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.7691497802734375, -1.714080810546875, -1.6590118408203125, -1.60394287109375, -1.5488739013671875, -1.493804931640625, -1.4387359619140625, -1.3836669921875, -1.3285980224609375, -1.273529052734375, -1.2184600830078125, -1.16339111328125, -1.1083221435546875, -1.053253173828125, -0.9981842041015625, -0.943115234375, -0.8880462646484375, -0.832977294921875, -0.7779083251953125, -0.72283935546875, -0.6677703857421875, -0.612701416015625, -0.5576324462890625, -0.5025634765625, -0.4474945068359375, -0.392425537109375, -0.3373565673828125, -0.28228759765625, -0.2272186279296875, -0.172149658203125, -0.1170806884765625, -0.06201171875, -0.0069427490234375, 0.048126220703125, 0.1031951904296875, 0.15826416015625, 0.2133331298828125, 0.268402099609375, 0.3234710693359375, 0.3785400390625, 0.4336090087890625, 0.488677978515625, 0.5437469482421875, 0.59881591796875, 0.6538848876953125, 0.708953857421875, 0.7640228271484375, 0.819091796875, 0.8741607666015625, 0.929229736328125, 0.9842987060546875, 1.03936767578125, 1.0944366455078125, 1.149505615234375, 1.2045745849609375, 1.2596435546875, 1.3147125244140625, 1.369781494140625, 1.4248504638671875, 1.47991943359375, 1.5349884033203125, 1.590057373046875, 1.6451263427734375, 1.7001953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 26.0, 16.0, 28.0, 28.0, 33.0, 55.0, 74.0, 82.0, 80.0, 101.0, 108.0, 74.0, 52.0, 41.0, 44.0, 27.0, 16.0, 25.0, 13.0, 7.0, 8.0, 8.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.2902984619140625, -1.252471923828125, -1.2146453857421875, -1.17681884765625, -1.1389923095703125, -1.101165771484375, -1.0633392333984375, -1.0255126953125, -0.9876861572265625, -0.949859619140625, -0.9120330810546875, -0.87420654296875, -0.8363800048828125, -0.798553466796875, -0.7607269287109375, -0.722900390625, -0.6850738525390625, -0.647247314453125, -0.6094207763671875, -0.57159423828125, -0.5337677001953125, -0.495941162109375, -0.4581146240234375, -0.4202880859375, -0.3824615478515625, -0.344635009765625, -0.3068084716796875, -0.26898193359375, -0.2311553955078125, -0.193328857421875, -0.1555023193359375, -0.11767578125, -0.0798492431640625, -0.042022705078125, -0.0041961669921875, 0.03363037109375, 0.0714569091796875, 0.109283447265625, 0.1471099853515625, 0.1849365234375, 0.2227630615234375, 0.260589599609375, 0.2984161376953125, 0.33624267578125, 0.3740692138671875, 0.411895751953125, 0.4497222900390625, 0.487548828125, 0.5253753662109375, 0.563201904296875, 0.6010284423828125, 0.63885498046875, 0.6766815185546875, 0.714508056640625, 0.7523345947265625, 0.7901611328125, 0.8279876708984375, 0.865814208984375, 0.9036407470703125, 0.94146728515625, 0.9792938232421875, 1.017120361328125, 1.0549468994140625, 1.0927734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 23.0, 41.0, 118.0, 207.0, 258.0, 213.0, 65.0, 28.0, 16.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.58578872680664, -46.51209259033203, -45.43840026855469, -44.36470413208008, -43.29100799560547, -42.217315673828125, -41.143619537353516, -40.069923400878906, -38.99623107910156, -37.92253494262695, -36.84884262084961, -35.775146484375, -34.70145034790039, -33.62775421142578, -32.55406188964844, -31.480365753173828, -30.40666961669922, -29.332975387573242, -28.259279251098633, -27.185585021972656, -26.111888885498047, -25.03819465637207, -23.964500427246094, -22.890804290771484, -21.817110061645508, -20.74341583251953, -19.669719696044922, -18.596025466918945, -17.52233123779297, -16.44863510131836, -15.374940872192383, -14.30124568939209, -13.227546691894531, -12.153851509094238, -11.080156326293945, -10.006462097167969, -8.932766914367676, -7.859071731567383, -6.785377025604248, -5.711682319641113, -4.63798713684082, -3.5642921924591064, -2.4905972480773926, -1.4169023036956787, -0.34320735931396484, 0.7304878234863281, 1.804182529449463, 2.8778772354125977, 3.9515724182128906, 5.025267601013184, 6.098962306976318, 7.172657012939453, 8.246352195739746, 9.320047378540039, 10.393741607666016, 11.467436790466309, 12.541131973266602, 13.614827156066895, 14.688522338867188, 15.762216567993164, 16.83591079711914, 17.90960693359375, 18.983301162719727, 20.056995391845703, 21.130691528320312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 8.0, 9.0, 13.0, 12.0, 21.0, 19.0, 19.0, 19.0, 24.0, 36.0, 43.0, 41.0, 46.0, 56.0, 55.0, 58.0, 55.0, 44.0, 53.0, 43.0, 43.0, 26.0, 26.0, 25.0, 34.0, 26.0, 26.0, 23.0, 6.0, 9.0, 4.0, 6.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-12.86214828491211, -12.477662086486816, -12.093174934387207, -11.708688735961914, -11.324201583862305, -10.939715385437012, -10.555229187011719, -10.17074203491211, -9.7862548828125, -9.401768684387207, -9.017281532287598, -8.632795333862305, -8.248308181762695, -7.863821983337402, -7.479335308074951, -7.0948486328125, -6.710362434387207, -6.325875759124756, -5.941389083862305, -5.556902885437012, -5.172415733337402, -4.787929534912109, -4.403442859649658, -4.018956184387207, -3.634469509124756, -3.2499828338623047, -2.8654961585998535, -2.4810097217559814, -2.0965230464935303, -1.712036371231079, -1.327549934387207, -0.9430632591247559, -0.5585775375366211, -0.1740909218788147, 0.2103956937789917, 0.5948822498321533, 0.9793689250946045, 1.3638556003570557, 1.7483420372009277, 2.132828712463379, 2.51731538772583, 2.9018020629882812, 3.2862887382507324, 3.6707751750946045, 4.055261611938477, 4.439748764038086, 4.824234962463379, 5.20872163772583, 5.593208312988281, 5.977694988250732, 6.362181663513184, 6.746667861938477, 7.131155014038086, 7.515641212463379, 7.90012788772583, 8.284614562988281, 8.66910171508789, 9.053587913513184, 9.438075065612793, 9.822561264038086, 10.207048416137695, 10.591534614562988, 10.976020812988281, 11.36050796508789, 11.744994163513184]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 7.0, 14.0, 16.0, 28.0, 36.0, 46.0, 55.0, 87.0, 163.0, 220.0, 381.0, 782.0, 1599.0, 3453.0, 8557.0, 27591.0, 179509.0, 3462499.0, 445291.0, 42894.0, 11866.0, 4681.0, 2134.0, 1068.0, 550.0, 289.0, 177.0, 101.0, 62.0, 35.0, 21.0, 18.0, 12.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.076171875, -2.0162506103515625, -1.956329345703125, -1.8964080810546875, -1.83648681640625, -1.7765655517578125, -1.716644287109375, -1.6567230224609375, -1.5968017578125, -1.5368804931640625, -1.476959228515625, -1.4170379638671875, -1.35711669921875, -1.2971954345703125, -1.237274169921875, -1.1773529052734375, -1.117431640625, -1.0575103759765625, -0.997589111328125, -0.9376678466796875, -0.87774658203125, -0.8178253173828125, -0.757904052734375, -0.6979827880859375, -0.6380615234375, -0.5781402587890625, -0.518218994140625, -0.4582977294921875, -0.39837646484375, -0.3384552001953125, -0.278533935546875, -0.2186126708984375, -0.15869140625, -0.0987701416015625, -0.038848876953125, 0.0210723876953125, 0.08099365234375, 0.1409149169921875, 0.200836181640625, 0.2607574462890625, 0.3206787109375, 0.3805999755859375, 0.440521240234375, 0.5004425048828125, 0.56036376953125, 0.6202850341796875, 0.680206298828125, 0.7401275634765625, 0.800048828125, 0.8599700927734375, 0.919891357421875, 0.9798126220703125, 1.03973388671875, 1.0996551513671875, 1.159576416015625, 1.2194976806640625, 1.2794189453125, 1.3393402099609375, 1.399261474609375, 1.4591827392578125, 1.51910400390625, 1.5790252685546875, 1.638946533203125, 1.6988677978515625, 1.7587890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 15.0, 15.0, 25.0, 21.0, 35.0, 33.0, 50.0, 58.0, 62.0, 52.0, 49.0, 65.0, 62.0, 45.0, 61.0, 51.0, 41.0, 51.0, 32.0, 28.0, 18.0, 21.0, 16.0, 18.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.107421875, -1.0788955688476562, -1.0503692626953125, -1.0218429565429688, -0.993316650390625, -0.9647903442382812, -0.9362640380859375, -0.9077377319335938, -0.87921142578125, -0.8506851196289062, -0.8221588134765625, -0.7936325073242188, -0.765106201171875, -0.7365798950195312, -0.7080535888671875, -0.6795272827148438, -0.6510009765625, -0.6224746704101562, -0.5939483642578125, -0.5654220581054688, -0.536895751953125, -0.5083694458007812, -0.4798431396484375, -0.45131683349609375, -0.42279052734375, -0.39426422119140625, -0.3657379150390625, -0.33721160888671875, -0.308685302734375, -0.28015899658203125, -0.2516326904296875, -0.22310638427734375, -0.194580078125, -0.16605377197265625, -0.1375274658203125, -0.10900115966796875, -0.080474853515625, -0.05194854736328125, -0.0234222412109375, 0.00510406494140625, 0.03363037109375, 0.06215667724609375, 0.0906829833984375, 0.11920928955078125, 0.147735595703125, 0.17626190185546875, 0.2047882080078125, 0.23331451416015625, 0.2618408203125, 0.29036712646484375, 0.3188934326171875, 0.34741973876953125, 0.375946044921875, 0.40447235107421875, 0.4329986572265625, 0.46152496337890625, 0.49005126953125, 0.5185775756835938, 0.5471038818359375, 0.5756301879882812, 0.604156494140625, 0.6326828002929688, 0.6612091064453125, 0.6897354125976562, 0.71826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 22.0, 50.0, 69.0, 172.0, 254.0, 489.0, 1170.0, 3757.0, 16002.0, 142813.0, 3830704.0, 176338.0, 16954.0, 3523.0, 1105.0, 451.0, 204.0, 100.0, 40.0, 25.0, 12.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.132232666015625, -3.03594970703125, -2.939666748046875, -2.8433837890625, -2.747100830078125, -2.65081787109375, -2.554534912109375, -2.458251953125, -2.361968994140625, -2.26568603515625, -2.169403076171875, -2.0731201171875, -1.976837158203125, -1.88055419921875, -1.784271240234375, -1.68798828125, -1.591705322265625, -1.49542236328125, -1.399139404296875, -1.3028564453125, -1.206573486328125, -1.11029052734375, -1.014007568359375, -0.917724609375, -0.821441650390625, -0.72515869140625, -0.628875732421875, -0.5325927734375, -0.436309814453125, -0.34002685546875, -0.243743896484375, -0.1474609375, -0.051177978515625, 0.04510498046875, 0.141387939453125, 0.2376708984375, 0.333953857421875, 0.43023681640625, 0.526519775390625, 0.622802734375, 0.719085693359375, 0.81536865234375, 0.911651611328125, 1.0079345703125, 1.104217529296875, 1.20050048828125, 1.296783447265625, 1.39306640625, 1.489349365234375, 1.58563232421875, 1.681915283203125, 1.7781982421875, 1.874481201171875, 1.97076416015625, 2.067047119140625, 2.163330078125, 2.259613037109375, 2.35589599609375, 2.452178955078125, 2.5484619140625, 2.644744873046875, 2.74102783203125, 2.837310791015625, 2.93359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 30.0, 54.0, 81.0, 172.0, 468.0, 1135.0, 1205.0, 480.0, 209.0, 75.0, 57.0, 19.0, 16.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.090606689453125, -3.00933837890625, -2.928070068359375, -2.8468017578125, -2.765533447265625, -2.68426513671875, -2.602996826171875, -2.521728515625, -2.440460205078125, -2.35919189453125, -2.277923583984375, -2.1966552734375, -2.115386962890625, -2.03411865234375, -1.952850341796875, -1.87158203125, -1.790313720703125, -1.70904541015625, -1.627777099609375, -1.5465087890625, -1.465240478515625, -1.38397216796875, -1.302703857421875, -1.221435546875, -1.140167236328125, -1.05889892578125, -0.977630615234375, -0.8963623046875, -0.815093994140625, -0.73382568359375, -0.652557373046875, -0.5712890625, -0.490020751953125, -0.40875244140625, -0.327484130859375, -0.2462158203125, -0.164947509765625, -0.08367919921875, -0.002410888671875, 0.078857421875, 0.160125732421875, 0.24139404296875, 0.322662353515625, 0.4039306640625, 0.485198974609375, 0.56646728515625, 0.647735595703125, 0.72900390625, 0.810272216796875, 0.89154052734375, 0.972808837890625, 1.0540771484375, 1.135345458984375, 1.21661376953125, 1.297882080078125, 1.379150390625, 1.460418701171875, 1.54168701171875, 1.622955322265625, 1.7042236328125, 1.785491943359375, 1.86676025390625, 1.948028564453125, 2.029296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 15.0, 58.0, 253.0, 387.0, 203.0, 47.0, 16.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.369407653808594, -18.183977127075195, -16.99854850769043, -15.813117980957031, -14.627687454223633, -13.44225788116455, -12.256828308105469, -11.07139778137207, -9.885968208312988, -8.700538635253906, -7.515108108520508, -6.329678535461426, -5.1442484855651855, -3.9588184356689453, -2.7733888626098633, -1.5879583358764648, -0.4025287628173828, 0.7829011678695679, 1.9683310985565186, 3.1537609100341797, 4.33919095993042, 5.52462100982666, 6.710050582885742, 7.895481109619141, 9.080910682678223, 10.266340255737305, 11.451770782470703, 12.637200355529785, 13.822629928588867, 15.008060455322266, 16.19348907470703, 17.378921508789062, 18.564350128173828, 19.749780654907227, 20.935209274291992, 22.12063980102539, 23.30607032775879, 24.491500854492188, 25.676929473876953, 26.86236000061035, 28.04779052734375, 29.23322105407715, 30.418649673461914, 31.604080200195312, 32.78950881958008, 33.97494125366211, 35.160369873046875, 36.345802307128906, 37.531227111816406, 38.71665573120117, 39.9020881652832, 41.08751678466797, 42.272945404052734, 43.458377838134766, 44.64380645751953, 45.82923889160156, 47.01466751098633, 48.200096130371094, 49.385528564453125, 50.57095718383789, 51.756385803222656, 52.94181823730469, 54.12724685668945, 55.31267547607422, 56.49810791015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 12.0, 11.0, 10.0, 23.0, 23.0, 32.0, 34.0, 39.0, 53.0, 48.0, 45.0, 49.0, 49.0, 59.0, 42.0, 50.0, 61.0, 54.0, 43.0, 37.0, 53.0, 32.0, 22.0, 22.0, 24.0, 15.0, 13.0, 7.0, 4.0, 7.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.749755382537842, -7.472809791564941, -7.195863723754883, -6.918918132781982, -6.641972064971924, -6.365026473999023, -6.088080406188965, -5.8111348152160645, -5.534189224243164, -5.257243633270264, -4.980297565460205, -4.703351974487305, -4.426405906677246, -4.149460315704346, -3.872514486312866, -3.5955686569213867, -3.318622589111328, -3.0416767597198486, -2.764730930328369, -2.4877853393554688, -2.21083927154541, -1.9338935613632202, -1.6569478511810303, -1.3800020217895508, -1.1030561923980713, -0.8261103630065918, -0.5491645932197571, -0.27221882343292236, 0.004727005958557129, 0.2816728353500366, 0.5586185455322266, 0.835564374923706, 1.1125097274780273, 1.3894555568695068, 1.6664013862609863, 1.9433470964431763, 2.2202930450439453, 2.4972386360168457, 2.774184465408325, 3.0511302947998047, 3.328076124191284, 3.6050219535827637, 3.881967782974243, 4.158913612365723, 4.435859203338623, 4.712805271148682, 4.989750862121582, 5.266696929931641, 5.543642520904541, 5.820588111877441, 6.0975341796875, 6.3744797706604, 6.651425838470459, 6.928371429443359, 7.205317497253418, 7.482263088226318, 7.759208679199219, 8.036154747009277, 8.31309986114502, 8.590045928955078, 8.866991996765137, 9.143938064575195, 9.420883178710938, 9.697829246520996, 9.974775314331055]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 12.0, 24.0, 27.0, 34.0, 62.0, 106.0, 145.0, 248.0, 504.0, 833.0, 1511.0, 3229.0, 7003.0, 16738.0, 45458.0, 136654.0, 401281.0, 290985.0, 89678.0, 31264.0, 12339.0, 5235.0, 2393.0, 1205.0, 636.0, 343.0, 213.0, 132.0, 73.0, 49.0, 38.0, 26.0, 9.0, 10.0, 11.0, 10.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9460601806640625, -1.890167236328125, -1.8342742919921875, -1.77838134765625, -1.7224884033203125, -1.666595458984375, -1.6107025146484375, -1.5548095703125, -1.4989166259765625, -1.443023681640625, -1.3871307373046875, -1.33123779296875, -1.2753448486328125, -1.219451904296875, -1.1635589599609375, -1.107666015625, -1.0517730712890625, -0.995880126953125, -0.9399871826171875, -0.88409423828125, -0.8282012939453125, -0.772308349609375, -0.7164154052734375, -0.6605224609375, -0.6046295166015625, -0.548736572265625, -0.4928436279296875, -0.43695068359375, -0.3810577392578125, -0.325164794921875, -0.2692718505859375, -0.21337890625, -0.1574859619140625, -0.101593017578125, -0.0457000732421875, 0.01019287109375, 0.0660858154296875, 0.121978759765625, 0.1778717041015625, 0.2337646484375, 0.2896575927734375, 0.345550537109375, 0.4014434814453125, 0.45733642578125, 0.5132293701171875, 0.569122314453125, 0.6250152587890625, 0.680908203125, 0.7368011474609375, 0.792694091796875, 0.8485870361328125, 0.90447998046875, 0.9603729248046875, 1.016265869140625, 1.0721588134765625, 1.1280517578125, 1.1839447021484375, 1.239837646484375, 1.2957305908203125, 1.35162353515625, 1.4075164794921875, 1.463409423828125, 1.5193023681640625, 1.5751953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 8.0, 15.0, 8.0, 21.0, 19.0, 19.0, 29.0, 44.0, 39.0, 39.0, 59.0, 46.0, 51.0, 50.0, 58.0, 54.0, 54.0, 34.0, 39.0, 59.0, 32.0, 42.0, 29.0, 33.0, 20.0, 11.0, 15.0, 9.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.98291015625, -0.9573593139648438, -0.9318084716796875, -0.9062576293945312, -0.880706787109375, -0.8551559448242188, -0.8296051025390625, -0.8040542602539062, -0.77850341796875, -0.7529525756835938, -0.7274017333984375, -0.7018508911132812, -0.676300048828125, -0.6507492065429688, -0.6251983642578125, -0.5996475219726562, -0.5740966796875, -0.5485458374023438, -0.5229949951171875, -0.49744415283203125, -0.471893310546875, -0.44634246826171875, -0.4207916259765625, -0.39524078369140625, -0.36968994140625, -0.34413909912109375, -0.3185882568359375, -0.29303741455078125, -0.267486572265625, -0.24193572998046875, -0.2163848876953125, -0.19083404541015625, -0.165283203125, -0.13973236083984375, -0.1141815185546875, -0.08863067626953125, -0.063079833984375, -0.03752899169921875, -0.0119781494140625, 0.01357269287109375, 0.03912353515625, 0.06467437744140625, 0.0902252197265625, 0.11577606201171875, 0.141326904296875, 0.16687774658203125, 0.1924285888671875, 0.21797943115234375, 0.2435302734375, 0.26908111572265625, 0.2946319580078125, 0.32018280029296875, 0.345733642578125, 0.37128448486328125, 0.3968353271484375, 0.42238616943359375, 0.44793701171875, 0.47348785400390625, 0.4990386962890625, 0.5245895385742188, 0.550140380859375, 0.5756912231445312, 0.6012420654296875, 0.6267929077148438, 0.65234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 10.0, 8.0, 36.0, 43.0, 49.0, 83.0, 128.0, 242.0, 391.0, 736.0, 1552.0, 4132.0, 18365.0, 135598.0, 740389.0, 122342.0, 17160.0, 4166.0, 1465.0, 678.0, 332.0, 201.0, 134.0, 90.0, 54.0, 48.0, 26.0, 15.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.631103515625, -2.52783203125, -2.424560546875, -2.3212890625, -2.218017578125, -2.11474609375, -2.011474609375, -1.908203125, -1.804931640625, -1.70166015625, -1.598388671875, -1.4951171875, -1.391845703125, -1.28857421875, -1.185302734375, -1.08203125, -0.978759765625, -0.87548828125, -0.772216796875, -0.6689453125, -0.565673828125, -0.46240234375, -0.359130859375, -0.255859375, -0.152587890625, -0.04931640625, 0.053955078125, 0.1572265625, 0.260498046875, 0.36376953125, 0.467041015625, 0.5703125, 0.673583984375, 0.77685546875, 0.880126953125, 0.9833984375, 1.086669921875, 1.18994140625, 1.293212890625, 1.396484375, 1.499755859375, 1.60302734375, 1.706298828125, 1.8095703125, 1.912841796875, 2.01611328125, 2.119384765625, 2.22265625, 2.325927734375, 2.42919921875, 2.532470703125, 2.6357421875, 2.739013671875, 2.84228515625, 2.945556640625, 3.048828125, 3.152099609375, 3.25537109375, 3.358642578125, 3.4619140625, 3.565185546875, 3.66845703125, 3.771728515625, 3.875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 8.0, 12.0, 11.0, 14.0, 18.0, 19.0, 22.0, 23.0, 30.0, 36.0, 36.0, 37.0, 39.0, 45.0, 45.0, 49.0, 39.0, 46.0, 58.0, 53.0, 37.0, 37.0, 49.0, 32.0, 25.0, 30.0, 16.0, 15.0, 14.0, 13.0, 13.0, 8.0, 10.0, 12.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.78515625, -2.70001220703125, -2.6148681640625, -2.52972412109375, -2.444580078125, -2.35943603515625, -2.2742919921875, -2.18914794921875, -2.10400390625, -2.01885986328125, -1.9337158203125, -1.84857177734375, -1.763427734375, -1.67828369140625, -1.5931396484375, -1.50799560546875, -1.4228515625, -1.33770751953125, -1.2525634765625, -1.16741943359375, -1.082275390625, -0.99713134765625, -0.9119873046875, -0.82684326171875, -0.74169921875, -0.65655517578125, -0.5714111328125, -0.48626708984375, -0.401123046875, -0.31597900390625, -0.2308349609375, -0.14569091796875, -0.060546875, 0.02459716796875, 0.1097412109375, 0.19488525390625, 0.280029296875, 0.36517333984375, 0.4503173828125, 0.53546142578125, 0.62060546875, 0.70574951171875, 0.7908935546875, 0.87603759765625, 0.961181640625, 1.04632568359375, 1.1314697265625, 1.21661376953125, 1.3017578125, 1.38690185546875, 1.4720458984375, 1.55718994140625, 1.642333984375, 1.72747802734375, 1.8126220703125, 1.89776611328125, 1.98291015625, 2.06805419921875, 2.1531982421875, 2.23834228515625, 2.323486328125, 2.40863037109375, 2.4937744140625, 2.57891845703125, 2.6640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 7.0, 12.0, 29.0, 47.0, 108.0, 345.0, 2171.0, 256132.0, 786085.0, 2970.0, 422.0, 122.0, 52.0, 15.0, 14.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.790130615234375, -3.64471435546875, -3.499298095703125, -3.3538818359375, -3.208465576171875, -3.06304931640625, -2.917633056640625, -2.772216796875, -2.626800537109375, -2.48138427734375, -2.335968017578125, -2.1905517578125, -2.045135498046875, -1.89971923828125, -1.754302978515625, -1.60888671875, -1.463470458984375, -1.31805419921875, -1.172637939453125, -1.0272216796875, -0.881805419921875, -0.73638916015625, -0.590972900390625, -0.445556640625, -0.300140380859375, -0.15472412109375, -0.009307861328125, 0.1361083984375, 0.281524658203125, 0.42694091796875, 0.572357177734375, 0.7177734375, 0.863189697265625, 1.00860595703125, 1.154022216796875, 1.2994384765625, 1.444854736328125, 1.59027099609375, 1.735687255859375, 1.881103515625, 2.026519775390625, 2.17193603515625, 2.317352294921875, 2.4627685546875, 2.608184814453125, 2.75360107421875, 2.899017333984375, 3.04443359375, 3.189849853515625, 3.33526611328125, 3.480682373046875, 3.6260986328125, 3.771514892578125, 3.91693115234375, 4.062347412109375, 4.207763671875, 4.353179931640625, 4.49859619140625, 4.644012451171875, 4.7894287109375, 4.934844970703125, 5.08026123046875, 5.225677490234375, 5.37109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 10.0, 8.0, 5.0, 8.0, 11.0, 20.0, 16.0, 34.0, 40.0, 63.0, 74.0, 108.0, 143.0, 130.0, 85.0, 66.0, 43.0, 34.0, 16.0, 24.0, 6.0, 13.0, 16.0, 4.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016164779663085938, -0.00015586242079734802, -0.00015007704496383667, -0.00014429166913032532, -0.00013850629329681396, -0.0001327209174633026, -0.00012693554162979126, -0.00012115016579627991, -0.00011536478996276855, -0.0001095794141292572, -0.00010379403829574585, -9.80086624622345e-05, -9.222328662872314e-05, -8.643791079521179e-05, -8.065253496170044e-05, -7.486715912818909e-05, -6.908178329467773e-05, -6.329640746116638e-05, -5.751103162765503e-05, -5.172565579414368e-05, -4.5940279960632324e-05, -4.015490412712097e-05, -3.436952829360962e-05, -2.8584152460098267e-05, -2.2798776626586914e-05, -1.701340079307556e-05, -1.1228024959564209e-05, -5.4426491260528564e-06, 3.427267074584961e-07, 6.128102540969849e-06, 1.1913478374481201e-05, 1.7698854207992554e-05, 2.3484230041503906e-05, 2.926960587501526e-05, 3.505498170852661e-05, 4.0840357542037964e-05, 4.6625733375549316e-05, 5.241110920906067e-05, 5.819648504257202e-05, 6.398186087608337e-05, 6.976723670959473e-05, 7.555261254310608e-05, 8.133798837661743e-05, 8.712336421012878e-05, 9.290874004364014e-05, 9.869411587715149e-05, 0.00010447949171066284, 0.0001102648675441742, 0.00011605024337768555, 0.0001218356192111969, 0.00012762099504470825, 0.0001334063708782196, 0.00013919174671173096, 0.0001449771225452423, 0.00015076249837875366, 0.00015654787421226501, 0.00016233325004577637, 0.00016811862587928772, 0.00017390400171279907, 0.00017968937754631042, 0.00018547475337982178, 0.00019126012921333313, 0.00019704550504684448, 0.00020283088088035583, 0.0002086162567138672]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 11.0, 15.0, 26.0, 40.0, 66.0, 114.0, 222.0, 477.0, 1117.0, 3599.0, 18200.0, 275592.0, 704149.0, 36440.0, 5583.0, 1672.0, 584.0, 264.0, 141.0, 74.0, 55.0, 29.0, 27.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.975067138671875, -0.92669677734375, -0.878326416015625, -0.8299560546875, -0.781585693359375, -0.73321533203125, -0.684844970703125, -0.636474609375, -0.588104248046875, -0.53973388671875, -0.491363525390625, -0.4429931640625, -0.394622802734375, -0.34625244140625, -0.297882080078125, -0.24951171875, -0.201141357421875, -0.15277099609375, -0.104400634765625, -0.0560302734375, -0.007659912109375, 0.04071044921875, 0.089080810546875, 0.137451171875, 0.185821533203125, 0.23419189453125, 0.282562255859375, 0.3309326171875, 0.379302978515625, 0.42767333984375, 0.476043701171875, 0.5244140625, 0.572784423828125, 0.62115478515625, 0.669525146484375, 0.7178955078125, 0.766265869140625, 0.81463623046875, 0.863006591796875, 0.911376953125, 0.959747314453125, 1.00811767578125, 1.056488037109375, 1.1048583984375, 1.153228759765625, 1.20159912109375, 1.249969482421875, 1.29833984375, 1.346710205078125, 1.39508056640625, 1.443450927734375, 1.4918212890625, 1.540191650390625, 1.58856201171875, 1.636932373046875, 1.685302734375, 1.733673095703125, 1.78204345703125, 1.830413818359375, 1.8787841796875, 1.927154541015625, 1.97552490234375, 2.023895263671875, 2.072265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 12.0, 10.0, 22.0, 36.0, 43.0, 65.0, 87.0, 107.0, 128.0, 121.0, 93.0, 73.0, 50.0, 49.0, 36.0, 17.0, 13.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.980621337890625, -0.94268798828125, -0.904754638671875, -0.8668212890625, -0.828887939453125, -0.79095458984375, -0.753021240234375, -0.715087890625, -0.677154541015625, -0.63922119140625, -0.601287841796875, -0.5633544921875, -0.525421142578125, -0.48748779296875, -0.449554443359375, -0.41162109375, -0.373687744140625, -0.33575439453125, -0.297821044921875, -0.2598876953125, -0.221954345703125, -0.18402099609375, -0.146087646484375, -0.108154296875, -0.070220947265625, -0.03228759765625, 0.005645751953125, 0.0435791015625, 0.081512451171875, 0.11944580078125, 0.157379150390625, 0.1953125, 0.233245849609375, 0.27117919921875, 0.309112548828125, 0.3470458984375, 0.384979248046875, 0.42291259765625, 0.460845947265625, 0.498779296875, 0.536712646484375, 0.57464599609375, 0.612579345703125, 0.6505126953125, 0.688446044921875, 0.72637939453125, 0.764312744140625, 0.80224609375, 0.840179443359375, 0.87811279296875, 0.916046142578125, 0.9539794921875, 0.991912841796875, 1.02984619140625, 1.067779541015625, 1.105712890625, 1.143646240234375, 1.18157958984375, 1.219512939453125, 1.2574462890625, 1.295379638671875, 1.33331298828125, 1.371246337890625, 1.4091796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 69.0, 183.0, 351.0, 229.0, 71.0, 31.0, 10.0, 10.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.86699676513672, -38.75015640258789, -37.63331604003906, -36.516475677490234, -35.399635314941406, -34.28279495239258, -33.16595458984375, -32.04911804199219, -30.932275772094727, -29.8154354095459, -28.69859504699707, -27.581754684448242, -26.464916229248047, -25.34807586669922, -24.23123550415039, -23.114395141601562, -21.997554779052734, -20.880714416503906, -19.763874053955078, -18.64703369140625, -17.530193328857422, -16.413352966308594, -15.296514511108398, -14.17967414855957, -13.062833786010742, -11.945993423461914, -10.829153060913086, -9.712313652038574, -8.595473289489746, -7.478632926940918, -6.361793041229248, -5.244953155517578, -4.12811279296875, -3.011272668838501, -1.894432544708252, -0.7775924205780029, 0.3392477035522461, 1.4560880661010742, 2.572927951812744, 3.689767837524414, 4.806608200073242, 5.92344856262207, 7.04028844833374, 8.15712833404541, 9.273968696594238, 10.390809059143066, 11.507648468017578, 12.624488830566406, 13.741329193115234, 14.858169555664062, 15.97500991821289, 17.09185028076172, 18.208690643310547, 19.325531005859375, 20.44236946105957, 21.5592098236084, 22.676050186157227, 23.792890548706055, 24.909730911254883, 26.02657127380371, 27.143409729003906, 28.260250091552734, 29.377090454101562, 30.49393081665039, 31.61077117919922]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 9.0, 10.0, 15.0, 11.0, 23.0, 19.0, 29.0, 29.0, 34.0, 40.0, 37.0, 45.0, 55.0, 45.0, 55.0, 51.0, 52.0, 52.0, 49.0, 43.0, 31.0, 34.0, 25.0, 19.0, 25.0, 24.0, 21.0, 19.0, 16.0, 13.0, 7.0, 13.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.482670783996582, -9.140835762023926, -8.79900074005127, -8.457165718078613, -8.115331649780273, -7.773496150970459, -7.431661605834961, -7.089826583862305, -6.747991561889648, -6.406156539916992, -6.064321517944336, -5.722486972808838, -5.380651950836182, -5.038816928863525, -4.696982383728027, -4.355147361755371, -4.013312339782715, -3.6714773178100586, -3.3296425342559814, -2.9878077507019043, -2.645972728729248, -2.304137706756592, -1.9623029232025146, -1.6204681396484375, -1.2786331176757812, -0.9367982149124146, -0.5949633121490479, -0.25312840938568115, 0.08870649337768555, 0.43054139614105225, 0.772376298904419, 1.114211082458496, 1.456045150756836, 1.7978800535202026, 2.1397149562835693, 2.4815497398376465, 2.8233847618103027, 3.165219783782959, 3.507054567337036, 3.8488893508911133, 4.1907243728637695, 4.532559394836426, 4.874394416809082, 5.21622896194458, 5.558063983917236, 5.899899005889893, 6.241733551025391, 6.583568572998047, 6.925403594970703, 7.267238616943359, 7.609073638916016, 7.950908184051514, 8.292743682861328, 8.634577751159668, 8.976412773132324, 9.31824779510498, 9.660082817077637, 10.001917839050293, 10.34375286102295, 10.685587882995605, 11.027421951293945, 11.369256973266602, 11.711091995239258, 12.052927017211914, 12.39476203918457]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 14.0, 4.0, 9.0, 23.0, 26.0, 34.0, 38.0, 59.0, 86.0, 121.0, 178.0, 294.0, 444.0, 804.0, 1394.0, 2636.0, 5661.0, 13338.0, 37410.0, 147057.0, 1218279.0, 2385928.0, 287098.0, 58793.0, 19009.0, 7535.0, 3557.0, 1805.0, 973.0, 558.0, 370.0, 233.0, 156.0, 98.0, 61.0, 57.0, 38.0, 26.0, 20.0, 12.0, 11.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.306640625, -1.2684173583984375, -1.230194091796875, -1.1919708251953125, -1.15374755859375, -1.1155242919921875, -1.077301025390625, -1.0390777587890625, -1.0008544921875, -0.9626312255859375, -0.924407958984375, -0.8861846923828125, -0.84796142578125, -0.8097381591796875, -0.771514892578125, -0.7332916259765625, -0.695068359375, -0.6568450927734375, -0.618621826171875, -0.5803985595703125, -0.54217529296875, -0.5039520263671875, -0.465728759765625, -0.4275054931640625, -0.3892822265625, -0.3510589599609375, -0.312835693359375, -0.2746124267578125, -0.23638916015625, -0.1981658935546875, -0.159942626953125, -0.1217193603515625, -0.08349609375, -0.0452728271484375, -0.007049560546875, 0.0311737060546875, 0.06939697265625, 0.1076202392578125, 0.145843505859375, 0.1840667724609375, 0.2222900390625, 0.2605133056640625, 0.298736572265625, 0.3369598388671875, 0.37518310546875, 0.4134063720703125, 0.451629638671875, 0.4898529052734375, 0.528076171875, 0.5662994384765625, 0.604522705078125, 0.6427459716796875, 0.68096923828125, 0.7191925048828125, 0.757415771484375, 0.7956390380859375, 0.8338623046875, 0.8720855712890625, 0.910308837890625, 0.9485321044921875, 0.98675537109375, 1.0249786376953125, 1.063201904296875, 1.1014251708984375, 1.1396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 20.0, 21.0, 30.0, 43.0, 49.0, 60.0, 67.0, 81.0, 81.0, 81.0, 69.0, 72.0, 68.0, 51.0, 57.0, 42.0, 26.0, 14.0, 19.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1061859130859375, -1.070770263671875, -1.0353546142578125, -0.99993896484375, -0.9645233154296875, -0.929107666015625, -0.8936920166015625, -0.8582763671875, -0.8228607177734375, -0.787445068359375, -0.7520294189453125, -0.71661376953125, -0.6811981201171875, -0.645782470703125, -0.6103668212890625, -0.574951171875, -0.5395355224609375, -0.504119873046875, -0.4687042236328125, -0.43328857421875, -0.3978729248046875, -0.362457275390625, -0.3270416259765625, -0.2916259765625, -0.2562103271484375, -0.220794677734375, -0.1853790283203125, -0.14996337890625, -0.1145477294921875, -0.079132080078125, -0.0437164306640625, -0.00830078125, 0.0271148681640625, 0.062530517578125, 0.0979461669921875, 0.13336181640625, 0.1687774658203125, 0.204193115234375, 0.2396087646484375, 0.2750244140625, 0.3104400634765625, 0.345855712890625, 0.3812713623046875, 0.41668701171875, 0.4521026611328125, 0.487518310546875, 0.5229339599609375, 0.558349609375, 0.5937652587890625, 0.629180908203125, 0.6645965576171875, 0.70001220703125, 0.7354278564453125, 0.770843505859375, 0.8062591552734375, 0.8416748046875, 0.8770904541015625, 0.912506103515625, 0.9479217529296875, 0.98333740234375, 1.0187530517578125, 1.054168701171875, 1.0895843505859375, 1.125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 12.0, 27.0, 23.0, 35.0, 51.0, 74.0, 137.0, 212.0, 415.0, 847.0, 2156.0, 6016.0, 20020.0, 86916.0, 983631.0, 2865149.0, 180300.0, 33731.0, 9169.0, 2966.0, 1187.0, 523.0, 276.0, 145.0, 79.0, 48.0, 36.0, 23.0, 22.0, 11.0, 10.0, 3.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.707122802734375, -1.65057373046875, -1.594024658203125, -1.5374755859375, -1.480926513671875, -1.42437744140625, -1.367828369140625, -1.311279296875, -1.254730224609375, -1.19818115234375, -1.141632080078125, -1.0850830078125, -1.028533935546875, -0.97198486328125, -0.915435791015625, -0.85888671875, -0.802337646484375, -0.74578857421875, -0.689239501953125, -0.6326904296875, -0.576141357421875, -0.51959228515625, -0.463043212890625, -0.406494140625, -0.349945068359375, -0.29339599609375, -0.236846923828125, -0.1802978515625, -0.123748779296875, -0.06719970703125, -0.010650634765625, 0.0458984375, 0.102447509765625, 0.15899658203125, 0.215545654296875, 0.2720947265625, 0.328643798828125, 0.38519287109375, 0.441741943359375, 0.498291015625, 0.554840087890625, 0.61138916015625, 0.667938232421875, 0.7244873046875, 0.781036376953125, 0.83758544921875, 0.894134521484375, 0.95068359375, 1.007232666015625, 1.06378173828125, 1.120330810546875, 1.1768798828125, 1.233428955078125, 1.28997802734375, 1.346527099609375, 1.403076171875, 1.459625244140625, 1.51617431640625, 1.572723388671875, 1.6292724609375, 1.685821533203125, 1.74237060546875, 1.798919677734375, 1.85546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 10.0, 11.0, 21.0, 16.0, 27.0, 28.0, 43.0, 40.0, 63.0, 111.0, 138.0, 210.0, 330.0, 494.0, 553.0, 584.0, 395.0, 275.0, 186.0, 120.0, 89.0, 62.0, 53.0, 39.0, 29.0, 18.0, 17.0, 12.0, 17.0, 14.0, 7.0, 3.0, 6.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.494140625, -1.4512481689453125, -1.408355712890625, -1.3654632568359375, -1.32257080078125, -1.2796783447265625, -1.236785888671875, -1.1938934326171875, -1.1510009765625, -1.1081085205078125, -1.065216064453125, -1.0223236083984375, -0.97943115234375, -0.9365386962890625, -0.893646240234375, -0.8507537841796875, -0.807861328125, -0.7649688720703125, -0.722076416015625, -0.6791839599609375, -0.63629150390625, -0.5933990478515625, -0.550506591796875, -0.5076141357421875, -0.4647216796875, -0.4218292236328125, -0.378936767578125, -0.3360443115234375, -0.29315185546875, -0.2502593994140625, -0.207366943359375, -0.1644744873046875, -0.12158203125, -0.0786895751953125, -0.035797119140625, 0.0070953369140625, 0.04998779296875, 0.0928802490234375, 0.135772705078125, 0.1786651611328125, 0.2215576171875, 0.2644500732421875, 0.307342529296875, 0.3502349853515625, 0.39312744140625, 0.4360198974609375, 0.478912353515625, 0.5218048095703125, 0.564697265625, 0.6075897216796875, 0.650482177734375, 0.6933746337890625, 0.73626708984375, 0.7791595458984375, 0.822052001953125, 0.8649444580078125, 0.9078369140625, 0.9507293701171875, 0.993621826171875, 1.0365142822265625, 1.07940673828125, 1.1222991943359375, 1.165191650390625, 1.2080841064453125, 1.2509765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 9.0, 13.0, 26.0, 64.0, 107.0, 164.0, 192.0, 161.0, 116.0, 62.0, 38.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.264766693115234, -22.661638259887695, -22.058509826660156, -21.45538330078125, -20.85225486755371, -20.249126434326172, -19.645998001098633, -19.042869567871094, -18.439743041992188, -17.83661460876465, -17.23348617553711, -16.630359649658203, -16.027231216430664, -15.424102783203125, -14.820974349975586, -14.217846870422363, -13.614718437194824, -13.011590003967285, -12.408462524414062, -11.805334091186523, -11.2022066116333, -10.599078178405762, -9.995950698852539, -9.392822265625, -8.789693832397461, -8.186565399169922, -7.583437919616699, -6.98030948638916, -6.3771820068359375, -5.774053573608398, -5.170925617218018, -4.567797660827637, -3.9646692276000977, -3.361541271209717, -2.758413314819336, -2.155285120010376, -1.5521571636199951, -0.9490292072296143, -0.3459010124206543, 0.25722694396972656, 0.8603549003601074, 1.4634828567504883, 2.066610813140869, 2.669739007949829, 3.27286696434021, 3.875994920730591, 4.479123115539551, 5.082251071929932, 5.6853790283203125, 6.288506984710693, 6.891634941101074, 7.494763374328613, 8.097890853881836, 8.701019287109375, 9.304147720336914, 9.907275199890137, 10.51040267944336, 11.113531112670898, 11.716658592224121, 12.31978702545166, 12.922914505004883, 13.526042938232422, 14.129171371459961, 14.732298851013184, 15.335427284240723]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 12.0, 15.0, 15.0, 17.0, 24.0, 14.0, 34.0, 36.0, 45.0, 55.0, 42.0, 72.0, 56.0, 63.0, 66.0, 65.0, 33.0, 49.0, 42.0, 42.0, 32.0, 20.0, 22.0, 33.0, 20.0, 25.0, 13.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.27517318725586, -9.972159385681152, -9.669144630432129, -9.366130828857422, -9.063117027282715, -8.760102272033691, -8.457088470458984, -8.154073715209961, -7.851059913635254, -7.548045635223389, -7.245031833648682, -6.942017555236816, -6.639003276824951, -6.335988998413086, -6.032975196838379, -5.729960918426514, -5.426947116851807, -5.123932838439941, -4.820919036865234, -4.517904758453369, -4.214890480041504, -3.9118764400482178, -3.6088624000549316, -3.3058481216430664, -3.0028340816497803, -2.699820041656494, -2.396805763244629, -2.0937917232513428, -1.790777564048767, -1.4877634048461914, -1.1847493648529053, -0.88173508644104, -0.5787210464477539, -0.2757069170475006, 0.027307212352752686, 0.3303213119506836, 0.6333354711532593, 0.936349630355835, 1.239363670349121, 1.5423779487609863, 1.8453919887542725, 2.1484060287475586, 2.451420307159424, 2.75443434715271, 3.057448387145996, 3.3604626655578613, 3.6634767055511475, 3.9664909839630127, 4.269505023956299, 4.572519302368164, 4.875533103942871, 5.178547382354736, 5.481561660766602, 5.784575462341309, 6.087589740753174, 6.390604019165039, 6.693617820739746, 6.996632099151611, 7.299645900726318, 7.602660179138184, 7.905674457550049, 8.208688735961914, 8.511702537536621, 8.814716339111328, 9.117731094360352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 5.0, 8.0, 21.0, 20.0, 25.0, 28.0, 52.0, 73.0, 115.0, 147.0, 241.0, 341.0, 552.0, 1085.0, 1862.0, 3515.0, 7308.0, 16444.0, 38229.0, 93208.0, 225661.0, 352007.0, 177667.0, 73458.0, 30568.0, 13069.0, 5974.0, 2937.0, 1592.0, 847.0, 477.0, 308.0, 216.0, 148.0, 81.0, 68.0, 61.0, 27.0, 31.0, 17.0, 10.0, 7.0, 11.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.546875, -1.501861572265625, -1.45684814453125, -1.411834716796875, -1.3668212890625, -1.321807861328125, -1.27679443359375, -1.231781005859375, -1.186767578125, -1.141754150390625, -1.09674072265625, -1.051727294921875, -1.0067138671875, -0.961700439453125, -0.91668701171875, -0.871673583984375, -0.82666015625, -0.781646728515625, -0.73663330078125, -0.691619873046875, -0.6466064453125, -0.601593017578125, -0.55657958984375, -0.511566162109375, -0.466552734375, -0.421539306640625, -0.37652587890625, -0.331512451171875, -0.2864990234375, -0.241485595703125, -0.19647216796875, -0.151458740234375, -0.1064453125, -0.061431884765625, -0.01641845703125, 0.028594970703125, 0.0736083984375, 0.118621826171875, 0.16363525390625, 0.208648681640625, 0.253662109375, 0.298675537109375, 0.34368896484375, 0.388702392578125, 0.4337158203125, 0.478729248046875, 0.52374267578125, 0.568756103515625, 0.61376953125, 0.658782958984375, 0.70379638671875, 0.748809814453125, 0.7938232421875, 0.838836669921875, 0.88385009765625, 0.928863525390625, 0.973876953125, 1.018890380859375, 1.06390380859375, 1.108917236328125, 1.1539306640625, 1.198944091796875, 1.24395751953125, 1.288970947265625, 1.333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 17.0, 26.0, 32.0, 50.0, 54.0, 53.0, 59.0, 72.0, 91.0, 81.0, 80.0, 81.0, 66.0, 60.0, 47.0, 27.0, 26.0, 20.0, 10.0, 12.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.11456298828125, -1.0787353515625, -1.04290771484375, -1.007080078125, -0.97125244140625, -0.9354248046875, -0.89959716796875, -0.86376953125, -0.82794189453125, -0.7921142578125, -0.75628662109375, -0.720458984375, -0.68463134765625, -0.6488037109375, -0.61297607421875, -0.5771484375, -0.54132080078125, -0.5054931640625, -0.46966552734375, -0.433837890625, -0.39801025390625, -0.3621826171875, -0.32635498046875, -0.29052734375, -0.25469970703125, -0.2188720703125, -0.18304443359375, -0.147216796875, -0.11138916015625, -0.0755615234375, -0.03973388671875, -0.00390625, 0.03192138671875, 0.0677490234375, 0.10357666015625, 0.139404296875, 0.17523193359375, 0.2110595703125, 0.24688720703125, 0.28271484375, 0.31854248046875, 0.3543701171875, 0.39019775390625, 0.426025390625, 0.46185302734375, 0.4976806640625, 0.53350830078125, 0.5693359375, 0.60516357421875, 0.6409912109375, 0.67681884765625, 0.712646484375, 0.74847412109375, 0.7843017578125, 0.82012939453125, 0.85595703125, 0.89178466796875, 0.9276123046875, 0.96343994140625, 0.999267578125, 1.03509521484375, 1.0709228515625, 1.10675048828125, 1.142578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 15.0, 22.0, 30.0, 47.0, 64.0, 125.0, 187.0, 346.0, 573.0, 1054.0, 2592.0, 9851.0, 116116.0, 847104.0, 59169.0, 6880.0, 2130.0, 939.0, 508.0, 289.0, 173.0, 117.0, 61.0, 50.0, 29.0, 22.0, 13.0, 8.0, 12.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.56463623046875, -4.4144287109375, -4.26422119140625, -4.114013671875, -3.96380615234375, -3.8135986328125, -3.66339111328125, -3.51318359375, -3.36297607421875, -3.2127685546875, -3.06256103515625, -2.912353515625, -2.76214599609375, -2.6119384765625, -2.46173095703125, -2.3115234375, -2.16131591796875, -2.0111083984375, -1.86090087890625, -1.710693359375, -1.56048583984375, -1.4102783203125, -1.26007080078125, -1.10986328125, -0.95965576171875, -0.8094482421875, -0.65924072265625, -0.509033203125, -0.35882568359375, -0.2086181640625, -0.05841064453125, 0.091796875, 0.24200439453125, 0.3922119140625, 0.54241943359375, 0.692626953125, 0.84283447265625, 0.9930419921875, 1.14324951171875, 1.29345703125, 1.44366455078125, 1.5938720703125, 1.74407958984375, 1.894287109375, 2.04449462890625, 2.1947021484375, 2.34490966796875, 2.4951171875, 2.64532470703125, 2.7955322265625, 2.94573974609375, 3.095947265625, 3.24615478515625, 3.3963623046875, 3.54656982421875, 3.69677734375, 3.84698486328125, 3.9971923828125, 4.14739990234375, 4.297607421875, 4.44781494140625, 4.5980224609375, 4.74822998046875, 4.8984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 2.0, 10.0, 10.0, 12.0, 14.0, 22.0, 17.0, 24.0, 24.0, 37.0, 44.0, 43.0, 43.0, 56.0, 58.0, 59.0, 50.0, 79.0, 63.0, 43.0, 42.0, 39.0, 42.0, 28.0, 20.0, 22.0, 20.0, 7.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.6328125, -3.51812744140625, -3.4034423828125, -3.28875732421875, -3.174072265625, -3.05938720703125, -2.9447021484375, -2.83001708984375, -2.71533203125, -2.60064697265625, -2.4859619140625, -2.37127685546875, -2.256591796875, -2.14190673828125, -2.0272216796875, -1.91253662109375, -1.7978515625, -1.68316650390625, -1.5684814453125, -1.45379638671875, -1.339111328125, -1.22442626953125, -1.1097412109375, -0.99505615234375, -0.88037109375, -0.76568603515625, -0.6510009765625, -0.53631591796875, -0.421630859375, -0.30694580078125, -0.1922607421875, -0.07757568359375, 0.037109375, 0.15179443359375, 0.2664794921875, 0.38116455078125, 0.495849609375, 0.61053466796875, 0.7252197265625, 0.83990478515625, 0.95458984375, 1.06927490234375, 1.1839599609375, 1.29864501953125, 1.413330078125, 1.52801513671875, 1.6427001953125, 1.75738525390625, 1.8720703125, 1.98675537109375, 2.1014404296875, 2.21612548828125, 2.330810546875, 2.44549560546875, 2.5601806640625, 2.67486572265625, 2.78955078125, 2.90423583984375, 3.0189208984375, 3.13360595703125, 3.248291015625, 3.36297607421875, 3.4776611328125, 3.59234619140625, 3.70703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 5.0, 7.0, 13.0, 14.0, 17.0, 13.0, 21.0, 36.0, 42.0, 69.0, 114.0, 155.0, 219.0, 419.0, 985.0, 2986.0, 14526.0, 168576.0, 792568.0, 57215.0, 7121.0, 1733.0, 697.0, 351.0, 186.0, 145.0, 70.0, 60.0, 41.0, 23.0, 29.0, 18.0, 13.0, 12.0, 9.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2494049072265625, -1.210723876953125, -1.1720428466796875, -1.13336181640625, -1.0946807861328125, -1.055999755859375, -1.0173187255859375, -0.9786376953125, -0.9399566650390625, -0.901275634765625, -0.8625946044921875, -0.82391357421875, -0.7852325439453125, -0.746551513671875, -0.7078704833984375, -0.669189453125, -0.6305084228515625, -0.591827392578125, -0.5531463623046875, -0.51446533203125, -0.4757843017578125, -0.437103271484375, -0.3984222412109375, -0.3597412109375, -0.3210601806640625, -0.282379150390625, -0.2436981201171875, -0.20501708984375, -0.1663360595703125, -0.127655029296875, -0.0889739990234375, -0.05029296875, -0.0116119384765625, 0.027069091796875, 0.0657501220703125, 0.10443115234375, 0.1431121826171875, 0.181793212890625, 0.2204742431640625, 0.2591552734375, 0.2978363037109375, 0.336517333984375, 0.3751983642578125, 0.41387939453125, 0.4525604248046875, 0.491241455078125, 0.5299224853515625, 0.568603515625, 0.6072845458984375, 0.645965576171875, 0.6846466064453125, 0.72332763671875, 0.7620086669921875, 0.800689697265625, 0.8393707275390625, 0.8780517578125, 0.9167327880859375, 0.955413818359375, 0.9940948486328125, 1.03277587890625, 1.0714569091796875, 1.110137939453125, 1.1488189697265625, 1.1875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 5.0, 6.0, 16.0, 11.0, 11.0, 16.0, 12.0, 18.0, 25.0, 34.0, 45.0, 55.0, 69.0, 90.0, 106.0, 79.0, 71.0, 65.0, 45.0, 28.0, 28.0, 24.0, 27.0, 13.0, 14.0, 21.0, 7.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013649463653564453, -0.00013159587979316711, -0.0001266971230506897, -0.00012179836630821228, -0.00011689960956573486, -0.00011200085282325745, -0.00010710209608078003, -0.00010220333933830261, -9.73045825958252e-05, -9.240582585334778e-05, -8.750706911087036e-05, -8.260831236839294e-05, -7.770955562591553e-05, -7.281079888343811e-05, -6.79120421409607e-05, -6.301328539848328e-05, -5.811452865600586e-05, -5.321577191352844e-05, -4.8317015171051025e-05, -4.341825842857361e-05, -3.851950168609619e-05, -3.3620744943618774e-05, -2.8721988201141357e-05, -2.382323145866394e-05, -1.8924474716186523e-05, -1.4025717973709106e-05, -9.12696123123169e-06, -4.2282044887542725e-06, 6.705522537231445e-07, 5.5693089962005615e-06, 1.0468065738677979e-05, 1.5366822481155396e-05, 2.0265579223632812e-05, 2.516433596611023e-05, 3.0063092708587646e-05, 3.4961849451065063e-05, 3.986060619354248e-05, 4.47593629360199e-05, 4.9658119678497314e-05, 5.455687642097473e-05, 5.945563316345215e-05, 6.435438990592957e-05, 6.925314664840698e-05, 7.41519033908844e-05, 7.905066013336182e-05, 8.394941687583923e-05, 8.884817361831665e-05, 9.374693036079407e-05, 9.864568710327148e-05, 0.0001035444438457489, 0.00010844320058822632, 0.00011334195733070374, 0.00011824071407318115, 0.00012313947081565857, 0.00012803822755813599, 0.0001329369843006134, 0.00013783574104309082, 0.00014273449778556824, 0.00014763325452804565, 0.00015253201127052307, 0.0001574307680130005, 0.0001623295247554779, 0.00016722828149795532, 0.00017212703824043274, 0.00017702579498291016]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 17.0, 14.0, 16.0, 17.0, 33.0, 46.0, 63.0, 84.0, 126.0, 195.0, 317.0, 629.0, 1329.0, 3839.0, 13773.0, 112238.0, 826733.0, 72269.0, 10952.0, 3202.0, 1243.0, 558.0, 300.0, 156.0, 112.0, 56.0, 55.0, 46.0, 32.0, 24.0, 14.0, 15.0, 10.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2555999755859375, -1.214324951171875, -1.1730499267578125, -1.13177490234375, -1.0904998779296875, -1.049224853515625, -1.0079498291015625, -0.9666748046875, -0.9253997802734375, -0.884124755859375, -0.8428497314453125, -0.80157470703125, -0.7602996826171875, -0.719024658203125, -0.6777496337890625, -0.636474609375, -0.5951995849609375, -0.553924560546875, -0.5126495361328125, -0.47137451171875, -0.4300994873046875, -0.388824462890625, -0.3475494384765625, -0.3062744140625, -0.2649993896484375, -0.223724365234375, -0.1824493408203125, -0.14117431640625, -0.0998992919921875, -0.058624267578125, -0.0173492431640625, 0.02392578125, 0.0652008056640625, 0.106475830078125, 0.1477508544921875, 0.18902587890625, 0.2303009033203125, 0.271575927734375, 0.3128509521484375, 0.3541259765625, 0.3954010009765625, 0.436676025390625, 0.4779510498046875, 0.51922607421875, 0.5605010986328125, 0.601776123046875, 0.6430511474609375, 0.684326171875, 0.7256011962890625, 0.766876220703125, 0.8081512451171875, 0.84942626953125, 0.8907012939453125, 0.931976318359375, 0.9732513427734375, 1.0145263671875, 1.0558013916015625, 1.097076416015625, 1.1383514404296875, 1.17962646484375, 1.2209014892578125, 1.262176513671875, 1.3034515380859375, 1.3447265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 10.0, 17.0, 23.0, 40.0, 37.0, 45.0, 63.0, 81.0, 93.0, 109.0, 112.0, 84.0, 76.0, 46.0, 33.0, 19.0, 18.0, 14.0, 8.0, 10.0, 4.0, 4.0, 7.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92626953125, -0.8948593139648438, -0.8634490966796875, -0.8320388793945312, -0.800628662109375, -0.7692184448242188, -0.7378082275390625, -0.7063980102539062, -0.67498779296875, -0.6435775756835938, -0.6121673583984375, -0.5807571411132812, -0.549346923828125, -0.5179367065429688, -0.4865264892578125, -0.45511627197265625, -0.4237060546875, -0.39229583740234375, -0.3608856201171875, -0.32947540283203125, -0.298065185546875, -0.26665496826171875, -0.2352447509765625, -0.20383453369140625, -0.17242431640625, -0.14101409912109375, -0.1096038818359375, -0.07819366455078125, -0.046783447265625, -0.01537322998046875, 0.0160369873046875, 0.04744720458984375, 0.078857421875, 0.11026763916015625, 0.1416778564453125, 0.17308807373046875, 0.204498291015625, 0.23590850830078125, 0.2673187255859375, 0.29872894287109375, 0.33013916015625, 0.36154937744140625, 0.3929595947265625, 0.42436981201171875, 0.455780029296875, 0.48719024658203125, 0.5186004638671875, 0.5500106811523438, 0.5814208984375, 0.6128311157226562, 0.6442413330078125, 0.6756515502929688, 0.707061767578125, 0.7384719848632812, 0.7698822021484375, 0.8012924194335938, 0.83270263671875, 0.8641128540039062, 0.8955230712890625, 0.9269332885742188, 0.958343505859375, 0.9897537231445312, 1.0211639404296875, 1.0525741577148438, 1.083984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 5.0, 16.0, 21.0, 48.0, 47.0, 102.0, 112.0, 178.0, 166.0, 105.0, 68.0, 51.0, 23.0, 11.0, 7.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.943916320800781, -15.443807601928711, -14.94369888305664, -14.44359016418457, -13.943480491638184, -13.443371772766113, -12.943263053894043, -12.443154335021973, -11.943044662475586, -11.442935943603516, -10.942827224731445, -10.442718505859375, -9.942608833312988, -9.442500114440918, -8.942391395568848, -8.442282676696777, -7.942173957824707, -7.442065238952637, -6.941956043243408, -6.441847324371338, -5.941738128662109, -5.441629409790039, -4.941520690917969, -4.441411972045898, -3.94130277633667, -3.4411938190460205, -2.941084861755371, -2.440976142883301, -1.9408671855926514, -1.440758228302002, -0.9406495094299316, -0.4405405521392822, 0.05956840515136719, 0.5596773028373718, 1.0597862005233765, 1.5598950386047363, 2.0600039958953857, 2.560112953186035, 3.0602216720581055, 3.560330629348755, 4.060439586639404, 4.560548305511475, 5.060657501220703, 5.560766220092773, 6.060874938964844, 6.560984134674072, 7.061092853546143, 7.561202049255371, 8.061310768127441, 8.561419486999512, 9.061528205871582, 9.561637878417969, 10.061746597290039, 10.56185531616211, 11.06196403503418, 11.56207275390625, 12.06218147277832, 12.56229019165039, 13.062398910522461, 13.562507629394531, 14.062617301940918, 14.562726020812988, 15.062834739685059, 15.562943458557129, 16.063053131103516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 9.0, 19.0, 15.0, 22.0, 20.0, 34.0, 21.0, 35.0, 40.0, 38.0, 30.0, 70.0, 86.0, 80.0, 72.0, 53.0, 49.0, 45.0, 37.0, 16.0, 28.0, 24.0, 25.0, 26.0, 11.0, 25.0, 18.0, 14.0, 3.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.230524063110352, -14.78946304321289, -14.348401069641113, -13.907340049743652, -13.466278076171875, -13.025217056274414, -12.584156036376953, -12.143094062805176, -11.702033042907715, -11.260972023010254, -10.819910049438477, -10.378849029541016, -9.937787055969238, -9.496726036071777, -9.0556640625, -8.614603042602539, -8.173542022705078, -7.732480525970459, -7.29141902923584, -6.850358009338379, -6.40929651260376, -5.968235015869141, -5.5271735191345215, -5.086112022399902, -4.645050048828125, -4.203988552093506, -3.762927293777466, -3.3218657970428467, -2.8808045387268066, -2.4397430419921875, -1.9986815452575684, -1.5576202869415283, -1.1165590286254883, -0.6754976511001587, -0.23443621397018433, 0.20662522315979004, 0.6476866006851196, 1.0887479782104492, 1.5298094749450684, 1.9708707332611084, 2.4119322299957275, 2.8529937267303467, 3.2940549850463867, 3.735116481781006, 4.176177978515625, 4.617238998413086, 5.058300971984863, 5.499361991882324, 5.940423488616943, 6.3814849853515625, 6.822546482086182, 7.263607978820801, 7.704668998718262, 8.145730972290039, 8.5867919921875, 9.027853012084961, 9.468914985656738, 9.9099760055542, 10.351037979125977, 10.792098999023438, 11.233160972595215, 11.674221992492676, 12.115283966064453, 12.556344985961914, 12.997406005859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 15.0, 20.0, 28.0, 38.0, 58.0, 100.0, 173.0, 324.0, 687.0, 1637.0, 4340.0, 15467.0, 83652.0, 1501718.0, 2434640.0, 122639.0, 19689.0, 5362.0, 1985.0, 803.0, 384.0, 241.0, 122.0, 51.0, 45.0, 23.0, 17.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.05059814453125, -1.9937744140625, -1.93695068359375, -1.880126953125, -1.82330322265625, -1.7664794921875, -1.70965576171875, -1.65283203125, -1.59600830078125, -1.5391845703125, -1.48236083984375, -1.425537109375, -1.36871337890625, -1.3118896484375, -1.25506591796875, -1.1982421875, -1.14141845703125, -1.0845947265625, -1.02777099609375, -0.970947265625, -0.91412353515625, -0.8572998046875, -0.80047607421875, -0.74365234375, -0.68682861328125, -0.6300048828125, -0.57318115234375, -0.516357421875, -0.45953369140625, -0.4027099609375, -0.34588623046875, -0.2890625, -0.23223876953125, -0.1754150390625, -0.11859130859375, -0.061767578125, -0.00494384765625, 0.0518798828125, 0.10870361328125, 0.16552734375, 0.22235107421875, 0.2791748046875, 0.33599853515625, 0.392822265625, 0.44964599609375, 0.5064697265625, 0.56329345703125, 0.6201171875, 0.67694091796875, 0.7337646484375, 0.79058837890625, 0.847412109375, 0.90423583984375, 0.9610595703125, 1.01788330078125, 1.07470703125, 1.13153076171875, 1.1883544921875, 1.24517822265625, 1.302001953125, 1.35882568359375, 1.4156494140625, 1.47247314453125, 1.529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 6.0, 9.0, 11.0, 7.0, 11.0, 16.0, 16.0, 24.0, 25.0, 25.0, 37.0, 26.0, 49.0, 50.0, 59.0, 56.0, 57.0, 54.0, 63.0, 50.0, 50.0, 52.0, 45.0, 48.0, 27.0, 26.0, 25.0, 13.0, 13.0, 15.0, 5.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.613189697265625, -0.58868408203125, -0.564178466796875, -0.5396728515625, -0.515167236328125, -0.49066162109375, -0.466156005859375, -0.441650390625, -0.417144775390625, -0.39263916015625, -0.368133544921875, -0.3436279296875, -0.319122314453125, -0.29461669921875, -0.270111083984375, -0.24560546875, -0.221099853515625, -0.19659423828125, -0.172088623046875, -0.1475830078125, -0.123077392578125, -0.09857177734375, -0.074066162109375, -0.049560546875, -0.025054931640625, -0.00054931640625, 0.023956298828125, 0.0484619140625, 0.072967529296875, 0.09747314453125, 0.121978759765625, 0.146484375, 0.170989990234375, 0.19549560546875, 0.220001220703125, 0.2445068359375, 0.269012451171875, 0.29351806640625, 0.318023681640625, 0.342529296875, 0.367034912109375, 0.39154052734375, 0.416046142578125, 0.4405517578125, 0.465057373046875, 0.48956298828125, 0.514068603515625, 0.53857421875, 0.563079833984375, 0.58758544921875, 0.612091064453125, 0.6365966796875, 0.661102294921875, 0.68560791015625, 0.710113525390625, 0.734619140625, 0.759124755859375, 0.78363037109375, 0.808135986328125, 0.8326416015625, 0.857147216796875, 0.88165283203125, 0.906158447265625, 0.9306640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 10.0, 8.0, 11.0, 23.0, 25.0, 49.0, 77.0, 109.0, 159.0, 272.0, 485.0, 915.0, 2233.0, 7710.0, 38747.0, 514684.0, 3425594.0, 170953.0, 23130.0, 5449.0, 1862.0, 752.0, 430.0, 249.0, 142.0, 79.0, 62.0, 23.0, 16.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.552734375, -2.4843292236328125, -2.415924072265625, -2.3475189208984375, -2.27911376953125, -2.2107086181640625, -2.142303466796875, -2.0738983154296875, -2.0054931640625, -1.9370880126953125, -1.868682861328125, -1.8002777099609375, -1.73187255859375, -1.6634674072265625, -1.595062255859375, -1.5266571044921875, -1.458251953125, -1.3898468017578125, -1.321441650390625, -1.2530364990234375, -1.18463134765625, -1.1162261962890625, -1.047821044921875, -0.9794158935546875, -0.9110107421875, -0.8426055908203125, -0.774200439453125, -0.7057952880859375, -0.63739013671875, -0.5689849853515625, -0.500579833984375, -0.4321746826171875, -0.36376953125, -0.2953643798828125, -0.226959228515625, -0.1585540771484375, -0.09014892578125, -0.0217437744140625, 0.046661376953125, 0.1150665283203125, 0.1834716796875, 0.2518768310546875, 0.320281982421875, 0.3886871337890625, 0.45709228515625, 0.5254974365234375, 0.593902587890625, 0.6623077392578125, 0.730712890625, 0.7991180419921875, 0.867523193359375, 0.9359283447265625, 1.00433349609375, 1.0727386474609375, 1.141143798828125, 1.2095489501953125, 1.2779541015625, 1.3463592529296875, 1.414764404296875, 1.4831695556640625, 1.55157470703125, 1.6199798583984375, 1.688385009765625, 1.7567901611328125, 1.8251953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 9.0, 31.0, 75.0, 165.0, 483.0, 1339.0, 1154.0, 429.0, 182.0, 77.0, 40.0, 30.0, 18.0, 11.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1341552734375, -4.022216796875, -3.9102783203125, -3.79833984375, -3.6864013671875, -3.574462890625, -3.4625244140625, -3.3505859375, -3.2386474609375, -3.126708984375, -3.0147705078125, -2.90283203125, -2.7908935546875, -2.678955078125, -2.5670166015625, -2.455078125, -2.3431396484375, -2.231201171875, -2.1192626953125, -2.00732421875, -1.8953857421875, -1.783447265625, -1.6715087890625, -1.5595703125, -1.4476318359375, -1.335693359375, -1.2237548828125, -1.11181640625, -0.9998779296875, -0.887939453125, -0.7760009765625, -0.6640625, -0.5521240234375, -0.440185546875, -0.3282470703125, -0.21630859375, -0.1043701171875, 0.007568359375, 0.1195068359375, 0.2314453125, 0.3433837890625, 0.455322265625, 0.5672607421875, 0.67919921875, 0.7911376953125, 0.903076171875, 1.0150146484375, 1.126953125, 1.2388916015625, 1.350830078125, 1.4627685546875, 1.57470703125, 1.6866455078125, 1.798583984375, 1.9105224609375, 2.0224609375, 2.1343994140625, 2.246337890625, 2.3582763671875, 2.47021484375, 2.5821533203125, 2.694091796875, 2.8060302734375, 2.91796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 13.0, 34.0, 104.0, 207.0, 309.0, 192.0, 67.0, 25.0, 14.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.147830963134766, -20.235191345214844, -19.322551727294922, -18.409912109375, -17.497272491455078, -16.584632873535156, -15.671993255615234, -14.759353637695312, -13.84671401977539, -12.934074401855469, -12.021434783935547, -11.108795166015625, -10.196155548095703, -9.283515930175781, -8.37087631225586, -7.458237171173096, -6.545598030090332, -5.63295841217041, -4.720318794250488, -3.8076794147491455, -2.8950397968292236, -1.9824004173278809, -1.069760799407959, -0.1571211814880371, 0.7555184364318848, 1.6681580543518066, 2.5807976722717285, 3.4934370517730713, 4.406076431274414, 5.318716049194336, 6.231355667114258, 7.14399528503418, 8.056634902954102, 8.969274520874023, 9.881914138793945, 10.794553756713867, 11.707193374633789, 12.619832992553711, 13.532472610473633, 14.445112228393555, 15.357751846313477, 16.2703914642334, 17.18303108215332, 18.095670700073242, 19.008310317993164, 19.920949935913086, 20.833589553833008, 21.74622917175293, 22.65886688232422, 23.57150650024414, 24.484146118164062, 25.396785736083984, 26.309425354003906, 27.222064971923828, 28.13470458984375, 29.047344207763672, 29.959983825683594, 30.872623443603516, 31.785263061523438, 32.69790267944336, 33.61054229736328, 34.5231819152832, 35.435821533203125, 36.34846115112305, 37.26110076904297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 27.0, 37.0, 62.0, 81.0, 88.0, 105.0, 114.0, 94.0, 106.0, 75.0, 55.0, 53.0, 42.0, 22.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.85193634033203, -26.208160400390625, -25.564382553100586, -24.920604705810547, -24.27682876586914, -23.633052825927734, -22.989274978637695, -22.345497131347656, -21.70172119140625, -21.057945251464844, -20.414167404174805, -19.770389556884766, -19.12661361694336, -18.482837677001953, -17.839059829711914, -17.195281982421875, -16.55150604248047, -15.907729148864746, -15.263952255249023, -14.6201753616333, -13.976398468017578, -13.332621574401855, -12.688844680786133, -12.04506778717041, -11.401290893554688, -10.757513999938965, -10.113737106323242, -9.46996021270752, -8.826183319091797, -8.182406425476074, -7.538629531860352, -6.894852638244629, -6.251073837280273, -5.607296943664551, -4.963520050048828, -4.3197431564331055, -3.675966262817383, -3.03218936920166, -2.3884124755859375, -1.7446355819702148, -1.1008586883544922, -0.45708179473876953, 0.18669509887695312, 0.8304719924926758, 1.4742488861083984, 2.118025779724121, 2.7618026733398438, 3.4055795669555664, 4.049356460571289, 4.693133354187012, 5.336910247802734, 5.980687141418457, 6.62446403503418, 7.268240928649902, 7.912017822265625, 8.555794715881348, 9.19957160949707, 9.843348503112793, 10.487125396728516, 11.130902290344238, 11.774679183959961, 12.418456077575684, 13.062232971191406, 13.706009864807129, 14.349786758422852]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 13.0, 11.0, 29.0, 24.0, 44.0, 46.0, 68.0, 101.0, 162.0, 277.0, 394.0, 772.0, 1319.0, 2748.0, 5870.0, 14332.0, 39033.0, 116296.0, 370094.0, 335377.0, 102836.0, 34694.0, 12976.0, 5452.0, 2527.0, 1322.0, 699.0, 328.0, 203.0, 143.0, 94.0, 59.0, 56.0, 31.0, 20.0, 17.0, 15.0, 13.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7041015625, -1.6507568359375, -1.597412109375, -1.5440673828125, -1.49072265625, -1.4373779296875, -1.384033203125, -1.3306884765625, -1.27734375, -1.2239990234375, -1.170654296875, -1.1173095703125, -1.06396484375, -1.0106201171875, -0.957275390625, -0.9039306640625, -0.8505859375, -0.7972412109375, -0.743896484375, -0.6905517578125, -0.63720703125, -0.5838623046875, -0.530517578125, -0.4771728515625, -0.423828125, -0.3704833984375, -0.317138671875, -0.2637939453125, -0.21044921875, -0.1571044921875, -0.103759765625, -0.0504150390625, 0.0029296875, 0.0562744140625, 0.109619140625, 0.1629638671875, 0.21630859375, 0.2696533203125, 0.322998046875, 0.3763427734375, 0.4296875, 0.4830322265625, 0.536376953125, 0.5897216796875, 0.64306640625, 0.6964111328125, 0.749755859375, 0.8031005859375, 0.8564453125, 0.9097900390625, 0.963134765625, 1.0164794921875, 1.06982421875, 1.1231689453125, 1.176513671875, 1.2298583984375, 1.283203125, 1.3365478515625, 1.389892578125, 1.4432373046875, 1.49658203125, 1.5499267578125, 1.603271484375, 1.6566162109375, 1.7099609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 4.0, 12.0, 7.0, 5.0, 16.0, 13.0, 22.0, 24.0, 25.0, 34.0, 21.0, 32.0, 38.0, 49.0, 44.0, 45.0, 45.0, 47.0, 38.0, 43.0, 45.0, 53.0, 42.0, 27.0, 43.0, 27.0, 34.0, 30.0, 24.0, 21.0, 15.0, 16.0, 10.0, 13.0, 5.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6650390625, -0.6449203491210938, -0.6248016357421875, -0.6046829223632812, -0.584564208984375, -0.5644454956054688, -0.5443267822265625, -0.5242080688476562, -0.50408935546875, -0.48397064208984375, -0.4638519287109375, -0.44373321533203125, -0.423614501953125, -0.40349578857421875, -0.3833770751953125, -0.36325836181640625, -0.3431396484375, -0.32302093505859375, -0.3029022216796875, -0.28278350830078125, -0.262664794921875, -0.24254608154296875, -0.2224273681640625, -0.20230865478515625, -0.18218994140625, -0.16207122802734375, -0.1419525146484375, -0.12183380126953125, -0.101715087890625, -0.08159637451171875, -0.0614776611328125, -0.04135894775390625, -0.021240234375, -0.00112152099609375, 0.0189971923828125, 0.03911590576171875, 0.059234619140625, 0.07935333251953125, 0.0994720458984375, 0.11959075927734375, 0.13970947265625, 0.15982818603515625, 0.1799468994140625, 0.20006561279296875, 0.220184326171875, 0.24030303955078125, 0.2604217529296875, 0.28054046630859375, 0.3006591796875, 0.32077789306640625, 0.3408966064453125, 0.36101531982421875, 0.381134033203125, 0.40125274658203125, 0.4213714599609375, 0.44149017333984375, 0.46160888671875, 0.48172760009765625, 0.5018463134765625, 0.5219650268554688, 0.542083740234375, 0.5622024536132812, 0.5823211669921875, 0.6024398803710938, 0.62255859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 23.0, 21.0, 63.0, 109.0, 248.0, 523.0, 1531.0, 6490.0, 171642.0, 847223.0, 16910.0, 2284.0, 759.0, 352.0, 151.0, 72.0, 44.0, 34.0, 14.0, 15.0, 6.0, 7.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8812255859375, -5.672607421875, -5.4639892578125, -5.25537109375, -5.0467529296875, -4.838134765625, -4.6295166015625, -4.4208984375, -4.2122802734375, -4.003662109375, -3.7950439453125, -3.58642578125, -3.3778076171875, -3.169189453125, -2.9605712890625, -2.751953125, -2.5433349609375, -2.334716796875, -2.1260986328125, -1.91748046875, -1.7088623046875, -1.500244140625, -1.2916259765625, -1.0830078125, -0.8743896484375, -0.665771484375, -0.4571533203125, -0.24853515625, -0.0399169921875, 0.168701171875, 0.3773193359375, 0.5859375, 0.7945556640625, 1.003173828125, 1.2117919921875, 1.42041015625, 1.6290283203125, 1.837646484375, 2.0462646484375, 2.2548828125, 2.4635009765625, 2.672119140625, 2.8807373046875, 3.08935546875, 3.2979736328125, 3.506591796875, 3.7152099609375, 3.923828125, 4.1324462890625, 4.341064453125, 4.5496826171875, 4.75830078125, 4.9669189453125, 5.175537109375, 5.3841552734375, 5.5927734375, 5.8013916015625, 6.010009765625, 6.2186279296875, 6.42724609375, 6.6358642578125, 6.844482421875, 7.0531005859375, 7.26171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 16.0, 21.0, 20.0, 31.0, 30.0, 31.0, 44.0, 49.0, 59.0, 41.0, 48.0, 53.0, 43.0, 50.0, 42.0, 53.0, 37.0, 39.0, 40.0, 24.0, 31.0, 22.0, 20.0, 9.0, 11.0, 7.0, 16.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.52288818359375, -2.4442138671875, -2.36553955078125, -2.286865234375, -2.20819091796875, -2.1295166015625, -2.05084228515625, -1.97216796875, -1.89349365234375, -1.8148193359375, -1.73614501953125, -1.657470703125, -1.57879638671875, -1.5001220703125, -1.42144775390625, -1.3427734375, -1.26409912109375, -1.1854248046875, -1.10675048828125, -1.028076171875, -0.94940185546875, -0.8707275390625, -0.79205322265625, -0.71337890625, -0.63470458984375, -0.5560302734375, -0.47735595703125, -0.398681640625, -0.32000732421875, -0.2413330078125, -0.16265869140625, -0.083984375, -0.00531005859375, 0.0733642578125, 0.15203857421875, 0.230712890625, 0.30938720703125, 0.3880615234375, 0.46673583984375, 0.54541015625, 0.62408447265625, 0.7027587890625, 0.78143310546875, 0.860107421875, 0.93878173828125, 1.0174560546875, 1.09613037109375, 1.1748046875, 1.25347900390625, 1.3321533203125, 1.41082763671875, 1.489501953125, 1.56817626953125, 1.6468505859375, 1.72552490234375, 1.80419921875, 1.88287353515625, 1.9615478515625, 2.04022216796875, 2.118896484375, 2.19757080078125, 2.2762451171875, 2.35491943359375, 2.43359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 11.0, 9.0, 22.0, 25.0, 37.0, 57.0, 88.0, 158.0, 455.0, 1713.0, 17066.0, 877163.0, 144508.0, 5616.0, 874.0, 281.0, 143.0, 74.0, 50.0, 35.0, 28.0, 22.0, 10.0, 18.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.34375, -2.274383544921875, -2.20501708984375, -2.135650634765625, -2.0662841796875, -1.996917724609375, -1.92755126953125, -1.858184814453125, -1.788818359375, -1.719451904296875, -1.65008544921875, -1.580718994140625, -1.5113525390625, -1.441986083984375, -1.37261962890625, -1.303253173828125, -1.23388671875, -1.164520263671875, -1.09515380859375, -1.025787353515625, -0.9564208984375, -0.887054443359375, -0.81768798828125, -0.748321533203125, -0.678955078125, -0.609588623046875, -0.54022216796875, -0.470855712890625, -0.4014892578125, -0.332122802734375, -0.26275634765625, -0.193389892578125, -0.1240234375, -0.054656982421875, 0.01470947265625, 0.084075927734375, 0.1534423828125, 0.222808837890625, 0.29217529296875, 0.361541748046875, 0.430908203125, 0.500274658203125, 0.56964111328125, 0.639007568359375, 0.7083740234375, 0.777740478515625, 0.84710693359375, 0.916473388671875, 0.98583984375, 1.055206298828125, 1.12457275390625, 1.193939208984375, 1.2633056640625, 1.332672119140625, 1.40203857421875, 1.471405029296875, 1.540771484375, 1.610137939453125, 1.67950439453125, 1.748870849609375, 1.8182373046875, 1.887603759765625, 1.95697021484375, 2.026336669921875, 2.095703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 2.0, 9.0, 5.0, 2.0, 9.0, 7.0, 10.0, 9.0, 19.0, 30.0, 29.0, 34.0, 51.0, 66.0, 89.0, 109.0, 117.0, 109.0, 72.0, 40.0, 29.0, 30.0, 14.0, 20.0, 14.0, 17.0, 15.0, 11.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016951560974121094, -0.00016369298100471497, -0.000157870352268219, -0.00015204772353172302, -0.00014622509479522705, -0.00014040246605873108, -0.0001345798373222351, -0.00012875720858573914, -0.00012293457984924316, -0.00011711195111274719, -0.00011128932237625122, -0.00010546669363975525, -9.964406490325928e-05, -9.38214361667633e-05, -8.799880743026733e-05, -8.217617869377136e-05, -7.635354995727539e-05, -7.053092122077942e-05, -6.470829248428345e-05, -5.8885663747787476e-05, -5.3063035011291504e-05, -4.724040627479553e-05, -4.141777753829956e-05, -3.559514880180359e-05, -2.9772520065307617e-05, -2.3949891328811646e-05, -1.8127262592315674e-05, -1.2304633855819702e-05, -6.4820051193237305e-06, -6.593763828277588e-07, 5.163252353668213e-06, 1.0985881090164185e-05, 1.6808509826660156e-05, 2.2631138563156128e-05, 2.84537672996521e-05, 3.427639603614807e-05, 4.009902477264404e-05, 4.5921653509140015e-05, 5.1744282245635986e-05, 5.756691098213196e-05, 6.338953971862793e-05, 6.92121684551239e-05, 7.503479719161987e-05, 8.085742592811584e-05, 8.668005466461182e-05, 9.250268340110779e-05, 9.832531213760376e-05, 0.00010414794087409973, 0.0001099705696105957, 0.00011579319834709167, 0.00012161582708358765, 0.00012743845582008362, 0.0001332610845565796, 0.00013908371329307556, 0.00014490634202957153, 0.0001507289707660675, 0.00015655159950256348, 0.00016237422823905945, 0.00016819685697555542, 0.0001740194857120514, 0.00017984211444854736, 0.00018566474318504333, 0.0001914873719215393, 0.00019731000065803528, 0.00020313262939453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 11.0, 9.0, 12.0, 15.0, 34.0, 41.0, 52.0, 101.0, 146.0, 217.0, 401.0, 732.0, 1939.0, 6212.0, 33971.0, 589893.0, 376174.0, 29410.0, 5667.0, 1790.0, 741.0, 384.0, 215.0, 99.0, 88.0, 61.0, 45.0, 22.0, 13.0, 20.0, 13.0, 8.0, 2.0, 4.0, 4.0, 2.0, 5.0], "bins": [-1.546875, -1.5108718872070312, -1.4748687744140625, -1.4388656616210938, -1.402862548828125, -1.3668594360351562, -1.3308563232421875, -1.2948532104492188, -1.25885009765625, -1.2228469848632812, -1.1868438720703125, -1.1508407592773438, -1.114837646484375, -1.0788345336914062, -1.0428314208984375, -1.0068283081054688, -0.9708251953125, -0.9348220825195312, -0.8988189697265625, -0.8628158569335938, -0.826812744140625, -0.7908096313476562, -0.7548065185546875, -0.7188034057617188, -0.68280029296875, -0.6467971801757812, -0.6107940673828125, -0.5747909545898438, -0.538787841796875, -0.5027847290039062, -0.4667816162109375, -0.43077850341796875, -0.394775390625, -0.35877227783203125, -0.3227691650390625, -0.28676605224609375, -0.250762939453125, -0.21475982666015625, -0.1787567138671875, -0.14275360107421875, -0.10675048828125, -0.07074737548828125, -0.0347442626953125, 0.00125885009765625, 0.037261962890625, 0.07326507568359375, 0.1092681884765625, 0.14527130126953125, 0.1812744140625, 0.21727752685546875, 0.2532806396484375, 0.28928375244140625, 0.325286865234375, 0.36128997802734375, 0.3972930908203125, 0.43329620361328125, 0.46929931640625, 0.5053024291992188, 0.5413055419921875, 0.5773086547851562, 0.613311767578125, 0.6493148803710938, 0.6853179931640625, 0.7213211059570312, 0.75732421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 13.0, 19.0, 28.0, 30.0, 32.0, 65.0, 108.0, 125.0, 127.0, 127.0, 70.0, 59.0, 43.0, 24.0, 21.0, 16.0, 10.0, 6.0, 16.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.865814208984375, -0.83612060546875, -0.806427001953125, -0.7767333984375, -0.747039794921875, -0.71734619140625, -0.687652587890625, -0.657958984375, -0.628265380859375, -0.59857177734375, -0.568878173828125, -0.5391845703125, -0.509490966796875, -0.47979736328125, -0.450103759765625, -0.42041015625, -0.390716552734375, -0.36102294921875, -0.331329345703125, -0.3016357421875, -0.271942138671875, -0.24224853515625, -0.212554931640625, -0.182861328125, -0.153167724609375, -0.12347412109375, -0.093780517578125, -0.0640869140625, -0.034393310546875, -0.00469970703125, 0.024993896484375, 0.0546875, 0.084381103515625, 0.11407470703125, 0.143768310546875, 0.1734619140625, 0.203155517578125, 0.23284912109375, 0.262542724609375, 0.292236328125, 0.321929931640625, 0.35162353515625, 0.381317138671875, 0.4110107421875, 0.440704345703125, 0.47039794921875, 0.500091552734375, 0.52978515625, 0.559478759765625, 0.58917236328125, 0.618865966796875, 0.6485595703125, 0.678253173828125, 0.70794677734375, 0.737640380859375, 0.767333984375, 0.797027587890625, 0.82672119140625, 0.856414794921875, 0.8861083984375, 0.915802001953125, 0.94549560546875, 0.975189208984375, 1.0048828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 24.0, 37.0, 140.0, 422.0, 234.0, 88.0, 28.0, 12.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.05577850341797, -51.840389251708984, -50.624996185302734, -49.40960693359375, -48.194217681884766, -46.97882843017578, -45.76343536376953, -44.54804611206055, -43.33265686035156, -42.11726760864258, -40.90187454223633, -39.686485290527344, -38.47109603881836, -37.255706787109375, -36.040313720703125, -34.82492446899414, -33.60953140258789, -32.394142150878906, -31.17875099182129, -29.963359832763672, -28.747970581054688, -27.53257942199707, -26.317188262939453, -25.10179901123047, -23.88640785217285, -22.671016693115234, -21.45562744140625, -20.240236282348633, -19.024845123291016, -17.80945587158203, -16.594064712524414, -15.378674507141113, -14.163284301757812, -12.947894096374512, -11.732503890991211, -10.517112731933594, -9.301722526550293, -8.086332321166992, -6.870941638946533, -5.655550956726074, -4.440160751342773, -3.2247703075408936, -2.0093798637390137, -0.7939894199371338, 0.4214010238647461, 1.6367912292480469, 2.852181911468506, 4.067572593688965, 5.282962799072266, 6.498353004455566, 7.713743686676025, 8.929134368896484, 10.144524574279785, 11.359914779663086, 12.575305938720703, 13.790696144104004, 15.006086349487305, 16.221477508544922, 17.436866760253906, 18.652257919311523, 19.86764907836914, 21.083038330078125, 22.298429489135742, 23.51382064819336, 24.729209899902344]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 23.0, 13.0, 15.0, 18.0, 28.0, 26.0, 31.0, 35.0, 37.0, 36.0, 44.0, 62.0, 81.0, 80.0, 56.0, 43.0, 49.0, 43.0, 26.0, 46.0, 25.0, 21.0, 14.0, 26.0, 14.0, 19.0, 8.0, 10.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.179211616516113, -9.824738502502441, -9.470264434814453, -9.115791320800781, -8.76131820678711, -8.406845092773438, -8.052371978759766, -7.697897911071777, -7.3434247970581055, -6.988951683044434, -6.6344780921936035, -6.280004501342773, -5.925531387329102, -5.57105827331543, -5.2165846824646, -4.8621110916137695, -4.507637977600098, -4.153164863586426, -3.7986912727355957, -3.4442179203033447, -3.0897445678710938, -2.7352712154388428, -2.380797863006592, -2.026324510574341, -1.6718511581420898, -1.3173778057098389, -0.9629044532775879, -0.6084311008453369, -0.25395774841308594, 0.10051560401916504, 0.454988956451416, 0.809462308883667, 1.1639366149902344, 1.5184099674224854, 1.8728833198547363, 2.2273566722869873, 2.5818300247192383, 2.9363033771514893, 3.2907767295837402, 3.645250082015991, 3.999723434448242, 4.354196548461914, 4.708670139312744, 5.063143730163574, 5.417616844177246, 5.772089958190918, 6.126563549041748, 6.481037139892578, 6.83551025390625, 7.189983367919922, 7.544456958770752, 7.898930549621582, 8.253403663635254, 8.607876777648926, 8.962350845336914, 9.316823959350586, 9.671297073364258, 10.02577018737793, 10.380243301391602, 10.73471736907959, 11.089190483093262, 11.443663597106934, 11.798137664794922, 12.152610778808594, 12.507083892822266]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 9.0, 5.0, 19.0, 27.0, 39.0, 84.0, 145.0, 294.0, 683.0, 1966.0, 7566.0, 53210.0, 2759006.0, 1327172.0, 35197.0, 6028.0, 1722.0, 587.0, 229.0, 117.0, 60.0, 43.0, 24.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.056640625, -2.98370361328125, -2.9107666015625, -2.83782958984375, -2.764892578125, -2.69195556640625, -2.6190185546875, -2.54608154296875, -2.47314453125, -2.40020751953125, -2.3272705078125, -2.25433349609375, -2.181396484375, -2.10845947265625, -2.0355224609375, -1.96258544921875, -1.8896484375, -1.81671142578125, -1.7437744140625, -1.67083740234375, -1.597900390625, -1.52496337890625, -1.4520263671875, -1.37908935546875, -1.30615234375, -1.23321533203125, -1.1602783203125, -1.08734130859375, -1.014404296875, -0.94146728515625, -0.8685302734375, -0.79559326171875, -0.72265625, -0.64971923828125, -0.5767822265625, -0.50384521484375, -0.430908203125, -0.35797119140625, -0.2850341796875, -0.21209716796875, -0.13916015625, -0.06622314453125, 0.0067138671875, 0.07965087890625, 0.152587890625, 0.22552490234375, 0.2984619140625, 0.37139892578125, 0.4443359375, 0.51727294921875, 0.5902099609375, 0.66314697265625, 0.736083984375, 0.80902099609375, 0.8819580078125, 0.95489501953125, 1.02783203125, 1.10076904296875, 1.1737060546875, 1.24664306640625, 1.319580078125, 1.39251708984375, 1.4654541015625, 1.53839111328125, 1.611328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 13.0, 18.0, 20.0, 21.0, 26.0, 35.0, 51.0, 52.0, 62.0, 65.0, 65.0, 72.0, 62.0, 76.0, 70.0, 63.0, 50.0, 40.0, 39.0, 30.0, 19.0, 15.0, 17.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8834609985351562, -0.8538360595703125, -0.8242111206054688, -0.794586181640625, -0.7649612426757812, -0.7353363037109375, -0.7057113647460938, -0.67608642578125, -0.6464614868164062, -0.6168365478515625, -0.5872116088867188, -0.557586669921875, -0.5279617309570312, -0.4983367919921875, -0.46871185302734375, -0.4390869140625, -0.40946197509765625, -0.3798370361328125, -0.35021209716796875, -0.320587158203125, -0.29096221923828125, -0.2613372802734375, -0.23171234130859375, -0.20208740234375, -0.17246246337890625, -0.1428375244140625, -0.11321258544921875, -0.083587646484375, -0.05396270751953125, -0.0243377685546875, 0.00528717041015625, 0.034912109375, 0.06453704833984375, 0.0941619873046875, 0.12378692626953125, 0.153411865234375, 0.18303680419921875, 0.2126617431640625, 0.24228668212890625, 0.27191162109375, 0.30153656005859375, 0.3311614990234375, 0.36078643798828125, 0.390411376953125, 0.42003631591796875, 0.4496612548828125, 0.47928619384765625, 0.5089111328125, 0.5385360717773438, 0.5681610107421875, 0.5977859497070312, 0.627410888671875, 0.6570358276367188, 0.6866607666015625, 0.7162857055664062, 0.74591064453125, 0.7755355834960938, 0.8051605224609375, 0.8347854614257812, 0.864410400390625, 0.8940353393554688, 0.9236602783203125, 0.9532852172851562, 0.98291015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 31.0, 50.0, 72.0, 123.0, 187.0, 394.0, 944.0, 2475.0, 10631.0, 128377.0, 3910957.0, 125088.0, 10239.0, 2599.0, 1032.0, 498.0, 248.0, 120.0, 76.0, 34.0, 28.0, 15.0, 12.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.09698486328125, -2.9986572265625, -2.90032958984375, -2.802001953125, -2.70367431640625, -2.6053466796875, -2.50701904296875, -2.40869140625, -2.31036376953125, -2.2120361328125, -2.11370849609375, -2.015380859375, -1.91705322265625, -1.8187255859375, -1.72039794921875, -1.6220703125, -1.52374267578125, -1.4254150390625, -1.32708740234375, -1.228759765625, -1.13043212890625, -1.0321044921875, -0.93377685546875, -0.83544921875, -0.73712158203125, -0.6387939453125, -0.54046630859375, -0.442138671875, -0.34381103515625, -0.2454833984375, -0.14715576171875, -0.048828125, 0.04949951171875, 0.1478271484375, 0.24615478515625, 0.344482421875, 0.44281005859375, 0.5411376953125, 0.63946533203125, 0.73779296875, 0.83612060546875, 0.9344482421875, 1.03277587890625, 1.131103515625, 1.22943115234375, 1.3277587890625, 1.42608642578125, 1.5244140625, 1.62274169921875, 1.7210693359375, 1.81939697265625, 1.917724609375, 2.01605224609375, 2.1143798828125, 2.21270751953125, 2.31103515625, 2.40936279296875, 2.5076904296875, 2.60601806640625, 2.704345703125, 2.80267333984375, 2.9010009765625, 2.99932861328125, 3.09765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 3.0, 17.0, 26.0, 40.0, 132.0, 447.0, 1507.0, 1384.0, 315.0, 110.0, 42.0, 27.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.033721923828125, -3.90728759765625, -3.780853271484375, -3.6544189453125, -3.527984619140625, -3.40155029296875, -3.275115966796875, -3.148681640625, -3.022247314453125, -2.89581298828125, -2.769378662109375, -2.6429443359375, -2.516510009765625, -2.39007568359375, -2.263641357421875, -2.13720703125, -2.010772705078125, -1.88433837890625, -1.757904052734375, -1.6314697265625, -1.505035400390625, -1.37860107421875, -1.252166748046875, -1.125732421875, -0.999298095703125, -0.87286376953125, -0.746429443359375, -0.6199951171875, -0.493560791015625, -0.36712646484375, -0.240692138671875, -0.1142578125, 0.012176513671875, 0.13861083984375, 0.265045166015625, 0.3914794921875, 0.517913818359375, 0.64434814453125, 0.770782470703125, 0.897216796875, 1.023651123046875, 1.15008544921875, 1.276519775390625, 1.4029541015625, 1.529388427734375, 1.65582275390625, 1.782257080078125, 1.90869140625, 2.035125732421875, 2.16156005859375, 2.287994384765625, 2.4144287109375, 2.540863037109375, 2.66729736328125, 2.793731689453125, 2.920166015625, 3.046600341796875, 3.17303466796875, 3.299468994140625, 3.4259033203125, 3.552337646484375, 3.67877197265625, 3.805206298828125, 3.931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 10.0, 10.0, 20.0, 59.0, 162.0, 261.0, 221.0, 148.0, 54.0, 25.0, 5.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.847034454345703, -21.13936996459961, -20.431703567504883, -19.72403907775879, -19.016374588012695, -18.30870819091797, -17.601043701171875, -16.89337921142578, -16.185712814331055, -15.478047370910645, -14.77038288116455, -14.06271743774414, -13.35505199432373, -12.64738655090332, -11.939722061157227, -11.232056617736816, -10.524392127990723, -9.816726684570312, -9.109062194824219, -8.401396751403809, -7.693731307983398, -6.9860663414001465, -6.2784013748168945, -5.570735931396484, -4.863070964813232, -4.1554059982299805, -3.4477405548095703, -2.7400755882263184, -2.0324103832244873, -1.3247451782226562, -0.6170802116394043, 0.09058523178100586, 0.7982501983642578, 1.5059154033660889, 2.21358060836792, 2.921245574951172, 3.628910779953003, 4.336575984954834, 5.044240951538086, 5.751906394958496, 6.459571361541748, 7.167236328125, 7.87490177154541, 8.58256721496582, 9.290231704711914, 9.997897148132324, 10.705562591552734, 11.413227081298828, 12.120892524719238, 12.828557968139648, 13.536222457885742, 14.243887901306152, 14.951553344726562, 15.659217834472656, 16.36688232421875, 17.074548721313477, 17.78221321105957, 18.489877700805664, 19.19754409790039, 19.905208587646484, 20.612873077392578, 21.320539474487305, 22.0282039642334, 22.735870361328125, 23.44353485107422]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 10.0, 25.0, 57.0, 99.0, 156.0, 211.0, 195.0, 121.0, 83.0, 27.0, 11.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.64105796813965, -24.809375762939453, -23.977691650390625, -23.146007537841797, -22.3143253326416, -21.482643127441406, -20.650959014892578, -19.81927490234375, -18.987592697143555, -18.15591049194336, -17.32422637939453, -16.492542266845703, -15.660860061645508, -14.829176902770996, -13.997493743896484, -13.165810585021973, -12.334127426147461, -11.50244426727295, -10.670761108398438, -9.839077949523926, -9.007394790649414, -8.175711631774902, -7.344028472900391, -6.512345314025879, -5.680662155151367, -4.8489789962768555, -4.017295837402344, -3.185612678527832, -2.3539295196533203, -1.5222463607788086, -0.6905632019042969, 0.14111995697021484, 0.9728012084960938, 1.8044843673706055, 2.636167526245117, 3.467850685119629, 4.299533843994141, 5.131217002868652, 5.962900161743164, 6.794583320617676, 7.6262664794921875, 8.4579496383667, 9.289632797241211, 10.121315956115723, 10.952999114990234, 11.784682273864746, 12.616365432739258, 13.44804859161377, 14.279731750488281, 15.111414909362793, 15.943098068237305, 16.7747802734375, 17.606464385986328, 18.438148498535156, 19.26983070373535, 20.101512908935547, 20.933197021484375, 21.764881134033203, 22.5965633392334, 23.428245544433594, 24.259929656982422, 25.09161376953125, 25.923295974731445, 26.75497817993164, 27.58666229248047]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 16.0, 23.0, 57.0, 90.0, 151.0, 249.0, 504.0, 1005.0, 2275.0, 6082.0, 20531.0, 95198.0, 439937.0, 379991.0, 75918.0, 17344.0, 5256.0, 2009.0, 866.0, 424.0, 218.0, 125.0, 84.0, 43.0, 30.0, 20.0, 24.0, 14.0, 12.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7566680908203125, -1.695953369140625, -1.6352386474609375, -1.57452392578125, -1.5138092041015625, -1.453094482421875, -1.3923797607421875, -1.3316650390625, -1.2709503173828125, -1.210235595703125, -1.1495208740234375, -1.08880615234375, -1.0280914306640625, -0.967376708984375, -0.9066619873046875, -0.845947265625, -0.7852325439453125, -0.724517822265625, -0.6638031005859375, -0.60308837890625, -0.5423736572265625, -0.481658935546875, -0.4209442138671875, -0.3602294921875, -0.2995147705078125, -0.238800048828125, -0.1780853271484375, -0.11737060546875, -0.0566558837890625, 0.004058837890625, 0.0647735595703125, 0.12548828125, 0.1862030029296875, 0.246917724609375, 0.3076324462890625, 0.36834716796875, 0.4290618896484375, 0.489776611328125, 0.5504913330078125, 0.6112060546875, 0.6719207763671875, 0.732635498046875, 0.7933502197265625, 0.85406494140625, 0.9147796630859375, 0.975494384765625, 1.0362091064453125, 1.096923828125, 1.1576385498046875, 1.218353271484375, 1.2790679931640625, 1.33978271484375, 1.4004974365234375, 1.461212158203125, 1.5219268798828125, 1.5826416015625, 1.6433563232421875, 1.704071044921875, 1.7647857666015625, 1.82550048828125, 1.8862152099609375, 1.946929931640625, 2.0076446533203125, 2.068359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 9.0, 11.0, 15.0, 19.0, 28.0, 32.0, 52.0, 40.0, 66.0, 83.0, 62.0, 71.0, 66.0, 68.0, 73.0, 61.0, 47.0, 46.0, 35.0, 37.0, 25.0, 14.0, 10.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8736343383789062, -0.8424835205078125, -0.8113327026367188, -0.780181884765625, -0.7490310668945312, -0.7178802490234375, -0.6867294311523438, -0.65557861328125, -0.6244277954101562, -0.5932769775390625, -0.5621261596679688, -0.530975341796875, -0.49982452392578125, -0.4686737060546875, -0.43752288818359375, -0.4063720703125, -0.37522125244140625, -0.3440704345703125, -0.31291961669921875, -0.281768798828125, -0.25061798095703125, -0.2194671630859375, -0.18831634521484375, -0.15716552734375, -0.12601470947265625, -0.0948638916015625, -0.06371307373046875, -0.032562255859375, -0.00141143798828125, 0.0297393798828125, 0.06089019775390625, 0.092041015625, 0.12319183349609375, 0.1543426513671875, 0.18549346923828125, 0.216644287109375, 0.24779510498046875, 0.2789459228515625, 0.31009674072265625, 0.34124755859375, 0.37239837646484375, 0.4035491943359375, 0.43470001220703125, 0.465850830078125, 0.49700164794921875, 0.5281524658203125, 0.5593032836914062, 0.5904541015625, 0.6216049194335938, 0.6527557373046875, 0.6839065551757812, 0.715057373046875, 0.7462081909179688, 0.7773590087890625, 0.8085098266601562, 0.83966064453125, 0.8708114624023438, 0.9019622802734375, 0.9331130981445312, 0.964263916015625, 0.9954147338867188, 1.0265655517578125, 1.0577163696289062, 1.0888671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 11.0, 21.0, 35.0, 56.0, 77.0, 158.0, 250.0, 525.0, 1400.0, 4369.0, 18172.0, 115158.0, 696503.0, 177232.0, 25714.0, 5752.0, 1759.0, 646.0, 321.0, 158.0, 72.0, 55.0, 30.0, 24.0, 15.0, 11.0, 8.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.3481597900390625, -2.280303955078125, -2.2124481201171875, -2.14459228515625, -2.0767364501953125, -2.008880615234375, -1.9410247802734375, -1.8731689453125, -1.8053131103515625, -1.737457275390625, -1.6696014404296875, -1.60174560546875, -1.5338897705078125, -1.466033935546875, -1.3981781005859375, -1.330322265625, -1.2624664306640625, -1.194610595703125, -1.1267547607421875, -1.05889892578125, -0.9910430908203125, -0.923187255859375, -0.8553314208984375, -0.7874755859375, -0.7196197509765625, -0.651763916015625, -0.5839080810546875, -0.51605224609375, -0.4481964111328125, -0.380340576171875, -0.3124847412109375, -0.24462890625, -0.1767730712890625, -0.108917236328125, -0.0410614013671875, 0.02679443359375, 0.0946502685546875, 0.162506103515625, 0.2303619384765625, 0.2982177734375, 0.3660736083984375, 0.433929443359375, 0.5017852783203125, 0.56964111328125, 0.6374969482421875, 0.705352783203125, 0.7732086181640625, 0.841064453125, 0.9089202880859375, 0.976776123046875, 1.0446319580078125, 1.11248779296875, 1.1803436279296875, 1.248199462890625, 1.3160552978515625, 1.3839111328125, 1.4517669677734375, 1.519622802734375, 1.5874786376953125, 1.65533447265625, 1.7231903076171875, 1.791046142578125, 1.8589019775390625, 1.9267578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 4.0, 4.0, 5.0, 15.0, 11.0, 16.0, 13.0, 24.0, 20.0, 21.0, 38.0, 26.0, 39.0, 38.0, 40.0, 45.0, 54.0, 46.0, 31.0, 59.0, 46.0, 40.0, 31.0, 34.0, 34.0, 41.0, 27.0, 34.0, 25.0, 18.0, 27.0, 18.0, 12.0, 12.0, 10.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7483673095703125, -1.683258056640625, -1.6181488037109375, -1.55303955078125, -1.4879302978515625, -1.422821044921875, -1.3577117919921875, -1.2926025390625, -1.2274932861328125, -1.162384033203125, -1.0972747802734375, -1.03216552734375, -0.9670562744140625, -0.901947021484375, -0.8368377685546875, -0.771728515625, -0.7066192626953125, -0.641510009765625, -0.5764007568359375, -0.51129150390625, -0.4461822509765625, -0.381072998046875, -0.3159637451171875, -0.2508544921875, -0.1857452392578125, -0.120635986328125, -0.0555267333984375, 0.00958251953125, 0.0746917724609375, 0.139801025390625, 0.2049102783203125, 0.27001953125, 0.3351287841796875, 0.400238037109375, 0.4653472900390625, 0.53045654296875, 0.5955657958984375, 0.660675048828125, 0.7257843017578125, 0.7908935546875, 0.8560028076171875, 0.921112060546875, 0.9862213134765625, 1.05133056640625, 1.1164398193359375, 1.181549072265625, 1.2466583251953125, 1.311767578125, 1.3768768310546875, 1.441986083984375, 1.5070953369140625, 1.57220458984375, 1.6373138427734375, 1.702423095703125, 1.7675323486328125, 1.8326416015625, 1.8977508544921875, 1.962860107421875, 2.0279693603515625, 2.09307861328125, 2.1581878662109375, 2.223297119140625, 2.2884063720703125, 2.353515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 14.0, 26.0, 41.0, 81.0, 172.0, 412.0, 1257.0, 4931.0, 25772.0, 209615.0, 722728.0, 68804.0, 10936.0, 2438.0, 765.0, 289.0, 127.0, 51.0, 32.0, 19.0, 17.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0227737426757812, -0.9967193603515625, -0.9706649780273438, -0.944610595703125, -0.9185562133789062, -0.8925018310546875, -0.8664474487304688, -0.84039306640625, -0.8143386840820312, -0.7882843017578125, -0.7622299194335938, -0.736175537109375, -0.7101211547851562, -0.6840667724609375, -0.6580123901367188, -0.6319580078125, -0.6059036254882812, -0.5798492431640625, -0.5537948608398438, -0.527740478515625, -0.5016860961914062, -0.4756317138671875, -0.44957733154296875, -0.42352294921875, -0.39746856689453125, -0.3714141845703125, -0.34535980224609375, -0.319305419921875, -0.29325103759765625, -0.2671966552734375, -0.24114227294921875, -0.215087890625, -0.18903350830078125, -0.1629791259765625, -0.13692474365234375, -0.110870361328125, -0.08481597900390625, -0.0587615966796875, -0.03270721435546875, -0.00665283203125, 0.01940155029296875, 0.0454559326171875, 0.07151031494140625, 0.097564697265625, 0.12361907958984375, 0.1496734619140625, 0.17572784423828125, 0.2017822265625, 0.22783660888671875, 0.2538909912109375, 0.27994537353515625, 0.305999755859375, 0.33205413818359375, 0.3581085205078125, 0.38416290283203125, 0.41021728515625, 0.43627166748046875, 0.4623260498046875, 0.48838043212890625, 0.514434814453125, 0.5404891967773438, 0.5665435791015625, 0.5925979614257812, 0.61865234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 4.0, 11.0, 14.0, 21.0, 22.0, 28.0, 32.0, 44.0, 53.0, 73.0, 82.0, 101.0, 101.0, 67.0, 70.0, 67.0, 44.0, 33.0, 24.0, 21.0, 11.0, 5.0, 15.0, 3.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011515617370605469, -0.00011120177805423737, -0.00010724738240242004, -0.00010329298675060272, -9.93385910987854e-05, -9.538419544696808e-05, -9.142979979515076e-05, -8.747540414333344e-05, -8.352100849151611e-05, -7.956661283969879e-05, -7.561221718788147e-05, -7.165782153606415e-05, -6.770342588424683e-05, -6.37490302324295e-05, -5.979463458061218e-05, -5.584023892879486e-05, -5.188584327697754e-05, -4.793144762516022e-05, -4.3977051973342896e-05, -4.0022656321525574e-05, -3.606826066970825e-05, -3.211386501789093e-05, -2.815946936607361e-05, -2.4205073714256287e-05, -2.0250678062438965e-05, -1.6296282410621643e-05, -1.2341886758804321e-05, -8.387491106987e-06, -4.433095455169678e-06, -4.78699803352356e-07, 3.475695848464966e-06, 7.430091500282288e-06, 1.138448715209961e-05, 1.533888280391693e-05, 1.9293278455734253e-05, 2.3247674107551575e-05, 2.7202069759368896e-05, 3.115646541118622e-05, 3.511086106300354e-05, 3.906525671482086e-05, 4.3019652366638184e-05, 4.6974048018455505e-05, 5.092844367027283e-05, 5.488283932209015e-05, 5.883723497390747e-05, 6.279163062572479e-05, 6.674602627754211e-05, 7.070042192935944e-05, 7.465481758117676e-05, 7.860921323299408e-05, 8.25636088848114e-05, 8.651800453662872e-05, 9.047240018844604e-05, 9.442679584026337e-05, 9.838119149208069e-05, 0.00010233558714389801, 0.00010628998279571533, 0.00011024437844753265, 0.00011419877409934998, 0.0001181531697511673, 0.00012210756540298462, 0.00012606196105480194, 0.00013001635670661926, 0.00013397075235843658, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 16.0, 24.0, 38.0, 61.0, 90.0, 133.0, 239.0, 402.0, 733.0, 1448.0, 3095.0, 7525.0, 21106.0, 71115.0, 273733.0, 525002.0, 98457.0, 28197.0, 9531.0, 3818.0, 1710.0, 838.0, 461.0, 247.0, 185.0, 100.0, 49.0, 40.0, 26.0, 27.0, 19.0, 8.0, 14.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.47021484375, -0.4546051025390625, -0.438995361328125, -0.4233856201171875, -0.40777587890625, -0.3921661376953125, -0.376556396484375, -0.3609466552734375, -0.3453369140625, -0.3297271728515625, -0.314117431640625, -0.2985076904296875, -0.28289794921875, -0.2672882080078125, -0.251678466796875, -0.2360687255859375, -0.220458984375, -0.2048492431640625, -0.189239501953125, -0.1736297607421875, -0.15802001953125, -0.1424102783203125, -0.126800537109375, -0.1111907958984375, -0.0955810546875, -0.0799713134765625, -0.064361572265625, -0.0487518310546875, -0.03314208984375, -0.0175323486328125, -0.001922607421875, 0.0136871337890625, 0.029296875, 0.0449066162109375, 0.060516357421875, 0.0761260986328125, 0.09173583984375, 0.1073455810546875, 0.122955322265625, 0.1385650634765625, 0.1541748046875, 0.1697845458984375, 0.185394287109375, 0.2010040283203125, 0.21661376953125, 0.2322235107421875, 0.247833251953125, 0.2634429931640625, 0.279052734375, 0.2946624755859375, 0.310272216796875, 0.3258819580078125, 0.34149169921875, 0.3571014404296875, 0.372711181640625, 0.3883209228515625, 0.4039306640625, 0.4195404052734375, 0.435150146484375, 0.4507598876953125, 0.46636962890625, 0.4819793701171875, 0.497589111328125, 0.5131988525390625, 0.52880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 8.0, 1.0, 6.0, 9.0, 16.0, 9.0, 20.0, 16.0, 21.0, 26.0, 42.0, 43.0, 45.0, 67.0, 66.0, 80.0, 75.0, 84.0, 57.0, 55.0, 44.0, 48.0, 29.0, 31.0, 27.0, 14.0, 10.0, 13.0, 9.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4137077331542969, -0.39894866943359375, -0.3841896057128906, -0.3694305419921875, -0.3546714782714844, -0.33991241455078125, -0.3251533508300781, -0.310394287109375, -0.2956352233886719, -0.28087615966796875, -0.2661170959472656, -0.2513580322265625, -0.23659896850585938, -0.22183990478515625, -0.20708084106445312, -0.19232177734375, -0.17756271362304688, -0.16280364990234375, -0.14804458618164062, -0.1332855224609375, -0.11852645874023438, -0.10376739501953125, -0.08900833129882812, -0.074249267578125, -0.059490203857421875, -0.04473114013671875, -0.029972076416015625, -0.0152130126953125, -0.000453948974609375, 0.01430511474609375, 0.029064178466796875, 0.0438232421875, 0.058582305908203125, 0.07334136962890625, 0.08810043334960938, 0.1028594970703125, 0.11761856079101562, 0.13237762451171875, 0.14713668823242188, 0.161895751953125, 0.17665481567382812, 0.19141387939453125, 0.20617294311523438, 0.2209320068359375, 0.23569107055664062, 0.25045013427734375, 0.2652091979980469, 0.27996826171875, 0.2947273254394531, 0.30948638916015625, 0.3242454528808594, 0.3390045166015625, 0.3537635803222656, 0.36852264404296875, 0.3832817077636719, 0.398040771484375, 0.4127998352050781, 0.42755889892578125, 0.4423179626464844, 0.4570770263671875, 0.4718360900878906, 0.48659515380859375, 0.5013542175292969, 0.51611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 15.0, 43.0, 90.0, 159.0, 347.0, 179.0, 89.0, 31.0, 20.0, 5.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.13393783569336, -22.502058029174805, -21.870176315307617, -21.238296508789062, -20.606414794921875, -19.97453498840332, -19.342655181884766, -18.710773468017578, -18.078893661499023, -17.44701385498047, -16.81513214111328, -16.183252334594727, -15.551371574401855, -14.919490814208984, -14.287610054016113, -13.655729293823242, -13.023848533630371, -12.3919677734375, -11.760087013244629, -11.128206253051758, -10.496326446533203, -9.864445686340332, -9.232564926147461, -8.600685119628906, -7.968803882598877, -7.336923122406006, -6.705042839050293, -6.073162078857422, -5.441281318664551, -4.809401035308838, -4.177520275115967, -3.545639991760254, -2.913759231567383, -2.281878709793091, -1.6499980688095093, -1.0181174278259277, -0.38623690605163574, 0.24564361572265625, 0.8775243759155273, 1.5094046592712402, 2.1412854194641113, 2.7731659412384033, 3.4050464630126953, 4.036927223205566, 4.6688079833984375, 5.30068826675415, 5.9325690269470215, 6.564449310302734, 7.1963300704956055, 7.828210830688477, 8.460091590881348, 9.091972351074219, 9.723852157592773, 10.355732917785645, 10.987613677978516, 11.61949348449707, 12.251375198364258, 12.883255958557129, 13.51513671875, 14.147016525268555, 14.778897285461426, 15.410778045654297, 16.042659759521484, 16.67453956604004, 17.306419372558594]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 19.0, 16.0, 14.0, 24.0, 26.0, 44.0, 39.0, 42.0, 48.0, 61.0, 95.0, 99.0, 82.0, 42.0, 43.0, 33.0, 40.0, 30.0, 38.0, 22.0, 20.0, 20.0, 6.0, 10.0, 9.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.887272834777832, -7.574706554412842, -7.262140274047852, -6.949573993682861, -6.637007713317871, -6.324440956115723, -6.011874675750732, -5.699308395385742, -5.386742115020752, -5.074175834655762, -4.7616095542907715, -4.449043273925781, -4.136476516723633, -3.8239104747772217, -3.5113439559936523, -3.198777675628662, -2.886211395263672, -2.5736451148986816, -2.2610788345336914, -1.948512315750122, -1.6359460353851318, -1.3233797550201416, -1.0108133554458618, -0.698246955871582, -0.3856806755065918, -0.07311433553695679, 0.23945200443267822, 0.5520183444023132, 0.8645846843719482, 1.1771509647369385, 1.4897173643112183, 1.802283763885498, 2.114849090576172, 2.427415370941162, 2.7399816513061523, 3.0525481700897217, 3.365114450454712, 3.677680730819702, 3.9902472496032715, 4.302813529968262, 4.615379810333252, 4.927946090698242, 5.240512371063232, 5.553078651428223, 5.865645408630371, 6.178211212158203, 6.490777969360352, 6.803344249725342, 7.115910530090332, 7.428476810455322, 7.7410430908203125, 8.053609848022461, 8.366175651550293, 8.678742408752441, 8.991308212280273, 9.303874969482422, 9.61644172668457, 9.929008483886719, 10.24157428741455, 10.5541410446167, 10.866706848144531, 11.17927360534668, 11.491839408874512, 11.80440616607666, 12.116971969604492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 14.0, 13.0, 16.0, 15.0, 29.0, 47.0, 68.0, 93.0, 167.0, 282.0, 524.0, 1003.0, 2080.0, 4828.0, 12791.0, 49607.0, 419744.0, 2971520.0, 640138.0, 65310.0, 15569.0, 5594.0, 2427.0, 1076.0, 537.0, 307.0, 169.0, 77.0, 70.0, 48.0, 39.0, 17.0, 18.0, 12.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.451171875, -1.4145050048828125, -1.377838134765625, -1.3411712646484375, -1.30450439453125, -1.2678375244140625, -1.231170654296875, -1.1945037841796875, -1.1578369140625, -1.1211700439453125, -1.084503173828125, -1.0478363037109375, -1.01116943359375, -0.9745025634765625, -0.937835693359375, -0.9011688232421875, -0.864501953125, -0.8278350830078125, -0.791168212890625, -0.7545013427734375, -0.71783447265625, -0.6811676025390625, -0.644500732421875, -0.6078338623046875, -0.5711669921875, -0.5345001220703125, -0.497833251953125, -0.4611663818359375, -0.42449951171875, -0.3878326416015625, -0.351165771484375, -0.3144989013671875, -0.27783203125, -0.2411651611328125, -0.204498291015625, -0.1678314208984375, -0.13116455078125, -0.0944976806640625, -0.057830810546875, -0.0211639404296875, 0.0155029296875, 0.0521697998046875, 0.088836669921875, 0.1255035400390625, 0.16217041015625, 0.1988372802734375, 0.235504150390625, 0.2721710205078125, 0.308837890625, 0.3455047607421875, 0.382171630859375, 0.4188385009765625, 0.45550537109375, 0.4921722412109375, 0.528839111328125, 0.5655059814453125, 0.6021728515625, 0.6388397216796875, 0.675506591796875, 0.7121734619140625, 0.74884033203125, 0.7855072021484375, 0.822174072265625, 0.8588409423828125, 0.8955078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 12.0, 15.0, 9.0, 26.0, 37.0, 46.0, 38.0, 42.0, 54.0, 56.0, 70.0, 78.0, 84.0, 69.0, 55.0, 61.0, 43.0, 50.0, 37.0, 25.0, 32.0, 15.0, 10.0, 6.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66552734375, -0.6387405395507812, -0.6119537353515625, -0.5851669311523438, -0.558380126953125, -0.5315933227539062, -0.5048065185546875, -0.47801971435546875, -0.45123291015625, -0.42444610595703125, -0.3976593017578125, -0.37087249755859375, -0.344085693359375, -0.31729888916015625, -0.2905120849609375, -0.26372528076171875, -0.2369384765625, -0.21015167236328125, -0.1833648681640625, -0.15657806396484375, -0.129791259765625, -0.10300445556640625, -0.0762176513671875, -0.04943084716796875, -0.02264404296875, 0.00414276123046875, 0.0309295654296875, 0.05771636962890625, 0.084503173828125, 0.11128997802734375, 0.1380767822265625, 0.16486358642578125, 0.191650390625, 0.21843719482421875, 0.2452239990234375, 0.27201080322265625, 0.298797607421875, 0.32558441162109375, 0.3523712158203125, 0.37915802001953125, 0.40594482421875, 0.43273162841796875, 0.4595184326171875, 0.48630523681640625, 0.513092041015625, 0.5398788452148438, 0.5666656494140625, 0.5934524536132812, 0.6202392578125, 0.6470260620117188, 0.6738128662109375, 0.7005996704101562, 0.727386474609375, 0.7541732788085938, 0.7809600830078125, 0.8077468872070312, 0.83453369140625, 0.8613204956054688, 0.8881072998046875, 0.9148941040039062, 0.941680908203125, 0.9684677124023438, 0.9952545166015625, 1.0220413208007812, 1.048828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 26.0, 32.0, 58.0, 87.0, 152.0, 276.0, 639.0, 1455.0, 4727.0, 18066.0, 126112.0, 2971672.0, 997993.0, 56643.0, 10937.0, 3187.0, 1156.0, 455.0, 212.0, 134.0, 82.0, 35.0, 34.0, 11.0, 15.0, 11.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.34722900390625, -1.2969970703125, -1.24676513671875, -1.196533203125, -1.14630126953125, -1.0960693359375, -1.04583740234375, -0.99560546875, -0.94537353515625, -0.8951416015625, -0.84490966796875, -0.794677734375, -0.74444580078125, -0.6942138671875, -0.64398193359375, -0.59375, -0.54351806640625, -0.4932861328125, -0.44305419921875, -0.392822265625, -0.34259033203125, -0.2923583984375, -0.24212646484375, -0.19189453125, -0.14166259765625, -0.0914306640625, -0.04119873046875, 0.009033203125, 0.05926513671875, 0.1094970703125, 0.15972900390625, 0.2099609375, 0.26019287109375, 0.3104248046875, 0.36065673828125, 0.410888671875, 0.46112060546875, 0.5113525390625, 0.56158447265625, 0.61181640625, 0.66204833984375, 0.7122802734375, 0.76251220703125, 0.812744140625, 0.86297607421875, 0.9132080078125, 0.96343994140625, 1.013671875, 1.06390380859375, 1.1141357421875, 1.16436767578125, 1.214599609375, 1.26483154296875, 1.3150634765625, 1.36529541015625, 1.41552734375, 1.46575927734375, 1.5159912109375, 1.56622314453125, 1.616455078125, 1.66668701171875, 1.7169189453125, 1.76715087890625, 1.8173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 7.0, 18.0, 18.0, 26.0, 50.0, 72.0, 113.0, 169.0, 305.0, 504.0, 738.0, 671.0, 499.0, 317.0, 173.0, 109.0, 79.0, 40.0, 48.0, 26.0, 20.0, 6.0, 10.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4109954833984375, -1.366912841796875, -1.3228302001953125, -1.27874755859375, -1.2346649169921875, -1.190582275390625, -1.1464996337890625, -1.1024169921875, -1.0583343505859375, -1.014251708984375, -0.9701690673828125, -0.92608642578125, -0.8820037841796875, -0.837921142578125, -0.7938385009765625, -0.749755859375, -0.7056732177734375, -0.661590576171875, -0.6175079345703125, -0.57342529296875, -0.5293426513671875, -0.485260009765625, -0.4411773681640625, -0.3970947265625, -0.3530120849609375, -0.308929443359375, -0.2648468017578125, -0.22076416015625, -0.1766815185546875, -0.132598876953125, -0.0885162353515625, -0.04443359375, -0.0003509521484375, 0.043731689453125, 0.0878143310546875, 0.13189697265625, 0.1759796142578125, 0.220062255859375, 0.2641448974609375, 0.3082275390625, 0.3523101806640625, 0.396392822265625, 0.4404754638671875, 0.48455810546875, 0.5286407470703125, 0.572723388671875, 0.6168060302734375, 0.660888671875, 0.7049713134765625, 0.749053955078125, 0.7931365966796875, 0.83721923828125, 0.8813018798828125, 0.925384521484375, 0.9694671630859375, 1.0135498046875, 1.0576324462890625, 1.101715087890625, 1.1457977294921875, 1.18988037109375, 1.2339630126953125, 1.278045654296875, 1.3221282958984375, 1.3662109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 10.0, 8.0, 10.0, 22.0, 25.0, 51.0, 66.0, 106.0, 150.0, 151.0, 141.0, 102.0, 59.0, 43.0, 22.0, 19.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021146774291992, -4.669943332672119, -4.318739414215088, -3.967535972595215, -3.616332530975342, -3.2651288509368896, -2.9139251708984375, -2.5627217292785645, -2.2115180492401123, -1.8603144884109497, -1.509110927581787, -1.157907247543335, -0.8067036867141724, -0.45550012588500977, -0.10429644584655762, 0.24690699577331543, 0.5981106758117676, 0.9493142366409302, 1.3005177974700928, 1.651721477508545, 2.002924919128418, 2.35412859916687, 2.7053322792053223, 3.0565357208251953, 3.4077394008636475, 3.7589430809020996, 4.110146522521973, 4.461350440979004, 4.812553882598877, 5.16375732421875, 5.514961242675781, 5.866164207458496, 6.217368125915527, 6.5685715675354, 6.919775485992432, 7.270978927612305, 7.622182369232178, 7.973385810852051, 8.324589729309082, 8.675792694091797, 9.026996612548828, 9.37820053100586, 9.729403495788574, 10.080607414245605, 10.431811332702637, 10.783014297485352, 11.134218215942383, 11.485422134399414, 11.836626052856445, 12.187829971313477, 12.539032936096191, 12.890236854553223, 13.241440773010254, 13.592643737792969, 13.94384765625, 14.295051574707031, 14.646254539489746, 14.997458457946777, 15.348661422729492, 15.699865341186523, 16.051069259643555, 16.402273178100586, 16.753475189208984, 17.104679107666016, 17.455883026123047]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 18.0, 13.0, 20.0, 28.0, 20.0, 31.0, 29.0, 37.0, 34.0, 36.0, 52.0, 35.0, 49.0, 45.0, 33.0, 49.0, 47.0, 34.0, 51.0, 38.0, 34.0, 27.0, 28.0, 30.0, 23.0, 17.0, 19.0, 28.0, 11.0, 10.0, 8.0, 11.0, 5.0, 8.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5354461669921875, -5.352889060974121, -5.170332431793213, -4.9877753257751465, -4.805218696594238, -4.622661590576172, -4.440104961395264, -4.257547855377197, -4.074991226196289, -3.8924343585968018, -3.7098774909973145, -3.527320623397827, -3.34476375579834, -3.1622068881988525, -2.9796500205993652, -2.797092914581299, -2.6145360469818115, -2.431979179382324, -2.249422311782837, -2.0668654441833496, -1.8843085765838623, -1.701751708984375, -1.5191947221755981, -1.3366378545761108, -1.1540809869766235, -0.9715241193771362, -0.7889672517776489, -0.6064103245735168, -0.42385345697402954, -0.24129658937454224, -0.058739662170410156, 0.12381720542907715, 0.30637407302856445, 0.48893094062805176, 0.6714878082275391, 0.8540447354316711, 1.0366015434265137, 1.219158411026001, 1.4017153978347778, 1.5842722654342651, 1.7668291330337524, 1.9493860006332397, 2.1319429874420166, 2.314499855041504, 2.497056722640991, 2.6796135902404785, 2.862170457839966, 3.044727325439453, 3.2272841930389404, 3.4098410606384277, 3.592397928237915, 3.7749547958374023, 3.9575116634368896, 4.140068531036377, 4.322625637054443, 4.505182266235352, 4.687739372253418, 4.870296478271484, 5.052853107452393, 5.235410213470459, 5.417966842651367, 5.600523948669434, 5.783080577850342, 5.965637683868408, 6.148194313049316]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 8.0, 2.0, 7.0, 7.0, 12.0, 19.0, 36.0, 37.0, 76.0, 89.0, 168.0, 238.0, 384.0, 811.0, 1595.0, 3775.0, 9919.0, 29689.0, 104195.0, 374157.0, 372939.0, 103676.0, 29636.0, 9834.0, 3716.0, 1636.0, 770.0, 413.0, 268.0, 162.0, 86.0, 54.0, 56.0, 20.0, 21.0, 15.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.470703125, -1.428680419921875, -1.38665771484375, -1.344635009765625, -1.3026123046875, -1.260589599609375, -1.21856689453125, -1.176544189453125, -1.134521484375, -1.092498779296875, -1.05047607421875, -1.008453369140625, -0.9664306640625, -0.924407958984375, -0.88238525390625, -0.840362548828125, -0.79833984375, -0.756317138671875, -0.71429443359375, -0.672271728515625, -0.6302490234375, -0.588226318359375, -0.54620361328125, -0.504180908203125, -0.462158203125, -0.420135498046875, -0.37811279296875, -0.336090087890625, -0.2940673828125, -0.252044677734375, -0.21002197265625, -0.167999267578125, -0.1259765625, -0.083953857421875, -0.04193115234375, 9.1552734375e-05, 0.0421142578125, 0.084136962890625, 0.12615966796875, 0.168182373046875, 0.210205078125, 0.252227783203125, 0.29425048828125, 0.336273193359375, 0.3782958984375, 0.420318603515625, 0.46234130859375, 0.504364013671875, 0.54638671875, 0.588409423828125, 0.63043212890625, 0.672454833984375, 0.7144775390625, 0.756500244140625, 0.79852294921875, 0.840545654296875, 0.882568359375, 0.924591064453125, 0.96661376953125, 1.008636474609375, 1.0506591796875, 1.092681884765625, 1.13470458984375, 1.176727294921875, 1.21875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 9.0, 13.0, 24.0, 23.0, 31.0, 39.0, 42.0, 43.0, 46.0, 55.0, 52.0, 70.0, 66.0, 76.0, 58.0, 56.0, 46.0, 56.0, 38.0, 39.0, 42.0, 16.0, 16.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.635040283203125, -0.60797119140625, -0.580902099609375, -0.5538330078125, -0.526763916015625, -0.49969482421875, -0.472625732421875, -0.445556640625, -0.418487548828125, -0.39141845703125, -0.364349365234375, -0.3372802734375, -0.310211181640625, -0.28314208984375, -0.256072998046875, -0.22900390625, -0.201934814453125, -0.17486572265625, -0.147796630859375, -0.1207275390625, -0.093658447265625, -0.06658935546875, -0.039520263671875, -0.012451171875, 0.014617919921875, 0.04168701171875, 0.068756103515625, 0.0958251953125, 0.122894287109375, 0.14996337890625, 0.177032470703125, 0.2041015625, 0.231170654296875, 0.25823974609375, 0.285308837890625, 0.3123779296875, 0.339447021484375, 0.36651611328125, 0.393585205078125, 0.420654296875, 0.447723388671875, 0.47479248046875, 0.501861572265625, 0.5289306640625, 0.555999755859375, 0.58306884765625, 0.610137939453125, 0.63720703125, 0.664276123046875, 0.69134521484375, 0.718414306640625, 0.7454833984375, 0.772552490234375, 0.79962158203125, 0.826690673828125, 0.853759765625, 0.880828857421875, 0.90789794921875, 0.934967041015625, 0.9620361328125, 0.989105224609375, 1.01617431640625, 1.043243408203125, 1.0703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 10.0, 11.0, 13.0, 33.0, 45.0, 47.0, 56.0, 85.0, 134.0, 243.0, 339.0, 701.0, 1339.0, 3667.0, 15877.0, 123012.0, 779121.0, 103363.0, 14015.0, 3479.0, 1282.0, 621.0, 352.0, 217.0, 148.0, 102.0, 65.0, 36.0, 31.0, 31.0, 15.0, 9.0, 12.0, 7.0, 7.0, 2.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.490234375, -2.420013427734375, -2.34979248046875, -2.279571533203125, -2.2093505859375, -2.139129638671875, -2.06890869140625, -1.998687744140625, -1.928466796875, -1.858245849609375, -1.78802490234375, -1.717803955078125, -1.6475830078125, -1.577362060546875, -1.50714111328125, -1.436920166015625, -1.36669921875, -1.296478271484375, -1.22625732421875, -1.156036376953125, -1.0858154296875, -1.015594482421875, -0.94537353515625, -0.875152587890625, -0.804931640625, -0.734710693359375, -0.66448974609375, -0.594268798828125, -0.5240478515625, -0.453826904296875, -0.38360595703125, -0.313385009765625, -0.2431640625, -0.172943115234375, -0.10272216796875, -0.032501220703125, 0.0377197265625, 0.107940673828125, 0.17816162109375, 0.248382568359375, 0.318603515625, 0.388824462890625, 0.45904541015625, 0.529266357421875, 0.5994873046875, 0.669708251953125, 0.73992919921875, 0.810150146484375, 0.88037109375, 0.950592041015625, 1.02081298828125, 1.091033935546875, 1.1612548828125, 1.231475830078125, 1.30169677734375, 1.371917724609375, 1.442138671875, 1.512359619140625, 1.58258056640625, 1.652801513671875, 1.7230224609375, 1.793243408203125, 1.86346435546875, 1.933685302734375, 2.00390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 17.0, 16.0, 10.0, 22.0, 30.0, 23.0, 44.0, 50.0, 51.0, 58.0, 44.0, 44.0, 65.0, 41.0, 46.0, 54.0, 39.0, 53.0, 39.0, 40.0, 42.0, 35.0, 19.0, 16.0, 12.0, 14.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.073699951171875, -1.99700927734375, -1.920318603515625, -1.8436279296875, -1.766937255859375, -1.69024658203125, -1.613555908203125, -1.536865234375, -1.460174560546875, -1.38348388671875, -1.306793212890625, -1.2301025390625, -1.153411865234375, -1.07672119140625, -1.000030517578125, -0.92333984375, -0.846649169921875, -0.76995849609375, -0.693267822265625, -0.6165771484375, -0.539886474609375, -0.46319580078125, -0.386505126953125, -0.309814453125, -0.233123779296875, -0.15643310546875, -0.079742431640625, -0.0030517578125, 0.073638916015625, 0.15032958984375, 0.227020263671875, 0.3037109375, 0.380401611328125, 0.45709228515625, 0.533782958984375, 0.6104736328125, 0.687164306640625, 0.76385498046875, 0.840545654296875, 0.917236328125, 0.993927001953125, 1.07061767578125, 1.147308349609375, 1.2239990234375, 1.300689697265625, 1.37738037109375, 1.454071044921875, 1.53076171875, 1.607452392578125, 1.68414306640625, 1.760833740234375, 1.8375244140625, 1.914215087890625, 1.99090576171875, 2.067596435546875, 2.144287109375, 2.220977783203125, 2.29766845703125, 2.374359130859375, 2.4510498046875, 2.527740478515625, 2.60443115234375, 2.681121826171875, 2.7578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 5.0, 6.0, 15.0, 19.0, 37.0, 43.0, 70.0, 81.0, 177.0, 287.0, 608.0, 1373.0, 3649.0, 11727.0, 48927.0, 636260.0, 291193.0, 38495.0, 9940.0, 3062.0, 1280.0, 549.0, 293.0, 172.0, 85.0, 62.0, 39.0, 25.0, 19.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5810546875, -0.5616378784179688, -0.5422210693359375, -0.5228042602539062, -0.503387451171875, -0.48397064208984375, -0.4645538330078125, -0.44513702392578125, -0.42572021484375, -0.40630340576171875, -0.3868865966796875, -0.36746978759765625, -0.348052978515625, -0.32863616943359375, -0.3092193603515625, -0.28980255126953125, -0.2703857421875, -0.25096893310546875, -0.2315521240234375, -0.21213531494140625, -0.192718505859375, -0.17330169677734375, -0.1538848876953125, -0.13446807861328125, -0.11505126953125, -0.09563446044921875, -0.0762176513671875, -0.05680084228515625, -0.037384033203125, -0.01796722412109375, 0.0014495849609375, 0.02086639404296875, 0.040283203125, 0.05970001220703125, 0.0791168212890625, 0.09853363037109375, 0.117950439453125, 0.13736724853515625, 0.1567840576171875, 0.17620086669921875, 0.19561767578125, 0.21503448486328125, 0.2344512939453125, 0.25386810302734375, 0.273284912109375, 0.29270172119140625, 0.3121185302734375, 0.33153533935546875, 0.3509521484375, 0.37036895751953125, 0.3897857666015625, 0.40920257568359375, 0.428619384765625, 0.44803619384765625, 0.4674530029296875, 0.48686981201171875, 0.50628662109375, 0.5257034301757812, 0.5451202392578125, 0.5645370483398438, 0.583953857421875, 0.6033706665039062, 0.6227874755859375, 0.6422042846679688, 0.66162109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 7.0, 9.0, 19.0, 18.0, 22.0, 34.0, 48.0, 54.0, 97.0, 98.0, 116.0, 103.0, 64.0, 51.0, 51.0, 27.0, 15.0, 26.0, 17.0, 15.0, 10.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010734796524047852, -0.00010401848703622818, -0.00010068900883197784, -9.735953062772751e-05, -9.403005242347717e-05, -9.070057421922684e-05, -8.73710960149765e-05, -8.404161781072617e-05, -8.071213960647583e-05, -7.73826614022255e-05, -7.405318319797516e-05, -7.072370499372482e-05, -6.739422678947449e-05, -6.406474858522415e-05, -6.0735270380973816e-05, -5.740579217672348e-05, -5.4076313972473145e-05, -5.074683576822281e-05, -4.741735756397247e-05, -4.408787935972214e-05, -4.07584011554718e-05, -3.7428922951221466e-05, -3.409944474697113e-05, -3.0769966542720795e-05, -2.744048833847046e-05, -2.4111010134220123e-05, -2.0781531929969788e-05, -1.7452053725719452e-05, -1.4122575521469116e-05, -1.079309731721878e-05, -7.463619112968445e-06, -4.134140908718109e-06, -8.046627044677734e-07, 2.5248154997825623e-06, 5.854293704032898e-06, 9.183771908283234e-06, 1.251325011253357e-05, 1.5842728316783905e-05, 1.917220652103424e-05, 2.2501684725284576e-05, 2.5831162929534912e-05, 2.9160641133785248e-05, 3.2490119338035583e-05, 3.581959754228592e-05, 3.9149075746536255e-05, 4.247855395078659e-05, 4.5808032155036926e-05, 4.913751035928726e-05, 5.24669885635376e-05, 5.579646676778793e-05, 5.912594497203827e-05, 6.24554231762886e-05, 6.578490138053894e-05, 6.911437958478928e-05, 7.244385778903961e-05, 7.577333599328995e-05, 7.910281419754028e-05, 8.243229240179062e-05, 8.576177060604095e-05, 8.909124881029129e-05, 9.242072701454163e-05, 9.575020521879196e-05, 9.90796834230423e-05, 0.00010240916162729263, 0.00010573863983154297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 16.0, 14.0, 38.0, 44.0, 55.0, 95.0, 170.0, 302.0, 524.0, 1305.0, 3948.0, 15899.0, 97910.0, 799065.0, 105554.0, 16860.0, 4104.0, 1360.0, 555.0, 297.0, 151.0, 94.0, 56.0, 45.0, 20.0, 19.0, 10.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.544708251953125, -0.52154541015625, -0.498382568359375, -0.4752197265625, -0.452056884765625, -0.42889404296875, -0.405731201171875, -0.382568359375, -0.359405517578125, -0.33624267578125, -0.313079833984375, -0.2899169921875, -0.266754150390625, -0.24359130859375, -0.220428466796875, -0.197265625, -0.174102783203125, -0.15093994140625, -0.127777099609375, -0.1046142578125, -0.081451416015625, -0.05828857421875, -0.035125732421875, -0.011962890625, 0.011199951171875, 0.03436279296875, 0.057525634765625, 0.0806884765625, 0.103851318359375, 0.12701416015625, 0.150177001953125, 0.17333984375, 0.196502685546875, 0.21966552734375, 0.242828369140625, 0.2659912109375, 0.289154052734375, 0.31231689453125, 0.335479736328125, 0.358642578125, 0.381805419921875, 0.40496826171875, 0.428131103515625, 0.4512939453125, 0.474456787109375, 0.49761962890625, 0.520782470703125, 0.5439453125, 0.567108154296875, 0.59027099609375, 0.613433837890625, 0.6365966796875, 0.659759521484375, 0.68292236328125, 0.706085205078125, 0.729248046875, 0.752410888671875, 0.77557373046875, 0.798736572265625, 0.8218994140625, 0.845062255859375, 0.86822509765625, 0.891387939453125, 0.91455078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 13.0, 15.0, 16.0, 28.0, 23.0, 27.0, 39.0, 50.0, 69.0, 95.0, 102.0, 109.0, 87.0, 54.0, 39.0, 40.0, 32.0, 19.0, 21.0, 14.0, 14.0, 7.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5390625, -0.5232086181640625, -0.507354736328125, -0.4915008544921875, -0.47564697265625, -0.4597930908203125, -0.443939208984375, -0.4280853271484375, -0.4122314453125, -0.3963775634765625, -0.380523681640625, -0.3646697998046875, -0.34881591796875, -0.3329620361328125, -0.317108154296875, -0.3012542724609375, -0.285400390625, -0.2695465087890625, -0.253692626953125, -0.2378387451171875, -0.22198486328125, -0.2061309814453125, -0.190277099609375, -0.1744232177734375, -0.1585693359375, -0.1427154541015625, -0.126861572265625, -0.1110076904296875, -0.09515380859375, -0.0792999267578125, -0.063446044921875, -0.0475921630859375, -0.03173828125, -0.0158843994140625, -3.0517578125e-05, 0.0158233642578125, 0.03167724609375, 0.0475311279296875, 0.063385009765625, 0.0792388916015625, 0.0950927734375, 0.1109466552734375, 0.126800537109375, 0.1426544189453125, 0.15850830078125, 0.1743621826171875, 0.190216064453125, 0.2060699462890625, 0.221923828125, 0.2377777099609375, 0.253631591796875, 0.2694854736328125, 0.28533935546875, 0.3011932373046875, 0.317047119140625, 0.3329010009765625, 0.3487548828125, 0.3646087646484375, 0.380462646484375, 0.3963165283203125, 0.41217041015625, 0.4280242919921875, 0.443878173828125, 0.4597320556640625, 0.4755859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 8.0, 18.0, 45.0, 117.0, 365.0, 285.0, 102.0, 26.0, 12.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.106849670410156, -33.36344909667969, -32.62004852294922, -31.876649856567383, -31.133251190185547, -30.389850616455078, -29.646451950073242, -28.903051376342773, -28.159652709960938, -27.41625213623047, -26.672853469848633, -25.929452896118164, -25.186054229736328, -24.44265365600586, -23.699254989624023, -22.955854415893555, -22.21245574951172, -21.46905517578125, -20.725656509399414, -19.982255935668945, -19.23885726928711, -18.49545669555664, -17.752058029174805, -17.008657455444336, -16.265256881713867, -15.521857261657715, -14.778457641601562, -14.03505802154541, -13.291658401489258, -12.548258781433105, -11.804859161376953, -11.061458587646484, -10.318059921264648, -9.574660301208496, -8.831260681152344, -8.087861061096191, -7.344461441040039, -6.601061820983887, -5.857661724090576, -5.114262104034424, -4.3708624839782715, -3.627462863922119, -2.884063243865967, -2.1406633853912354, -1.397263765335083, -0.6538641452789307, 0.08953571319580078, 0.8329353332519531, 1.5763349533081055, 2.319734573364258, 3.06313419342041, 3.8065340518951416, 4.549933433532715, 5.293333053588867, 6.036733150482178, 6.78013277053833, 7.523532390594482, 8.266932487487793, 9.010332107543945, 9.753731727600098, 10.49713134765625, 11.240530967712402, 11.983930587768555, 12.727330207824707, 13.47072982788086]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 10.0, 2.0, 10.0, 16.0, 7.0, 12.0, 19.0, 28.0, 16.0, 33.0, 23.0, 26.0, 42.0, 41.0, 58.0, 75.0, 106.0, 90.0, 55.0, 37.0, 49.0, 20.0, 38.0, 31.0, 30.0, 14.0, 19.0, 14.0, 19.0, 4.0, 6.0, 6.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-10.810636520385742, -10.506580352783203, -10.202524185180664, -9.898468017578125, -9.594411849975586, -9.290355682373047, -8.986299514770508, -8.682243347167969, -8.37818717956543, -8.07413101196289, -7.770074844360352, -7.4660186767578125, -7.161962509155273, -6.857906341552734, -6.553850173950195, -6.249794006347656, -5.945737361907959, -5.64168119430542, -5.337625026702881, -5.033568859100342, -4.729512691497803, -4.425456523895264, -4.121399879455566, -3.8173439502716064, -3.5132877826690674, -3.2092316150665283, -2.9051754474639893, -2.601119041442871, -2.297062873840332, -1.9930068254470825, -1.688950538635254, -1.3848943710327148, -1.0808382034301758, -0.7767820358276367, -0.4727258086204529, -0.16866958141326904, 0.13538658618927002, 0.4394427537918091, 0.7434990406036377, 1.0475552082061768, 1.3516113758087158, 1.6556675434112549, 1.959723711013794, 2.263780117034912, 2.567836284637451, 2.8718924522399902, 3.1759486198425293, 3.4800047874450684, 3.7840609550476074, 4.0881171226501465, 4.3921732902526855, 4.696229457855225, 5.000285625457764, 5.304341793060303, 5.6083984375, 5.912454605102539, 6.216510772705078, 6.520566940307617, 6.824623107910156, 7.128679275512695, 7.432735443115234, 7.736791610717773, 8.040847778320312, 8.344903945922852, 8.64896011352539]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 2.0, 12.0, 13.0, 18.0, 25.0, 47.0, 68.0, 97.0, 168.0, 346.0, 665.0, 1339.0, 3310.0, 9568.0, 40378.0, 309086.0, 2618778.0, 1081913.0, 100136.0, 18555.0, 5539.0, 2137.0, 941.0, 488.0, 236.0, 142.0, 95.0, 59.0, 40.0, 19.0, 16.0, 14.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2607421875, -1.223388671875, -1.18603515625, -1.148681640625, -1.111328125, -1.073974609375, -1.03662109375, -0.999267578125, -0.9619140625, -0.924560546875, -0.88720703125, -0.849853515625, -0.8125, -0.775146484375, -0.73779296875, -0.700439453125, -0.6630859375, -0.625732421875, -0.58837890625, -0.551025390625, -0.513671875, -0.476318359375, -0.43896484375, -0.401611328125, -0.3642578125, -0.326904296875, -0.28955078125, -0.252197265625, -0.21484375, -0.177490234375, -0.14013671875, -0.102783203125, -0.0654296875, -0.028076171875, 0.00927734375, 0.046630859375, 0.083984375, 0.121337890625, 0.15869140625, 0.196044921875, 0.2333984375, 0.270751953125, 0.30810546875, 0.345458984375, 0.3828125, 0.420166015625, 0.45751953125, 0.494873046875, 0.5322265625, 0.569580078125, 0.60693359375, 0.644287109375, 0.681640625, 0.718994140625, 0.75634765625, 0.793701171875, 0.8310546875, 0.868408203125, 0.90576171875, 0.943115234375, 0.98046875, 1.017822265625, 1.05517578125, 1.092529296875, 1.1298828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 12.0, 14.0, 16.0, 16.0, 24.0, 30.0, 41.0, 50.0, 27.0, 51.0, 48.0, 46.0, 60.0, 54.0, 65.0, 59.0, 41.0, 51.0, 48.0, 44.0, 43.0, 29.0, 34.0, 20.0, 11.0, 17.0, 9.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6767578125, -0.6533203125, -0.6298828125, -0.6064453125, -0.5830078125, -0.5595703125, -0.5361328125, -0.5126953125, -0.4892578125, -0.4658203125, -0.4423828125, -0.4189453125, -0.3955078125, -0.3720703125, -0.3486328125, -0.3251953125, -0.3017578125, -0.2783203125, -0.2548828125, -0.2314453125, -0.2080078125, -0.1845703125, -0.1611328125, -0.1376953125, -0.1142578125, -0.0908203125, -0.0673828125, -0.0439453125, -0.0205078125, 0.0029296875, 0.0263671875, 0.0498046875, 0.0732421875, 0.0966796875, 0.1201171875, 0.1435546875, 0.1669921875, 0.1904296875, 0.2138671875, 0.2373046875, 0.2607421875, 0.2841796875, 0.3076171875, 0.3310546875, 0.3544921875, 0.3779296875, 0.4013671875, 0.4248046875, 0.4482421875, 0.4716796875, 0.4951171875, 0.5185546875, 0.5419921875, 0.5654296875, 0.5888671875, 0.6123046875, 0.6357421875, 0.6591796875, 0.6826171875, 0.7060546875, 0.7294921875, 0.7529296875, 0.7763671875, 0.7998046875, 0.8232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 5.0, 9.0, 13.0, 9.0, 13.0, 24.0, 58.0, 76.0, 115.0, 156.0, 334.0, 803.0, 2116.0, 7418.0, 40789.0, 659587.0, 3289378.0, 167564.0, 18813.0, 4460.0, 1315.0, 559.0, 284.0, 151.0, 74.0, 41.0, 36.0, 24.0, 9.0, 13.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8123626708984375, -1.762420654296875, -1.7124786376953125, -1.66253662109375, -1.6125946044921875, -1.562652587890625, -1.5127105712890625, -1.4627685546875, -1.4128265380859375, -1.362884521484375, -1.3129425048828125, -1.26300048828125, -1.2130584716796875, -1.163116455078125, -1.1131744384765625, -1.063232421875, -1.0132904052734375, -0.963348388671875, -0.9134063720703125, -0.86346435546875, -0.8135223388671875, -0.763580322265625, -0.7136383056640625, -0.6636962890625, -0.6137542724609375, -0.563812255859375, -0.5138702392578125, -0.46392822265625, -0.4139862060546875, -0.364044189453125, -0.3141021728515625, -0.26416015625, -0.2142181396484375, -0.164276123046875, -0.1143341064453125, -0.06439208984375, -0.0144500732421875, 0.035491943359375, 0.0854339599609375, 0.1353759765625, 0.1853179931640625, 0.235260009765625, 0.2852020263671875, 0.33514404296875, 0.3850860595703125, 0.435028076171875, 0.4849700927734375, 0.534912109375, 0.5848541259765625, 0.634796142578125, 0.6847381591796875, 0.73468017578125, 0.7846221923828125, 0.834564208984375, 0.8845062255859375, 0.9344482421875, 0.9843902587890625, 1.034332275390625, 1.0842742919921875, 1.13421630859375, 1.1841583251953125, 1.234100341796875, 1.2840423583984375, 1.333984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 12.0, 26.0, 41.0, 37.0, 83.0, 93.0, 129.0, 203.0, 296.0, 394.0, 526.0, 556.0, 469.0, 347.0, 251.0, 150.0, 115.0, 69.0, 66.0, 38.0, 46.0, 19.0, 18.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0298614501953125, -0.993316650390625, -0.9567718505859375, -0.92022705078125, -0.8836822509765625, -0.847137451171875, -0.8105926513671875, -0.7740478515625, -0.7375030517578125, -0.700958251953125, -0.6644134521484375, -0.62786865234375, -0.5913238525390625, -0.554779052734375, -0.5182342529296875, -0.481689453125, -0.4451446533203125, -0.408599853515625, -0.3720550537109375, -0.33551025390625, -0.2989654541015625, -0.262420654296875, -0.2258758544921875, -0.1893310546875, -0.1527862548828125, -0.116241455078125, -0.0796966552734375, -0.04315185546875, -0.0066070556640625, 0.029937744140625, 0.0664825439453125, 0.10302734375, 0.1395721435546875, 0.176116943359375, 0.2126617431640625, 0.24920654296875, 0.2857513427734375, 0.322296142578125, 0.3588409423828125, 0.3953857421875, 0.4319305419921875, 0.468475341796875, 0.5050201416015625, 0.54156494140625, 0.5781097412109375, 0.614654541015625, 0.6511993408203125, 0.687744140625, 0.7242889404296875, 0.760833740234375, 0.7973785400390625, 0.83392333984375, 0.8704681396484375, 0.907012939453125, 0.9435577392578125, 0.9801025390625, 1.0166473388671875, 1.053192138671875, 1.0897369384765625, 1.12628173828125, 1.1628265380859375, 1.199371337890625, 1.2359161376953125, 1.2724609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 13.0, 29.0, 49.0, 94.0, 145.0, 181.0, 176.0, 125.0, 61.0, 49.0, 24.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.183838844299316, -7.769847869873047, -7.355856895446777, -6.941866397857666, -6.5278754234313965, -6.113884449005127, -5.699893951416016, -5.285902976989746, -4.871912002563477, -4.457921028137207, -4.0439300537109375, -3.629939556121826, -3.2159485816955566, -2.801957607269287, -2.3879668712615967, -1.9739761352539062, -1.5599851608276367, -1.1459943056106567, -0.7320034503936768, -0.3180125951766968, 0.0959782600402832, 0.5099692344665527, 0.9239599704742432, 1.3379507064819336, 1.7519416809082031, 2.1659326553344727, 2.579923391342163, 2.9939141273498535, 3.407905101776123, 3.8218960762023926, 4.235886573791504, 4.649877548217773, 5.063869476318359, 5.477860450744629, 5.891851425170898, 6.30584192276001, 6.719832897186279, 7.133823871612549, 7.54781436920166, 7.96180534362793, 8.3757963180542, 8.789787292480469, 9.203778266906738, 9.617769241333008, 10.031759262084961, 10.445751190185547, 10.8597412109375, 11.27373218536377, 11.687723159790039, 12.101714134216309, 12.515705108642578, 12.929696083068848, 13.343687057495117, 13.75767707824707, 14.17166805267334, 14.58565902709961, 14.999650001525879, 15.413640975952148, 15.827631950378418, 16.241622924804688, 16.65561294555664, 17.069604873657227, 17.48359489440918, 17.897586822509766, 18.31157684326172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 8.0, 19.0, 23.0, 23.0, 19.0, 33.0, 37.0, 38.0, 31.0, 51.0, 37.0, 41.0, 52.0, 43.0, 48.0, 44.0, 45.0, 32.0, 30.0, 47.0, 32.0, 39.0, 27.0, 24.0, 22.0, 23.0, 10.0, 12.0, 15.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0], "bins": [-6.707261085510254, -6.5287370681762695, -6.350213050842285, -6.171689033508301, -5.993165493011475, -5.81464147567749, -5.636117458343506, -5.4575934410095215, -5.279069423675537, -5.100545406341553, -4.922021389007568, -4.743497848510742, -4.564973831176758, -4.386449813842773, -4.207925796508789, -4.029401779174805, -3.8508780002593994, -3.672353982925415, -3.4938302040100098, -3.3153061866760254, -3.136782169342041, -2.9582581520080566, -2.7797343730926514, -2.601210355758667, -2.4226865768432617, -2.2441625595092773, -2.065638780593872, -1.8871147632598877, -1.7085907459259033, -1.5300668478012085, -1.3515429496765137, -1.1730189323425293, -0.9944949150085449, -0.8159709572792053, -0.6374469995498657, -0.4589231014251709, -0.2803991436958313, -0.1018751859664917, 0.07664871215820312, 0.2551727294921875, 0.4336966276168823, 0.6122205853462219, 0.7907445430755615, 0.9692684412002563, 1.1477923393249512, 1.3263163566589355, 1.5048402547836304, 1.6833642721176147, 1.8618881702423096, 2.040412187576294, 2.218935966491699, 2.3974599838256836, 2.575984001159668, 2.7545080184936523, 2.9330317974090576, 3.111555814743042, 3.2900795936584473, 3.4686036109924316, 3.647127389907837, 3.8256514072418213, 4.004175186157227, 4.182699203491211, 4.361223220825195, 4.53974723815918, 4.718271255493164]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 10.0, 7.0, 9.0, 11.0, 26.0, 40.0, 51.0, 92.0, 183.0, 334.0, 630.0, 1302.0, 2813.0, 6863.0, 17919.0, 54502.0, 206201.0, 492176.0, 186938.0, 50212.0, 16634.0, 6308.0, 2722.0, 1220.0, 603.0, 296.0, 186.0, 101.0, 70.0, 33.0, 21.0, 16.0, 6.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.087188720703125, -1.04449462890625, -1.001800537109375, -0.9591064453125, -0.916412353515625, -0.87371826171875, -0.831024169921875, -0.788330078125, -0.745635986328125, -0.70294189453125, -0.660247802734375, -0.6175537109375, -0.574859619140625, -0.53216552734375, -0.489471435546875, -0.44677734375, -0.404083251953125, -0.36138916015625, -0.318695068359375, -0.2760009765625, -0.233306884765625, -0.19061279296875, -0.147918701171875, -0.105224609375, -0.062530517578125, -0.01983642578125, 0.022857666015625, 0.0655517578125, 0.108245849609375, 0.15093994140625, 0.193634033203125, 0.236328125, 0.279022216796875, 0.32171630859375, 0.364410400390625, 0.4071044921875, 0.449798583984375, 0.49249267578125, 0.535186767578125, 0.577880859375, 0.620574951171875, 0.66326904296875, 0.705963134765625, 0.7486572265625, 0.791351318359375, 0.83404541015625, 0.876739501953125, 0.91943359375, 0.962127685546875, 1.00482177734375, 1.047515869140625, 1.0902099609375, 1.132904052734375, 1.17559814453125, 1.218292236328125, 1.260986328125, 1.303680419921875, 1.34637451171875, 1.389068603515625, 1.4317626953125, 1.474456787109375, 1.51715087890625, 1.559844970703125, 1.6025390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 21.0, 22.0, 27.0, 32.0, 27.0, 48.0, 43.0, 39.0, 44.0, 56.0, 65.0, 55.0, 46.0, 59.0, 44.0, 54.0, 27.0, 53.0, 32.0, 30.0, 34.0, 18.0, 11.0, 12.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6354446411132812, -0.6121978759765625, -0.5889511108398438, -0.565704345703125, -0.5424575805664062, -0.5192108154296875, -0.49596405029296875, -0.47271728515625, -0.44947052001953125, -0.4262237548828125, -0.40297698974609375, -0.379730224609375, -0.35648345947265625, -0.3332366943359375, -0.30998992919921875, -0.2867431640625, -0.26349639892578125, -0.2402496337890625, -0.21700286865234375, -0.193756103515625, -0.17050933837890625, -0.1472625732421875, -0.12401580810546875, -0.10076904296875, -0.07752227783203125, -0.0542755126953125, -0.03102874755859375, -0.007781982421875, 0.01546478271484375, 0.0387115478515625, 0.06195831298828125, 0.085205078125, 0.10845184326171875, 0.1316986083984375, 0.15494537353515625, 0.178192138671875, 0.20143890380859375, 0.2246856689453125, 0.24793243408203125, 0.27117919921875, 0.29442596435546875, 0.3176727294921875, 0.34091949462890625, 0.364166259765625, 0.38741302490234375, 0.4106597900390625, 0.43390655517578125, 0.4571533203125, 0.48040008544921875, 0.5036468505859375, 0.5268936157226562, 0.550140380859375, 0.5733871459960938, 0.5966339111328125, 0.6198806762695312, 0.64312744140625, 0.6663742065429688, 0.6896209716796875, 0.7128677368164062, 0.736114501953125, 0.7593612670898438, 0.7826080322265625, 0.8058547973632812, 0.8291015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 21.0, 18.0, 15.0, 31.0, 33.0, 46.0, 74.0, 95.0, 148.0, 218.0, 344.0, 507.0, 892.0, 1696.0, 4239.0, 17860.0, 171297.0, 785405.0, 51473.0, 8394.0, 2592.0, 1156.0, 669.0, 412.0, 266.0, 182.0, 138.0, 92.0, 60.0, 45.0, 42.0, 29.0, 17.0, 15.0, 2.0, 6.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.9354248046875, -1.866943359375, -1.7984619140625, -1.72998046875, -1.6614990234375, -1.593017578125, -1.5245361328125, -1.4560546875, -1.3875732421875, -1.319091796875, -1.2506103515625, -1.18212890625, -1.1136474609375, -1.045166015625, -0.9766845703125, -0.908203125, -0.8397216796875, -0.771240234375, -0.7027587890625, -0.63427734375, -0.5657958984375, -0.497314453125, -0.4288330078125, -0.3603515625, -0.2918701171875, -0.223388671875, -0.1549072265625, -0.08642578125, -0.0179443359375, 0.050537109375, 0.1190185546875, 0.1875, 0.2559814453125, 0.324462890625, 0.3929443359375, 0.46142578125, 0.5299072265625, 0.598388671875, 0.6668701171875, 0.7353515625, 0.8038330078125, 0.872314453125, 0.9407958984375, 1.00927734375, 1.0777587890625, 1.146240234375, 1.2147216796875, 1.283203125, 1.3516845703125, 1.420166015625, 1.4886474609375, 1.55712890625, 1.6256103515625, 1.694091796875, 1.7625732421875, 1.8310546875, 1.8995361328125, 1.968017578125, 2.0364990234375, 2.10498046875, 2.1734619140625, 2.241943359375, 2.3104248046875, 2.37890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 4.0, 3.0, 9.0, 9.0, 9.0, 13.0, 16.0, 21.0, 15.0, 31.0, 33.0, 31.0, 41.0, 47.0, 44.0, 61.0, 46.0, 55.0, 71.0, 58.0, 49.0, 61.0, 41.0, 28.0, 37.0, 33.0, 20.0, 16.0, 13.0, 13.0, 14.0, 12.0, 9.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.050048828125, -1.97314453125, -1.896240234375, -1.8193359375, -1.742431640625, -1.66552734375, -1.588623046875, -1.51171875, -1.434814453125, -1.35791015625, -1.281005859375, -1.2041015625, -1.127197265625, -1.05029296875, -0.973388671875, -0.896484375, -0.819580078125, -0.74267578125, -0.665771484375, -0.5888671875, -0.511962890625, -0.43505859375, -0.358154296875, -0.28125, -0.204345703125, -0.12744140625, -0.050537109375, 0.0263671875, 0.103271484375, 0.18017578125, 0.257080078125, 0.333984375, 0.410888671875, 0.48779296875, 0.564697265625, 0.6416015625, 0.718505859375, 0.79541015625, 0.872314453125, 0.94921875, 1.026123046875, 1.10302734375, 1.179931640625, 1.2568359375, 1.333740234375, 1.41064453125, 1.487548828125, 1.564453125, 1.641357421875, 1.71826171875, 1.795166015625, 1.8720703125, 1.948974609375, 2.02587890625, 2.102783203125, 2.1796875, 2.256591796875, 2.33349609375, 2.410400390625, 2.4873046875, 2.564208984375, 2.64111328125, 2.718017578125, 2.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 6.0, 6.0, 9.0, 22.0, 35.0, 65.0, 103.0, 163.0, 299.0, 695.0, 1749.0, 6163.0, 41817.0, 875283.0, 107005.0, 10750.0, 2565.0, 929.0, 369.0, 210.0, 112.0, 54.0, 39.0, 30.0, 20.0, 14.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.821533203125, -0.79638671875, -0.771240234375, -0.74609375, -0.720947265625, -0.69580078125, -0.670654296875, -0.6455078125, -0.620361328125, -0.59521484375, -0.570068359375, -0.544921875, -0.519775390625, -0.49462890625, -0.469482421875, -0.4443359375, -0.419189453125, -0.39404296875, -0.368896484375, -0.34375, -0.318603515625, -0.29345703125, -0.268310546875, -0.2431640625, -0.218017578125, -0.19287109375, -0.167724609375, -0.142578125, -0.117431640625, -0.09228515625, -0.067138671875, -0.0419921875, -0.016845703125, 0.00830078125, 0.033447265625, 0.05859375, 0.083740234375, 0.10888671875, 0.134033203125, 0.1591796875, 0.184326171875, 0.20947265625, 0.234619140625, 0.259765625, 0.284912109375, 0.31005859375, 0.335205078125, 0.3603515625, 0.385498046875, 0.41064453125, 0.435791015625, 0.4609375, 0.486083984375, 0.51123046875, 0.536376953125, 0.5615234375, 0.586669921875, 0.61181640625, 0.636962890625, 0.662109375, 0.687255859375, 0.71240234375, 0.737548828125, 0.7626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 15.0, 5.0, 11.0, 28.0, 30.0, 29.0, 39.0, 68.0, 102.0, 181.0, 153.0, 101.0, 63.0, 46.0, 24.0, 26.0, 15.0, 17.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013506412506103516, -0.00013003312051296234, -0.00012500211596488953, -0.00011997111141681671, -0.0001149401068687439, -0.00010990910232067108, -0.00010487809777259827, -9.984709322452545e-05, -9.481608867645264e-05, -8.978508412837982e-05, -8.475407958030701e-05, -7.972307503223419e-05, -7.469207048416138e-05, -6.966106593608856e-05, -6.463006138801575e-05, -5.959905683994293e-05, -5.456805229187012e-05, -4.95370477437973e-05, -4.450604319572449e-05, -3.947503864765167e-05, -3.444403409957886e-05, -2.9413029551506042e-05, -2.4382025003433228e-05, -1.9351020455360413e-05, -1.4320015907287598e-05, -9.289011359214783e-06, -4.258006811141968e-06, 7.729977369308472e-07, 5.804002285003662e-06, 1.0835006833076477e-05, 1.5866011381149292e-05, 2.0897015929222107e-05, 2.5928020477294922e-05, 3.095902502536774e-05, 3.599002957344055e-05, 4.102103412151337e-05, 4.605203866958618e-05, 5.1083043217658997e-05, 5.611404776573181e-05, 6.114505231380463e-05, 6.617605686187744e-05, 7.120706140995026e-05, 7.623806595802307e-05, 8.126907050609589e-05, 8.63000750541687e-05, 9.133107960224152e-05, 9.636208415031433e-05, 0.00010139308869838715, 0.00010642409324645996, 0.00011145509779453278, 0.00011648610234260559, 0.0001215171068906784, 0.00012654811143875122, 0.00013157911598682404, 0.00013661012053489685, 0.00014164112508296967, 0.00014667212963104248, 0.0001517031341791153, 0.0001567341387271881, 0.00016176514327526093, 0.00016679614782333374, 0.00017182715237140656, 0.00017685815691947937, 0.00018188916146755219, 0.000186920166015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 11.0, 7.0, 18.0, 19.0, 36.0, 48.0, 59.0, 81.0, 126.0, 203.0, 386.0, 732.0, 1499.0, 3406.0, 9508.0, 38936.0, 295212.0, 633376.0, 46993.0, 10678.0, 3712.0, 1560.0, 789.0, 461.0, 237.0, 132.0, 92.0, 63.0, 45.0, 35.0, 25.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.404052734375, -0.3885459899902344, -0.37303924560546875, -0.3575325012207031, -0.3420257568359375, -0.3265190124511719, -0.31101226806640625, -0.2955055236816406, -0.279998779296875, -0.2644920349121094, -0.24898529052734375, -0.23347854614257812, -0.2179718017578125, -0.20246505737304688, -0.18695831298828125, -0.17145156860351562, -0.15594482421875, -0.14043807983398438, -0.12493133544921875, -0.10942459106445312, -0.0939178466796875, -0.07841110229492188, -0.06290435791015625, -0.047397613525390625, -0.031890869140625, -0.016384124755859375, -0.00087738037109375, 0.014629364013671875, 0.0301361083984375, 0.045642852783203125, 0.06114959716796875, 0.07665634155273438, 0.0921630859375, 0.10766983032226562, 0.12317657470703125, 0.13868331909179688, 0.1541900634765625, 0.16969680786132812, 0.18520355224609375, 0.20071029663085938, 0.216217041015625, 0.23172378540039062, 0.24723052978515625, 0.2627372741699219, 0.2782440185546875, 0.2937507629394531, 0.30925750732421875, 0.3247642517089844, 0.34027099609375, 0.3557777404785156, 0.37128448486328125, 0.3867912292480469, 0.4022979736328125, 0.4178047180175781, 0.43331146240234375, 0.4488182067871094, 0.464324951171875, 0.4798316955566406, 0.49533843994140625, 0.5108451843261719, 0.5263519287109375, 0.5418586730957031, 0.5573654174804688, 0.5728721618652344, 0.58837890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 11.0, 9.0, 18.0, 14.0, 14.0, 29.0, 29.0, 35.0, 55.0, 56.0, 67.0, 111.0, 121.0, 98.0, 73.0, 63.0, 36.0, 34.0, 24.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 3.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3922462463378906, -0.37799835205078125, -0.3637504577636719, -0.3495025634765625, -0.3352546691894531, -0.32100677490234375, -0.3067588806152344, -0.292510986328125, -0.2782630920410156, -0.26401519775390625, -0.24976730346679688, -0.2355194091796875, -0.22127151489257812, -0.20702362060546875, -0.19277572631835938, -0.17852783203125, -0.16427993774414062, -0.15003204345703125, -0.13578414916992188, -0.1215362548828125, -0.10728836059570312, -0.09304046630859375, -0.07879257202148438, -0.064544677734375, -0.050296783447265625, -0.03604888916015625, -0.021800994873046875, -0.0075531005859375, 0.006694793701171875, 0.02094268798828125, 0.035190582275390625, 0.0494384765625, 0.06368637084960938, 0.07793426513671875, 0.09218215942382812, 0.1064300537109375, 0.12067794799804688, 0.13492584228515625, 0.14917373657226562, 0.163421630859375, 0.17766952514648438, 0.19191741943359375, 0.20616531372070312, 0.2204132080078125, 0.23466110229492188, 0.24890899658203125, 0.2631568908691406, 0.27740478515625, 0.2916526794433594, 0.30590057373046875, 0.3201484680175781, 0.3343963623046875, 0.3486442565917969, 0.36289215087890625, 0.3771400451660156, 0.391387939453125, 0.4056358337402344, 0.41988372802734375, 0.4341316223144531, 0.4483795166015625, 0.4626274108886719, 0.47687530517578125, 0.4911231994628906, 0.50537109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 14.0, 31.0, 114.0, 513.0, 235.0, 63.0, 19.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.60491180419922, -33.66425323486328, -32.72359085083008, -31.78293228149414, -30.84227180480957, -29.901611328125, -28.960952758789062, -28.020292282104492, -27.079631805419922, -26.13897132873535, -25.198312759399414, -24.257652282714844, -23.316991806030273, -22.376331329345703, -21.435672760009766, -20.495012283325195, -19.554351806640625, -18.613691329956055, -17.673032760620117, -16.732372283935547, -15.791711807250977, -14.851052284240723, -13.910392761230469, -12.969732284545898, -12.029073715209961, -11.088414192199707, -10.147753715515137, -9.207094192504883, -8.266433715820312, -7.325774192810059, -6.3851141929626465, -5.444454193115234, -4.503793716430664, -3.563133716583252, -2.62247371673584, -1.6818139553070068, -0.7411539554595947, 0.19950580596923828, 1.1401658058166504, 2.0808258056640625, 3.0214858055114746, 3.9621458053588867, 4.902805805206299, 5.843465805053711, 6.784125328063965, 7.724785327911377, 8.665445327758789, 9.60610580444336, 10.546765327453613, 11.487424850463867, 12.428085327148438, 13.368744850158691, 14.309405326843262, 15.250064849853516, 16.190725326538086, 17.131385803222656, 18.072044372558594, 19.012704849243164, 19.9533634185791, 20.894023895263672, 21.834684371948242, 22.775344848632812, 23.71600341796875, 24.65666389465332, 25.59732437133789]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 10.0, 13.0, 18.0, 15.0, 12.0, 14.0, 14.0, 30.0, 30.0, 34.0, 39.0, 47.0, 90.0, 140.0, 90.0, 58.0, 42.0, 32.0, 39.0, 23.0, 25.0, 11.0, 21.0, 16.0, 17.0, 14.0, 6.0, 9.0, 7.0, 10.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.924737930297852, -8.6578950881958, -8.39105224609375, -8.1242094039917, -7.857367038726807, -7.590524196624756, -7.323681354522705, -7.056838512420654, -6.789996147155762, -6.523153305053711, -6.25631046295166, -5.989467620849609, -5.722625255584717, -5.455782413482666, -5.188939571380615, -4.9220967292785645, -4.655253887176514, -4.388411045074463, -4.121568202972412, -3.8547255992889404, -3.5878829956054688, -3.321040153503418, -3.054197311401367, -2.7873544692993164, -2.5205118656158447, -2.253669023513794, -1.9868264198303223, -1.7199835777282715, -1.4531408548355103, -1.186298131942749, -0.9194552898406982, -0.652612566947937, -0.3857698440551758, -0.11892709136009216, 0.14791566133499146, 0.41475844383239746, 0.6816011667251587, 0.9484438896179199, 1.2152867317199707, 1.482129454612732, 1.7489721775054932, 2.015815019607544, 2.2826576232910156, 2.5495004653930664, 2.816343307495117, 3.083185911178589, 3.3500287532806396, 3.6168713569641113, 3.883714199066162, 4.150557041168213, 4.417399883270264, 4.684242248535156, 4.951085090637207, 5.217927932739258, 5.484770774841309, 5.751613616943359, 6.01845645904541, 6.285299301147461, 6.552142143249512, 6.8189849853515625, 7.085827350616455, 7.352670192718506, 7.619513034820557, 7.886355876922607, 8.1531982421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 6.0, 11.0, 12.0, 12.0, 29.0, 27.0, 30.0, 70.0, 134.0, 234.0, 406.0, 887.0, 2009.0, 5197.0, 17682.0, 97352.0, 955745.0, 2592758.0, 452376.0, 51312.0, 11485.0, 3669.0, 1398.0, 662.0, 331.0, 170.0, 98.0, 60.0, 48.0, 26.0, 11.0, 13.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.650390625, -1.602325439453125, -1.55426025390625, -1.506195068359375, -1.4581298828125, -1.410064697265625, -1.36199951171875, -1.313934326171875, -1.265869140625, -1.217803955078125, -1.16973876953125, -1.121673583984375, -1.0736083984375, -1.025543212890625, -0.97747802734375, -0.929412841796875, -0.88134765625, -0.833282470703125, -0.78521728515625, -0.737152099609375, -0.6890869140625, -0.641021728515625, -0.59295654296875, -0.544891357421875, -0.496826171875, -0.448760986328125, -0.40069580078125, -0.352630615234375, -0.3045654296875, -0.256500244140625, -0.20843505859375, -0.160369873046875, -0.1123046875, -0.064239501953125, -0.01617431640625, 0.031890869140625, 0.0799560546875, 0.128021240234375, 0.17608642578125, 0.224151611328125, 0.272216796875, 0.320281982421875, 0.36834716796875, 0.416412353515625, 0.4644775390625, 0.512542724609375, 0.56060791015625, 0.608673095703125, 0.65673828125, 0.704803466796875, 0.75286865234375, 0.800933837890625, 0.8489990234375, 0.897064208984375, 0.94512939453125, 0.993194580078125, 1.041259765625, 1.089324951171875, 1.13739013671875, 1.185455322265625, 1.2335205078125, 1.281585693359375, 1.32965087890625, 1.377716064453125, 1.42578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 5.0, 12.0, 14.0, 15.0, 13.0, 40.0, 24.0, 26.0, 32.0, 30.0, 33.0, 43.0, 42.0, 37.0, 47.0, 49.0, 49.0, 52.0, 40.0, 40.0, 44.0, 52.0, 29.0, 35.0, 25.0, 24.0, 27.0, 21.0, 17.0, 11.0, 14.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.490966796875, -0.4728431701660156, -0.45471954345703125, -0.4365959167480469, -0.4184722900390625, -0.4003486633300781, -0.38222503662109375, -0.3641014099121094, -0.345977783203125, -0.3278541564941406, -0.30973052978515625, -0.2916069030761719, -0.2734832763671875, -0.2553596496582031, -0.23723602294921875, -0.21911239624023438, -0.20098876953125, -0.18286514282226562, -0.16474151611328125, -0.14661788940429688, -0.1284942626953125, -0.11037063598632812, -0.09224700927734375, -0.07412338256835938, -0.055999755859375, -0.037876129150390625, -0.01975250244140625, -0.001628875732421875, 0.0164947509765625, 0.034618377685546875, 0.05274200439453125, 0.07086563110351562, 0.0889892578125, 0.10711288452148438, 0.12523651123046875, 0.14336013793945312, 0.1614837646484375, 0.17960739135742188, 0.19773101806640625, 0.21585464477539062, 0.233978271484375, 0.2521018981933594, 0.27022552490234375, 0.2883491516113281, 0.3064727783203125, 0.3245964050292969, 0.34272003173828125, 0.3608436584472656, 0.37896728515625, 0.3970909118652344, 0.41521453857421875, 0.4333381652832031, 0.4514617919921875, 0.4695854187011719, 0.48770904541015625, 0.5058326721191406, 0.523956298828125, 0.5420799255371094, 0.5602035522460938, 0.5783271789550781, 0.5964508056640625, 0.6145744323730469, 0.6326980590820312, 0.6508216857910156, 0.6689453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 10.0, 13.0, 15.0, 14.0, 36.0, 41.0, 44.0, 53.0, 110.0, 159.0, 229.0, 416.0, 749.0, 1570.0, 3829.0, 13870.0, 140130.0, 3774932.0, 231894.0, 17804.0, 4503.0, 1788.0, 835.0, 459.0, 269.0, 157.0, 99.0, 55.0, 49.0, 31.0, 34.0, 10.0, 19.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.626800537109375, -2.53485107421875, -2.442901611328125, -2.3509521484375, -2.259002685546875, -2.16705322265625, -2.075103759765625, -1.983154296875, -1.891204833984375, -1.79925537109375, -1.707305908203125, -1.6153564453125, -1.523406982421875, -1.43145751953125, -1.339508056640625, -1.24755859375, -1.155609130859375, -1.06365966796875, -0.971710205078125, -0.8797607421875, -0.787811279296875, -0.69586181640625, -0.603912353515625, -0.511962890625, -0.420013427734375, -0.32806396484375, -0.236114501953125, -0.1441650390625, -0.052215576171875, 0.03973388671875, 0.131683349609375, 0.2236328125, 0.315582275390625, 0.40753173828125, 0.499481201171875, 0.5914306640625, 0.683380126953125, 0.77532958984375, 0.867279052734375, 0.959228515625, 1.051177978515625, 1.14312744140625, 1.235076904296875, 1.3270263671875, 1.418975830078125, 1.51092529296875, 1.602874755859375, 1.69482421875, 1.786773681640625, 1.87872314453125, 1.970672607421875, 2.0626220703125, 2.154571533203125, 2.24652099609375, 2.338470458984375, 2.430419921875, 2.522369384765625, 2.61431884765625, 2.706268310546875, 2.7982177734375, 2.890167236328125, 2.98211669921875, 3.074066162109375, 3.166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 10.0, 23.0, 29.0, 32.0, 40.0, 70.0, 100.0, 114.0, 192.0, 248.0, 433.0, 536.0, 587.0, 455.0, 311.0, 259.0, 166.0, 129.0, 85.0, 56.0, 41.0, 29.0, 27.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.112213134765625, -2.04669189453125, -1.981170654296875, -1.9156494140625, -1.850128173828125, -1.78460693359375, -1.719085693359375, -1.653564453125, -1.588043212890625, -1.52252197265625, -1.457000732421875, -1.3914794921875, -1.325958251953125, -1.26043701171875, -1.194915771484375, -1.12939453125, -1.063873291015625, -0.99835205078125, -0.932830810546875, -0.8673095703125, -0.801788330078125, -0.73626708984375, -0.670745849609375, -0.605224609375, -0.539703369140625, -0.47418212890625, -0.408660888671875, -0.3431396484375, -0.277618408203125, -0.21209716796875, -0.146575927734375, -0.0810546875, -0.015533447265625, 0.04998779296875, 0.115509033203125, 0.1810302734375, 0.246551513671875, 0.31207275390625, 0.377593994140625, 0.443115234375, 0.508636474609375, 0.57415771484375, 0.639678955078125, 0.7052001953125, 0.770721435546875, 0.83624267578125, 0.901763916015625, 0.96728515625, 1.032806396484375, 1.09832763671875, 1.163848876953125, 1.2293701171875, 1.294891357421875, 1.36041259765625, 1.425933837890625, 1.491455078125, 1.556976318359375, 1.62249755859375, 1.688018798828125, 1.7535400390625, 1.819061279296875, 1.88458251953125, 1.950103759765625, 2.015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 5.0, 14.0, 11.0, 23.0, 36.0, 114.0, 199.0, 250.0, 173.0, 83.0, 45.0, 17.0, 11.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.30022430419922, -42.137691497802734, -40.97515869140625, -39.8126220703125, -38.650089263916016, -37.48755645751953, -36.32502365112305, -35.16249084472656, -33.99995422363281, -32.83742141723633, -31.67488670349121, -30.512353897094727, -29.34981918334961, -28.187286376953125, -27.02475357055664, -25.862220764160156, -24.699687957763672, -23.537155151367188, -22.37462043762207, -21.212087631225586, -20.04955291748047, -18.887020111083984, -17.7244873046875, -16.561954498291016, -15.399419784545898, -14.236886024475098, -13.074352264404297, -11.911819458007812, -10.749285697937012, -9.586751937866211, -8.424219131469727, -7.261685371398926, -6.099153518676758, -4.936619758605957, -3.7740864753723145, -2.6115529537200928, -1.449019432067871, -0.2864856719970703, 0.8760476112365723, 2.038580894470215, 3.2011146545410156, 4.363648414611816, 5.526181697845459, 6.688714981079102, 7.851248741149902, 9.013782501220703, 10.176315307617188, 11.338849067687988, 12.501382827758789, 13.66391658782959, 14.82645034790039, 15.988983154296875, 17.15151596069336, 18.314050674438477, 19.47658348083496, 20.639118194580078, 21.801651000976562, 22.964183807373047, 24.126718521118164, 25.28925132751465, 26.451786041259766, 27.61431884765625, 28.776851654052734, 29.93938446044922, 31.101919174194336]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 10.0, 11.0, 22.0, 15.0, 17.0, 30.0, 26.0, 29.0, 36.0, 44.0, 38.0, 53.0, 61.0, 57.0, 72.0, 65.0, 47.0, 47.0, 40.0, 42.0, 28.0, 39.0, 35.0, 26.0, 20.0, 15.0, 10.0, 13.0, 5.0, 6.0, 6.0, 11.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.77409839630127, -12.343695640563965, -11.91329288482666, -11.482890129089355, -11.05248737335205, -10.622084617614746, -10.191682815551758, -9.761280059814453, -9.330877304077148, -8.900474548339844, -8.470071792602539, -8.039669036865234, -7.60926628112793, -7.178863525390625, -6.7484612464904785, -6.318058490753174, -5.887655258178711, -5.457252502441406, -5.026849746704102, -4.596446990966797, -4.166044235229492, -3.7356417179107666, -3.305239200592041, -2.8748364448547363, -2.4444336891174316, -2.014030933380127, -1.5836282968521118, -1.1532256603240967, -0.722822904586792, -0.2924201488494873, 0.13798236846923828, 0.568385124206543, 0.9987869262695312, 1.429189682006836, 1.859592318534851, 2.289994955062866, 2.720397710800171, 3.1508004665374756, 3.581202983856201, 4.011605739593506, 4.4420084953308105, 4.872411251068115, 5.30281400680542, 5.733216285705566, 6.163619041442871, 6.594021797180176, 7.0244245529174805, 7.454827308654785, 7.88523006439209, 8.315632820129395, 8.7460355758667, 9.176438331604004, 9.606841087341309, 10.037243843078613, 10.467645645141602, 10.898048400878906, 11.328451156616211, 11.758853912353516, 12.18925666809082, 12.619659423828125, 13.05006217956543, 13.480464935302734, 13.910867691040039, 14.341270446777344, 14.771673202514648]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 16.0, 23.0, 25.0, 30.0, 59.0, 76.0, 100.0, 185.0, 321.0, 569.0, 1166.0, 2374.0, 5474.0, 15660.0, 52034.0, 274125.0, 571678.0, 87291.0, 23000.0, 7988.0, 3136.0, 1485.0, 746.0, 332.0, 217.0, 131.0, 76.0, 76.0, 48.0, 34.0, 13.0, 8.0, 11.0, 6.0, 3.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.240234375, -1.201690673828125, -1.16314697265625, -1.124603271484375, -1.0860595703125, -1.047515869140625, -1.00897216796875, -0.970428466796875, -0.931884765625, -0.893341064453125, -0.85479736328125, -0.816253662109375, -0.7777099609375, -0.739166259765625, -0.70062255859375, -0.662078857421875, -0.62353515625, -0.584991455078125, -0.54644775390625, -0.507904052734375, -0.4693603515625, -0.430816650390625, -0.39227294921875, -0.353729248046875, -0.315185546875, -0.276641845703125, -0.23809814453125, -0.199554443359375, -0.1610107421875, -0.122467041015625, -0.08392333984375, -0.045379638671875, -0.0068359375, 0.031707763671875, 0.07025146484375, 0.108795166015625, 0.1473388671875, 0.185882568359375, 0.22442626953125, 0.262969970703125, 0.301513671875, 0.340057373046875, 0.37860107421875, 0.417144775390625, 0.4556884765625, 0.494232177734375, 0.53277587890625, 0.571319580078125, 0.60986328125, 0.648406982421875, 0.68695068359375, 0.725494384765625, 0.7640380859375, 0.802581787109375, 0.84112548828125, 0.879669189453125, 0.918212890625, 0.956756591796875, 0.99530029296875, 1.033843994140625, 1.0723876953125, 1.110931396484375, 1.14947509765625, 1.188018798828125, 1.2265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 15.0, 15.0, 29.0, 33.0, 47.0, 42.0, 60.0, 44.0, 80.0, 68.0, 78.0, 71.0, 69.0, 74.0, 48.0, 44.0, 35.0, 34.0, 31.0, 22.0, 17.0, 12.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7572479248046875, -0.722503662109375, -0.6877593994140625, -0.65301513671875, -0.6182708740234375, -0.583526611328125, -0.5487823486328125, -0.5140380859375, -0.4792938232421875, -0.444549560546875, -0.4098052978515625, -0.37506103515625, -0.3403167724609375, -0.305572509765625, -0.2708282470703125, -0.236083984375, -0.2013397216796875, -0.166595458984375, -0.1318511962890625, -0.09710693359375, -0.0623626708984375, -0.027618408203125, 0.0071258544921875, 0.0418701171875, 0.0766143798828125, 0.111358642578125, 0.1461029052734375, 0.18084716796875, 0.2155914306640625, 0.250335693359375, 0.2850799560546875, 0.31982421875, 0.3545684814453125, 0.389312744140625, 0.4240570068359375, 0.45880126953125, 0.4935455322265625, 0.528289794921875, 0.5630340576171875, 0.5977783203125, 0.6325225830078125, 0.667266845703125, 0.7020111083984375, 0.73675537109375, 0.7714996337890625, 0.806243896484375, 0.8409881591796875, 0.875732421875, 0.9104766845703125, 0.945220947265625, 0.9799652099609375, 1.01470947265625, 1.0494537353515625, 1.084197998046875, 1.1189422607421875, 1.1536865234375, 1.1884307861328125, 1.223175048828125, 1.2579193115234375, 1.29266357421875, 1.3274078369140625, 1.362152099609375, 1.3968963623046875, 1.431640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 23.0, 36.0, 52.0, 86.0, 122.0, 156.0, 265.0, 373.0, 771.0, 1859.0, 6833.0, 49896.0, 891703.0, 82467.0, 9460.0, 2259.0, 862.0, 450.0, 269.0, 178.0, 106.0, 68.0, 48.0, 36.0, 32.0, 15.0, 15.0, 5.0, 12.0, 5.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5478515625, -1.5017852783203125, -1.455718994140625, -1.4096527099609375, -1.36358642578125, -1.3175201416015625, -1.271453857421875, -1.2253875732421875, -1.1793212890625, -1.1332550048828125, -1.087188720703125, -1.0411224365234375, -0.99505615234375, -0.9489898681640625, -0.902923583984375, -0.8568572998046875, -0.810791015625, -0.7647247314453125, -0.718658447265625, -0.6725921630859375, -0.62652587890625, -0.5804595947265625, -0.534393310546875, -0.4883270263671875, -0.4422607421875, -0.3961944580078125, -0.350128173828125, -0.3040618896484375, -0.25799560546875, -0.2119293212890625, -0.165863037109375, -0.1197967529296875, -0.07373046875, -0.0276641845703125, 0.018402099609375, 0.0644683837890625, 0.11053466796875, 0.1566009521484375, 0.202667236328125, 0.2487335205078125, 0.2947998046875, 0.3408660888671875, 0.386932373046875, 0.4329986572265625, 0.47906494140625, 0.5251312255859375, 0.571197509765625, 0.6172637939453125, 0.663330078125, 0.7093963623046875, 0.755462646484375, 0.8015289306640625, 0.84759521484375, 0.8936614990234375, 0.939727783203125, 0.9857940673828125, 1.0318603515625, 1.0779266357421875, 1.123992919921875, 1.1700592041015625, 1.21612548828125, 1.2621917724609375, 1.308258056640625, 1.3543243408203125, 1.400390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 10.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 15.0, 19.0, 21.0, 29.0, 28.0, 56.0, 54.0, 58.0, 62.0, 80.0, 59.0, 68.0, 64.0, 52.0, 40.0, 33.0, 34.0, 12.0, 21.0, 20.0, 19.0, 20.0, 8.0, 10.0, 9.0, 6.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.49609375, -2.41912841796875, -2.3421630859375, -2.26519775390625, -2.188232421875, -2.11126708984375, -2.0343017578125, -1.95733642578125, -1.88037109375, -1.80340576171875, -1.7264404296875, -1.64947509765625, -1.572509765625, -1.49554443359375, -1.4185791015625, -1.34161376953125, -1.2646484375, -1.18768310546875, -1.1107177734375, -1.03375244140625, -0.956787109375, -0.87982177734375, -0.8028564453125, -0.72589111328125, -0.64892578125, -0.57196044921875, -0.4949951171875, -0.41802978515625, -0.341064453125, -0.26409912109375, -0.1871337890625, -0.11016845703125, -0.033203125, 0.04376220703125, 0.1207275390625, 0.19769287109375, 0.274658203125, 0.35162353515625, 0.4285888671875, 0.50555419921875, 0.58251953125, 0.65948486328125, 0.7364501953125, 0.81341552734375, 0.890380859375, 0.96734619140625, 1.0443115234375, 1.12127685546875, 1.1982421875, 1.27520751953125, 1.3521728515625, 1.42913818359375, 1.506103515625, 1.58306884765625, 1.6600341796875, 1.73699951171875, 1.81396484375, 1.89093017578125, 1.9678955078125, 2.04486083984375, 2.121826171875, 2.19879150390625, 2.2757568359375, 2.35272216796875, 2.4296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 9.0, 11.0, 19.0, 29.0, 38.0, 53.0, 92.0, 157.0, 268.0, 520.0, 1216.0, 3597.0, 14236.0, 183021.0, 817976.0, 19849.0, 4517.0, 1501.0, 653.0, 308.0, 171.0, 89.0, 66.0, 37.0, 31.0, 25.0, 16.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.37534332275390625, -0.3649444580078125, -0.35454559326171875, -0.344146728515625, -0.33374786376953125, -0.3233489990234375, -0.31295013427734375, -0.30255126953125, -0.29215240478515625, -0.2817535400390625, -0.27135467529296875, -0.260955810546875, -0.25055694580078125, -0.2401580810546875, -0.22975921630859375, -0.2193603515625, -0.20896148681640625, -0.1985626220703125, -0.18816375732421875, -0.177764892578125, -0.16736602783203125, -0.1569671630859375, -0.14656829833984375, -0.13616943359375, -0.12577056884765625, -0.1153717041015625, -0.10497283935546875, -0.094573974609375, -0.08417510986328125, -0.0737762451171875, -0.06337738037109375, -0.052978515625, -0.04257965087890625, -0.0321807861328125, -0.02178192138671875, -0.011383056640625, -0.00098419189453125, 0.0094146728515625, 0.01981353759765625, 0.03021240234375, 0.04061126708984375, 0.0510101318359375, 0.06140899658203125, 0.071807861328125, 0.08220672607421875, 0.0926055908203125, 0.10300445556640625, 0.1134033203125, 0.12380218505859375, 0.1342010498046875, 0.14459991455078125, 0.154998779296875, 0.16539764404296875, 0.1757965087890625, 0.18619537353515625, 0.19659423828125, 0.20699310302734375, 0.2173919677734375, 0.22779083251953125, 0.238189697265625, 0.24858856201171875, 0.2589874267578125, 0.26938629150390625, 0.27978515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 7.0, 7.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 110.0, 146.0, 154.0, 155.0, 67.0, 39.0, 37.0, 24.0, 19.0, 10.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.636713027954102e-05, -8.399225771427155e-05, -8.161738514900208e-05, -7.92425125837326e-05, -7.686764001846313e-05, -7.449276745319366e-05, -7.21178948879242e-05, -6.974302232265472e-05, -6.736814975738525e-05, -6.499327719211578e-05, -6.261840462684631e-05, -6.024353206157684e-05, -5.786865949630737e-05, -5.54937869310379e-05, -5.311891436576843e-05, -5.074404180049896e-05, -4.836916923522949e-05, -4.599429666996002e-05, -4.361942410469055e-05, -4.124455153942108e-05, -3.886967897415161e-05, -3.649480640888214e-05, -3.411993384361267e-05, -3.17450612783432e-05, -2.937018871307373e-05, -2.699531614780426e-05, -2.462044358253479e-05, -2.224557101726532e-05, -1.987069845199585e-05, -1.749582588672638e-05, -1.512095332145691e-05, -1.2746080756187439e-05, -1.0371208190917969e-05, -7.996335625648499e-06, -5.621463060379028e-06, -3.246590495109558e-06, -8.717179298400879e-07, 1.5031546354293823e-06, 3.8780272006988525e-06, 6.252899765968323e-06, 8.627772331237793e-06, 1.1002644896507263e-05, 1.3377517461776733e-05, 1.5752390027046204e-05, 1.8127262592315674e-05, 2.0502135157585144e-05, 2.2877007722854614e-05, 2.5251880288124084e-05, 2.7626752853393555e-05, 3.0001625418663025e-05, 3.2376497983932495e-05, 3.4751370549201965e-05, 3.7126243114471436e-05, 3.9501115679740906e-05, 4.1875988245010376e-05, 4.4250860810279846e-05, 4.6625733375549316e-05, 4.900060594081879e-05, 5.137547850608826e-05, 5.375035107135773e-05, 5.61252236366272e-05, 5.850009620189667e-05, 6.087496876716614e-05, 6.324984133243561e-05, 6.562471389770508e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 21.0, 26.0, 23.0, 47.0, 67.0, 101.0, 157.0, 264.0, 418.0, 764.0, 1378.0, 2775.0, 6157.0, 16501.0, 63245.0, 809634.0, 108661.0, 22977.0, 7930.0, 3522.0, 1631.0, 885.0, 500.0, 282.0, 162.0, 114.0, 77.0, 62.0, 49.0, 32.0, 21.0, 13.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.19930648803710938, -0.19280242919921875, -0.18629837036132812, -0.1797943115234375, -0.17329025268554688, -0.16678619384765625, -0.16028213500976562, -0.153778076171875, -0.14727401733398438, -0.14076995849609375, -0.13426589965820312, -0.1277618408203125, -0.12125778198242188, -0.11475372314453125, -0.10824966430664062, -0.10174560546875, -0.09524154663085938, -0.08873748779296875, -0.08223342895507812, -0.0757293701171875, -0.06922531127929688, -0.06272125244140625, -0.056217193603515625, -0.049713134765625, -0.043209075927734375, -0.03670501708984375, -0.030200958251953125, -0.0236968994140625, -0.017192840576171875, -0.01068878173828125, -0.004184722900390625, 0.0023193359375, 0.008823394775390625, 0.01532745361328125, 0.021831512451171875, 0.0283355712890625, 0.034839630126953125, 0.04134368896484375, 0.047847747802734375, 0.054351806640625, 0.060855865478515625, 0.06735992431640625, 0.07386398315429688, 0.0803680419921875, 0.08687210083007812, 0.09337615966796875, 0.09988021850585938, 0.10638427734375, 0.11288833618164062, 0.11939239501953125, 0.12589645385742188, 0.1324005126953125, 0.13890457153320312, 0.14540863037109375, 0.15191268920898438, 0.158416748046875, 0.16492080688476562, 0.17142486572265625, 0.17792892456054688, 0.1844329833984375, 0.19093704223632812, 0.19744110107421875, 0.20394515991210938, 0.21044921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 2.0, 5.0, 7.0, 6.0, 14.0, 25.0, 11.0, 18.0, 27.0, 50.0, 76.0, 140.0, 156.0, 141.0, 86.0, 57.0, 40.0, 20.0, 20.0, 16.0, 23.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.339599609375, -0.33008575439453125, -0.3205718994140625, -0.31105804443359375, -0.301544189453125, -0.29203033447265625, -0.2825164794921875, -0.27300262451171875, -0.26348876953125, -0.25397491455078125, -0.2444610595703125, -0.23494720458984375, -0.225433349609375, -0.21591949462890625, -0.2064056396484375, -0.19689178466796875, -0.1873779296875, -0.17786407470703125, -0.1683502197265625, -0.15883636474609375, -0.149322509765625, -0.13980865478515625, -0.1302947998046875, -0.12078094482421875, -0.11126708984375, -0.10175323486328125, -0.0922393798828125, -0.08272552490234375, -0.073211669921875, -0.06369781494140625, -0.0541839599609375, -0.04467010498046875, -0.03515625, -0.02564239501953125, -0.0161285400390625, -0.00661468505859375, 0.002899169921875, 0.01241302490234375, 0.0219268798828125, 0.03144073486328125, 0.04095458984375, 0.05046844482421875, 0.0599822998046875, 0.06949615478515625, 0.079010009765625, 0.08852386474609375, 0.0980377197265625, 0.10755157470703125, 0.1170654296875, 0.12657928466796875, 0.1360931396484375, 0.14560699462890625, 0.155120849609375, 0.16463470458984375, 0.1741485595703125, 0.18366241455078125, 0.19317626953125, 0.20269012451171875, 0.2122039794921875, 0.22171783447265625, 0.231231689453125, 0.24074554443359375, 0.2502593994140625, 0.25977325439453125, 0.269287109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 11.0, 20.0, 23.0, 43.0, 64.0, 129.0, 482.0, 103.0, 50.0, 18.0, 14.0, 8.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.590933799743652, -12.262884140014648, -11.934834480285645, -11.606783866882324, -11.27873420715332, -10.950684547424316, -10.622634887695312, -10.294585227966309, -9.966535568237305, -9.6384859085083, -9.310436248779297, -8.982385635375977, -8.654335975646973, -8.326286315917969, -7.998236656188965, -7.670186996459961, -7.342136383056641, -7.014086723327637, -6.686036586761475, -6.357986927032471, -6.029936790466309, -5.701887130737305, -5.373837471008301, -5.045787811279297, -4.717737674713135, -4.389688014984131, -4.061637878417969, -3.733588218688965, -3.405538320541382, -3.077488422393799, -2.749438762664795, -2.421388864517212, -2.0933399200439453, -1.7652900218963623, -1.4372402429580688, -1.1091904640197754, -0.7811405658721924, -0.4530906677246094, -0.12504088878631592, 0.20300889015197754, 0.5310587882995605, 0.8591086268424988, 1.187158465385437, 1.5152082443237305, 1.8432581424713135, 2.1713080406188965, 2.4993577003479004, 2.8274075984954834, 3.1554574966430664, 3.4835073947906494, 3.8115572929382324, 4.139606952667236, 4.467657089233398, 4.795706748962402, 5.123756408691406, 5.45180606842041, 5.779856204986572, 6.107905864715576, 6.435956001281738, 6.764005661010742, 7.092055320739746, 7.420105457305908, 7.748155117034912, 8.076205253601074, 8.404254913330078]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 12.0, 12.0, 13.0, 16.0, 16.0, 21.0, 15.0, 27.0, 24.0, 24.0, 43.0, 185.0, 256.0, 54.0, 34.0, 19.0, 34.0, 25.0, 21.0, 18.0, 12.0, 13.0, 11.0, 8.0, 10.0, 9.0, 2.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.607936859130859, -7.3912434577941895, -7.1745500564575195, -6.95785665512085, -6.74116325378418, -6.52446985244751, -6.30777645111084, -6.091082572937012, -5.8743896484375, -5.65769624710083, -5.44100284576416, -5.22430944442749, -5.00761604309082, -4.79092264175415, -4.5742292404174805, -4.357535362243652, -4.140841960906982, -3.9241485595703125, -3.7074551582336426, -3.4907617568969727, -3.2740683555603027, -3.057374954223633, -2.840681314468384, -2.623987913131714, -2.407294511795044, -2.190601110458374, -1.973907709121704, -1.7572141885757446, -1.5405207872390747, -1.3238273859024048, -1.1071338653564453, -0.8904404640197754, -0.6737470626831055, -0.45705363154411316, -0.24036020040512085, -0.023666739463806152, 0.19302666187286377, 0.4097200632095337, 0.6264135837554932, 0.8431069850921631, 1.059800386428833, 1.276493787765503, 1.4931871891021729, 1.7098807096481323, 1.9265741109848022, 2.1432676315307617, 2.3599610328674316, 2.5766544342041016, 2.7933478355407715, 3.0100412368774414, 3.2267346382141113, 3.4434280395507812, 3.660121440887451, 3.876814842224121, 4.093508720397949, 4.310201644897461, 4.526895523071289, 4.743588924407959, 4.960282325744629, 5.176975727081299, 5.393669128417969, 5.610362529754639, 5.827055931091309, 6.043749809265137, 6.260442733764648]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 6.0, 8.0, 17.0, 19.0, 32.0, 38.0, 42.0, 43.0, 55.0, 139.0, 254.0, 67.0, 46.0, 43.0, 28.0, 24.0, 22.0, 25.0, 17.0, 17.0, 9.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.891357421875, -0.86279296875, -0.834228515625, -0.8056640625, -0.777099609375, -0.74853515625, -0.719970703125, -0.69140625, -0.662841796875, -0.63427734375, -0.605712890625, -0.5771484375, -0.548583984375, -0.52001953125, -0.491455078125, -0.462890625, -0.434326171875, -0.40576171875, -0.377197265625, -0.3486328125, -0.320068359375, -0.29150390625, -0.262939453125, -0.234375, -0.205810546875, -0.17724609375, -0.148681640625, -0.1201171875, -0.091552734375, -0.06298828125, -0.034423828125, -0.005859375, 0.022705078125, 0.05126953125, 0.079833984375, 0.1083984375, 0.136962890625, 0.16552734375, 0.194091796875, 0.22265625, 0.251220703125, 0.27978515625, 0.308349609375, 0.3369140625, 0.365478515625, 0.39404296875, 0.422607421875, 0.451171875, 0.479736328125, 0.50830078125, 0.536865234375, 0.5654296875, 0.593994140625, 0.62255859375, 0.651123046875, 0.6796875, 0.708251953125, 0.73681640625, 0.765380859375, 0.7939453125, 0.822509765625, 0.85107421875, 0.879638671875, 0.908203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 10.0, 11.0, 13.0, 17.0, 22.0, 23.0, 48.0, 98.0, 222.0, 628.0, 2842.0, 32289.0, 8343188.0, 7162.0, 1235.0, 369.0, 147.0, 86.0, 42.0, 33.0, 12.0, 11.0, 14.0, 16.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-10.011630058288574, -9.680545806884766, -9.34946060180664, -9.018376350402832, -8.687292098999023, -8.356207847595215, -8.025123596191406, -7.694038391113281, -7.362954139709473, -7.031869888305664, -6.700785160064697, -6.3697004318237305, -6.038616180419922, -5.707531929016113, -5.3764472007751465, -5.04536247253418, -4.714278221130371, -4.3831939697265625, -4.052109241485596, -3.721024751663208, -3.3899402618408203, -3.0588557720184326, -2.727771282196045, -2.3966867923736572, -2.0656023025512695, -1.7345178127288818, -1.4034333229064941, -1.0723488330841064, -0.7412643432617188, -0.41017985343933105, -0.07909536361694336, 0.25198912620544434, 0.5830726623535156, 0.9141571521759033, 1.245241641998291, 1.5763261318206787, 1.9074106216430664, 2.238495111465454, 2.569579601287842, 2.9006640911102295, 3.231748580932617, 3.562833070755005, 3.8939175605773926, 4.225002288818359, 4.556086540222168, 4.887170791625977, 5.218255519866943, 5.54934024810791, 5.880424499511719, 6.211508750915527, 6.542593479156494, 6.873678207397461, 7.2047624588012695, 7.535846710205078, 7.866931438446045, 8.198016166687012, 8.52910041809082, 8.860184669494629, 9.191268920898438, 9.522354125976562, 9.853438377380371, 10.18452262878418, 10.515607833862305, 10.846692085266113, 11.177776336669922]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 11.0, 5.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.871780395507812, -14.41817569732666, -13.964570999145508, -13.510966300964355, -13.057361602783203, -12.60375690460205, -12.150152206420898, -11.696547508239746, -11.242942810058594, -10.789338111877441, -10.335733413696289, -9.882128715515137, -9.428524017333984, -8.974919319152832, -8.52131462097168, -8.067709922790527, -7.614105224609375, -7.160500526428223, -6.70689582824707, -6.253291130065918, -5.799686431884766, -5.346081733703613, -4.892477035522461, -4.438872337341309, -3.9852676391601562, -3.531662940979004, -3.0780582427978516, -2.624453544616699, -2.170848846435547, -1.7172441482543945, -1.2636394500732422, -0.8100347518920898, -0.3564291000366211, 0.09717559814453125, 0.5507802963256836, 1.004384994506836, 1.4579896926879883, 1.9115943908691406, 2.365199089050293, 2.8188037872314453, 3.2724084854125977, 3.72601318359375, 4.179617881774902, 4.633222579956055, 5.086827278137207, 5.540431976318359, 5.994036674499512, 6.447641372680664, 6.901246070861816, 7.354850769042969, 7.808455467224121, 8.262060165405273, 8.715664863586426, 9.169269561767578, 9.62287425994873, 10.076478958129883, 10.530083656311035, 10.983688354492188, 11.43729305267334, 11.890897750854492, 12.344502449035645, 12.798107147216797, 13.25171184539795, 13.705316543579102, 14.158921241760254]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 18.0, 16.0, 21.0, 34.0, 54.0, 71.0, 75.0, 121.0, 153.0, 232.0, 387.0, 679.0, 1330.0, 3075.0, 8772.0, 26407.0, 85508.0, 208518.0, 127887.0, 40188.0, 12588.0, 4308.0, 1657.0, 759.0, 383.0, 265.0, 188.0, 132.0, 101.0, 65.0, 52.0, 40.0, 35.0, 34.0, 26.0, 19.0, 9.0, 13.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4296875, -6.2200927734375, -6.010498046875, -5.8009033203125, -5.59130859375, -5.3817138671875, -5.172119140625, -4.9625244140625, -4.7529296875, -4.5433349609375, -4.333740234375, -4.1241455078125, -3.91455078125, -3.7049560546875, -3.495361328125, -3.2857666015625, -3.076171875, -2.8665771484375, -2.656982421875, -2.4473876953125, -2.23779296875, -2.0281982421875, -1.818603515625, -1.6090087890625, -1.3994140625, -1.1898193359375, -0.980224609375, -0.7706298828125, -0.56103515625, -0.3514404296875, -0.141845703125, 0.0677490234375, 0.27734375, 0.4869384765625, 0.696533203125, 0.9061279296875, 1.11572265625, 1.3253173828125, 1.534912109375, 1.7445068359375, 1.9541015625, 2.1636962890625, 2.373291015625, 2.5828857421875, 2.79248046875, 3.0020751953125, 3.211669921875, 3.4212646484375, 3.630859375, 3.8404541015625, 4.050048828125, 4.2596435546875, 4.46923828125, 4.6788330078125, 4.888427734375, 5.0980224609375, 5.3076171875, 5.5172119140625, 5.726806640625, 5.9364013671875, 6.14599609375, 6.3555908203125, 6.565185546875, 6.7747802734375, 6.984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 14.0, 18.0, 20.0, 28.0, 45.0, 43.0, 64.0, 92.0, 98.0, 105.0, 87.0, 93.0, 60.0, 53.0, 74.0, 30.0, 15.0, 25.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8467559814453125, -0.807769775390625, -0.7687835693359375, -0.72979736328125, -0.6908111572265625, -0.651824951171875, -0.6128387451171875, -0.5738525390625, -0.5348663330078125, -0.495880126953125, -0.4568939208984375, -0.41790771484375, -0.3789215087890625, -0.339935302734375, -0.3009490966796875, -0.261962890625, -0.2229766845703125, -0.183990478515625, -0.1450042724609375, -0.10601806640625, -0.0670318603515625, -0.028045654296875, 0.0109405517578125, 0.0499267578125, 0.0889129638671875, 0.127899169921875, 0.1668853759765625, 0.20587158203125, 0.2448577880859375, 0.283843994140625, 0.3228302001953125, 0.36181640625, 0.4008026123046875, 0.439788818359375, 0.4787750244140625, 0.51776123046875, 0.5567474365234375, 0.595733642578125, 0.6347198486328125, 0.6737060546875, 0.7126922607421875, 0.751678466796875, 0.7906646728515625, 0.82965087890625, 0.8686370849609375, 0.907623291015625, 0.9466094970703125, 0.985595703125, 1.0245819091796875, 1.063568115234375, 1.1025543212890625, 1.14154052734375, 1.1805267333984375, 1.219512939453125, 1.2584991455078125, 1.2974853515625, 1.3364715576171875, 1.375457763671875, 1.4144439697265625, 1.45343017578125, 1.4924163818359375, 1.531402587890625, 1.5703887939453125, 1.609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 12.0, 8.0, 24.0, 35.0, 54.0, 77.0, 71.0, 68.0, 59.0, 34.0, 13.0, 15.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21453857421875, -7.9825663566589355, -7.750594139099121, -7.518621921539307, -7.286649703979492, -7.054677486419678, -6.822705268859863, -6.590733051300049, -6.358760833740234, -6.12678861618042, -5.8948163986206055, -5.662844181060791, -5.430871963500977, -5.198899745941162, -4.966927528381348, -4.734955310821533, -4.502983093261719, -4.271010875701904, -4.03903865814209, -3.8070664405822754, -3.575094223022461, -3.3431220054626465, -3.111149787902832, -2.8791775703430176, -2.647205352783203, -2.4152331352233887, -2.183260917663574, -1.9512887001037598, -1.7193164825439453, -1.4873442649841309, -1.2553720474243164, -1.023399829864502, -0.7914276123046875, -0.559455394744873, -0.3274831771850586, -0.09551095962524414, 0.1364612579345703, 0.36843347549438477, 0.6004056930541992, 0.8323779106140137, 1.0643501281738281, 1.2963223457336426, 1.528294563293457, 1.7602667808532715, 1.992238998413086, 2.2242112159729004, 2.456183433532715, 2.6881556510925293, 2.9201278686523438, 3.152100086212158, 3.3840723037719727, 3.616044521331787, 3.8480167388916016, 4.079988956451416, 4.3119611740112305, 4.543933391571045, 4.775905609130859, 5.007877826690674, 5.239850044250488, 5.471822261810303, 5.703794479370117, 5.935766696929932, 6.167738914489746, 6.3997111320495605, 6.631683349609375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 5.0, 9.0, 23.0, 58.0, 135.0, 120.0, 51.0, 18.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.148806095123291, -5.946475028991699, -5.744144439697266, -5.541813373565674, -5.339482307434082, -5.137151718139648, -4.934820652008057, -4.732489585876465, -4.530158996582031, -4.3278279304504395, -4.125497341156006, -3.923166275024414, -3.7208352088928223, -3.5185043811798096, -3.316173553466797, -3.113842487335205, -2.9115114212036133, -2.7091805934906006, -2.506849527359009, -2.304518699645996, -2.1021876335144043, -1.8998568058013916, -1.697525978088379, -1.4951950311660767, -1.2928640842437744, -1.0905331373214722, -0.8882022500038147, -0.6858713626861572, -0.483540415763855, -0.28120946884155273, -0.07887864112854004, 0.12345230579376221, 0.32578277587890625, 0.5281137228012085, 0.730444610118866, 0.9327754974365234, 1.1351064443588257, 1.337437391281128, 1.5397682189941406, 1.7420991659164429, 1.9444301128387451, 2.146760940551758, 2.3490920066833496, 2.5514228343963623, 2.753753662109375, 2.956084728240967, 3.1584155559539795, 3.360746383666992, 3.563077449798584, 3.7654082775115967, 3.9677393436431885, 4.170070171356201, 4.372401237487793, 4.574731826782227, 4.777062892913818, 4.97939395904541, 5.181724548339844, 5.3840556144714355, 5.586386203765869, 5.788717269897461, 5.991048336029053, 6.1933794021606445, 6.395709991455078, 6.59804105758667, 6.800372123718262]}, "eval/loss": 5.628564834594727, "eval/wer": 1.5293172212631705, "eval/runtime": 963.4096, "eval/samples_per_second": 2.742, "eval/steps_per_second": 0.344, "train/train_runtime": 28486.3453, "train/train_samples_per_second": 5.009, "train/train_steps_per_second": 0.157, "train/total_flos": 0.0, "train/train_loss": 6.089906092074955} \ No newline at end of file