diff --git "a/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220322_102142-3iwtcnsp/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.169, "train/learning_rate": 2.9295774647887323e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8917, "_timestamp": 1647953419, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 9.0, 9.0, 11.0, 15.0, 19.0, 21.0, 28.0, 38.0, 39.0, 52.0, 40.0, 55.0, 46.0, 59.0, 44.0, 60.0, 47.0, 53.0, 44.0, 40.0, 47.0, 38.0, 22.0, 23.0, 25.0, 20.0, 17.0, 12.0, 13.0, 14.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.31623077392578, -72.91283416748047, -70.50942993164062, -68.10603332519531, -65.70263671875, -63.29923629760742, -60.895835876464844, -58.49243927001953, -56.08903884887695, -53.685638427734375, -51.28224182128906, -48.878841400146484, -46.475440979003906, -44.072044372558594, -41.668643951416016, -39.26524353027344, -36.861846923828125, -34.45844650268555, -32.055049896240234, -29.651649475097656, -27.24825096130371, -24.844852447509766, -22.441452026367188, -20.038053512573242, -17.634654998779297, -15.231256484985352, -12.82785701751709, -10.424457550048828, -8.021059036254883, -5.6176605224609375, -3.214261054992676, -0.8108615875244141, 1.5925369262695312, 3.9959359169006348, 6.399334907531738, 8.802734375, 11.206132888793945, 13.60953140258789, 16.01293182373047, 18.416330337524414, 20.81972885131836, 23.223127365112305, 25.62652587890625, 28.029926300048828, 30.433324813842773, 32.83672332763672, 35.2401237487793, 37.643524169921875, 40.04692077636719, 42.450321197509766, 44.85371780395508, 47.257118225097656, 49.66051483154297, 52.06391525268555, 54.467315673828125, 56.87071228027344, 59.274112701416016, 61.677513122558594, 64.0809097290039, 66.48430633544922, 68.88771057128906, 71.29110717773438, 73.69450378417969, 76.09790802001953, 78.50130462646484]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 18.0, 21.0, 20.0, 24.0, 35.0, 21.0, 32.0, 28.0, 42.0, 41.0, 34.0, 38.0, 33.0, 43.0, 43.0, 33.0, 49.0, 35.0, 38.0, 41.0, 26.0, 31.0, 34.0, 30.0, 23.0, 25.0, 16.0, 5.0, 14.0, 8.0, 8.0, 9.0, 8.0, 8.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-70.98054504394531, -68.85433197021484, -66.72811889648438, -64.60191345214844, -62.47570037841797, -60.3494873046875, -58.2232780456543, -56.097068786621094, -53.970855712890625, -51.844642639160156, -49.71843338012695, -47.59222412109375, -45.46601104736328, -43.33979797363281, -41.21358871459961, -39.087379455566406, -36.96116638183594, -34.83495330810547, -32.708744049072266, -30.58253288269043, -28.456321716308594, -26.330110549926758, -24.203899383544922, -22.077688217163086, -19.95147705078125, -17.825265884399414, -15.699054718017578, -13.572843551635742, -11.446632385253906, -9.32042121887207, -7.194210052490234, -5.067998886108398, -2.9417877197265625, -0.8155765533447266, 1.3106346130371094, 3.4368457794189453, 5.563056945800781, 7.689268112182617, 9.815479278564453, 11.941690444946289, 14.067901611328125, 16.19411277770996, 18.320323944091797, 20.446535110473633, 22.57274627685547, 24.698957443237305, 26.82516860961914, 28.951379776000977, 31.077590942382812, 33.20380401611328, 35.330013275146484, 37.45622253417969, 39.582435607910156, 41.708648681640625, 43.83485794067383, 45.96106719970703, 48.0872802734375, 50.21349334716797, 52.33970260620117, 54.465911865234375, 56.592124938964844, 58.71833801269531, 60.844547271728516, 62.97075653076172, 65.09696960449219]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 11.0, 21.0, 22.0, 32.0, 61.0, 74.0, 111.0, 170.0, 235.0, 347.0, 544.0, 812.0, 1235.0, 1852.0, 2936.0, 4699.0, 7550.0, 12381.0, 20737.0, 35593.0, 62323.0, 116794.0, 233638.0, 457231.0, 760199.0, 900650.0, 714252.0, 410371.0, 204565.0, 103984.0, 57030.0, 32374.0, 19208.0, 11567.0, 7362.0, 4627.0, 2838.0, 1970.0, 1307.0, 829.0, 578.0, 378.0, 267.0, 181.0, 120.0, 78.0, 50.0, 32.0, 25.0, 7.0, 12.0, 8.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-50.625, -49.013671875, -47.40234375, -45.791015625, -44.1796875, -42.568359375, -40.95703125, -39.345703125, -37.734375, -36.123046875, -34.51171875, -32.900390625, -31.2890625, -29.677734375, -28.06640625, -26.455078125, -24.84375, -23.232421875, -21.62109375, -20.009765625, -18.3984375, -16.787109375, -15.17578125, -13.564453125, -11.953125, -10.341796875, -8.73046875, -7.119140625, -5.5078125, -3.896484375, -2.28515625, -0.673828125, 0.9375, 2.548828125, 4.16015625, 5.771484375, 7.3828125, 8.994140625, 10.60546875, 12.216796875, 13.828125, 15.439453125, 17.05078125, 18.662109375, 20.2734375, 21.884765625, 23.49609375, 25.107421875, 26.71875, 28.330078125, 29.94140625, 31.552734375, 33.1640625, 34.775390625, 36.38671875, 37.998046875, 39.609375, 41.220703125, 42.83203125, 44.443359375, 46.0546875, 47.666015625, 49.27734375, 50.888671875, 52.5]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 7.0, 5.0, 7.0, 15.0, 12.0, 22.0, 17.0, 22.0, 28.0, 31.0, 26.0, 36.0, 22.0, 35.0, 38.0, 32.0, 46.0, 44.0, 39.0, 34.0, 39.0, 44.0, 51.0, 39.0, 35.0, 27.0, 28.0, 24.0, 25.0, 28.0, 13.0, 19.0, 10.0, 10.0, 13.0, 12.0, 9.0, 10.0, 8.0, 5.0, 2.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 4.0], "bins": [-48.46875, -47.07861328125, -45.6884765625, -44.29833984375, -42.908203125, -41.51806640625, -40.1279296875, -38.73779296875, -37.34765625, -35.95751953125, -34.5673828125, -33.17724609375, -31.787109375, -30.39697265625, -29.0068359375, -27.61669921875, -26.2265625, -24.83642578125, -23.4462890625, -22.05615234375, -20.666015625, -19.27587890625, -17.8857421875, -16.49560546875, -15.10546875, -13.71533203125, -12.3251953125, -10.93505859375, -9.544921875, -8.15478515625, -6.7646484375, -5.37451171875, -3.984375, -2.59423828125, -1.2041015625, 0.18603515625, 1.576171875, 2.96630859375, 4.3564453125, 5.74658203125, 7.13671875, 8.52685546875, 9.9169921875, 11.30712890625, 12.697265625, 14.08740234375, 15.4775390625, 16.86767578125, 18.2578125, 19.64794921875, 21.0380859375, 22.42822265625, 23.818359375, 25.20849609375, 26.5986328125, 27.98876953125, 29.37890625, 30.76904296875, 32.1591796875, 33.54931640625, 34.939453125, 36.32958984375, 37.7197265625, 39.10986328125, 40.5]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 18.0, 26.0, 57.0, 57.0, 117.0, 179.0, 261.0, 399.0, 648.0, 1013.0, 1450.0, 2147.0, 3262.0, 5037.0, 7592.0, 11320.0, 17636.0, 26513.0, 40841.0, 62307.0, 94929.0, 143500.0, 218067.0, 325364.0, 479356.0, 643684.0, 648074.0, 485396.0, 329809.0, 220582.0, 146055.0, 95567.0, 62778.0, 41024.0, 27097.0, 17538.0, 11528.0, 7852.0, 5070.0, 3463.0, 2253.0, 1487.0, 981.0, 639.0, 503.0, 290.0, 185.0, 142.0, 89.0, 31.0, 33.0, 26.0, 8.0, 6.0, 4.0, 3.0], "bins": [-42.71875, -41.462890625, -40.20703125, -38.951171875, -37.6953125, -36.439453125, -35.18359375, -33.927734375, -32.671875, -31.416015625, -30.16015625, -28.904296875, -27.6484375, -26.392578125, -25.13671875, -23.880859375, -22.625, -21.369140625, -20.11328125, -18.857421875, -17.6015625, -16.345703125, -15.08984375, -13.833984375, -12.578125, -11.322265625, -10.06640625, -8.810546875, -7.5546875, -6.298828125, -5.04296875, -3.787109375, -2.53125, -1.275390625, -0.01953125, 1.236328125, 2.4921875, 3.748046875, 5.00390625, 6.259765625, 7.515625, 8.771484375, 10.02734375, 11.283203125, 12.5390625, 13.794921875, 15.05078125, 16.306640625, 17.5625, 18.818359375, 20.07421875, 21.330078125, 22.5859375, 23.841796875, 25.09765625, 26.353515625, 27.609375, 28.865234375, 30.12109375, 31.376953125, 32.6328125, 33.888671875, 35.14453125, 36.400390625, 37.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 3.0, 9.0, 8.0, 27.0, 17.0, 31.0, 22.0, 34.0, 35.0, 49.0, 63.0, 79.0, 88.0, 114.0, 124.0, 145.0, 177.0, 235.0, 255.0, 297.0, 288.0, 286.0, 296.0, 232.0, 200.0, 189.0, 126.0, 113.0, 101.0, 86.0, 68.0, 50.0, 41.0, 43.0, 25.0, 23.0, 20.0, 13.0, 11.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.71875, -20.089111328125, -19.45947265625, -18.829833984375, -18.2001953125, -17.570556640625, -16.94091796875, -16.311279296875, -15.681640625, -15.052001953125, -14.42236328125, -13.792724609375, -13.1630859375, -12.533447265625, -11.90380859375, -11.274169921875, -10.64453125, -10.014892578125, -9.38525390625, -8.755615234375, -8.1259765625, -7.496337890625, -6.86669921875, -6.237060546875, -5.607421875, -4.977783203125, -4.34814453125, -3.718505859375, -3.0888671875, -2.459228515625, -1.82958984375, -1.199951171875, -0.5703125, 0.059326171875, 0.68896484375, 1.318603515625, 1.9482421875, 2.577880859375, 3.20751953125, 3.837158203125, 4.466796875, 5.096435546875, 5.72607421875, 6.355712890625, 6.9853515625, 7.614990234375, 8.24462890625, 8.874267578125, 9.50390625, 10.133544921875, 10.76318359375, 11.392822265625, 12.0224609375, 12.652099609375, 13.28173828125, 13.911376953125, 14.541015625, 15.170654296875, 15.80029296875, 16.429931640625, 17.0595703125, 17.689208984375, 18.31884765625, 18.948486328125, 19.578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 7.0, 6.0, 11.0, 9.0, 17.0, 24.0, 25.0, 26.0, 27.0, 31.0, 35.0, 47.0, 56.0, 41.0, 42.0, 37.0, 50.0, 38.0, 52.0, 54.0, 50.0, 50.0, 42.0, 32.0, 31.0, 23.0, 33.0, 17.0, 13.0, 12.0, 12.0, 10.0, 8.0, 6.0, 9.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.76505661010742, -42.194217681884766, -40.62337875366211, -39.05253982543945, -37.4817008972168, -35.91086196899414, -34.34001922607422, -32.76918029785156, -31.19834327697754, -29.627504348754883, -28.056665420532227, -26.485824584960938, -24.91498565673828, -23.344146728515625, -21.77330780029297, -20.202468872070312, -18.631629943847656, -17.060791015625, -15.489952087402344, -13.919112205505371, -12.348273277282715, -10.777434349060059, -9.206594467163086, -7.63575553894043, -6.064916610717773, -4.494077682495117, -2.9232382774353027, -1.3523988723754883, 0.21844005584716797, 1.7892789840698242, 3.360118865966797, 4.930957794189453, 6.501792907714844, 8.0726318359375, 9.643470764160156, 11.214310646057129, 12.785149574279785, 14.355988502502441, 15.926828384399414, 17.49766731262207, 19.068506240844727, 20.639345169067383, 22.21018409729004, 23.781024932861328, 25.351863861083984, 26.92270278930664, 28.493541717529297, 30.064380645751953, 31.63521957397461, 33.206058502197266, 34.77689743041992, 36.34773635864258, 37.918575286865234, 39.48941421508789, 41.06025695800781, 42.63109588623047, 44.201934814453125, 45.77277374267578, 47.34361267089844, 48.914451599121094, 50.48529052734375, 52.056129455566406, 53.62696838378906, 55.19780731201172, 56.768646240234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 4.0, 2.0, 12.0, 10.0, 14.0, 15.0, 14.0, 17.0, 19.0, 28.0, 25.0, 31.0, 34.0, 32.0, 49.0, 51.0, 50.0, 36.0, 35.0, 45.0, 45.0, 43.0, 40.0, 34.0, 32.0, 40.0, 42.0, 38.0, 23.0, 27.0, 28.0, 14.0, 12.0, 13.0, 8.0, 6.0, 6.0, 2.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-56.3577880859375, -54.805931091308594, -53.25407791137695, -51.70222091674805, -50.150367736816406, -48.5985107421875, -47.046653747558594, -45.49479675292969, -43.94294357299805, -42.39108657836914, -40.8392333984375, -39.287376403808594, -37.73551940917969, -36.18366622924805, -34.63180923461914, -33.0799560546875, -31.528099060058594, -29.97624397277832, -28.424388885498047, -26.87253189086914, -25.320676803588867, -23.768821716308594, -22.216964721679688, -20.665109634399414, -19.11325454711914, -17.561399459838867, -16.009544372558594, -14.457687377929688, -12.905832290649414, -11.35397720336914, -9.80212116241455, -8.250265121459961, -6.6984100341796875, -5.146554470062256, -3.594698905944824, -2.0428433418273926, -0.49098777770996094, 1.0608677864074707, 2.6127233505249023, 4.164579391479492, 5.716434478759766, 7.268290042877197, 8.820145606994629, 10.372001647949219, 11.923856735229492, 13.475711822509766, 15.027567863464355, 16.579423904418945, 18.13127899169922, 19.683134078979492, 21.234989166259766, 22.786846160888672, 24.338701248168945, 25.89055633544922, 27.442413330078125, 28.9942684173584, 30.546123504638672, 32.09798049926758, 33.64983367919922, 35.201690673828125, 36.75354766845703, 38.30540084838867, 39.85725784301758, 41.40911102294922, 42.960968017578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 6.0, 14.0, 15.0, 19.0, 37.0, 43.0, 82.0, 89.0, 150.0, 219.0, 279.0, 396.0, 587.0, 800.0, 1201.0, 1728.0, 2422.0, 3635.0, 5337.0, 8070.0, 11717.0, 17851.0, 27499.0, 42145.0, 64786.0, 101494.0, 161766.0, 204647.0, 139423.0, 87544.0, 56166.0, 36372.0, 23882.0, 15657.0, 10412.0, 6979.0, 4686.0, 3141.0, 2261.0, 1512.0, 1029.0, 771.0, 527.0, 346.0, 254.0, 159.0, 126.0, 95.0, 61.0, 46.0, 28.0, 17.0, 13.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.875, -12.4361572265625, -11.997314453125, -11.5584716796875, -11.11962890625, -10.6807861328125, -10.241943359375, -9.8031005859375, -9.3642578125, -8.9254150390625, -8.486572265625, -8.0477294921875, -7.60888671875, -7.1700439453125, -6.731201171875, -6.2923583984375, -5.853515625, -5.4146728515625, -4.975830078125, -4.5369873046875, -4.09814453125, -3.6593017578125, -3.220458984375, -2.7816162109375, -2.3427734375, -1.9039306640625, -1.465087890625, -1.0262451171875, -0.58740234375, -0.1485595703125, 0.290283203125, 0.7291259765625, 1.16796875, 1.6068115234375, 2.045654296875, 2.4844970703125, 2.92333984375, 3.3621826171875, 3.801025390625, 4.2398681640625, 4.6787109375, 5.1175537109375, 5.556396484375, 5.9952392578125, 6.43408203125, 6.8729248046875, 7.311767578125, 7.7506103515625, 8.189453125, 8.6282958984375, 9.067138671875, 9.5059814453125, 9.94482421875, 10.3836669921875, 10.822509765625, 11.2613525390625, 11.7001953125, 12.1390380859375, 12.577880859375, 13.0167236328125, 13.45556640625, 13.8944091796875, 14.333251953125, 14.7720947265625, 15.2109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 9.0, 12.0, 11.0, 16.0, 26.0, 35.0, 18.0, 26.0, 49.0, 28.0, 39.0, 37.0, 30.0, 40.0, 42.0, 47.0, 37.0, 41.0, 32.0, 36.0, 39.0, 44.0, 37.0, 31.0, 28.0, 29.0, 20.0, 18.0, 27.0, 14.0, 8.0, 10.0, 9.0, 10.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0], "bins": [-47.375, -45.9765625, -44.578125, -43.1796875, -41.78125, -40.3828125, -38.984375, -37.5859375, -36.1875, -34.7890625, -33.390625, -31.9921875, -30.59375, -29.1953125, -27.796875, -26.3984375, -25.0, -23.6015625, -22.203125, -20.8046875, -19.40625, -18.0078125, -16.609375, -15.2109375, -13.8125, -12.4140625, -11.015625, -9.6171875, -8.21875, -6.8203125, -5.421875, -4.0234375, -2.625, -1.2265625, 0.171875, 1.5703125, 2.96875, 4.3671875, 5.765625, 7.1640625, 8.5625, 9.9609375, 11.359375, 12.7578125, 14.15625, 15.5546875, 16.953125, 18.3515625, 19.75, 21.1484375, 22.546875, 23.9453125, 25.34375, 26.7421875, 28.140625, 29.5390625, 30.9375, 32.3359375, 33.734375, 35.1328125, 36.53125, 37.9296875, 39.328125, 40.7265625, 42.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 5.0, 22.0, 24.0, 28.0, 42.0, 71.0, 96.0, 157.0, 229.0, 340.0, 512.0, 803.0, 1260.0, 1827.0, 3040.0, 5206.0, 8331.0, 14128.0, 24135.0, 42999.0, 80122.0, 160577.0, 285147.0, 199519.0, 97655.0, 51306.0, 28735.0, 16631.0, 9890.0, 5842.0, 3563.0, 2220.0, 1419.0, 866.0, 582.0, 383.0, 235.0, 203.0, 136.0, 71.0, 52.0, 36.0, 24.0, 20.0, 12.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.213623046875, -9.88037109375, -9.547119140625, -9.2138671875, -8.880615234375, -8.54736328125, -8.214111328125, -7.880859375, -7.547607421875, -7.21435546875, -6.881103515625, -6.5478515625, -6.214599609375, -5.88134765625, -5.548095703125, -5.21484375, -4.881591796875, -4.54833984375, -4.215087890625, -3.8818359375, -3.548583984375, -3.21533203125, -2.882080078125, -2.548828125, -2.215576171875, -1.88232421875, -1.549072265625, -1.2158203125, -0.882568359375, -0.54931640625, -0.216064453125, 0.1171875, 0.450439453125, 0.78369140625, 1.116943359375, 1.4501953125, 1.783447265625, 2.11669921875, 2.449951171875, 2.783203125, 3.116455078125, 3.44970703125, 3.782958984375, 4.1162109375, 4.449462890625, 4.78271484375, 5.115966796875, 5.44921875, 5.782470703125, 6.11572265625, 6.448974609375, 6.7822265625, 7.115478515625, 7.44873046875, 7.781982421875, 8.115234375, 8.448486328125, 8.78173828125, 9.114990234375, 9.4482421875, 9.781494140625, 10.11474609375, 10.447998046875, 10.78125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 6.0, 8.0, 14.0, 8.0, 19.0, 19.0, 27.0, 17.0, 33.0, 24.0, 28.0, 27.0, 31.0, 48.0, 31.0, 29.0, 30.0, 31.0, 43.0, 42.0, 39.0, 35.0, 37.0, 42.0, 25.0, 31.0, 22.0, 33.0, 20.0, 25.0, 27.0, 17.0, 16.0, 23.0, 10.0, 14.0, 14.0, 8.0, 5.0, 5.0, 3.0, 6.0, 5.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.96875, -30.056640625, -29.14453125, -28.232421875, -27.3203125, -26.408203125, -25.49609375, -24.583984375, -23.671875, -22.759765625, -21.84765625, -20.935546875, -20.0234375, -19.111328125, -18.19921875, -17.287109375, -16.375, -15.462890625, -14.55078125, -13.638671875, -12.7265625, -11.814453125, -10.90234375, -9.990234375, -9.078125, -8.166015625, -7.25390625, -6.341796875, -5.4296875, -4.517578125, -3.60546875, -2.693359375, -1.78125, -0.869140625, 0.04296875, 0.955078125, 1.8671875, 2.779296875, 3.69140625, 4.603515625, 5.515625, 6.427734375, 7.33984375, 8.251953125, 9.1640625, 10.076171875, 10.98828125, 11.900390625, 12.8125, 13.724609375, 14.63671875, 15.548828125, 16.4609375, 17.373046875, 18.28515625, 19.197265625, 20.109375, 21.021484375, 21.93359375, 22.845703125, 23.7578125, 24.669921875, 25.58203125, 26.494140625, 27.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 11.0, 19.0, 39.0, 48.0, 78.0, 97.0, 188.0, 271.0, 442.0, 698.0, 1014.0, 1591.0, 2639.0, 4110.0, 6676.0, 10869.0, 17702.0, 29504.0, 49901.0, 86776.0, 151075.0, 253556.0, 180731.0, 102937.0, 59112.0, 34479.0, 20681.0, 12530.0, 7654.0, 4867.0, 2977.0, 1942.0, 1200.0, 757.0, 459.0, 326.0, 222.0, 129.0, 79.0, 50.0, 23.0, 31.0, 20.0, 15.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7422027587890625, -0.715362548828125, -0.6885223388671875, -0.66168212890625, -0.6348419189453125, -0.608001708984375, -0.5811614990234375, -0.5543212890625, -0.5274810791015625, -0.500640869140625, -0.4738006591796875, -0.44696044921875, -0.4201202392578125, -0.393280029296875, -0.3664398193359375, -0.339599609375, -0.3127593994140625, -0.285919189453125, -0.2590789794921875, -0.23223876953125, -0.2053985595703125, -0.178558349609375, -0.1517181396484375, -0.1248779296875, -0.0980377197265625, -0.071197509765625, -0.0443572998046875, -0.01751708984375, 0.0093231201171875, 0.036163330078125, 0.0630035400390625, 0.08984375, 0.1166839599609375, 0.143524169921875, 0.1703643798828125, 0.19720458984375, 0.2240447998046875, 0.250885009765625, 0.2777252197265625, 0.3045654296875, 0.3314056396484375, 0.358245849609375, 0.3850860595703125, 0.41192626953125, 0.4387664794921875, 0.465606689453125, 0.4924468994140625, 0.519287109375, 0.5461273193359375, 0.572967529296875, 0.5998077392578125, 0.62664794921875, 0.6534881591796875, 0.680328369140625, 0.7071685791015625, 0.7340087890625, 0.7608489990234375, 0.787689208984375, 0.8145294189453125, 0.84136962890625, 0.8682098388671875, 0.895050048828125, 0.9218902587890625, 0.94873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 10.0, 6.0, 4.0, 7.0, 10.0, 15.0, 13.0, 29.0, 20.0, 28.0, 35.0, 39.0, 48.0, 64.0, 58.0, 83.0, 81.0, 62.0, 55.0, 42.0, 40.0, 36.0, 34.0, 29.0, 17.0, 17.0, 18.0, 20.0, 21.0, 12.0, 5.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0002512931823730469, -0.0002432689070701599, -0.00023524463176727295, -0.00022722035646438599, -0.00021919608116149902, -0.00021117180585861206, -0.0002031475305557251, -0.00019512325525283813, -0.00018709897994995117, -0.0001790747046470642, -0.00017105042934417725, -0.00016302615404129028, -0.00015500187873840332, -0.00014697760343551636, -0.0001389533281326294, -0.00013092905282974243, -0.00012290477752685547, -0.0001148805022239685, -0.00010685622692108154, -9.883195161819458e-05, -9.080767631530762e-05, -8.278340101242065e-05, -7.475912570953369e-05, -6.673485040664673e-05, -5.8710575103759766e-05, -5.06862998008728e-05, -4.266202449798584e-05, -3.463774919509888e-05, -2.6613473892211914e-05, -1.858919858932495e-05, -1.0564923286437988e-05, -2.5406479835510254e-06, 5.4836273193359375e-06, 1.35079026222229e-05, 2.1532177925109863e-05, 2.9556453227996826e-05, 3.758072853088379e-05, 4.560500383377075e-05, 5.3629279136657715e-05, 6.165355443954468e-05, 6.967782974243164e-05, 7.77021050453186e-05, 8.572638034820557e-05, 9.375065565109253e-05, 0.00010177493095397949, 0.00010979920625686646, 0.00011782348155975342, 0.00012584775686264038, 0.00013387203216552734, 0.0001418963074684143, 0.00014992058277130127, 0.00015794485807418823, 0.0001659691333770752, 0.00017399340867996216, 0.00018201768398284912, 0.00019004195928573608, 0.00019806623458862305, 0.00020609050989151, 0.00021411478519439697, 0.00022213906049728394, 0.0002301633358001709, 0.00023818761110305786, 0.0002462118864059448, 0.0002542361617088318, 0.00026226043701171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 15.0, 17.0, 17.0, 29.0, 43.0, 62.0, 88.0, 133.0, 160.0, 208.0, 335.0, 523.0, 818.0, 1361.0, 2089.0, 3534.0, 5807.0, 9754.0, 16264.0, 26988.0, 45080.0, 73361.0, 116678.0, 182328.0, 205922.0, 136279.0, 85920.0, 53430.0, 32129.0, 19426.0, 11573.0, 7051.0, 4150.0, 2530.0, 1541.0, 971.0, 612.0, 399.0, 270.0, 185.0, 134.0, 122.0, 61.0, 49.0, 32.0, 31.0, 14.0, 12.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2998046875, -1.2606201171875, -1.221435546875, -1.1822509765625, -1.14306640625, -1.1038818359375, -1.064697265625, -1.0255126953125, -0.986328125, -0.9471435546875, -0.907958984375, -0.8687744140625, -0.82958984375, -0.7904052734375, -0.751220703125, -0.7120361328125, -0.6728515625, -0.6336669921875, -0.594482421875, -0.5552978515625, -0.51611328125, -0.4769287109375, -0.437744140625, -0.3985595703125, -0.359375, -0.3201904296875, -0.281005859375, -0.2418212890625, -0.20263671875, -0.1634521484375, -0.124267578125, -0.0850830078125, -0.0458984375, -0.0067138671875, 0.032470703125, 0.0716552734375, 0.11083984375, 0.1500244140625, 0.189208984375, 0.2283935546875, 0.267578125, 0.3067626953125, 0.345947265625, 0.3851318359375, 0.42431640625, 0.4635009765625, 0.502685546875, 0.5418701171875, 0.5810546875, 0.6202392578125, 0.659423828125, 0.6986083984375, 0.73779296875, 0.7769775390625, 0.816162109375, 0.8553466796875, 0.89453125, 0.9337158203125, 0.972900390625, 1.0120849609375, 1.05126953125, 1.0904541015625, 1.129638671875, 1.1688232421875, 1.2080078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 16.0, 13.0, 17.0, 16.0, 15.0, 21.0, 25.0, 32.0, 21.0, 24.0, 46.0, 41.0, 43.0, 44.0, 42.0, 52.0, 49.0, 52.0, 53.0, 39.0, 52.0, 31.0, 37.0, 29.0, 16.0, 24.0, 19.0, 21.0, 20.0, 16.0, 12.0, 8.0, 5.0, 6.0, 9.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.3581695556640625, -0.345001220703125, -0.3318328857421875, -0.31866455078125, -0.3054962158203125, -0.292327880859375, -0.2791595458984375, -0.2659912109375, -0.2528228759765625, -0.239654541015625, -0.2264862060546875, -0.21331787109375, -0.2001495361328125, -0.186981201171875, -0.1738128662109375, -0.16064453125, -0.1474761962890625, -0.134307861328125, -0.1211395263671875, -0.10797119140625, -0.0948028564453125, -0.081634521484375, -0.0684661865234375, -0.0552978515625, -0.0421295166015625, -0.028961181640625, -0.0157928466796875, -0.00262451171875, 0.0105438232421875, 0.023712158203125, 0.0368804931640625, 0.050048828125, 0.0632171630859375, 0.076385498046875, 0.0895538330078125, 0.10272216796875, 0.1158905029296875, 0.129058837890625, 0.1422271728515625, 0.1553955078125, 0.1685638427734375, 0.181732177734375, 0.1949005126953125, 0.20806884765625, 0.2212371826171875, 0.234405517578125, 0.2475738525390625, 0.2607421875, 0.2739105224609375, 0.287078857421875, 0.3002471923828125, 0.31341552734375, 0.3265838623046875, 0.339752197265625, 0.3529205322265625, 0.3660888671875, 0.3792572021484375, 0.392425537109375, 0.4055938720703125, 0.41876220703125, 0.4319305419921875, 0.445098876953125, 0.4582672119140625, 0.471435546875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 9.0, 10.0, 19.0, 22.0, 22.0, 23.0, 26.0, 30.0, 36.0, 34.0, 46.0, 49.0, 40.0, 44.0, 48.0, 45.0, 50.0, 43.0, 58.0, 48.0, 49.0, 29.0, 35.0, 27.0, 26.0, 25.0, 21.0, 15.0, 10.0, 9.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.78710174560547, -40.31550598144531, -38.843910217285156, -37.372310638427734, -35.90071487426758, -34.42911911010742, -32.957523345947266, -31.485925674438477, -30.014328002929688, -28.54273223876953, -27.071134567260742, -25.599538803100586, -24.127941131591797, -22.65634536743164, -21.184749603271484, -19.713151931762695, -18.24155616760254, -16.769960403442383, -15.298362731933594, -13.826766967773438, -12.355169296264648, -10.883573532104492, -9.41197681427002, -7.940380096435547, -6.468783378601074, -4.997186660766602, -3.525590181350708, -2.0539937019348145, -0.5823969841003418, 0.8891997337341309, 2.3607959747314453, 3.832392692565918, 5.303989410400391, 6.775586128234863, 8.247182846069336, 9.718778610229492, 11.190376281738281, 12.661972045898438, 14.13356876373291, 15.605165481567383, 17.076763153076172, 18.548358917236328, 20.019956588745117, 21.491552352905273, 22.963150024414062, 24.43474578857422, 25.906341552734375, 27.377939224243164, 28.84953498840332, 30.321130752563477, 31.792728424072266, 33.26432418823242, 34.73591995239258, 36.20751953125, 37.679115295410156, 39.15071105957031, 40.62230682373047, 42.093902587890625, 43.56549835205078, 45.0370979309082, 46.50869369506836, 47.980289459228516, 49.45188522338867, 50.923484802246094, 52.39508056640625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 5.0, 1.0, 15.0, 8.0, 14.0, 17.0, 11.0, 17.0, 26.0, 22.0, 34.0, 26.0, 36.0, 35.0, 52.0, 42.0, 50.0, 37.0, 40.0, 43.0, 36.0, 57.0, 30.0, 35.0, 33.0, 40.0, 48.0, 32.0, 27.0, 23.0, 26.0, 11.0, 15.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.87858581542969, -51.40857696533203, -49.938568115234375, -48.46855926513672, -46.99855041503906, -45.528541564941406, -44.05853271484375, -42.588523864746094, -41.11851501464844, -39.64850616455078, -38.178497314453125, -36.70848846435547, -35.23847961425781, -33.768470764160156, -32.2984619140625, -30.828453063964844, -29.358442306518555, -27.8884334564209, -26.418424606323242, -24.948415756225586, -23.47840690612793, -22.008398056030273, -20.538387298583984, -19.068378448486328, -17.598369598388672, -16.128360748291016, -14.65835189819336, -13.188343048095703, -11.718334197998047, -10.24832534790039, -8.778315544128418, -7.308306694030762, -5.838298797607422, -4.368289947509766, -2.8982808589935303, -1.428271770477295, 0.04173707962036133, 1.5117459297180176, 2.981755256652832, 4.451764106750488, 5.9217729568481445, 7.391781806945801, 8.861790657043457, 10.33180046081543, 11.801809310913086, 13.271818161010742, 14.741827011108398, 16.211835861206055, 17.68184471130371, 19.151853561401367, 20.621862411499023, 22.09187126159668, 23.561880111694336, 25.031888961791992, 26.50189971923828, 27.971908569335938, 29.441917419433594, 30.91192626953125, 32.381935119628906, 33.85194396972656, 35.32195281982422, 36.791961669921875, 38.26197052001953, 39.73197937011719, 41.201988220214844]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 1.0, 6.0, 12.0, 33.0, 27.0, 48.0, 67.0, 145.0, 178.0, 281.0, 485.0, 746.0, 1203.0, 2110.0, 3331.0, 5638.0, 9705.0, 17129.0, 29746.0, 50874.0, 83627.0, 125590.0, 161567.0, 168764.0, 141216.0, 98099.0, 61708.0, 36370.0, 20993.0, 11799.0, 6883.0, 4041.0, 2328.0, 1467.0, 880.0, 499.0, 355.0, 233.0, 128.0, 82.0, 56.0, 39.0, 22.0, 17.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.75, -50.1904296875, -48.630859375, -47.0712890625, -45.51171875, -43.9521484375, -42.392578125, -40.8330078125, -39.2734375, -37.7138671875, -36.154296875, -34.5947265625, -33.03515625, -31.4755859375, -29.916015625, -28.3564453125, -26.796875, -25.2373046875, -23.677734375, -22.1181640625, -20.55859375, -18.9990234375, -17.439453125, -15.8798828125, -14.3203125, -12.7607421875, -11.201171875, -9.6416015625, -8.08203125, -6.5224609375, -4.962890625, -3.4033203125, -1.84375, -0.2841796875, 1.275390625, 2.8349609375, 4.39453125, 5.9541015625, 7.513671875, 9.0732421875, 10.6328125, 12.1923828125, 13.751953125, 15.3115234375, 16.87109375, 18.4306640625, 19.990234375, 21.5498046875, 23.109375, 24.6689453125, 26.228515625, 27.7880859375, 29.34765625, 30.9072265625, 32.466796875, 34.0263671875, 35.5859375, 37.1455078125, 38.705078125, 40.2646484375, 41.82421875, 43.3837890625, 44.943359375, 46.5029296875, 48.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 12.0, 9.0, 17.0, 11.0, 16.0, 19.0, 31.0, 22.0, 32.0, 34.0, 35.0, 37.0, 42.0, 47.0, 31.0, 50.0, 45.0, 44.0, 37.0, 46.0, 33.0, 39.0, 44.0, 30.0, 40.0, 35.0, 29.0, 31.0, 19.0, 16.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-49.5, -48.18212890625, -46.8642578125, -45.54638671875, -44.228515625, -42.91064453125, -41.5927734375, -40.27490234375, -38.95703125, -37.63916015625, -36.3212890625, -35.00341796875, -33.685546875, -32.36767578125, -31.0498046875, -29.73193359375, -28.4140625, -27.09619140625, -25.7783203125, -24.46044921875, -23.142578125, -21.82470703125, -20.5068359375, -19.18896484375, -17.87109375, -16.55322265625, -15.2353515625, -13.91748046875, -12.599609375, -11.28173828125, -9.9638671875, -8.64599609375, -7.328125, -6.01025390625, -4.6923828125, -3.37451171875, -2.056640625, -0.73876953125, 0.5791015625, 1.89697265625, 3.21484375, 4.53271484375, 5.8505859375, 7.16845703125, 8.486328125, 9.80419921875, 11.1220703125, 12.43994140625, 13.7578125, 15.07568359375, 16.3935546875, 17.71142578125, 19.029296875, 20.34716796875, 21.6650390625, 22.98291015625, 24.30078125, 25.61865234375, 26.9365234375, 28.25439453125, 29.572265625, 30.89013671875, 32.2080078125, 33.52587890625, 34.84375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 7.0, 7.0, 11.0, 20.0, 27.0, 52.0, 62.0, 93.0, 199.0, 279.0, 350.0, 556.0, 711.0, 1065.0, 1510.0, 2170.0, 3022.0, 4463.0, 6121.0, 8562.0, 12091.0, 16459.0, 22345.0, 30106.0, 39125.0, 51536.0, 64031.0, 76914.0, 87622.0, 93421.0, 93716.0, 88141.0, 77077.0, 63913.0, 51309.0, 39856.0, 30300.0, 22603.0, 16681.0, 12130.0, 8731.0, 6345.0, 4503.0, 3125.0, 2192.0, 1584.0, 1122.0, 756.0, 507.0, 338.0, 233.0, 168.0, 98.0, 89.0, 38.0, 36.0, 20.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0], "bins": [-28.796875, -27.868408203125, -26.93994140625, -26.011474609375, -25.0830078125, -24.154541015625, -23.22607421875, -22.297607421875, -21.369140625, -20.440673828125, -19.51220703125, -18.583740234375, -17.6552734375, -16.726806640625, -15.79833984375, -14.869873046875, -13.94140625, -13.012939453125, -12.08447265625, -11.156005859375, -10.2275390625, -9.299072265625, -8.37060546875, -7.442138671875, -6.513671875, -5.585205078125, -4.65673828125, -3.728271484375, -2.7998046875, -1.871337890625, -0.94287109375, -0.014404296875, 0.9140625, 1.842529296875, 2.77099609375, 3.699462890625, 4.6279296875, 5.556396484375, 6.48486328125, 7.413330078125, 8.341796875, 9.270263671875, 10.19873046875, 11.127197265625, 12.0556640625, 12.984130859375, 13.91259765625, 14.841064453125, 15.76953125, 16.697998046875, 17.62646484375, 18.554931640625, 19.4833984375, 20.411865234375, 21.34033203125, 22.268798828125, 23.197265625, 24.125732421875, 25.05419921875, 25.982666015625, 26.9111328125, 27.839599609375, 28.76806640625, 29.696533203125, 30.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 3.0, 6.0, 11.0, 7.0, 8.0, 19.0, 13.0, 18.0, 20.0, 19.0, 23.0, 25.0, 21.0, 23.0, 33.0, 27.0, 32.0, 30.0, 41.0, 32.0, 36.0, 39.0, 27.0, 26.0, 35.0, 37.0, 29.0, 33.0, 30.0, 37.0, 30.0, 13.0, 20.0, 19.0, 22.0, 16.0, 15.0, 16.0, 14.0, 14.0, 10.0, 14.0, 15.0, 7.0, 9.0, 5.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.03125, -20.325439453125, -19.61962890625, -18.913818359375, -18.2080078125, -17.502197265625, -16.79638671875, -16.090576171875, -15.384765625, -14.678955078125, -13.97314453125, -13.267333984375, -12.5615234375, -11.855712890625, -11.14990234375, -10.444091796875, -9.73828125, -9.032470703125, -8.32666015625, -7.620849609375, -6.9150390625, -6.209228515625, -5.50341796875, -4.797607421875, -4.091796875, -3.385986328125, -2.68017578125, -1.974365234375, -1.2685546875, -0.562744140625, 0.14306640625, 0.848876953125, 1.5546875, 2.260498046875, 2.96630859375, 3.672119140625, 4.3779296875, 5.083740234375, 5.78955078125, 6.495361328125, 7.201171875, 7.906982421875, 8.61279296875, 9.318603515625, 10.0244140625, 10.730224609375, 11.43603515625, 12.141845703125, 12.84765625, 13.553466796875, 14.25927734375, 14.965087890625, 15.6708984375, 16.376708984375, 17.08251953125, 17.788330078125, 18.494140625, 19.199951171875, 19.90576171875, 20.611572265625, 21.3173828125, 22.023193359375, 22.72900390625, 23.434814453125, 24.140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 10.0, 3.0, 11.0, 12.0, 20.0, 42.0, 33.0, 86.0, 124.0, 179.0, 250.0, 406.0, 570.0, 920.0, 1392.0, 1980.0, 2987.0, 4702.0, 7187.0, 10660.0, 15976.0, 24155.0, 36271.0, 51727.0, 72775.0, 95998.0, 115627.0, 125433.0, 119687.0, 102229.0, 79298.0, 57381.0, 39963.0, 26931.0, 18021.0, 11852.0, 8108.0, 5355.0, 3461.0, 2194.0, 1528.0, 1004.0, 662.0, 452.0, 279.0, 218.0, 161.0, 93.0, 52.0, 40.0, 29.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.98681640625, -6.7587890625, -6.53076171875, -6.302734375, -6.07470703125, -5.8466796875, -5.61865234375, -5.390625, -5.16259765625, -4.9345703125, -4.70654296875, -4.478515625, -4.25048828125, -4.0224609375, -3.79443359375, -3.56640625, -3.33837890625, -3.1103515625, -2.88232421875, -2.654296875, -2.42626953125, -2.1982421875, -1.97021484375, -1.7421875, -1.51416015625, -1.2861328125, -1.05810546875, -0.830078125, -0.60205078125, -0.3740234375, -0.14599609375, 0.08203125, 0.31005859375, 0.5380859375, 0.76611328125, 0.994140625, 1.22216796875, 1.4501953125, 1.67822265625, 1.90625, 2.13427734375, 2.3623046875, 2.59033203125, 2.818359375, 3.04638671875, 3.2744140625, 3.50244140625, 3.73046875, 3.95849609375, 4.1865234375, 4.41455078125, 4.642578125, 4.87060546875, 5.0986328125, 5.32666015625, 5.5546875, 5.78271484375, 6.0107421875, 6.23876953125, 6.466796875, 6.69482421875, 6.9228515625, 7.15087890625, 7.37890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 3.0, 5.0, 12.0, 7.0, 9.0, 10.0, 18.0, 20.0, 23.0, 24.0, 22.0, 27.0, 32.0, 44.0, 31.0, 45.0, 46.0, 40.0, 44.0, 59.0, 55.0, 47.0, 40.0, 43.0, 28.0, 35.0, 26.0, 23.0, 28.0, 19.0, 12.0, 16.0, 21.0, 15.0, 8.0, 8.0, 9.0, 5.0, 9.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006685256958007812, -0.0006450265645980835, -0.0006215274333953857, -0.000598028302192688, -0.0005745291709899902, -0.0005510300397872925, -0.0005275309085845947, -0.000504031777381897, -0.0004805326461791992, -0.00045703351497650146, -0.0004335343837738037, -0.00041003525257110596, -0.0003865361213684082, -0.00036303699016571045, -0.0003395378589630127, -0.00031603872776031494, -0.0002925395965576172, -0.00026904046535491943, -0.0002455413341522217, -0.00022204220294952393, -0.00019854307174682617, -0.00017504394054412842, -0.00015154480934143066, -0.0001280456781387329, -0.00010454654693603516, -8.10474157333374e-05, -5.754828453063965e-05, -3.4049153327941895e-05, -1.055002212524414e-05, 1.2949109077453613e-05, 3.644824028015137e-05, 5.994737148284912e-05, 8.344650268554688e-05, 0.00010694563388824463, 0.00013044476509094238, 0.00015394389629364014, 0.0001774430274963379, 0.00020094215869903564, 0.0002244412899017334, 0.00024794042110443115, 0.0002714395523071289, 0.00029493868350982666, 0.0003184378147125244, 0.00034193694591522217, 0.0003654360771179199, 0.0003889352083206177, 0.00041243433952331543, 0.0004359334707260132, 0.00045943260192871094, 0.0004829317331314087, 0.0005064308643341064, 0.0005299299955368042, 0.000553429126739502, 0.0005769282579421997, 0.0006004273891448975, 0.0006239265203475952, 0.000647425651550293, 0.0006709247827529907, 0.0006944239139556885, 0.0007179230451583862, 0.000741422176361084, 0.0007649213075637817, 0.0007884204387664795, 0.0008119195699691772, 0.000835418701171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 5.0, 13.0, 12.0, 24.0, 38.0, 44.0, 67.0, 109.0, 162.0, 228.0, 374.0, 534.0, 823.0, 1270.0, 2102.0, 3312.0, 5503.0, 8907.0, 14634.0, 24363.0, 39060.0, 61832.0, 90645.0, 123907.0, 146160.0, 147265.0, 122911.0, 90659.0, 61566.0, 39039.0, 24544.0, 14940.0, 8777.0, 5515.0, 3410.0, 2097.0, 1287.0, 805.0, 540.0, 358.0, 229.0, 155.0, 109.0, 67.0, 49.0, 42.0, 28.0, 11.0, 15.0, 9.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.9375, -8.658203125, -8.37890625, -8.099609375, -7.8203125, -7.541015625, -7.26171875, -6.982421875, -6.703125, -6.423828125, -6.14453125, -5.865234375, -5.5859375, -5.306640625, -5.02734375, -4.748046875, -4.46875, -4.189453125, -3.91015625, -3.630859375, -3.3515625, -3.072265625, -2.79296875, -2.513671875, -2.234375, -1.955078125, -1.67578125, -1.396484375, -1.1171875, -0.837890625, -0.55859375, -0.279296875, 0.0, 0.279296875, 0.55859375, 0.837890625, 1.1171875, 1.396484375, 1.67578125, 1.955078125, 2.234375, 2.513671875, 2.79296875, 3.072265625, 3.3515625, 3.630859375, 3.91015625, 4.189453125, 4.46875, 4.748046875, 5.02734375, 5.306640625, 5.5859375, 5.865234375, 6.14453125, 6.423828125, 6.703125, 6.982421875, 7.26171875, 7.541015625, 7.8203125, 8.099609375, 8.37890625, 8.658203125, 8.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 3.0, 6.0, 8.0, 14.0, 15.0, 26.0, 22.0, 23.0, 26.0, 31.0, 50.0, 44.0, 68.0, 47.0, 39.0, 62.0, 64.0, 68.0, 45.0, 53.0, 42.0, 43.0, 36.0, 28.0, 22.0, 19.0, 18.0, 17.0, 19.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.359375, -4.2379150390625, -4.116455078125, -3.9949951171875, -3.87353515625, -3.7520751953125, -3.630615234375, -3.5091552734375, -3.3876953125, -3.2662353515625, -3.144775390625, -3.0233154296875, -2.90185546875, -2.7803955078125, -2.658935546875, -2.5374755859375, -2.416015625, -2.2945556640625, -2.173095703125, -2.0516357421875, -1.93017578125, -1.8087158203125, -1.687255859375, -1.5657958984375, -1.4443359375, -1.3228759765625, -1.201416015625, -1.0799560546875, -0.95849609375, -0.8370361328125, -0.715576171875, -0.5941162109375, -0.47265625, -0.3511962890625, -0.229736328125, -0.1082763671875, 0.01318359375, 0.1346435546875, 0.256103515625, 0.3775634765625, 0.4990234375, 0.6204833984375, 0.741943359375, 0.8634033203125, 0.98486328125, 1.1063232421875, 1.227783203125, 1.3492431640625, 1.470703125, 1.5921630859375, 1.713623046875, 1.8350830078125, 1.95654296875, 2.0780029296875, 2.199462890625, 2.3209228515625, 2.4423828125, 2.5638427734375, 2.685302734375, 2.8067626953125, 2.92822265625, 3.0496826171875, 3.171142578125, 3.2926025390625, 3.4140625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 5.0, 3.0, 15.0, 20.0, 17.0, 26.0, 24.0, 33.0, 23.0, 33.0, 42.0, 53.0, 49.0, 61.0, 53.0, 50.0, 63.0, 63.0, 57.0, 45.0, 37.0, 43.0, 26.0, 37.0, 22.0, 16.0, 18.0, 17.0, 13.0, 2.0, 3.0, 9.0, 4.0, 2.0, 0.0, 8.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.36299133300781, -35.89435958862305, -34.42573165893555, -32.95709991455078, -31.48847198486328, -30.019840240478516, -28.551210403442383, -27.08258056640625, -25.613950729370117, -24.145320892333984, -22.67669105529785, -21.20806121826172, -19.739429473876953, -18.270801544189453, -16.802169799804688, -15.333539962768555, -13.864910125732422, -12.396280288696289, -10.927650451660156, -9.459019660949707, -7.990389823913574, -6.521759986877441, -5.053129196166992, -3.5844993591308594, -2.1158695220947266, -0.6472394466400146, 0.8213906288146973, 2.2900209426879883, 3.758650779724121, 5.227280616760254, 6.695911407470703, 8.164541244506836, 9.633174896240234, 11.101804733276367, 12.5704345703125, 14.03906536102295, 15.507695198059082, 16.97632598876953, 18.444955825805664, 19.913585662841797, 21.38221549987793, 22.850845336914062, 24.319475173950195, 25.788105010986328, 27.256736755371094, 28.725364685058594, 30.19399642944336, 31.662626266479492, 33.131256103515625, 34.59988784790039, 36.06851577758789, 37.537147521972656, 39.005775451660156, 40.47440719604492, 41.94303894042969, 43.41166687011719, 44.88029479980469, 46.34892654418945, 47.81755447387695, 49.28618621826172, 50.75481414794922, 52.223445892333984, 53.69207763671875, 55.16070556640625, 56.629337310791016]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 12.0, 4.0, 8.0, 15.0, 10.0, 18.0, 16.0, 14.0, 22.0, 17.0, 26.0, 31.0, 29.0, 27.0, 36.0, 26.0, 39.0, 36.0, 37.0, 37.0, 45.0, 33.0, 43.0, 37.0, 34.0, 37.0, 36.0, 28.0, 34.0, 25.0, 31.0, 32.0, 24.0, 26.0, 15.0, 12.0, 7.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 6.0, 1.0, 3.0], "bins": [-47.087921142578125, -45.79851150512695, -44.50910186767578, -43.219688415527344, -41.93027877807617, -40.640869140625, -39.35145950317383, -38.062049865722656, -36.77263641357422, -35.48322677612305, -34.193817138671875, -32.90440368652344, -31.614994049072266, -30.325584411621094, -29.036174774169922, -27.74676513671875, -26.457355499267578, -25.167945861816406, -23.8785343170166, -22.58912467956543, -21.299713134765625, -20.010303497314453, -18.72089385986328, -17.43148422241211, -16.142072677612305, -14.852662086486816, -13.563251495361328, -12.273841857910156, -10.984431266784668, -9.69502067565918, -8.405611038208008, -7.1162004470825195, -5.826786041259766, -4.537375450134277, -3.2479653358459473, -1.958554983139038, -0.6691446304321289, 0.6202659606933594, 1.9096760749816895, 3.1990861892700195, 4.488496780395508, 5.777907371520996, 7.067317485809326, 8.356727600097656, 9.646138191223145, 10.935548782348633, 12.224958419799805, 13.514369010925293, 14.803779602050781, 16.093189239501953, 17.382600784301758, 18.67201042175293, 19.961421966552734, 21.250831604003906, 22.540241241455078, 23.82965087890625, 25.119062423706055, 26.408472061157227, 27.69788360595703, 28.987293243408203, 30.276702880859375, 31.56611442565918, 32.855525970458984, 34.144935607910156, 35.43434524536133]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 12.0, 11.0, 20.0, 26.0, 50.0, 75.0, 113.0, 166.0, 259.0, 397.0, 597.0, 968.0, 1489.0, 2377.0, 3686.0, 5914.0, 9127.0, 14320.0, 22305.0, 35596.0, 55859.0, 87970.0, 137647.0, 214006.0, 320197.0, 451876.0, 562098.0, 591976.0, 521768.0, 394919.0, 270973.0, 177335.0, 113321.0, 72673.0, 45461.0, 29010.0, 18345.0, 11329.0, 7313.0, 4643.0, 2885.0, 1853.0, 1192.0, 780.0, 490.0, 314.0, 197.0, 134.0, 82.0, 65.0, 33.0, 16.0, 8.0, 10.0, 3.0, 1.0, 3.0], "bins": [-31.234375, -30.3232421875, -29.412109375, -28.5009765625, -27.58984375, -26.6787109375, -25.767578125, -24.8564453125, -23.9453125, -23.0341796875, -22.123046875, -21.2119140625, -20.30078125, -19.3896484375, -18.478515625, -17.5673828125, -16.65625, -15.7451171875, -14.833984375, -13.9228515625, -13.01171875, -12.1005859375, -11.189453125, -10.2783203125, -9.3671875, -8.4560546875, -7.544921875, -6.6337890625, -5.72265625, -4.8115234375, -3.900390625, -2.9892578125, -2.078125, -1.1669921875, -0.255859375, 0.6552734375, 1.56640625, 2.4775390625, 3.388671875, 4.2998046875, 5.2109375, 6.1220703125, 7.033203125, 7.9443359375, 8.85546875, 9.7666015625, 10.677734375, 11.5888671875, 12.5, 13.4111328125, 14.322265625, 15.2333984375, 16.14453125, 17.0556640625, 17.966796875, 18.8779296875, 19.7890625, 20.7001953125, 21.611328125, 22.5224609375, 23.43359375, 24.3447265625, 25.255859375, 26.1669921875, 27.078125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 12.0, 16.0, 19.0, 10.0, 12.0, 27.0, 18.0, 25.0, 34.0, 28.0, 30.0, 30.0, 28.0, 30.0, 42.0, 41.0, 47.0, 45.0, 38.0, 44.0, 38.0, 32.0, 27.0, 43.0, 29.0, 38.0, 34.0, 29.0, 34.0, 19.0, 18.0, 13.0, 6.0, 11.0, 7.0, 2.0, 4.0, 7.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.84375, -31.942138671875, -31.04052734375, -30.138916015625, -29.2373046875, -28.335693359375, -27.43408203125, -26.532470703125, -25.630859375, -24.729248046875, -23.82763671875, -22.926025390625, -22.0244140625, -21.122802734375, -20.22119140625, -19.319580078125, -18.41796875, -17.516357421875, -16.61474609375, -15.713134765625, -14.8115234375, -13.909912109375, -13.00830078125, -12.106689453125, -11.205078125, -10.303466796875, -9.40185546875, -8.500244140625, -7.5986328125, -6.697021484375, -5.79541015625, -4.893798828125, -3.9921875, -3.090576171875, -2.18896484375, -1.287353515625, -0.3857421875, 0.515869140625, 1.41748046875, 2.319091796875, 3.220703125, 4.122314453125, 5.02392578125, 5.925537109375, 6.8271484375, 7.728759765625, 8.63037109375, 9.531982421875, 10.43359375, 11.335205078125, 12.23681640625, 13.138427734375, 14.0400390625, 14.941650390625, 15.84326171875, 16.744873046875, 17.646484375, 18.548095703125, 19.44970703125, 20.351318359375, 21.2529296875, 22.154541015625, 23.05615234375, 23.957763671875, 24.859375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 10.0, 24.0, 24.0, 33.0, 64.0, 96.0, 158.0, 278.0, 434.0, 750.0, 1243.0, 2108.0, 3534.0, 5844.0, 9964.0, 16807.0, 27848.0, 46526.0, 76122.0, 121388.0, 185891.0, 274957.0, 380561.0, 481305.0, 541954.0, 529412.0, 453440.0, 348278.0, 246499.0, 165672.0, 106216.0, 66234.0, 39918.0, 24221.0, 14603.0, 8956.0, 5145.0, 3130.0, 1820.0, 1085.0, 667.0, 388.0, 289.0, 154.0, 95.0, 58.0, 34.0, 23.0, 12.0, 3.0, 7.0, 3.0, 5.0, 0.0, 2.0], "bins": [-29.921875, -29.0380859375, -28.154296875, -27.2705078125, -26.38671875, -25.5029296875, -24.619140625, -23.7353515625, -22.8515625, -21.9677734375, -21.083984375, -20.2001953125, -19.31640625, -18.4326171875, -17.548828125, -16.6650390625, -15.78125, -14.8974609375, -14.013671875, -13.1298828125, -12.24609375, -11.3623046875, -10.478515625, -9.5947265625, -8.7109375, -7.8271484375, -6.943359375, -6.0595703125, -5.17578125, -4.2919921875, -3.408203125, -2.5244140625, -1.640625, -0.7568359375, 0.126953125, 1.0107421875, 1.89453125, 2.7783203125, 3.662109375, 4.5458984375, 5.4296875, 6.3134765625, 7.197265625, 8.0810546875, 8.96484375, 9.8486328125, 10.732421875, 11.6162109375, 12.5, 13.3837890625, 14.267578125, 15.1513671875, 16.03515625, 16.9189453125, 17.802734375, 18.6865234375, 19.5703125, 20.4541015625, 21.337890625, 22.2216796875, 23.10546875, 23.9892578125, 24.873046875, 25.7568359375, 26.640625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 17.0, 21.0, 28.0, 41.0, 36.0, 41.0, 48.0, 59.0, 77.0, 101.0, 129.0, 142.0, 147.0, 194.0, 198.0, 235.0, 232.0, 235.0, 238.0, 219.0, 218.0, 235.0, 195.0, 187.0, 160.0, 127.0, 112.0, 93.0, 57.0, 63.0, 40.0, 32.0, 15.0, 23.0, 18.0, 14.0, 11.0, 5.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.976318359375, -14.50732421875, -14.038330078125, -13.5693359375, -13.100341796875, -12.63134765625, -12.162353515625, -11.693359375, -11.224365234375, -10.75537109375, -10.286376953125, -9.8173828125, -9.348388671875, -8.87939453125, -8.410400390625, -7.94140625, -7.472412109375, -7.00341796875, -6.534423828125, -6.0654296875, -5.596435546875, -5.12744140625, -4.658447265625, -4.189453125, -3.720458984375, -3.25146484375, -2.782470703125, -2.3134765625, -1.844482421875, -1.37548828125, -0.906494140625, -0.4375, 0.031494140625, 0.50048828125, 0.969482421875, 1.4384765625, 1.907470703125, 2.37646484375, 2.845458984375, 3.314453125, 3.783447265625, 4.25244140625, 4.721435546875, 5.1904296875, 5.659423828125, 6.12841796875, 6.597412109375, 7.06640625, 7.535400390625, 8.00439453125, 8.473388671875, 8.9423828125, 9.411376953125, 9.88037109375, 10.349365234375, 10.818359375, 11.287353515625, 11.75634765625, 12.225341796875, 12.6943359375, 13.163330078125, 13.63232421875, 14.101318359375, 14.5703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 6.0, 8.0, 17.0, 18.0, 22.0, 17.0, 20.0, 24.0, 26.0, 32.0, 32.0, 44.0, 45.0, 44.0, 39.0, 51.0, 41.0, 52.0, 43.0, 39.0, 48.0, 44.0, 32.0, 24.0, 37.0, 23.0, 22.0, 29.0, 20.0, 17.0, 11.0, 13.0, 9.0, 7.0, 5.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.593976974487305, -26.68051528930664, -25.76705551147461, -24.853593826293945, -23.94013214111328, -23.02667236328125, -22.113210678100586, -21.199748992919922, -20.28628921508789, -19.372827529907227, -18.459367752075195, -17.54590606689453, -16.6324462890625, -15.718984603881836, -14.805522918701172, -13.892062187194824, -12.978601455688477, -12.065140724182129, -11.151679992675781, -10.238218307495117, -9.32475757598877, -8.411296844482422, -7.497835636138916, -6.58437442779541, -5.6709136962890625, -4.757452964782715, -3.843991756439209, -2.9305307865142822, -2.0170698165893555, -1.1036090850830078, -0.19014787673950195, 0.7233133316040039, 1.6367759704589844, 2.550236940383911, 3.463697910308838, 4.377159118652344, 5.290619850158691, 6.204080581665039, 7.117541790008545, 8.03100299835205, 8.944463729858398, 9.857924461364746, 10.771385192871094, 11.684846878051758, 12.598307609558105, 13.511768341064453, 14.425230026245117, 15.338690757751465, 16.252151489257812, 17.165613174438477, 18.079072952270508, 18.992534637451172, 19.905994415283203, 20.819456100463867, 21.73291778564453, 22.646377563476562, 23.559839248657227, 24.47330093383789, 25.386760711669922, 26.300222396850586, 27.21368408203125, 28.12714385986328, 29.040605545043945, 29.95406723022461, 30.86752700805664]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 9.0, 12.0, 13.0, 7.0, 15.0, 14.0, 20.0, 22.0, 19.0, 28.0, 30.0, 28.0, 36.0, 33.0, 38.0, 36.0, 33.0, 40.0, 40.0, 30.0, 28.0, 35.0, 46.0, 38.0, 38.0, 34.0, 36.0, 25.0, 29.0, 24.0, 20.0, 22.0, 25.0, 17.0, 11.0, 10.0, 12.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.56411361694336, -28.58710289001465, -27.610090255737305, -26.633079528808594, -25.656068801879883, -24.679058074951172, -23.702045440673828, -22.725034713745117, -21.748023986816406, -20.771013259887695, -19.79400062561035, -18.81698989868164, -17.83997917175293, -16.86296844482422, -15.885955810546875, -14.908945083618164, -13.93193244934082, -12.954920768737793, -11.977910041809082, -11.000898361206055, -10.023887634277344, -9.046875953674316, -8.069864273071289, -7.09285306930542, -6.115841865539551, -5.138830661773682, -4.1618194580078125, -3.184807777404785, -2.207796573638916, -1.2307853698730469, -0.25377368927001953, 0.7232375144958496, 1.7002487182617188, 2.677259922027588, 3.654271364212036, 4.631282806396484, 5.6082940101623535, 6.585305213928223, 7.56231689453125, 8.539327621459961, 9.516339302062988, 10.493350982666016, 11.470361709594727, 12.447373390197754, 13.424385070800781, 14.401395797729492, 15.37840747833252, 16.355419158935547, 17.332429885864258, 18.30944061279297, 19.286453247070312, 20.263463973999023, 21.240474700927734, 22.217487335205078, 23.19449806213379, 24.1715087890625, 25.148521423339844, 26.125532150268555, 27.1025447845459, 28.07955551147461, 29.05656623840332, 30.03357696533203, 31.010589599609375, 31.987600326538086, 32.9646110534668]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 1.0, 2.0, 7.0, 22.0, 20.0, 18.0, 28.0, 54.0, 76.0, 107.0, 166.0, 286.0, 551.0, 1013.0, 1826.0, 3599.0, 7074.0, 14465.0, 29432.0, 61891.0, 133749.0, 278654.0, 269686.0, 129696.0, 59537.0, 28412.0, 13862.0, 6715.0, 3468.0, 1839.0, 933.0, 485.0, 332.0, 200.0, 107.0, 59.0, 60.0, 27.0, 24.0, 26.0, 12.0, 12.0, 7.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.295166015625, -11.91064453125, -11.526123046875, -11.1416015625, -10.757080078125, -10.37255859375, -9.988037109375, -9.603515625, -9.218994140625, -8.83447265625, -8.449951171875, -8.0654296875, -7.680908203125, -7.29638671875, -6.911865234375, -6.52734375, -6.142822265625, -5.75830078125, -5.373779296875, -4.9892578125, -4.604736328125, -4.22021484375, -3.835693359375, -3.451171875, -3.066650390625, -2.68212890625, -2.297607421875, -1.9130859375, -1.528564453125, -1.14404296875, -0.759521484375, -0.375, 0.009521484375, 0.39404296875, 0.778564453125, 1.1630859375, 1.547607421875, 1.93212890625, 2.316650390625, 2.701171875, 3.085693359375, 3.47021484375, 3.854736328125, 4.2392578125, 4.623779296875, 5.00830078125, 5.392822265625, 5.77734375, 6.161865234375, 6.54638671875, 6.930908203125, 7.3154296875, 7.699951171875, 8.08447265625, 8.468994140625, 8.853515625, 9.238037109375, 9.62255859375, 10.007080078125, 10.3916015625, 10.776123046875, 11.16064453125, 11.545166015625, 11.9296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 9.0, 6.0, 12.0, 8.0, 16.0, 13.0, 20.0, 22.0, 13.0, 22.0, 25.0, 27.0, 26.0, 26.0, 29.0, 31.0, 30.0, 39.0, 41.0, 35.0, 29.0, 26.0, 36.0, 44.0, 23.0, 37.0, 32.0, 24.0, 33.0, 36.0, 26.0, 30.0, 23.0, 19.0, 21.0, 17.0, 15.0, 14.0, 7.0, 11.0, 7.0, 6.0, 3.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-28.0, -27.09765625, -26.1953125, -25.29296875, -24.390625, -23.48828125, -22.5859375, -21.68359375, -20.78125, -19.87890625, -18.9765625, -18.07421875, -17.171875, -16.26953125, -15.3671875, -14.46484375, -13.5625, -12.66015625, -11.7578125, -10.85546875, -9.953125, -9.05078125, -8.1484375, -7.24609375, -6.34375, -5.44140625, -4.5390625, -3.63671875, -2.734375, -1.83203125, -0.9296875, -0.02734375, 0.875, 1.77734375, 2.6796875, 3.58203125, 4.484375, 5.38671875, 6.2890625, 7.19140625, 8.09375, 8.99609375, 9.8984375, 10.80078125, 11.703125, 12.60546875, 13.5078125, 14.41015625, 15.3125, 16.21484375, 17.1171875, 18.01953125, 18.921875, 19.82421875, 20.7265625, 21.62890625, 22.53125, 23.43359375, 24.3359375, 25.23828125, 26.140625, 27.04296875, 27.9453125, 28.84765625, 29.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 10.0, 16.0, 15.0, 23.0, 19.0, 38.0, 65.0, 114.0, 134.0, 233.0, 355.0, 536.0, 833.0, 1276.0, 2142.0, 3505.0, 6046.0, 10522.0, 19395.0, 35758.0, 69650.0, 140792.0, 268910.0, 239542.0, 118638.0, 59328.0, 30985.0, 16771.0, 9387.0, 5259.0, 3126.0, 1933.0, 1109.0, 714.0, 442.0, 286.0, 200.0, 143.0, 108.0, 53.0, 34.0, 23.0, 34.0, 15.0, 11.0, 8.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.82421875, -6.61669921875, -6.4091796875, -6.20166015625, -5.994140625, -5.78662109375, -5.5791015625, -5.37158203125, -5.1640625, -4.95654296875, -4.7490234375, -4.54150390625, -4.333984375, -4.12646484375, -3.9189453125, -3.71142578125, -3.50390625, -3.29638671875, -3.0888671875, -2.88134765625, -2.673828125, -2.46630859375, -2.2587890625, -2.05126953125, -1.84375, -1.63623046875, -1.4287109375, -1.22119140625, -1.013671875, -0.80615234375, -0.5986328125, -0.39111328125, -0.18359375, 0.02392578125, 0.2314453125, 0.43896484375, 0.646484375, 0.85400390625, 1.0615234375, 1.26904296875, 1.4765625, 1.68408203125, 1.8916015625, 2.09912109375, 2.306640625, 2.51416015625, 2.7216796875, 2.92919921875, 3.13671875, 3.34423828125, 3.5517578125, 3.75927734375, 3.966796875, 4.17431640625, 4.3818359375, 4.58935546875, 4.796875, 5.00439453125, 5.2119140625, 5.41943359375, 5.626953125, 5.83447265625, 6.0419921875, 6.24951171875, 6.45703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 5.0, 5.0, 8.0, 11.0, 7.0, 23.0, 19.0, 25.0, 27.0, 23.0, 28.0, 24.0, 30.0, 31.0, 42.0, 37.0, 31.0, 43.0, 39.0, 35.0, 40.0, 39.0, 34.0, 37.0, 48.0, 36.0, 41.0, 32.0, 29.0, 25.0, 22.0, 20.0, 14.0, 16.0, 15.0, 14.0, 9.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.21875, -22.5, -21.78125, -21.0625, -20.34375, -19.625, -18.90625, -18.1875, -17.46875, -16.75, -16.03125, -15.3125, -14.59375, -13.875, -13.15625, -12.4375, -11.71875, -11.0, -10.28125, -9.5625, -8.84375, -8.125, -7.40625, -6.6875, -5.96875, -5.25, -4.53125, -3.8125, -3.09375, -2.375, -1.65625, -0.9375, -0.21875, 0.5, 1.21875, 1.9375, 2.65625, 3.375, 4.09375, 4.8125, 5.53125, 6.25, 6.96875, 7.6875, 8.40625, 9.125, 9.84375, 10.5625, 11.28125, 12.0, 12.71875, 13.4375, 14.15625, 14.875, 15.59375, 16.3125, 17.03125, 17.75, 18.46875, 19.1875, 19.90625, 20.625, 21.34375, 22.0625, 22.78125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 18.0, 18.0, 32.0, 46.0, 46.0, 72.0, 109.0, 133.0, 231.0, 332.0, 474.0, 628.0, 1018.0, 1522.0, 2225.0, 3332.0, 5182.0, 8014.0, 12608.0, 20778.0, 34866.0, 61106.0, 117162.0, 251753.0, 253020.0, 119066.0, 62004.0, 35120.0, 21069.0, 12760.0, 8147.0, 5194.0, 3472.0, 2201.0, 1513.0, 1004.0, 719.0, 483.0, 311.0, 207.0, 147.0, 121.0, 90.0, 71.0, 34.0, 31.0, 15.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.462890625, -0.4474639892578125, -0.432037353515625, -0.4166107177734375, -0.40118408203125, -0.3857574462890625, -0.370330810546875, -0.3549041748046875, -0.3394775390625, -0.3240509033203125, -0.308624267578125, -0.2931976318359375, -0.27777099609375, -0.2623443603515625, -0.246917724609375, -0.2314910888671875, -0.216064453125, -0.2006378173828125, -0.185211181640625, -0.1697845458984375, -0.15435791015625, -0.1389312744140625, -0.123504638671875, -0.1080780029296875, -0.0926513671875, -0.0772247314453125, -0.061798095703125, -0.0463714599609375, -0.03094482421875, -0.0155181884765625, -9.1552734375e-05, 0.0153350830078125, 0.03076171875, 0.0461883544921875, 0.061614990234375, 0.0770416259765625, 0.09246826171875, 0.1078948974609375, 0.123321533203125, 0.1387481689453125, 0.1541748046875, 0.1696014404296875, 0.185028076171875, 0.2004547119140625, 0.21588134765625, 0.2313079833984375, 0.246734619140625, 0.2621612548828125, 0.277587890625, 0.2930145263671875, 0.308441162109375, 0.3238677978515625, 0.33929443359375, 0.3547210693359375, 0.370147705078125, 0.3855743408203125, 0.4010009765625, 0.4164276123046875, 0.431854248046875, 0.4472808837890625, 0.46270751953125, 0.4781341552734375, 0.493560791015625, 0.5089874267578125, 0.5244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 9.0, 16.0, 16.0, 19.0, 25.0, 44.0, 36.0, 45.0, 58.0, 71.0, 73.0, 69.0, 76.0, 81.0, 73.0, 45.0, 49.0, 32.0, 28.0, 23.0, 26.0, 12.0, 10.0, 12.0, 12.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014197826385498047, -0.00013800431042909622, -0.00013403035700321198, -0.00013005640357732773, -0.00012608245015144348, -0.00012210849672555923, -0.00011813454329967499, -0.00011416058987379074, -0.0001101866364479065, -0.00010621268302202225, -0.000102238729596138, -9.826477617025375e-05, -9.429082274436951e-05, -9.031686931848526e-05, -8.634291589260101e-05, -8.236896246671677e-05, -7.839500904083252e-05, -7.442105561494827e-05, -7.044710218906403e-05, -6.647314876317978e-05, -6.249919533729553e-05, -5.8525241911411285e-05, -5.455128848552704e-05, -5.057733505964279e-05, -4.6603381633758545e-05, -4.26294282078743e-05, -3.865547478199005e-05, -3.4681521356105804e-05, -3.070756793022156e-05, -2.673361450433731e-05, -2.2759661078453064e-05, -1.8785707652568817e-05, -1.481175422668457e-05, -1.0837800800800323e-05, -6.863847374916077e-06, -2.88989394903183e-06, 1.084059476852417e-06, 5.058012902736664e-06, 9.03196632862091e-06, 1.3005919754505157e-05, 1.6979873180389404e-05, 2.095382660627365e-05, 2.4927780032157898e-05, 2.8901733458042145e-05, 3.287568688392639e-05, 3.684964030981064e-05, 4.0823593735694885e-05, 4.479754716157913e-05, 4.877150058746338e-05, 5.2745454013347626e-05, 5.671940743923187e-05, 6.069336086511612e-05, 6.466731429100037e-05, 6.864126771688461e-05, 7.261522114276886e-05, 7.65891745686531e-05, 8.056312799453735e-05, 8.45370814204216e-05, 8.851103484630585e-05, 9.24849882721901e-05, 9.645894169807434e-05, 0.00010043289512395859, 0.00010440684854984283, 0.00010838080197572708, 0.00011235475540161133]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 8.0, 9.0, 15.0, 17.0, 35.0, 58.0, 85.0, 114.0, 160.0, 204.0, 348.0, 513.0, 734.0, 1101.0, 1676.0, 2330.0, 3482.0, 5136.0, 7458.0, 11168.0, 16083.0, 24244.0, 35621.0, 55817.0, 91758.0, 171107.0, 263408.0, 135319.0, 76700.0, 47596.0, 31024.0, 20859.0, 14157.0, 9512.0, 6572.0, 4414.0, 2994.0, 2167.0, 1429.0, 998.0, 740.0, 457.0, 297.0, 216.0, 136.0, 101.0, 67.0, 38.0, 32.0, 19.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2724609375, -1.231842041015625, -1.19122314453125, -1.150604248046875, -1.1099853515625, -1.069366455078125, -1.02874755859375, -0.988128662109375, -0.947509765625, -0.906890869140625, -0.86627197265625, -0.825653076171875, -0.7850341796875, -0.744415283203125, -0.70379638671875, -0.663177490234375, -0.62255859375, -0.581939697265625, -0.54132080078125, -0.500701904296875, -0.4600830078125, -0.419464111328125, -0.37884521484375, -0.338226318359375, -0.297607421875, -0.256988525390625, -0.21636962890625, -0.175750732421875, -0.1351318359375, -0.094512939453125, -0.05389404296875, -0.013275146484375, 0.02734375, 0.067962646484375, 0.10858154296875, 0.149200439453125, 0.1898193359375, 0.230438232421875, 0.27105712890625, 0.311676025390625, 0.352294921875, 0.392913818359375, 0.43353271484375, 0.474151611328125, 0.5147705078125, 0.555389404296875, 0.59600830078125, 0.636627197265625, 0.67724609375, 0.717864990234375, 0.75848388671875, 0.799102783203125, 0.8397216796875, 0.880340576171875, 0.92095947265625, 0.961578369140625, 1.002197265625, 1.042816162109375, 1.08343505859375, 1.124053955078125, 1.1646728515625, 1.205291748046875, 1.24591064453125, 1.286529541015625, 1.3271484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 7.0, 13.0, 15.0, 11.0, 13.0, 15.0, 21.0, 23.0, 16.0, 27.0, 25.0, 28.0, 30.0, 36.0, 54.0, 57.0, 53.0, 70.0, 65.0, 47.0, 52.0, 47.0, 26.0, 22.0, 26.0, 26.0, 31.0, 17.0, 26.0, 18.0, 14.0, 13.0, 8.0, 9.0, 6.0, 5.0, 1.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.51611328125, -0.5005073547363281, -0.48490142822265625, -0.4692955017089844, -0.4536895751953125, -0.4380836486816406, -0.42247772216796875, -0.4068717956542969, -0.391265869140625, -0.3756599426269531, -0.36005401611328125, -0.3444480895996094, -0.3288421630859375, -0.3132362365722656, -0.29763031005859375, -0.2820243835449219, -0.26641845703125, -0.2508125305175781, -0.23520660400390625, -0.21960067749023438, -0.2039947509765625, -0.18838882446289062, -0.17278289794921875, -0.15717697143554688, -0.141571044921875, -0.12596511840820312, -0.11035919189453125, -0.09475326538085938, -0.0791473388671875, -0.06354141235351562, -0.04793548583984375, -0.032329559326171875, -0.0167236328125, -0.001117706298828125, 0.01448822021484375, 0.030094146728515625, 0.0457000732421875, 0.061305999755859375, 0.07691192626953125, 0.09251785278320312, 0.108123779296875, 0.12372970581054688, 0.13933563232421875, 0.15494155883789062, 0.1705474853515625, 0.18615341186523438, 0.20175933837890625, 0.21736526489257812, 0.23297119140625, 0.24857711791992188, 0.26418304443359375, 0.2797889709472656, 0.2953948974609375, 0.3110008239746094, 0.32660675048828125, 0.3422126770019531, 0.357818603515625, 0.3734245300292969, 0.38903045654296875, 0.4046363830566406, 0.4202423095703125, 0.4358482360839844, 0.45145416259765625, 0.4670600891113281, 0.482666015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 10.0, 17.0, 12.0, 26.0, 22.0, 23.0, 18.0, 36.0, 23.0, 33.0, 47.0, 42.0, 35.0, 43.0, 51.0, 46.0, 49.0, 43.0, 37.0, 43.0, 40.0, 37.0, 26.0, 30.0, 28.0, 20.0, 27.0, 22.0, 23.0, 11.0, 5.0, 7.0, 10.0, 4.0, 9.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.90628433227539, -25.035118103027344, -24.16395378112793, -23.292787551879883, -22.421621322631836, -21.550457000732422, -20.679290771484375, -19.808124542236328, -18.93695831298828, -18.065792083740234, -17.19462776184082, -16.323461532592773, -15.452295303344727, -14.581130027770996, -13.709964752197266, -12.838798522949219, -11.967634201049805, -11.096468925476074, -10.225302696228027, -9.354137420654297, -8.48297119140625, -7.6118059158325195, -6.740640640258789, -5.8694748878479, -4.998309135437012, -4.127143383026123, -3.2559778690338135, -2.384812355041504, -1.5136466026306152, -0.6424808502197266, 0.2286844253540039, 1.0998501777648926, 1.971017837524414, 2.8421835899353027, 3.7133491039276123, 4.584514617919922, 5.4556803703308105, 6.326846122741699, 7.19801139831543, 8.069177627563477, 8.940342903137207, 9.811508178710938, 10.682674407958984, 11.553839683532715, 12.425004959106445, 13.296171188354492, 14.167336463928223, 15.038501739501953, 15.90966796875, 16.780834197998047, 17.65199851989746, 18.523164749145508, 19.394330978393555, 20.26549530029297, 21.136661529541016, 22.007827758789062, 22.87899398803711, 23.750160217285156, 24.62132453918457, 25.492490768432617, 26.363656997680664, 27.234821319580078, 28.105987548828125, 28.977153778076172, 29.848318099975586]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 6.0, 6.0, 14.0, 13.0, 9.0, 10.0, 21.0, 18.0, 21.0, 24.0, 26.0, 29.0, 25.0, 37.0, 34.0, 40.0, 35.0, 36.0, 39.0, 38.0, 30.0, 27.0, 35.0, 41.0, 45.0, 36.0, 35.0, 35.0, 27.0, 26.0, 24.0, 25.0, 20.0, 24.0, 12.0, 14.0, 8.0, 12.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.470666885375977, -27.520793914794922, -26.570919036865234, -25.621044158935547, -24.671171188354492, -23.721298217773438, -22.77142333984375, -21.821548461914062, -20.871675491333008, -19.921802520751953, -18.971927642822266, -18.022052764892578, -17.072179794311523, -16.12230682373047, -15.172431945800781, -14.22255802154541, -13.272684097290039, -12.322810173034668, -11.372936248779297, -10.423062324523926, -9.473188400268555, -8.523314476013184, -7.5734405517578125, -6.623566627502441, -5.67369270324707, -4.723818778991699, -3.773944854736328, -2.824070930480957, -1.874197006225586, -0.9243230819702148, 0.02555084228515625, 0.9754247665405273, 1.9252967834472656, 2.8751707077026367, 3.825044631958008, 4.774918556213379, 5.72479248046875, 6.674666404724121, 7.624540328979492, 8.574414253234863, 9.524288177490234, 10.474162101745605, 11.424036026000977, 12.373909950256348, 13.323783874511719, 14.27365779876709, 15.223531723022461, 16.173404693603516, 17.123279571533203, 18.07315444946289, 19.023027420043945, 19.972900390625, 20.922775268554688, 21.872650146484375, 22.82252311706543, 23.772396087646484, 24.722270965576172, 25.67214584350586, 26.622018814086914, 27.57189178466797, 28.521766662597656, 29.471641540527344, 30.4215145111084, 31.371387481689453, 32.32126235961914]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 12.0, 20.0, 38.0, 42.0, 63.0, 96.0, 146.0, 259.0, 381.0, 555.0, 795.0, 1237.0, 1782.0, 2662.0, 3974.0, 6019.0, 8945.0, 13053.0, 19244.0, 27619.0, 38187.0, 52174.0, 67736.0, 83866.0, 96931.0, 104767.0, 104382.0, 95323.0, 81337.0, 66056.0, 50535.0, 37175.0, 26384.0, 18458.0, 12505.0, 8697.0, 5655.0, 3793.0, 2482.0, 1670.0, 1101.0, 775.0, 554.0, 320.0, 265.0, 174.0, 117.0, 62.0, 35.0, 35.0, 22.0, 17.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0], "bins": [-21.46875, -20.796630859375, -20.12451171875, -19.452392578125, -18.7802734375, -18.108154296875, -17.43603515625, -16.763916015625, -16.091796875, -15.419677734375, -14.74755859375, -14.075439453125, -13.4033203125, -12.731201171875, -12.05908203125, -11.386962890625, -10.71484375, -10.042724609375, -9.37060546875, -8.698486328125, -8.0263671875, -7.354248046875, -6.68212890625, -6.010009765625, -5.337890625, -4.665771484375, -3.99365234375, -3.321533203125, -2.6494140625, -1.977294921875, -1.30517578125, -0.633056640625, 0.0390625, 0.711181640625, 1.38330078125, 2.055419921875, 2.7275390625, 3.399658203125, 4.07177734375, 4.743896484375, 5.416015625, 6.088134765625, 6.76025390625, 7.432373046875, 8.1044921875, 8.776611328125, 9.44873046875, 10.120849609375, 10.79296875, 11.465087890625, 12.13720703125, 12.809326171875, 13.4814453125, 14.153564453125, 14.82568359375, 15.497802734375, 16.169921875, 16.842041015625, 17.51416015625, 18.186279296875, 18.8583984375, 19.530517578125, 20.20263671875, 20.874755859375, 21.546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 8.0, 11.0, 11.0, 12.0, 16.0, 20.0, 21.0, 22.0, 17.0, 22.0, 29.0, 29.0, 44.0, 28.0, 50.0, 31.0, 37.0, 43.0, 28.0, 45.0, 39.0, 43.0, 39.0, 37.0, 41.0, 40.0, 26.0, 15.0, 30.0, 24.0, 20.0, 21.0, 14.0, 8.0, 8.0, 11.0, 8.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.15625, -28.2197265625, -27.283203125, -26.3466796875, -25.41015625, -24.4736328125, -23.537109375, -22.6005859375, -21.6640625, -20.7275390625, -19.791015625, -18.8544921875, -17.91796875, -16.9814453125, -16.044921875, -15.1083984375, -14.171875, -13.2353515625, -12.298828125, -11.3623046875, -10.42578125, -9.4892578125, -8.552734375, -7.6162109375, -6.6796875, -5.7431640625, -4.806640625, -3.8701171875, -2.93359375, -1.9970703125, -1.060546875, -0.1240234375, 0.8125, 1.7490234375, 2.685546875, 3.6220703125, 4.55859375, 5.4951171875, 6.431640625, 7.3681640625, 8.3046875, 9.2412109375, 10.177734375, 11.1142578125, 12.05078125, 12.9873046875, 13.923828125, 14.8603515625, 15.796875, 16.7333984375, 17.669921875, 18.6064453125, 19.54296875, 20.4794921875, 21.416015625, 22.3525390625, 23.2890625, 24.2255859375, 25.162109375, 26.0986328125, 27.03515625, 27.9716796875, 28.908203125, 29.8447265625, 30.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 3.0, 5.0, 16.0, 29.0, 25.0, 56.0, 66.0, 102.0, 181.0, 244.0, 378.0, 519.0, 793.0, 1103.0, 1692.0, 2434.0, 3611.0, 5145.0, 7866.0, 11854.0, 17179.0, 24898.0, 34919.0, 48458.0, 64006.0, 81250.0, 96224.0, 105333.0, 106554.0, 99182.0, 85711.0, 69676.0, 52603.0, 39066.0, 27525.0, 19068.0, 12983.0, 8819.0, 6209.0, 4083.0, 2829.0, 1890.0, 1320.0, 824.0, 576.0, 401.0, 305.0, 171.0, 140.0, 83.0, 52.0, 40.0, 31.0, 9.0, 8.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.796875, -21.09716796875, -20.3974609375, -19.69775390625, -18.998046875, -18.29833984375, -17.5986328125, -16.89892578125, -16.19921875, -15.49951171875, -14.7998046875, -14.10009765625, -13.400390625, -12.70068359375, -12.0009765625, -11.30126953125, -10.6015625, -9.90185546875, -9.2021484375, -8.50244140625, -7.802734375, -7.10302734375, -6.4033203125, -5.70361328125, -5.00390625, -4.30419921875, -3.6044921875, -2.90478515625, -2.205078125, -1.50537109375, -0.8056640625, -0.10595703125, 0.59375, 1.29345703125, 1.9931640625, 2.69287109375, 3.392578125, 4.09228515625, 4.7919921875, 5.49169921875, 6.19140625, 6.89111328125, 7.5908203125, 8.29052734375, 8.990234375, 9.68994140625, 10.3896484375, 11.08935546875, 11.7890625, 12.48876953125, 13.1884765625, 13.88818359375, 14.587890625, 15.28759765625, 15.9873046875, 16.68701171875, 17.38671875, 18.08642578125, 18.7861328125, 19.48583984375, 20.185546875, 20.88525390625, 21.5849609375, 22.28466796875, 22.984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 6.0, 9.0, 5.0, 10.0, 16.0, 13.0, 13.0, 4.0, 17.0, 32.0, 31.0, 24.0, 30.0, 36.0, 39.0, 44.0, 45.0, 46.0, 30.0, 52.0, 47.0, 45.0, 51.0, 29.0, 42.0, 28.0, 33.0, 29.0, 29.0, 27.0, 16.0, 23.0, 17.0, 21.0, 16.0, 9.0, 4.0, 5.0, 7.0, 4.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.898193359375, -20.24951171875, -19.600830078125, -18.9521484375, -18.303466796875, -17.65478515625, -17.006103515625, -16.357421875, -15.708740234375, -15.06005859375, -14.411376953125, -13.7626953125, -13.114013671875, -12.46533203125, -11.816650390625, -11.16796875, -10.519287109375, -9.87060546875, -9.221923828125, -8.5732421875, -7.924560546875, -7.27587890625, -6.627197265625, -5.978515625, -5.329833984375, -4.68115234375, -4.032470703125, -3.3837890625, -2.735107421875, -2.08642578125, -1.437744140625, -0.7890625, -0.140380859375, 0.50830078125, 1.156982421875, 1.8056640625, 2.454345703125, 3.10302734375, 3.751708984375, 4.400390625, 5.049072265625, 5.69775390625, 6.346435546875, 6.9951171875, 7.643798828125, 8.29248046875, 8.941162109375, 9.58984375, 10.238525390625, 10.88720703125, 11.535888671875, 12.1845703125, 12.833251953125, 13.48193359375, 14.130615234375, 14.779296875, 15.427978515625, 16.07666015625, 16.725341796875, 17.3740234375, 18.022705078125, 18.67138671875, 19.320068359375, 19.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 2.0, 6.0, 12.0, 24.0, 21.0, 42.0, 53.0, 90.0, 137.0, 203.0, 345.0, 554.0, 939.0, 1557.0, 2606.0, 4454.0, 7528.0, 12881.0, 22176.0, 37748.0, 60214.0, 92277.0, 127205.0, 151798.0, 151716.0, 128526.0, 92858.0, 60950.0, 37469.0, 22349.0, 13016.0, 7539.0, 4506.0, 2620.0, 1624.0, 944.0, 604.0, 307.0, 234.0, 143.0, 87.0, 74.0, 32.0, 22.0, 17.0, 13.0, 12.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-8.25, -8.00006103515625, -7.7501220703125, -7.50018310546875, -7.250244140625, -7.00030517578125, -6.7503662109375, -6.50042724609375, -6.25048828125, -6.00054931640625, -5.7506103515625, -5.50067138671875, -5.250732421875, -5.00079345703125, -4.7508544921875, -4.50091552734375, -4.2509765625, -4.00103759765625, -3.7510986328125, -3.50115966796875, -3.251220703125, -3.00128173828125, -2.7513427734375, -2.50140380859375, -2.25146484375, -2.00152587890625, -1.7515869140625, -1.50164794921875, -1.251708984375, -1.00177001953125, -0.7518310546875, -0.50189208984375, -0.251953125, -0.00201416015625, 0.2479248046875, 0.49786376953125, 0.747802734375, 0.99774169921875, 1.2476806640625, 1.49761962890625, 1.74755859375, 1.99749755859375, 2.2474365234375, 2.49737548828125, 2.747314453125, 2.99725341796875, 3.2471923828125, 3.49713134765625, 3.7470703125, 3.99700927734375, 4.2469482421875, 4.49688720703125, 4.746826171875, 4.99676513671875, 5.2467041015625, 5.49664306640625, 5.74658203125, 5.99652099609375, 6.2464599609375, 6.49639892578125, 6.746337890625, 6.99627685546875, 7.2462158203125, 7.49615478515625, 7.74609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 5.0, 11.0, 4.0, 9.0, 13.0, 11.0, 21.0, 24.0, 36.0, 27.0, 27.0, 53.0, 51.0, 43.0, 55.0, 53.0, 51.0, 70.0, 56.0, 54.0, 41.0, 33.0, 46.0, 31.0, 39.0, 25.0, 24.0, 14.0, 23.0, 14.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005884170532226562, -0.0005662664771080017, -0.0005441159009933472, -0.0005219653248786926, -0.0004998147487640381, -0.00047766417264938354, -0.000455513596534729, -0.00043336302042007446, -0.0004112124443054199, -0.0003890618681907654, -0.00036691129207611084, -0.0003447607159614563, -0.00032261013984680176, -0.0003004595637321472, -0.0002783089876174927, -0.00025615841150283813, -0.0002340078353881836, -0.00021185725927352905, -0.0001897066831588745, -0.00016755610704421997, -0.00014540553092956543, -0.0001232549548149109, -0.00010110437870025635, -7.89538025856018e-05, -5.6803226470947266e-05, -3.4652650356292725e-05, -1.2502074241638184e-05, 9.648501873016357e-06, 3.17990779876709e-05, 5.394965410232544e-05, 7.610023021697998e-05, 9.825080633163452e-05, 0.00012040138244628906, 0.0001425519585609436, 0.00016470253467559814, 0.00018685311079025269, 0.00020900368690490723, 0.00023115426301956177, 0.0002533048391342163, 0.00027545541524887085, 0.0002976059913635254, 0.00031975656747817993, 0.00034190714359283447, 0.000364057719707489, 0.00038620829582214355, 0.0004083588719367981, 0.00043050944805145264, 0.0004526600241661072, 0.0004748106002807617, 0.0004969611763954163, 0.0005191117525100708, 0.0005412623286247253, 0.0005634129047393799, 0.0005855634808540344, 0.000607714056968689, 0.0006298646330833435, 0.000652015209197998, 0.0006741657853126526, 0.0006963163614273071, 0.0007184669375419617, 0.0007406175136566162, 0.0007627680897712708, 0.0007849186658859253, 0.0008070692420005798, 0.0008292198181152344]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 10.0, 10.0, 15.0, 27.0, 42.0, 67.0, 103.0, 168.0, 241.0, 325.0, 560.0, 808.0, 1154.0, 1875.0, 3002.0, 4603.0, 7311.0, 11407.0, 18161.0, 28649.0, 43960.0, 64883.0, 90803.0, 116568.0, 132763.0, 133412.0, 115574.0, 89016.0, 63186.0, 42836.0, 27831.0, 17953.0, 11320.0, 7100.0, 4563.0, 2990.0, 1840.0, 1226.0, 742.0, 488.0, 341.0, 223.0, 122.0, 86.0, 70.0, 47.0, 25.0, 14.0, 14.0, 9.0, 5.0, 4.0, 4.0, 0.0, 3.0], "bins": [-7.6328125, -7.40814208984375, -7.1834716796875, -6.95880126953125, -6.734130859375, -6.50946044921875, -6.2847900390625, -6.06011962890625, -5.83544921875, -5.61077880859375, -5.3861083984375, -5.16143798828125, -4.936767578125, -4.71209716796875, -4.4874267578125, -4.26275634765625, -4.0380859375, -3.81341552734375, -3.5887451171875, -3.36407470703125, -3.139404296875, -2.91473388671875, -2.6900634765625, -2.46539306640625, -2.24072265625, -2.01605224609375, -1.7913818359375, -1.56671142578125, -1.342041015625, -1.11737060546875, -0.8927001953125, -0.66802978515625, -0.443359375, -0.21868896484375, 0.0059814453125, 0.23065185546875, 0.455322265625, 0.67999267578125, 0.9046630859375, 1.12933349609375, 1.35400390625, 1.57867431640625, 1.8033447265625, 2.02801513671875, 2.252685546875, 2.47735595703125, 2.7020263671875, 2.92669677734375, 3.1513671875, 3.37603759765625, 3.6007080078125, 3.82537841796875, 4.050048828125, 4.27471923828125, 4.4993896484375, 4.72406005859375, 4.94873046875, 5.17340087890625, 5.3980712890625, 5.62274169921875, 5.847412109375, 6.07208251953125, 6.2967529296875, 6.52142333984375, 6.74609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 11.0, 4.0, 12.0, 6.0, 20.0, 14.0, 15.0, 38.0, 38.0, 39.0, 47.0, 60.0, 55.0, 56.0, 51.0, 64.0, 59.0, 52.0, 49.0, 47.0, 52.0, 37.0, 29.0, 19.0, 19.0, 23.0, 17.0, 11.0, 11.0, 7.0, 3.0, 5.0, 4.0, 5.0, 6.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96484375, -2.84429931640625, -2.7237548828125, -2.60321044921875, -2.482666015625, -2.36212158203125, -2.2415771484375, -2.12103271484375, -2.00048828125, -1.87994384765625, -1.7593994140625, -1.63885498046875, -1.518310546875, -1.39776611328125, -1.2772216796875, -1.15667724609375, -1.0361328125, -0.91558837890625, -0.7950439453125, -0.67449951171875, -0.553955078125, -0.43341064453125, -0.3128662109375, -0.19232177734375, -0.07177734375, 0.04876708984375, 0.1693115234375, 0.28985595703125, 0.410400390625, 0.53094482421875, 0.6514892578125, 0.77203369140625, 0.892578125, 1.01312255859375, 1.1336669921875, 1.25421142578125, 1.374755859375, 1.49530029296875, 1.6158447265625, 1.73638916015625, 1.85693359375, 1.97747802734375, 2.0980224609375, 2.21856689453125, 2.339111328125, 2.45965576171875, 2.5802001953125, 2.70074462890625, 2.8212890625, 2.94183349609375, 3.0623779296875, 3.18292236328125, 3.303466796875, 3.42401123046875, 3.5445556640625, 3.66510009765625, 3.78564453125, 3.90618896484375, 4.0267333984375, 4.14727783203125, 4.267822265625, 4.38836669921875, 4.5089111328125, 4.62945556640625, 4.75]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 9.0, 11.0, 18.0, 11.0, 8.0, 20.0, 19.0, 29.0, 37.0, 29.0, 40.0, 30.0, 46.0, 46.0, 45.0, 66.0, 49.0, 49.0, 49.0, 52.0, 58.0, 22.0, 42.0, 31.0, 36.0, 20.0, 28.0, 14.0, 19.0, 15.0, 10.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.106853485107422, -26.15304183959961, -25.199230194091797, -24.245418548583984, -23.291606903076172, -22.33779525756836, -21.38398551940918, -20.430173873901367, -19.476362228393555, -18.522550582885742, -17.56873893737793, -16.614927291870117, -15.661116600036621, -14.707304954528809, -13.753494262695312, -12.7996826171875, -11.845870971679688, -10.892059326171875, -9.938247680664062, -8.984436988830566, -8.030625343322754, -7.076813697814941, -6.123002529144287, -5.169191360473633, -4.21537971496582, -3.261568307876587, -2.3077569007873535, -1.3539454936981201, -0.4001340866088867, 0.5536775588989258, 1.50748872756958, 2.4612998962402344, 3.415111541748047, 4.368923187255859, 5.322734355926514, 6.276545524597168, 7.2303571701049805, 8.184168815612793, 9.137979507446289, 10.091791152954102, 11.045602798461914, 11.999414443969727, 12.953226089477539, 13.907036781311035, 14.860848426818848, 15.81466007232666, 16.768470764160156, 17.72228240966797, 18.67609405517578, 19.629905700683594, 20.583717346191406, 21.53752899169922, 22.49134063720703, 23.445152282714844, 24.398962020874023, 25.352773666381836, 26.30658531188965, 27.26039695739746, 28.214208602905273, 29.168020248413086, 30.121829986572266, 31.075641632080078, 32.02945327758789, 32.9832649230957, 33.937076568603516]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 16.0, 6.0, 11.0, 9.0, 17.0, 22.0, 18.0, 23.0, 16.0, 32.0, 23.0, 46.0, 36.0, 37.0, 32.0, 36.0, 40.0, 31.0, 42.0, 53.0, 49.0, 53.0, 32.0, 27.0, 32.0, 35.0, 34.0, 27.0, 24.0, 14.0, 29.0, 9.0, 13.0, 16.0, 12.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.512569427490234, -32.47273254394531, -31.43289566040039, -30.39305877685547, -29.353221893310547, -28.313385009765625, -27.273550033569336, -26.233713150024414, -25.193876266479492, -24.15403938293457, -23.11420249938965, -22.074365615844727, -21.034530639648438, -19.994693756103516, -18.954856872558594, -17.915019989013672, -16.87518310546875, -15.835346221923828, -14.795509338378906, -13.7556734085083, -12.715836524963379, -11.675999641418457, -10.636163711547852, -9.59632682800293, -8.556489944458008, -7.516653060913086, -6.476816654205322, -5.436980247497559, -4.397143363952637, -3.357306480407715, -2.317470073699951, -1.2776336669921875, -0.23780059814453125, 0.8020360469818115, 1.8418726921081543, 2.881709337234497, 3.92154598236084, 4.961382865905762, 6.001219272613525, 7.041055679321289, 8.080892562866211, 9.120729446411133, 10.160566329956055, 11.20040225982666, 12.240239143371582, 13.280076026916504, 14.31991195678711, 15.359748840332031, 16.399585723876953, 17.439422607421875, 18.479259490966797, 19.51909637451172, 20.55893325805664, 21.598770141601562, 22.63860511779785, 23.678442001342773, 24.718278884887695, 25.758115768432617, 26.79795265197754, 27.83778953552246, 28.87762451171875, 29.917461395263672, 30.957298278808594, 31.997135162353516, 33.03697204589844]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 7.0, 21.0, 28.0, 50.0, 101.0, 153.0, 270.0, 484.0, 778.0, 1378.0, 2351.0, 3922.0, 6518.0, 11088.0, 18566.0, 30284.0, 50692.0, 83157.0, 134644.0, 212355.0, 318622.0, 444717.0, 550084.0, 586011.0, 531357.0, 414176.0, 292011.0, 191906.0, 120844.0, 74128.0, 45528.0, 27206.0, 16552.0, 9649.0, 5829.0, 3531.0, 2074.0, 1240.0, 796.0, 487.0, 239.0, 159.0, 109.0, 75.0, 44.0, 20.0, 12.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.552978515625, -20.79345703125, -20.033935546875, -19.2744140625, -18.514892578125, -17.75537109375, -16.995849609375, -16.236328125, -15.476806640625, -14.71728515625, -13.957763671875, -13.1982421875, -12.438720703125, -11.67919921875, -10.919677734375, -10.16015625, -9.400634765625, -8.64111328125, -7.881591796875, -7.1220703125, -6.362548828125, -5.60302734375, -4.843505859375, -4.083984375, -3.324462890625, -2.56494140625, -1.805419921875, -1.0458984375, -0.286376953125, 0.47314453125, 1.232666015625, 1.9921875, 2.751708984375, 3.51123046875, 4.270751953125, 5.0302734375, 5.789794921875, 6.54931640625, 7.308837890625, 8.068359375, 8.827880859375, 9.58740234375, 10.346923828125, 11.1064453125, 11.865966796875, 12.62548828125, 13.385009765625, 14.14453125, 14.904052734375, 15.66357421875, 16.423095703125, 17.1826171875, 17.942138671875, 18.70166015625, 19.461181640625, 20.220703125, 20.980224609375, 21.73974609375, 22.499267578125, 23.2587890625, 24.018310546875, 24.77783203125, 25.537353515625, 26.296875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 16.0, 9.0, 7.0, 11.0, 11.0, 12.0, 17.0, 19.0, 27.0, 24.0, 31.0, 25.0, 24.0, 30.0, 33.0, 35.0, 44.0, 49.0, 37.0, 40.0, 46.0, 40.0, 39.0, 35.0, 34.0, 39.0, 29.0, 32.0, 25.0, 22.0, 22.0, 25.0, 20.0, 24.0, 13.0, 5.0, 14.0, 5.0, 1.0, 6.0, 1.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.6083984375, -19.904296875, -19.2001953125, -18.49609375, -17.7919921875, -17.087890625, -16.3837890625, -15.6796875, -14.9755859375, -14.271484375, -13.5673828125, -12.86328125, -12.1591796875, -11.455078125, -10.7509765625, -10.046875, -9.3427734375, -8.638671875, -7.9345703125, -7.23046875, -6.5263671875, -5.822265625, -5.1181640625, -4.4140625, -3.7099609375, -3.005859375, -2.3017578125, -1.59765625, -0.8935546875, -0.189453125, 0.5146484375, 1.21875, 1.9228515625, 2.626953125, 3.3310546875, 4.03515625, 4.7392578125, 5.443359375, 6.1474609375, 6.8515625, 7.5556640625, 8.259765625, 8.9638671875, 9.66796875, 10.3720703125, 11.076171875, 11.7802734375, 12.484375, 13.1884765625, 13.892578125, 14.5966796875, 15.30078125, 16.0048828125, 16.708984375, 17.4130859375, 18.1171875, 18.8212890625, 19.525390625, 20.2294921875, 20.93359375, 21.6376953125, 22.341796875, 23.0458984375, 23.75]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [4.0, 6.0, 8.0, 16.0, 16.0, 34.0, 72.0, 103.0, 142.0, 280.0, 380.0, 675.0, 1022.0, 1613.0, 2763.0, 4236.0, 6949.0, 11128.0, 17898.0, 27988.0, 43356.0, 65901.0, 98278.0, 141862.0, 197600.0, 263431.0, 330904.0, 388613.0, 428629.0, 432294.0, 402726.0, 349929.0, 281892.0, 215711.0, 157678.0, 109779.0, 74177.0, 49482.0, 32000.0, 20501.0, 12849.0, 8003.0, 5087.0, 3095.0, 1930.0, 1195.0, 728.0, 522.0, 284.0, 193.0, 135.0, 84.0, 41.0, 27.0, 22.0, 7.0, 15.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.1904296875, -15.615234375, -15.0400390625, -14.46484375, -13.8896484375, -13.314453125, -12.7392578125, -12.1640625, -11.5888671875, -11.013671875, -10.4384765625, -9.86328125, -9.2880859375, -8.712890625, -8.1376953125, -7.5625, -6.9873046875, -6.412109375, -5.8369140625, -5.26171875, -4.6865234375, -4.111328125, -3.5361328125, -2.9609375, -2.3857421875, -1.810546875, -1.2353515625, -0.66015625, -0.0849609375, 0.490234375, 1.0654296875, 1.640625, 2.2158203125, 2.791015625, 3.3662109375, 3.94140625, 4.5166015625, 5.091796875, 5.6669921875, 6.2421875, 6.8173828125, 7.392578125, 7.9677734375, 8.54296875, 9.1181640625, 9.693359375, 10.2685546875, 10.84375, 11.4189453125, 11.994140625, 12.5693359375, 13.14453125, 13.7197265625, 14.294921875, 14.8701171875, 15.4453125, 16.0205078125, 16.595703125, 17.1708984375, 17.74609375, 18.3212890625, 18.896484375, 19.4716796875, 20.046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 6.0, 6.0, 14.0, 13.0, 15.0, 16.0, 15.0, 37.0, 31.0, 36.0, 55.0, 64.0, 71.0, 68.0, 87.0, 120.0, 113.0, 128.0, 135.0, 138.0, 168.0, 166.0, 182.0, 193.0, 184.0, 155.0, 177.0, 169.0, 149.0, 180.0, 162.0, 155.0, 112.0, 127.0, 108.0, 77.0, 79.0, 65.0, 59.0, 51.0, 31.0, 31.0, 26.0, 22.0, 18.0, 17.0, 6.0, 7.0, 5.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0], "bins": [-10.2421875, -9.946044921875, -9.64990234375, -9.353759765625, -9.0576171875, -8.761474609375, -8.46533203125, -8.169189453125, -7.873046875, -7.576904296875, -7.28076171875, -6.984619140625, -6.6884765625, -6.392333984375, -6.09619140625, -5.800048828125, -5.50390625, -5.207763671875, -4.91162109375, -4.615478515625, -4.3193359375, -4.023193359375, -3.72705078125, -3.430908203125, -3.134765625, -2.838623046875, -2.54248046875, -2.246337890625, -1.9501953125, -1.654052734375, -1.35791015625, -1.061767578125, -0.765625, -0.469482421875, -0.17333984375, 0.122802734375, 0.4189453125, 0.715087890625, 1.01123046875, 1.307373046875, 1.603515625, 1.899658203125, 2.19580078125, 2.491943359375, 2.7880859375, 3.084228515625, 3.38037109375, 3.676513671875, 3.97265625, 4.268798828125, 4.56494140625, 4.861083984375, 5.1572265625, 5.453369140625, 5.74951171875, 6.045654296875, 6.341796875, 6.637939453125, 6.93408203125, 7.230224609375, 7.5263671875, 7.822509765625, 8.11865234375, 8.414794921875, 8.7109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 11.0, 12.0, 12.0, 11.0, 20.0, 12.0, 26.0, 26.0, 20.0, 34.0, 42.0, 39.0, 35.0, 63.0, 50.0, 48.0, 53.0, 53.0, 59.0, 38.0, 48.0, 37.0, 32.0, 37.0, 24.0, 18.0, 20.0, 17.0, 18.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-26.09819984436035, -25.360565185546875, -24.6229305267334, -23.885295867919922, -23.147663116455078, -22.4100284576416, -21.672393798828125, -20.93475914001465, -20.197124481201172, -19.459489822387695, -18.72185516357422, -17.984222412109375, -17.2465877532959, -16.508953094482422, -15.771318435668945, -15.033683776855469, -14.296051025390625, -13.558416366577148, -12.820782661437988, -12.083148002624512, -11.345514297485352, -10.607879638671875, -9.870244979858398, -9.132610321044922, -8.394976615905762, -7.657342433929443, -6.919708251953125, -6.182073593139648, -5.44443941116333, -4.706805229187012, -3.969170570373535, -3.231536388397217, -2.4939022064208984, -1.7562679052352905, -1.0186336040496826, -0.28099918365478516, 0.4566349983215332, 1.1942691802978516, 1.9319038391113281, 2.6695380210876465, 3.407172203063965, 4.144806385040283, 4.882440567016602, 5.620075225830078, 6.3577094078063965, 7.095343589782715, 7.832978248596191, 8.570611953735352, 9.308246612548828, 10.045881271362305, 10.783514976501465, 11.521149635314941, 12.258783340454102, 12.996417999267578, 13.734052658081055, 14.471687316894531, 15.209321022033691, 15.946955680847168, 16.684589385986328, 17.422224044799805, 18.15985870361328, 18.897491455078125, 19.635128021240234, 20.372760772705078, 21.110395431518555]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 9.0, 8.0, 13.0, 6.0, 13.0, 23.0, 25.0, 34.0, 33.0, 26.0, 21.0, 26.0, 34.0, 34.0, 45.0, 47.0, 47.0, 55.0, 38.0, 37.0, 39.0, 42.0, 49.0, 40.0, 30.0, 21.0, 21.0, 34.0, 28.0, 26.0, 20.0, 7.0, 13.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.70098304748535, -26.826419830322266, -25.951858520507812, -25.077295303344727, -24.20273208618164, -23.328170776367188, -22.4536075592041, -21.579044342041016, -20.704483032226562, -19.829919815063477, -18.955358505249023, -18.080795288085938, -17.20623207092285, -16.331668853759766, -15.457107543945312, -14.582544326782227, -13.70798110961914, -12.833418846130371, -11.958855628967285, -11.084293365478516, -10.20973014831543, -9.33516788482666, -8.46060562133789, -7.586042881011963, -6.711480140686035, -5.836917400360107, -4.96235466003418, -4.08779239654541, -3.2132296562194824, -2.3386669158935547, -1.4641046524047852, -0.5895419120788574, 0.2850189208984375, 1.1595815420150757, 2.034144163131714, 2.9087066650390625, 3.7832694053649902, 4.657832145690918, 5.5323944091796875, 6.406957149505615, 7.281519889831543, 8.156082153320312, 9.030645370483398, 9.905207633972168, 10.779769897460938, 11.654333114624023, 12.528895378112793, 13.403457641601562, 14.278020858764648, 15.152583122253418, 16.027145385742188, 16.901708602905273, 17.77627182006836, 18.650833129882812, 19.5253963470459, 20.399959564208984, 21.274520874023438, 22.149084091186523, 23.023645401000977, 23.898208618164062, 24.77277183532715, 25.647335052490234, 26.521896362304688, 27.396459579467773, 28.27102279663086]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 15.0, 13.0, 24.0, 62.0, 80.0, 114.0, 192.0, 284.0, 403.0, 680.0, 1020.0, 1568.0, 2577.0, 3929.0, 6250.0, 9890.0, 15985.0, 26367.0, 42962.0, 71426.0, 115557.0, 174242.0, 195997.0, 143694.0, 91285.0, 55469.0, 33683.0, 20520.0, 12803.0, 7758.0, 4938.0, 3221.0, 1987.0, 1275.0, 751.0, 574.0, 375.0, 218.0, 142.0, 81.0, 53.0, 31.0, 23.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99334716796875, -4.8226318359375, -4.65191650390625, -4.481201171875, -4.31048583984375, -4.1397705078125, -3.96905517578125, -3.79833984375, -3.62762451171875, -3.4569091796875, -3.28619384765625, -3.115478515625, -2.94476318359375, -2.7740478515625, -2.60333251953125, -2.4326171875, -2.26190185546875, -2.0911865234375, -1.92047119140625, -1.749755859375, -1.57904052734375, -1.4083251953125, -1.23760986328125, -1.06689453125, -0.89617919921875, -0.7254638671875, -0.55474853515625, -0.384033203125, -0.21331787109375, -0.0426025390625, 0.12811279296875, 0.298828125, 0.46954345703125, 0.6402587890625, 0.81097412109375, 0.981689453125, 1.15240478515625, 1.3231201171875, 1.49383544921875, 1.66455078125, 1.83526611328125, 2.0059814453125, 2.17669677734375, 2.347412109375, 2.51812744140625, 2.6888427734375, 2.85955810546875, 3.0302734375, 3.20098876953125, 3.3717041015625, 3.54241943359375, 3.713134765625, 3.88385009765625, 4.0545654296875, 4.22528076171875, 4.39599609375, 4.56671142578125, 4.7374267578125, 4.90814208984375, 5.078857421875, 5.24957275390625, 5.4202880859375, 5.59100341796875, 5.76171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 9.0, 5.0, 10.0, 11.0, 10.0, 11.0, 12.0, 18.0, 22.0, 26.0, 27.0, 26.0, 29.0, 26.0, 38.0, 37.0, 39.0, 43.0, 42.0, 53.0, 40.0, 49.0, 26.0, 40.0, 43.0, 32.0, 32.0, 34.0, 21.0, 29.0, 29.0, 27.0, 16.0, 18.0, 8.0, 14.0, 7.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-26.21875, -25.3720703125, -24.525390625, -23.6787109375, -22.83203125, -21.9853515625, -21.138671875, -20.2919921875, -19.4453125, -18.5986328125, -17.751953125, -16.9052734375, -16.05859375, -15.2119140625, -14.365234375, -13.5185546875, -12.671875, -11.8251953125, -10.978515625, -10.1318359375, -9.28515625, -8.4384765625, -7.591796875, -6.7451171875, -5.8984375, -5.0517578125, -4.205078125, -3.3583984375, -2.51171875, -1.6650390625, -0.818359375, 0.0283203125, 0.875, 1.7216796875, 2.568359375, 3.4150390625, 4.26171875, 5.1083984375, 5.955078125, 6.8017578125, 7.6484375, 8.4951171875, 9.341796875, 10.1884765625, 11.03515625, 11.8818359375, 12.728515625, 13.5751953125, 14.421875, 15.2685546875, 16.115234375, 16.9619140625, 17.80859375, 18.6552734375, 19.501953125, 20.3486328125, 21.1953125, 22.0419921875, 22.888671875, 23.7353515625, 24.58203125, 25.4287109375, 26.275390625, 27.1220703125, 27.96875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 10.0, 18.0, 29.0, 43.0, 45.0, 96.0, 102.0, 229.0, 360.0, 508.0, 753.0, 1277.0, 2061.0, 3214.0, 5376.0, 8795.0, 15301.0, 25990.0, 46255.0, 83913.0, 161235.0, 262803.0, 196582.0, 102611.0, 55031.0, 31327.0, 17827.0, 10414.0, 6277.0, 3770.0, 2304.0, 1428.0, 879.0, 610.0, 372.0, 245.0, 145.0, 98.0, 68.0, 52.0, 29.0, 21.0, 19.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.85546875, -4.706787109375, -4.55810546875, -4.409423828125, -4.2607421875, -4.112060546875, -3.96337890625, -3.814697265625, -3.666015625, -3.517333984375, -3.36865234375, -3.219970703125, -3.0712890625, -2.922607421875, -2.77392578125, -2.625244140625, -2.4765625, -2.327880859375, -2.17919921875, -2.030517578125, -1.8818359375, -1.733154296875, -1.58447265625, -1.435791015625, -1.287109375, -1.138427734375, -0.98974609375, -0.841064453125, -0.6923828125, -0.543701171875, -0.39501953125, -0.246337890625, -0.09765625, 0.051025390625, 0.19970703125, 0.348388671875, 0.4970703125, 0.645751953125, 0.79443359375, 0.943115234375, 1.091796875, 1.240478515625, 1.38916015625, 1.537841796875, 1.6865234375, 1.835205078125, 1.98388671875, 2.132568359375, 2.28125, 2.429931640625, 2.57861328125, 2.727294921875, 2.8759765625, 3.024658203125, 3.17333984375, 3.322021484375, 3.470703125, 3.619384765625, 3.76806640625, 3.916748046875, 4.0654296875, 4.214111328125, 4.36279296875, 4.511474609375, 4.66015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 4.0, 4.0, 9.0, 8.0, 11.0, 19.0, 20.0, 20.0, 21.0, 18.0, 24.0, 30.0, 24.0, 19.0, 35.0, 32.0, 27.0, 54.0, 43.0, 46.0, 44.0, 47.0, 43.0, 41.0, 42.0, 42.0, 24.0, 28.0, 31.0, 29.0, 15.0, 24.0, 16.0, 19.0, 16.0, 10.0, 16.0, 9.0, 10.0, 12.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.09375, -17.52978515625, -16.9658203125, -16.40185546875, -15.837890625, -15.27392578125, -14.7099609375, -14.14599609375, -13.58203125, -13.01806640625, -12.4541015625, -11.89013671875, -11.326171875, -10.76220703125, -10.1982421875, -9.63427734375, -9.0703125, -8.50634765625, -7.9423828125, -7.37841796875, -6.814453125, -6.25048828125, -5.6865234375, -5.12255859375, -4.55859375, -3.99462890625, -3.4306640625, -2.86669921875, -2.302734375, -1.73876953125, -1.1748046875, -0.61083984375, -0.046875, 0.51708984375, 1.0810546875, 1.64501953125, 2.208984375, 2.77294921875, 3.3369140625, 3.90087890625, 4.46484375, 5.02880859375, 5.5927734375, 6.15673828125, 6.720703125, 7.28466796875, 7.8486328125, 8.41259765625, 8.9765625, 9.54052734375, 10.1044921875, 10.66845703125, 11.232421875, 11.79638671875, 12.3603515625, 12.92431640625, 13.48828125, 14.05224609375, 14.6162109375, 15.18017578125, 15.744140625, 16.30810546875, 16.8720703125, 17.43603515625, 18.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 21.0, 15.0, 24.0, 45.0, 57.0, 85.0, 134.0, 155.0, 305.0, 446.0, 747.0, 1290.0, 2062.0, 3610.0, 6585.0, 12398.0, 24081.0, 49740.0, 116895.0, 356308.0, 287252.0, 97503.0, 42877.0, 20964.0, 10864.0, 5941.0, 3289.0, 1817.0, 1128.0, 674.0, 434.0, 286.0, 152.0, 95.0, 77.0, 52.0, 41.0, 22.0, 23.0, 14.0, 10.0, 3.0, 5.0, 1.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4873046875, -0.47153472900390625, -0.4557647705078125, -0.43999481201171875, -0.424224853515625, -0.40845489501953125, -0.3926849365234375, -0.37691497802734375, -0.36114501953125, -0.34537506103515625, -0.3296051025390625, -0.31383514404296875, -0.298065185546875, -0.28229522705078125, -0.2665252685546875, -0.25075531005859375, -0.2349853515625, -0.21921539306640625, -0.2034454345703125, -0.18767547607421875, -0.171905517578125, -0.15613555908203125, -0.1403656005859375, -0.12459564208984375, -0.10882568359375, -0.09305572509765625, -0.0772857666015625, -0.06151580810546875, -0.045745849609375, -0.02997589111328125, -0.0142059326171875, 0.00156402587890625, 0.017333984375, 0.03310394287109375, 0.0488739013671875, 0.06464385986328125, 0.080413818359375, 0.09618377685546875, 0.1119537353515625, 0.12772369384765625, 0.14349365234375, 0.15926361083984375, 0.1750335693359375, 0.19080352783203125, 0.206573486328125, 0.22234344482421875, 0.2381134033203125, 0.25388336181640625, 0.2696533203125, 0.28542327880859375, 0.3011932373046875, 0.31696319580078125, 0.332733154296875, 0.34850311279296875, 0.3642730712890625, 0.38004302978515625, 0.39581298828125, 0.41158294677734375, 0.4273529052734375, 0.44312286376953125, 0.458892822265625, 0.47466278076171875, 0.4904327392578125, 0.5062026977539062, 0.52197265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 9.0, 10.0, 8.0, 19.0, 16.0, 12.0, 36.0, 36.0, 44.0, 48.0, 77.0, 85.0, 103.0, 89.0, 88.0, 69.0, 56.0, 54.0, 28.0, 24.0, 20.0, 13.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00012046098709106445, -0.00011718831956386566, -0.00011391565203666687, -0.00011064298450946808, -0.00010737031698226929, -0.0001040976494550705, -0.0001008249819278717, -9.755231440067291e-05, -9.427964687347412e-05, -9.100697934627533e-05, -8.773431181907654e-05, -8.446164429187775e-05, -8.118897676467896e-05, -7.791630923748016e-05, -7.464364171028137e-05, -7.137097418308258e-05, -6.809830665588379e-05, -6.4825639128685e-05, -6.15529716014862e-05, -5.8280304074287415e-05, -5.500763654708862e-05, -5.173496901988983e-05, -4.846230149269104e-05, -4.518963396549225e-05, -4.191696643829346e-05, -3.8644298911094666e-05, -3.5371631383895874e-05, -3.209896385669708e-05, -2.882629632949829e-05, -2.55536288022995e-05, -2.2280961275100708e-05, -1.9008293747901917e-05, -1.5735626220703125e-05, -1.2462958693504333e-05, -9.190291166305542e-06, -5.9176236391067505e-06, -2.644956111907959e-06, 6.277114152908325e-07, 3.900378942489624e-06, 7.1730464696884155e-06, 1.0445713996887207e-05, 1.3718381524085999e-05, 1.699104905128479e-05, 2.026371657848358e-05, 2.3536384105682373e-05, 2.6809051632881165e-05, 3.0081719160079956e-05, 3.335438668727875e-05, 3.662705421447754e-05, 3.989972174167633e-05, 4.317238926887512e-05, 4.6445056796073914e-05, 4.9717724323272705e-05, 5.2990391850471497e-05, 5.626305937767029e-05, 5.953572690486908e-05, 6.280839443206787e-05, 6.608106195926666e-05, 6.935372948646545e-05, 7.262639701366425e-05, 7.589906454086304e-05, 7.917173206806183e-05, 8.244439959526062e-05, 8.571706712245941e-05, 8.89897346496582e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 8.0, 5.0, 15.0, 26.0, 33.0, 43.0, 67.0, 73.0, 108.0, 163.0, 228.0, 302.0, 413.0, 623.0, 768.0, 1178.0, 1622.0, 2340.0, 3215.0, 4571.0, 6506.0, 9665.0, 14082.0, 21252.0, 33415.0, 53549.0, 91714.0, 178501.0, 280216.0, 136658.0, 75294.0, 45051.0, 28448.0, 18178.0, 12152.0, 8271.0, 5805.0, 4044.0, 2804.0, 2081.0, 1420.0, 1010.0, 702.0, 588.0, 369.0, 308.0, 174.0, 161.0, 111.0, 78.0, 53.0, 34.0, 24.0, 21.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.91259765625, -0.8824996948242188, -0.8524017333984375, -0.8223037719726562, -0.792205810546875, -0.7621078491210938, -0.7320098876953125, -0.7019119262695312, -0.67181396484375, -0.6417160034179688, -0.6116180419921875, -0.5815200805664062, -0.551422119140625, -0.5213241577148438, -0.4912261962890625, -0.46112823486328125, -0.4310302734375, -0.40093231201171875, -0.3708343505859375, -0.34073638916015625, -0.310638427734375, -0.28054046630859375, -0.2504425048828125, -0.22034454345703125, -0.19024658203125, -0.16014862060546875, -0.1300506591796875, -0.09995269775390625, -0.069854736328125, -0.03975677490234375, -0.0096588134765625, 0.02043914794921875, 0.050537109375, 0.08063507080078125, 0.1107330322265625, 0.14083099365234375, 0.170928955078125, 0.20102691650390625, 0.2311248779296875, 0.26122283935546875, 0.29132080078125, 0.32141876220703125, 0.3515167236328125, 0.38161468505859375, 0.411712646484375, 0.44181060791015625, 0.4719085693359375, 0.5020065307617188, 0.5321044921875, 0.5622024536132812, 0.5923004150390625, 0.6223983764648438, 0.652496337890625, 0.6825942993164062, 0.7126922607421875, 0.7427902221679688, 0.77288818359375, 0.8029861450195312, 0.8330841064453125, 0.8631820678710938, 0.893280029296875, 0.9233779907226562, 0.9534759521484375, 0.9835739135742188, 1.013671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 2.0, 5.0, 12.0, 9.0, 11.0, 18.0, 22.0, 25.0, 23.0, 32.0, 36.0, 18.0, 38.0, 27.0, 43.0, 59.0, 60.0, 90.0, 63.0, 55.0, 42.0, 41.0, 31.0, 24.0, 33.0, 26.0, 27.0, 18.0, 20.0, 13.0, 5.0, 11.0, 8.0, 7.0, 4.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.33251953125, -0.32281494140625, -0.3131103515625, -0.30340576171875, -0.293701171875, -0.28399658203125, -0.2742919921875, -0.26458740234375, -0.2548828125, -0.24517822265625, -0.2354736328125, -0.22576904296875, -0.216064453125, -0.20635986328125, -0.1966552734375, -0.18695068359375, -0.17724609375, -0.16754150390625, -0.1578369140625, -0.14813232421875, -0.138427734375, -0.12872314453125, -0.1190185546875, -0.10931396484375, -0.099609375, -0.08990478515625, -0.0802001953125, -0.07049560546875, -0.060791015625, -0.05108642578125, -0.0413818359375, -0.03167724609375, -0.02197265625, -0.01226806640625, -0.0025634765625, 0.00714111328125, 0.016845703125, 0.02655029296875, 0.0362548828125, 0.04595947265625, 0.0556640625, 0.06536865234375, 0.0750732421875, 0.08477783203125, 0.094482421875, 0.10418701171875, 0.1138916015625, 0.12359619140625, 0.13330078125, 0.14300537109375, 0.1527099609375, 0.16241455078125, 0.172119140625, 0.18182373046875, 0.1915283203125, 0.20123291015625, 0.2109375, 0.22064208984375, 0.2303466796875, 0.24005126953125, 0.249755859375, 0.25946044921875, 0.2691650390625, 0.27886962890625, 0.28857421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 7.0, 6.0, 16.0, 12.0, 7.0, 22.0, 12.0, 23.0, 26.0, 17.0, 28.0, 42.0, 31.0, 45.0, 54.0, 56.0, 43.0, 50.0, 55.0, 47.0, 51.0, 36.0, 46.0, 38.0, 24.0, 33.0, 27.0, 19.0, 16.0, 16.0, 16.0, 16.0, 12.0, 8.0, 4.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.600421905517578, -23.88871955871582, -23.177017211914062, -22.465316772460938, -21.75361442565918, -21.041912078857422, -20.330211639404297, -19.61850929260254, -18.90680694580078, -18.195104598999023, -17.483402252197266, -16.77170181274414, -16.059999465942383, -15.348297119140625, -14.636595726013184, -13.924894332885742, -13.213191986083984, -12.501489639282227, -11.789788246154785, -11.078086853027344, -10.366384506225586, -9.654682159423828, -8.942980766296387, -8.231279373168945, -7.5195770263671875, -6.807875156402588, -6.096173286437988, -5.384471416473389, -4.672769546508789, -3.9610676765441895, -3.24936580657959, -2.5376639366149902, -1.8259639739990234, -1.1142621040344238, -0.4025602340698242, 0.3091416358947754, 1.020843505859375, 1.7325453758239746, 2.444247245788574, 3.155949115753174, 3.8676509857177734, 4.579352855682373, 5.291054725646973, 6.002756595611572, 6.714458465576172, 7.4261603355407715, 8.137862205505371, 8.849563598632812, 9.56126594543457, 10.272968292236328, 10.98466968536377, 11.696371078491211, 12.408073425292969, 13.119775772094727, 13.831477165222168, 14.54317855834961, 15.254880905151367, 15.966583251953125, 16.67828369140625, 17.389986038208008, 18.101688385009766, 18.813390731811523, 19.52509307861328, 20.236793518066406, 20.948495864868164]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 9.0, 8.0, 10.0, 7.0, 14.0, 23.0, 28.0, 33.0, 31.0, 27.0, 23.0, 27.0, 38.0, 31.0, 44.0, 47.0, 45.0, 56.0, 40.0, 39.0, 35.0, 42.0, 49.0, 37.0, 29.0, 20.0, 28.0, 26.0, 34.0, 23.0, 17.0, 11.0, 12.0, 8.0, 9.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.148395538330078, -26.28829574584961, -25.428197860717773, -24.568099975585938, -23.70800018310547, -22.847900390625, -21.987802505493164, -21.127704620361328, -20.26760482788086, -19.40750503540039, -18.547407150268555, -17.68730926513672, -16.82720947265625, -15.967110633850098, -15.107011795043945, -14.246912956237793, -13.38681411743164, -12.526715278625488, -11.666616439819336, -10.806517601013184, -9.946418762207031, -9.086319923400879, -8.226221084594727, -7.366122245788574, -6.506023406982422, -5.6459245681762695, -4.785825729370117, -3.925726890563965, -3.0656280517578125, -2.20552921295166, -1.3454303741455078, -0.48533153533935547, 0.37476539611816406, 1.2348642349243164, 2.0949630737304688, 2.955061912536621, 3.8151607513427734, 4.675259590148926, 5.535358428955078, 6.3954572677612305, 7.255556106567383, 8.115654945373535, 8.975753784179688, 9.83585262298584, 10.695951461791992, 11.556050300598145, 12.416149139404297, 13.27624797821045, 14.136346817016602, 14.996445655822754, 15.856544494628906, 16.716644287109375, 17.57674217224121, 18.436840057373047, 19.296939849853516, 20.157039642333984, 21.01713752746582, 21.877235412597656, 22.737335205078125, 23.597434997558594, 24.45753288269043, 25.317630767822266, 26.177730560302734, 27.037830352783203, 27.89792823791504]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 7.0, 6.0, 10.0, 13.0, 24.0, 24.0, 43.0, 57.0, 100.0, 151.0, 207.0, 391.0, 539.0, 847.0, 1243.0, 1933.0, 3000.0, 4519.0, 6981.0, 10594.0, 15733.0, 22808.0, 32622.0, 44912.0, 59931.0, 76300.0, 91066.0, 100981.0, 105049.0, 100933.0, 90119.0, 75021.0, 59095.0, 44429.0, 31576.0, 22381.0, 14940.0, 10210.0, 6782.0, 4410.0, 2997.0, 1904.0, 1246.0, 871.0, 581.0, 328.0, 238.0, 136.0, 89.0, 69.0, 43.0, 29.0, 25.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0], "bins": [-17.078125, -16.535400390625, -15.99267578125, -15.449951171875, -14.9072265625, -14.364501953125, -13.82177734375, -13.279052734375, -12.736328125, -12.193603515625, -11.65087890625, -11.108154296875, -10.5654296875, -10.022705078125, -9.47998046875, -8.937255859375, -8.39453125, -7.851806640625, -7.30908203125, -6.766357421875, -6.2236328125, -5.680908203125, -5.13818359375, -4.595458984375, -4.052734375, -3.510009765625, -2.96728515625, -2.424560546875, -1.8818359375, -1.339111328125, -0.79638671875, -0.253662109375, 0.2890625, 0.831787109375, 1.37451171875, 1.917236328125, 2.4599609375, 3.002685546875, 3.54541015625, 4.088134765625, 4.630859375, 5.173583984375, 5.71630859375, 6.259033203125, 6.8017578125, 7.344482421875, 7.88720703125, 8.429931640625, 8.97265625, 9.515380859375, 10.05810546875, 10.600830078125, 11.1435546875, 11.686279296875, 12.22900390625, 12.771728515625, 13.314453125, 13.857177734375, 14.39990234375, 14.942626953125, 15.4853515625, 16.028076171875, 16.57080078125, 17.113525390625, 17.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 5.0, 6.0, 4.0, 8.0, 11.0, 12.0, 15.0, 26.0, 16.0, 19.0, 31.0, 39.0, 25.0, 26.0, 40.0, 34.0, 42.0, 37.0, 39.0, 44.0, 46.0, 45.0, 39.0, 45.0, 41.0, 32.0, 42.0, 28.0, 31.0, 28.0, 22.0, 15.0, 20.0, 18.0, 8.0, 13.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.5, -25.67041015625, -24.8408203125, -24.01123046875, -23.181640625, -22.35205078125, -21.5224609375, -20.69287109375, -19.86328125, -19.03369140625, -18.2041015625, -17.37451171875, -16.544921875, -15.71533203125, -14.8857421875, -14.05615234375, -13.2265625, -12.39697265625, -11.5673828125, -10.73779296875, -9.908203125, -9.07861328125, -8.2490234375, -7.41943359375, -6.58984375, -5.76025390625, -4.9306640625, -4.10107421875, -3.271484375, -2.44189453125, -1.6123046875, -0.78271484375, 0.046875, 0.87646484375, 1.7060546875, 2.53564453125, 3.365234375, 4.19482421875, 5.0244140625, 5.85400390625, 6.68359375, 7.51318359375, 8.3427734375, 9.17236328125, 10.001953125, 10.83154296875, 11.6611328125, 12.49072265625, 13.3203125, 14.14990234375, 14.9794921875, 15.80908203125, 16.638671875, 17.46826171875, 18.2978515625, 19.12744140625, 19.95703125, 20.78662109375, 21.6162109375, 22.44580078125, 23.275390625, 24.10498046875, 24.9345703125, 25.76416015625, 26.59375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 19.0, 24.0, 42.0, 64.0, 90.0, 158.0, 241.0, 319.0, 496.0, 700.0, 1093.0, 1612.0, 2313.0, 3556.0, 5385.0, 7919.0, 11314.0, 16307.0, 23865.0, 33267.0, 44829.0, 58701.0, 73421.0, 86906.0, 96453.0, 100428.0, 97257.0, 88248.0, 75057.0, 59491.0, 46026.0, 34199.0, 24620.0, 17245.0, 11883.0, 8044.0, 5710.0, 3667.0, 2517.0, 1694.0, 1092.0, 759.0, 480.0, 315.0, 252.0, 160.0, 112.0, 63.0, 47.0, 22.0, 29.0, 9.0, 10.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-16.4375, -15.91650390625, -15.3955078125, -14.87451171875, -14.353515625, -13.83251953125, -13.3115234375, -12.79052734375, -12.26953125, -11.74853515625, -11.2275390625, -10.70654296875, -10.185546875, -9.66455078125, -9.1435546875, -8.62255859375, -8.1015625, -7.58056640625, -7.0595703125, -6.53857421875, -6.017578125, -5.49658203125, -4.9755859375, -4.45458984375, -3.93359375, -3.41259765625, -2.8916015625, -2.37060546875, -1.849609375, -1.32861328125, -0.8076171875, -0.28662109375, 0.234375, 0.75537109375, 1.2763671875, 1.79736328125, 2.318359375, 2.83935546875, 3.3603515625, 3.88134765625, 4.40234375, 4.92333984375, 5.4443359375, 5.96533203125, 6.486328125, 7.00732421875, 7.5283203125, 8.04931640625, 8.5703125, 9.09130859375, 9.6123046875, 10.13330078125, 10.654296875, 11.17529296875, 11.6962890625, 12.21728515625, 12.73828125, 13.25927734375, 13.7802734375, 14.30126953125, 14.822265625, 15.34326171875, 15.8642578125, 16.38525390625, 16.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 5.0, 11.0, 17.0, 20.0, 18.0, 16.0, 19.0, 27.0, 20.0, 25.0, 19.0, 29.0, 33.0, 30.0, 33.0, 30.0, 29.0, 28.0, 43.0, 42.0, 50.0, 40.0, 40.0, 36.0, 34.0, 39.0, 27.0, 24.0, 21.0, 27.0, 15.0, 19.0, 11.0, 13.0, 13.0, 18.0, 8.0, 11.0, 11.0, 7.0, 5.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.15625, -14.6834716796875, -14.210693359375, -13.7379150390625, -13.26513671875, -12.7923583984375, -12.319580078125, -11.8468017578125, -11.3740234375, -10.9012451171875, -10.428466796875, -9.9556884765625, -9.48291015625, -9.0101318359375, -8.537353515625, -8.0645751953125, -7.591796875, -7.1190185546875, -6.646240234375, -6.1734619140625, -5.70068359375, -5.2279052734375, -4.755126953125, -4.2823486328125, -3.8095703125, -3.3367919921875, -2.864013671875, -2.3912353515625, -1.91845703125, -1.4456787109375, -0.972900390625, -0.5001220703125, -0.02734375, 0.4454345703125, 0.918212890625, 1.3909912109375, 1.86376953125, 2.3365478515625, 2.809326171875, 3.2821044921875, 3.7548828125, 4.2276611328125, 4.700439453125, 5.1732177734375, 5.64599609375, 6.1187744140625, 6.591552734375, 7.0643310546875, 7.537109375, 8.0098876953125, 8.482666015625, 8.9554443359375, 9.42822265625, 9.9010009765625, 10.373779296875, 10.8465576171875, 11.3193359375, 11.7921142578125, 12.264892578125, 12.7376708984375, 13.21044921875, 13.6832275390625, 14.156005859375, 14.6287841796875, 15.1015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 12.0, 26.0, 38.0, 53.0, 74.0, 122.0, 206.0, 337.0, 586.0, 1043.0, 1813.0, 3346.0, 6431.0, 11610.0, 21871.0, 38398.0, 66547.0, 105494.0, 146613.0, 169008.0, 159129.0, 122755.0, 82001.0, 49814.0, 27960.0, 15145.0, 8215.0, 4346.0, 2353.0, 1341.0, 778.0, 414.0, 253.0, 152.0, 89.0, 60.0, 32.0, 25.0, 15.0, 16.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.33538818359375, -7.0965576171875, -6.85772705078125, -6.618896484375, -6.38006591796875, -6.1412353515625, -5.90240478515625, -5.66357421875, -5.42474365234375, -5.1859130859375, -4.94708251953125, -4.708251953125, -4.46942138671875, -4.2305908203125, -3.99176025390625, -3.7529296875, -3.51409912109375, -3.2752685546875, -3.03643798828125, -2.797607421875, -2.55877685546875, -2.3199462890625, -2.08111572265625, -1.84228515625, -1.60345458984375, -1.3646240234375, -1.12579345703125, -0.886962890625, -0.64813232421875, -0.4093017578125, -0.17047119140625, 0.068359375, 0.30718994140625, 0.5460205078125, 0.78485107421875, 1.023681640625, 1.26251220703125, 1.5013427734375, 1.74017333984375, 1.97900390625, 2.21783447265625, 2.4566650390625, 2.69549560546875, 2.934326171875, 3.17315673828125, 3.4119873046875, 3.65081787109375, 3.8896484375, 4.12847900390625, 4.3673095703125, 4.60614013671875, 4.844970703125, 5.08380126953125, 5.3226318359375, 5.56146240234375, 5.80029296875, 6.03912353515625, 6.2779541015625, 6.51678466796875, 6.755615234375, 6.99444580078125, 7.2332763671875, 7.47210693359375, 7.7109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 8.0, 11.0, 13.0, 15.0, 22.0, 16.0, 15.0, 33.0, 32.0, 39.0, 40.0, 47.0, 47.0, 42.0, 41.0, 62.0, 49.0, 50.0, 38.0, 49.0, 38.0, 36.0, 29.0, 33.0, 41.0, 24.0, 20.0, 14.0, 12.0, 14.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005679130554199219, -0.0005493834614753723, -0.0005308538675308228, -0.0005123242735862732, -0.0004937946796417236, -0.00047526508569717407, -0.0004567354917526245, -0.00043820589780807495, -0.0004196763038635254, -0.00040114670991897583, -0.00038261711597442627, -0.0003640875220298767, -0.00034555792808532715, -0.0003270283341407776, -0.00030849874019622803, -0.00028996914625167847, -0.0002714395523071289, -0.00025290995836257935, -0.00023438036441802979, -0.00021585077047348022, -0.00019732117652893066, -0.0001787915825843811, -0.00016026198863983154, -0.00014173239469528198, -0.00012320280075073242, -0.00010467320680618286, -8.61436128616333e-05, -6.761401891708374e-05, -4.908442497253418e-05, -3.055483102798462e-05, -1.2025237083435059e-05, 6.504356861114502e-06, 2.5033950805664062e-05, 4.356354475021362e-05, 6.209313869476318e-05, 8.062273263931274e-05, 9.91523265838623e-05, 0.00011768192052841187, 0.00013621151447296143, 0.00015474110841751099, 0.00017327070236206055, 0.0001918002963066101, 0.00021032989025115967, 0.00022885948419570923, 0.0002473890781402588, 0.00026591867208480835, 0.0002844482660293579, 0.00030297785997390747, 0.00032150745391845703, 0.0003400370478630066, 0.00035856664180755615, 0.0003770962357521057, 0.0003956258296966553, 0.00041415542364120483, 0.0004326850175857544, 0.00045121461153030396, 0.0004697442054748535, 0.0004882737994194031, 0.0005068033933639526, 0.0005253329873085022, 0.0005438625812530518, 0.0005623921751976013, 0.0005809217691421509, 0.0005994513630867004, 0.00061798095703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 7.0, 8.0, 12.0, 15.0, 32.0, 44.0, 81.0, 104.0, 193.0, 279.0, 494.0, 713.0, 1185.0, 1994.0, 3210.0, 5537.0, 9181.0, 15398.0, 25255.0, 39870.0, 60866.0, 86920.0, 114126.0, 134115.0, 136600.0, 122845.0, 97486.0, 69950.0, 46606.0, 29691.0, 18350.0, 10868.0, 6575.0, 3879.0, 2306.0, 1398.0, 887.0, 526.0, 344.0, 204.0, 141.0, 92.0, 60.0, 46.0, 24.0, 17.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0], "bins": [-7.51171875, -7.3040771484375, -7.096435546875, -6.8887939453125, -6.68115234375, -6.4735107421875, -6.265869140625, -6.0582275390625, -5.8505859375, -5.6429443359375, -5.435302734375, -5.2276611328125, -5.02001953125, -4.8123779296875, -4.604736328125, -4.3970947265625, -4.189453125, -3.9818115234375, -3.774169921875, -3.5665283203125, -3.35888671875, -3.1512451171875, -2.943603515625, -2.7359619140625, -2.5283203125, -2.3206787109375, -2.113037109375, -1.9053955078125, -1.69775390625, -1.4901123046875, -1.282470703125, -1.0748291015625, -0.8671875, -0.6595458984375, -0.451904296875, -0.2442626953125, -0.03662109375, 0.1710205078125, 0.378662109375, 0.5863037109375, 0.7939453125, 1.0015869140625, 1.209228515625, 1.4168701171875, 1.62451171875, 1.8321533203125, 2.039794921875, 2.2474365234375, 2.455078125, 2.6627197265625, 2.870361328125, 3.0780029296875, 3.28564453125, 3.4932861328125, 3.700927734375, 3.9085693359375, 4.1162109375, 4.3238525390625, 4.531494140625, 4.7391357421875, 4.94677734375, 5.1544189453125, 5.362060546875, 5.5697021484375, 5.77734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 7.0, 12.0, 16.0, 21.0, 19.0, 13.0, 27.0, 29.0, 43.0, 42.0, 31.0, 43.0, 48.0, 48.0, 55.0, 47.0, 54.0, 53.0, 66.0, 39.0, 43.0, 33.0, 31.0, 27.0, 15.0, 18.0, 18.0, 18.0, 17.0, 10.0, 7.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.75030517578125, -2.6568603515625, -2.56341552734375, -2.469970703125, -2.37652587890625, -2.2830810546875, -2.18963623046875, -2.09619140625, -2.00274658203125, -1.9093017578125, -1.81585693359375, -1.722412109375, -1.62896728515625, -1.5355224609375, -1.44207763671875, -1.3486328125, -1.25518798828125, -1.1617431640625, -1.06829833984375, -0.974853515625, -0.88140869140625, -0.7879638671875, -0.69451904296875, -0.60107421875, -0.50762939453125, -0.4141845703125, -0.32073974609375, -0.227294921875, -0.13385009765625, -0.0404052734375, 0.05303955078125, 0.146484375, 0.23992919921875, 0.3333740234375, 0.42681884765625, 0.520263671875, 0.61370849609375, 0.7071533203125, 0.80059814453125, 0.89404296875, 0.98748779296875, 1.0809326171875, 1.17437744140625, 1.267822265625, 1.36126708984375, 1.4547119140625, 1.54815673828125, 1.6416015625, 1.73504638671875, 1.8284912109375, 1.92193603515625, 2.015380859375, 2.10882568359375, 2.2022705078125, 2.29571533203125, 2.38916015625, 2.48260498046875, 2.5760498046875, 2.66949462890625, 2.762939453125, 2.85638427734375, 2.9498291015625, 3.04327392578125, 3.13671875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 7.0, 4.0, 6.0, 10.0, 8.0, 6.0, 16.0, 17.0, 25.0, 29.0, 18.0, 29.0, 38.0, 30.0, 47.0, 51.0, 46.0, 50.0, 44.0, 56.0, 67.0, 35.0, 43.0, 42.0, 31.0, 45.0, 27.0, 21.0, 25.0, 21.0, 19.0, 16.0, 17.0, 10.0, 7.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.900941848754883, -23.196670532226562, -22.492401123046875, -21.788129806518555, -21.083858489990234, -20.379589080810547, -19.675317764282227, -18.971046447753906, -18.26677703857422, -17.5625057220459, -16.85823631286621, -16.15396499633789, -15.449694633483887, -14.745424270629883, -14.041152954101562, -13.336882591247559, -12.632612228393555, -11.92834186553955, -11.224071502685547, -10.519800186157227, -9.815529823303223, -9.111259460449219, -8.406988143920898, -7.7027177810668945, -6.998447418212891, -6.294177055358887, -5.589906215667725, -4.8856353759765625, -4.181365013122559, -3.4770944118499756, -2.7728238105773926, -2.0685529708862305, -1.3642845153808594, -0.6600139141082764, 0.04425668716430664, 0.7485272884368896, 1.4527978897094727, 2.1570684909820557, 2.8613390922546387, 3.565609931945801, 4.269880294799805, 4.974150657653809, 5.678421497344971, 6.382692337036133, 7.086962699890137, 7.791233062744141, 8.495504379272461, 9.199774742126465, 9.904045104980469, 10.608315467834473, 11.312585830688477, 12.016857147216797, 12.7211275100708, 13.425397872924805, 14.129669189453125, 14.833939552307129, 15.538209915161133, 16.242481231689453, 16.94675064086914, 17.65102195739746, 18.35529327392578, 19.05956268310547, 19.76383399963379, 20.46810531616211, 21.172374725341797]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 6.0, 7.0, 12.0, 8.0, 17.0, 16.0, 19.0, 19.0, 20.0, 24.0, 32.0, 27.0, 28.0, 33.0, 45.0, 38.0, 28.0, 55.0, 40.0, 44.0, 34.0, 40.0, 36.0, 29.0, 39.0, 32.0, 30.0, 32.0, 28.0, 24.0, 23.0, 20.0, 18.0, 17.0, 12.0, 7.0, 7.0, 9.0, 10.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.045042037963867, -23.230960845947266, -22.416881561279297, -21.602800369262695, -20.788719177246094, -19.974639892578125, -19.160558700561523, -18.346477508544922, -17.532398223876953, -16.71831703186035, -15.904236793518066, -15.090156555175781, -14.27607536315918, -13.461995124816895, -12.64791488647461, -11.833833694458008, -11.019752502441406, -10.205672264099121, -9.39159107208252, -8.577510833740234, -7.763430118560791, -6.949349403381348, -6.1352691650390625, -5.321188449859619, -4.507107734680176, -3.6930270195007324, -2.878946542739868, -2.064866065979004, -1.2507853507995605, -0.4367046356201172, 0.37737560272216797, 1.1914563179016113, 2.0055389404296875, 2.819619655609131, 3.633700132369995, 4.447780609130859, 5.261861324310303, 6.075942039489746, 6.890022277832031, 7.704102993011475, 8.518183708190918, 9.332263946533203, 10.146345138549805, 10.96042537689209, 11.774505615234375, 12.588586807250977, 13.402667045593262, 14.216747283935547, 15.030828475952148, 15.844908714294434, 16.65898895263672, 17.47307014465332, 18.287151336669922, 19.10123062133789, 19.915311813354492, 20.729393005371094, 21.543472290039062, 22.357553482055664, 23.171632766723633, 23.985713958740234, 24.799795150756836, 25.613876342773438, 26.427955627441406, 27.242036819458008, 28.05611801147461]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [5.0, 3.0, 8.0, 15.0, 29.0, 33.0, 50.0, 64.0, 121.0, 210.0, 334.0, 517.0, 860.0, 1385.0, 2080.0, 3484.0, 5595.0, 8930.0, 14401.0, 22351.0, 35620.0, 55633.0, 86604.0, 131257.0, 194133.0, 275969.0, 370630.0, 453945.0, 502938.0, 493926.0, 432693.0, 340834.0, 252761.0, 174634.0, 117972.0, 77383.0, 49597.0, 32110.0, 20155.0, 12954.0, 7953.0, 5112.0, 3313.0, 1989.0, 1361.0, 878.0, 523.0, 328.0, 230.0, 143.0, 104.0, 58.0, 41.0, 15.0, 13.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.171875, -15.611572265625, -15.05126953125, -14.490966796875, -13.9306640625, -13.370361328125, -12.81005859375, -12.249755859375, -11.689453125, -11.129150390625, -10.56884765625, -10.008544921875, -9.4482421875, -8.887939453125, -8.32763671875, -7.767333984375, -7.20703125, -6.646728515625, -6.08642578125, -5.526123046875, -4.9658203125, -4.405517578125, -3.84521484375, -3.284912109375, -2.724609375, -2.164306640625, -1.60400390625, -1.043701171875, -0.4833984375, 0.076904296875, 0.63720703125, 1.197509765625, 1.7578125, 2.318115234375, 2.87841796875, 3.438720703125, 3.9990234375, 4.559326171875, 5.11962890625, 5.679931640625, 6.240234375, 6.800537109375, 7.36083984375, 7.921142578125, 8.4814453125, 9.041748046875, 9.60205078125, 10.162353515625, 10.72265625, 11.282958984375, 11.84326171875, 12.403564453125, 12.9638671875, 13.524169921875, 14.08447265625, 14.644775390625, 15.205078125, 15.765380859375, 16.32568359375, 16.885986328125, 17.4462890625, 18.006591796875, 18.56689453125, 19.127197265625, 19.6875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 8.0, 7.0, 9.0, 10.0, 14.0, 17.0, 14.0, 19.0, 31.0, 37.0, 35.0, 38.0, 30.0, 36.0, 36.0, 36.0, 42.0, 43.0, 55.0, 46.0, 42.0, 44.0, 29.0, 47.0, 37.0, 24.0, 31.0, 34.0, 23.0, 16.0, 19.0, 14.0, 10.0, 12.0, 7.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.349853515625, -17.69970703125, -17.049560546875, -16.3994140625, -15.749267578125, -15.09912109375, -14.448974609375, -13.798828125, -13.148681640625, -12.49853515625, -11.848388671875, -11.1982421875, -10.548095703125, -9.89794921875, -9.247802734375, -8.59765625, -7.947509765625, -7.29736328125, -6.647216796875, -5.9970703125, -5.346923828125, -4.69677734375, -4.046630859375, -3.396484375, -2.746337890625, -2.09619140625, -1.446044921875, -0.7958984375, -0.145751953125, 0.50439453125, 1.154541015625, 1.8046875, 2.454833984375, 3.10498046875, 3.755126953125, 4.4052734375, 5.055419921875, 5.70556640625, 6.355712890625, 7.005859375, 7.656005859375, 8.30615234375, 8.956298828125, 9.6064453125, 10.256591796875, 10.90673828125, 11.556884765625, 12.20703125, 12.857177734375, 13.50732421875, 14.157470703125, 14.8076171875, 15.457763671875, 16.10791015625, 16.758056640625, 17.408203125, 18.058349609375, 18.70849609375, 19.358642578125, 20.0087890625, 20.658935546875, 21.30908203125, 21.959228515625, 22.609375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 20.0, 43.0, 59.0, 96.0, 164.0, 257.0, 436.0, 731.0, 1313.0, 2193.0, 3665.0, 6121.0, 10192.0, 16761.0, 27300.0, 43981.0, 69806.0, 106494.0, 157553.0, 223436.0, 299336.0, 374806.0, 436955.0, 463122.0, 450467.0, 400731.0, 327970.0, 249918.0, 179856.0, 123473.0, 81611.0, 52500.0, 32909.0, 19956.0, 12151.0, 7204.0, 4286.0, 2559.0, 1537.0, 899.0, 576.0, 340.0, 209.0, 116.0, 67.0, 42.0, 18.0, 11.0, 10.0, 11.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0306396484375, -14.506591796875, -13.9825439453125, -13.45849609375, -12.9344482421875, -12.410400390625, -11.8863525390625, -11.3623046875, -10.8382568359375, -10.314208984375, -9.7901611328125, -9.26611328125, -8.7420654296875, -8.218017578125, -7.6939697265625, -7.169921875, -6.6458740234375, -6.121826171875, -5.5977783203125, -5.07373046875, -4.5496826171875, -4.025634765625, -3.5015869140625, -2.9775390625, -2.4534912109375, -1.929443359375, -1.4053955078125, -0.88134765625, -0.3572998046875, 0.166748046875, 0.6907958984375, 1.21484375, 1.7388916015625, 2.262939453125, 2.7869873046875, 3.31103515625, 3.8350830078125, 4.359130859375, 4.8831787109375, 5.4072265625, 5.9312744140625, 6.455322265625, 6.9793701171875, 7.50341796875, 8.0274658203125, 8.551513671875, 9.0755615234375, 9.599609375, 10.1236572265625, 10.647705078125, 11.1717529296875, 11.69580078125, 12.2198486328125, 12.743896484375, 13.2679443359375, 13.7919921875, 14.3160400390625, 14.840087890625, 15.3641357421875, 15.88818359375, 16.4122314453125, 16.936279296875, 17.4603271484375, 17.984375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 15.0, 18.0, 20.0, 16.0, 20.0, 32.0, 39.0, 39.0, 79.0, 60.0, 51.0, 83.0, 107.0, 141.0, 127.0, 154.0, 169.0, 175.0, 177.0, 202.0, 215.0, 203.0, 207.0, 186.0, 188.0, 174.0, 156.0, 157.0, 134.0, 120.0, 113.0, 101.0, 73.0, 54.0, 57.0, 43.0, 27.0, 22.0, 22.0, 16.0, 18.0, 12.0, 10.0, 5.0, 13.0, 2.0, 3.0, 2.0, 3.0, 3.0], "bins": [-10.1171875, -9.832763671875, -9.54833984375, -9.263916015625, -8.9794921875, -8.695068359375, -8.41064453125, -8.126220703125, -7.841796875, -7.557373046875, -7.27294921875, -6.988525390625, -6.7041015625, -6.419677734375, -6.13525390625, -5.850830078125, -5.56640625, -5.281982421875, -4.99755859375, -4.713134765625, -4.4287109375, -4.144287109375, -3.85986328125, -3.575439453125, -3.291015625, -3.006591796875, -2.72216796875, -2.437744140625, -2.1533203125, -1.868896484375, -1.58447265625, -1.300048828125, -1.015625, -0.731201171875, -0.44677734375, -0.162353515625, 0.1220703125, 0.406494140625, 0.69091796875, 0.975341796875, 1.259765625, 1.544189453125, 1.82861328125, 2.113037109375, 2.3974609375, 2.681884765625, 2.96630859375, 3.250732421875, 3.53515625, 3.819580078125, 4.10400390625, 4.388427734375, 4.6728515625, 4.957275390625, 5.24169921875, 5.526123046875, 5.810546875, 6.094970703125, 6.37939453125, 6.663818359375, 6.9482421875, 7.232666015625, 7.51708984375, 7.801513671875, 8.0859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 5.0, 16.0, 12.0, 19.0, 19.0, 37.0, 25.0, 35.0, 27.0, 49.0, 59.0, 40.0, 43.0, 43.0, 50.0, 60.0, 39.0, 45.0, 30.0, 36.0, 45.0, 32.0, 23.0, 19.0, 16.0, 24.0, 15.0, 21.0, 10.0, 11.0, 12.0, 7.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.732458114624023, -17.11579704284668, -16.499135971069336, -15.882474899291992, -15.265813827514648, -14.649152755737305, -14.032491683959961, -13.415830612182617, -12.799169540405273, -12.18250846862793, -11.565847396850586, -10.949186325073242, -10.332525253295898, -9.715864181518555, -9.099203109741211, -8.482542037963867, -7.865880966186523, -7.24921989440918, -6.632558822631836, -6.015897750854492, -5.399236679077148, -4.782575607299805, -4.165914535522461, -3.549253463745117, -2.9325923919677734, -2.3159313201904297, -1.699270248413086, -1.0826091766357422, -0.46594810485839844, 0.1507129669189453, 0.7673740386962891, 1.3840351104736328, 2.0006942749023438, 2.6173553466796875, 3.2340164184570312, 3.850677490234375, 4.467338562011719, 5.0839996337890625, 5.700660705566406, 6.31732177734375, 6.933982849121094, 7.5506439208984375, 8.167304992675781, 8.783966064453125, 9.400627136230469, 10.017288208007812, 10.633949279785156, 11.2506103515625, 11.867271423339844, 12.483932495117188, 13.100593566894531, 13.717254638671875, 14.333915710449219, 14.950576782226562, 15.567237854003906, 16.18389892578125, 16.800559997558594, 17.417221069335938, 18.03388214111328, 18.650543212890625, 19.26720428466797, 19.883865356445312, 20.500526428222656, 21.1171875, 21.733848571777344]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 8.0, 10.0, 13.0, 15.0, 15.0, 14.0, 17.0, 19.0, 26.0, 26.0, 27.0, 23.0, 35.0, 35.0, 49.0, 36.0, 38.0, 41.0, 47.0, 35.0, 43.0, 39.0, 52.0, 25.0, 35.0, 29.0, 39.0, 32.0, 27.0, 30.0, 17.0, 21.0, 9.0, 11.0, 11.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.07156753540039, -21.348522186279297, -20.625476837158203, -19.90243148803711, -19.17938804626465, -18.456342697143555, -17.73329734802246, -17.010251998901367, -16.287208557128906, -15.564163208007812, -14.841118812561035, -14.118073463439941, -13.395029067993164, -12.67198371887207, -11.948938369750977, -11.225893020629883, -10.502847671508789, -9.779802322387695, -9.056757926940918, -8.333712577819824, -7.610667705535889, -6.887622833251953, -6.164577484130859, -5.441532611846924, -4.718487739562988, -3.9954428672790527, -3.272397756576538, -2.5493526458740234, -1.826307773590088, -1.1032629013061523, -0.3802175521850586, 0.34282732009887695, 1.0658721923828125, 1.7889171838760376, 2.5119621753692627, 3.2350072860717773, 3.958052158355713, 4.681097030639648, 5.404142379760742, 6.127187252044678, 6.850232124328613, 7.573276996612549, 8.296321868896484, 9.019367218017578, 9.742412567138672, 10.46545696258545, 11.188502311706543, 11.91154670715332, 12.634592056274414, 13.357637405395508, 14.080681800842285, 14.803727149963379, 15.526771545410156, 16.24981689453125, 16.972862243652344, 17.695907592773438, 18.41895294189453, 19.141998291015625, 19.86504364013672, 20.588088989257812, 21.311132431030273, 22.034177780151367, 22.75722312927246, 23.480268478393555, 24.203311920166016]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 18.0, 18.0, 32.0, 48.0, 66.0, 93.0, 130.0, 184.0, 277.0, 400.0, 629.0, 873.0, 1316.0, 1892.0, 2821.0, 4235.0, 6402.0, 9904.0, 14936.0, 23448.0, 37786.0, 60498.0, 95904.0, 147841.0, 195939.0, 158484.0, 104042.0, 65837.0, 41041.0, 25863.0, 16328.0, 10320.0, 6960.0, 4601.0, 2978.0, 2008.0, 1391.0, 900.0, 649.0, 450.0, 301.0, 199.0, 178.0, 88.0, 68.0, 63.0, 25.0, 19.0, 24.0, 20.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.8359375, -3.714508056640625, -3.59307861328125, -3.471649169921875, -3.3502197265625, -3.228790283203125, -3.10736083984375, -2.985931396484375, -2.864501953125, -2.743072509765625, -2.62164306640625, -2.500213623046875, -2.3787841796875, -2.257354736328125, -2.13592529296875, -2.014495849609375, -1.89306640625, -1.771636962890625, -1.65020751953125, -1.528778076171875, -1.4073486328125, -1.285919189453125, -1.16448974609375, -1.043060302734375, -0.921630859375, -0.800201416015625, -0.67877197265625, -0.557342529296875, -0.4359130859375, -0.314483642578125, -0.19305419921875, -0.071624755859375, 0.0498046875, 0.171234130859375, 0.29266357421875, 0.414093017578125, 0.5355224609375, 0.656951904296875, 0.77838134765625, 0.899810791015625, 1.021240234375, 1.142669677734375, 1.26409912109375, 1.385528564453125, 1.5069580078125, 1.628387451171875, 1.74981689453125, 1.871246337890625, 1.99267578125, 2.114105224609375, 2.23553466796875, 2.356964111328125, 2.4783935546875, 2.599822998046875, 2.72125244140625, 2.842681884765625, 2.964111328125, 3.085540771484375, 3.20697021484375, 3.328399658203125, 3.4498291015625, 3.571258544921875, 3.69268798828125, 3.814117431640625, 3.935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 15.0, 20.0, 14.0, 18.0, 15.0, 20.0, 24.0, 21.0, 23.0, 34.0, 36.0, 40.0, 37.0, 42.0, 39.0, 39.0, 45.0, 38.0, 52.0, 36.0, 35.0, 30.0, 27.0, 30.0, 36.0, 24.0, 36.0, 21.0, 17.0, 13.0, 11.0, 11.0, 15.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.21875, -19.49658203125, -18.7744140625, -18.05224609375, -17.330078125, -16.60791015625, -15.8857421875, -15.16357421875, -14.44140625, -13.71923828125, -12.9970703125, -12.27490234375, -11.552734375, -10.83056640625, -10.1083984375, -9.38623046875, -8.6640625, -7.94189453125, -7.2197265625, -6.49755859375, -5.775390625, -5.05322265625, -4.3310546875, -3.60888671875, -2.88671875, -2.16455078125, -1.4423828125, -0.72021484375, 0.001953125, 0.72412109375, 1.4462890625, 2.16845703125, 2.890625, 3.61279296875, 4.3349609375, 5.05712890625, 5.779296875, 6.50146484375, 7.2236328125, 7.94580078125, 8.66796875, 9.39013671875, 10.1123046875, 10.83447265625, 11.556640625, 12.27880859375, 13.0009765625, 13.72314453125, 14.4453125, 15.16748046875, 15.8896484375, 16.61181640625, 17.333984375, 18.05615234375, 18.7783203125, 19.50048828125, 20.22265625, 20.94482421875, 21.6669921875, 22.38916015625, 23.111328125, 23.83349609375, 24.5556640625, 25.27783203125, 26.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 12.0, 18.0, 29.0, 29.0, 55.0, 94.0, 131.0, 230.0, 332.0, 582.0, 877.0, 1339.0, 2114.0, 3514.0, 5887.0, 9978.0, 16806.0, 29348.0, 52397.0, 97171.0, 187935.0, 271645.0, 168547.0, 87558.0, 47323.0, 26628.0, 15205.0, 8922.0, 5359.0, 3292.0, 1896.0, 1225.0, 725.0, 491.0, 322.0, 213.0, 115.0, 76.0, 59.0, 25.0, 11.0, 21.0, 11.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.33203125, -4.202392578125, -4.07275390625, -3.943115234375, -3.8134765625, -3.683837890625, -3.55419921875, -3.424560546875, -3.294921875, -3.165283203125, -3.03564453125, -2.906005859375, -2.7763671875, -2.646728515625, -2.51708984375, -2.387451171875, -2.2578125, -2.128173828125, -1.99853515625, -1.868896484375, -1.7392578125, -1.609619140625, -1.47998046875, -1.350341796875, -1.220703125, -1.091064453125, -0.96142578125, -0.831787109375, -0.7021484375, -0.572509765625, -0.44287109375, -0.313232421875, -0.18359375, -0.053955078125, 0.07568359375, 0.205322265625, 0.3349609375, 0.464599609375, 0.59423828125, 0.723876953125, 0.853515625, 0.983154296875, 1.11279296875, 1.242431640625, 1.3720703125, 1.501708984375, 1.63134765625, 1.760986328125, 1.890625, 2.020263671875, 2.14990234375, 2.279541015625, 2.4091796875, 2.538818359375, 2.66845703125, 2.798095703125, 2.927734375, 3.057373046875, 3.18701171875, 3.316650390625, 3.4462890625, 3.575927734375, 3.70556640625, 3.835205078125, 3.96484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 7.0, 8.0, 6.0, 3.0, 3.0, 7.0, 5.0, 14.0, 13.0, 19.0, 21.0, 29.0, 31.0, 25.0, 16.0, 27.0, 33.0, 45.0, 38.0, 39.0, 38.0, 41.0, 45.0, 38.0, 46.0, 40.0, 53.0, 29.0, 45.0, 33.0, 22.0, 20.0, 28.0, 21.0, 19.0, 23.0, 17.0, 18.0, 9.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.45751953125, -12.9775390625, -12.49755859375, -12.017578125, -11.53759765625, -11.0576171875, -10.57763671875, -10.09765625, -9.61767578125, -9.1376953125, -8.65771484375, -8.177734375, -7.69775390625, -7.2177734375, -6.73779296875, -6.2578125, -5.77783203125, -5.2978515625, -4.81787109375, -4.337890625, -3.85791015625, -3.3779296875, -2.89794921875, -2.41796875, -1.93798828125, -1.4580078125, -0.97802734375, -0.498046875, -0.01806640625, 0.4619140625, 0.94189453125, 1.421875, 1.90185546875, 2.3818359375, 2.86181640625, 3.341796875, 3.82177734375, 4.3017578125, 4.78173828125, 5.26171875, 5.74169921875, 6.2216796875, 6.70166015625, 7.181640625, 7.66162109375, 8.1416015625, 8.62158203125, 9.1015625, 9.58154296875, 10.0615234375, 10.54150390625, 11.021484375, 11.50146484375, 11.9814453125, 12.46142578125, 12.94140625, 13.42138671875, 13.9013671875, 14.38134765625, 14.861328125, 15.34130859375, 15.8212890625, 16.30126953125, 16.78125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 8.0, 6.0, 8.0, 19.0, 21.0, 35.0, 51.0, 78.0, 93.0, 134.0, 164.0, 247.0, 339.0, 529.0, 765.0, 1060.0, 1505.0, 2376.0, 3424.0, 5241.0, 8154.0, 12614.0, 20724.0, 34925.0, 63336.0, 128071.0, 292836.0, 236625.0, 101664.0, 52605.0, 30236.0, 18167.0, 11098.0, 7112.0, 4561.0, 2999.0, 2065.0, 1443.0, 957.0, 660.0, 472.0, 316.0, 224.0, 161.0, 120.0, 81.0, 60.0, 40.0, 40.0, 25.0, 18.0, 16.0, 11.0, 9.0, 2.0, 5.0, 4.0, 3.0], "bins": [-0.276611328125, -0.2681922912597656, -0.25977325439453125, -0.2513542175292969, -0.2429351806640625, -0.23451614379882812, -0.22609710693359375, -0.21767807006835938, -0.209259033203125, -0.20083999633789062, -0.19242095947265625, -0.18400192260742188, -0.1755828857421875, -0.16716384887695312, -0.15874481201171875, -0.15032577514648438, -0.14190673828125, -0.13348770141601562, -0.12506866455078125, -0.11664962768554688, -0.1082305908203125, -0.09981155395507812, -0.09139251708984375, -0.08297348022460938, -0.074554443359375, -0.06613540649414062, -0.05771636962890625, -0.049297332763671875, -0.0408782958984375, -0.032459259033203125, -0.02404022216796875, -0.015621185302734375, -0.0072021484375, 0.001216888427734375, 0.00963592529296875, 0.018054962158203125, 0.0264739990234375, 0.034893035888671875, 0.04331207275390625, 0.051731109619140625, 0.060150146484375, 0.06856918334960938, 0.07698822021484375, 0.08540725708007812, 0.0938262939453125, 0.10224533081054688, 0.11066436767578125, 0.11908340454101562, 0.12750244140625, 0.13592147827148438, 0.14434051513671875, 0.15275955200195312, 0.1611785888671875, 0.16959762573242188, 0.17801666259765625, 0.18643569946289062, 0.194854736328125, 0.20327377319335938, 0.21169281005859375, 0.22011184692382812, 0.2285308837890625, 0.23694992065429688, 0.24536895751953125, 0.2537879943847656, 0.26220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 15.0, 19.0, 21.0, 28.0, 25.0, 39.0, 37.0, 38.0, 59.0, 46.0, 55.0, 50.0, 65.0, 60.0, 60.0, 59.0, 43.0, 45.0, 54.0, 22.0, 30.0, 18.0, 23.0, 10.0, 6.0, 14.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8041343688964844e-05, -4.660803824663162e-05, -4.51747328042984e-05, -4.374142736196518e-05, -4.230812191963196e-05, -4.0874816477298737e-05, -3.9441511034965515e-05, -3.8008205592632294e-05, -3.657490015029907e-05, -3.514159470796585e-05, -3.370828926563263e-05, -3.227498382329941e-05, -3.0841678380966187e-05, -2.9408372938632965e-05, -2.7975067496299744e-05, -2.6541762053966522e-05, -2.51084566116333e-05, -2.367515116930008e-05, -2.2241845726966858e-05, -2.0808540284633636e-05, -1.9375234842300415e-05, -1.7941929399967194e-05, -1.6508623957633972e-05, -1.507531851530075e-05, -1.364201307296753e-05, -1.2208707630634308e-05, -1.0775402188301086e-05, -9.342096745967865e-06, -7.908791303634644e-06, -6.475485861301422e-06, -5.042180418968201e-06, -3.6088749766349792e-06, -2.175569534301758e-06, -7.422640919685364e-07, 6.910413503646851e-07, 2.1243467926979065e-06, 3.557652235031128e-06, 4.990957677364349e-06, 6.424263119697571e-06, 7.857568562030792e-06, 9.290874004364014e-06, 1.0724179446697235e-05, 1.2157484889030457e-05, 1.3590790331363678e-05, 1.50240957736969e-05, 1.645740121603012e-05, 1.7890706658363342e-05, 1.9324012100696564e-05, 2.0757317543029785e-05, 2.2190622985363007e-05, 2.3623928427696228e-05, 2.505723387002945e-05, 2.649053931236267e-05, 2.7923844754695892e-05, 2.9357150197029114e-05, 3.0790455639362335e-05, 3.222376108169556e-05, 3.365706652402878e-05, 3.5090371966362e-05, 3.652367740869522e-05, 3.795698285102844e-05, 3.9390288293361664e-05, 4.0823593735694885e-05, 4.225689917802811e-05, 4.369020462036133e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 5.0, 15.0, 25.0, 41.0, 68.0, 88.0, 140.0, 188.0, 325.0, 411.0, 709.0, 1024.0, 1503.0, 2260.0, 3430.0, 5388.0, 8301.0, 13218.0, 21459.0, 36230.0, 61623.0, 115788.0, 275348.0, 247030.0, 106490.0, 58012.0, 33740.0, 20278.0, 12479.0, 8049.0, 5011.0, 3283.0, 2274.0, 1513.0, 905.0, 628.0, 424.0, 272.0, 210.0, 123.0, 82.0, 69.0, 30.0, 25.0, 14.0, 10.0, 7.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.7532730102539062, -0.7296905517578125, -0.7061080932617188, -0.682525634765625, -0.6589431762695312, -0.6353607177734375, -0.6117782592773438, -0.58819580078125, -0.5646133422851562, -0.5410308837890625, -0.5174484252929688, -0.493865966796875, -0.47028350830078125, -0.4467010498046875, -0.42311859130859375, -0.3995361328125, -0.37595367431640625, -0.3523712158203125, -0.32878875732421875, -0.305206298828125, -0.28162384033203125, -0.2580413818359375, -0.23445892333984375, -0.21087646484375, -0.18729400634765625, -0.1637115478515625, -0.14012908935546875, -0.116546630859375, -0.09296417236328125, -0.0693817138671875, -0.04579925537109375, -0.022216796875, 0.00136566162109375, 0.0249481201171875, 0.04853057861328125, 0.072113037109375, 0.09569549560546875, 0.1192779541015625, 0.14286041259765625, 0.16644287109375, 0.19002532958984375, 0.2136077880859375, 0.23719024658203125, 0.260772705078125, 0.28435516357421875, 0.3079376220703125, 0.33152008056640625, 0.3551025390625, 0.37868499755859375, 0.4022674560546875, 0.42584991455078125, 0.449432373046875, 0.47301483154296875, 0.4965972900390625, 0.5201797485351562, 0.54376220703125, 0.5673446655273438, 0.5909271240234375, 0.6145095825195312, 0.638092041015625, 0.6616744995117188, 0.6852569580078125, 0.7088394165039062, 0.732421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 11.0, 8.0, 5.0, 10.0, 15.0, 12.0, 33.0, 27.0, 30.0, 31.0, 37.0, 35.0, 56.0, 82.0, 106.0, 105.0, 75.0, 65.0, 39.0, 31.0, 29.0, 27.0, 24.0, 16.0, 11.0, 14.0, 16.0, 10.0, 12.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.44775390625, -0.4352684020996094, -0.42278289794921875, -0.4102973937988281, -0.3978118896484375, -0.3853263854980469, -0.37284088134765625, -0.3603553771972656, -0.347869873046875, -0.3353843688964844, -0.32289886474609375, -0.3104133605957031, -0.2979278564453125, -0.2854423522949219, -0.27295684814453125, -0.2604713439941406, -0.24798583984375, -0.23550033569335938, -0.22301483154296875, -0.21052932739257812, -0.1980438232421875, -0.18555831909179688, -0.17307281494140625, -0.16058731079101562, -0.148101806640625, -0.13561630249023438, -0.12313079833984375, -0.11064529418945312, -0.0981597900390625, -0.08567428588867188, -0.07318878173828125, -0.060703277587890625, -0.0482177734375, -0.035732269287109375, -0.02324676513671875, -0.010761260986328125, 0.0017242431640625, 0.014209747314453125, 0.02669525146484375, 0.039180755615234375, 0.051666259765625, 0.06415176391601562, 0.07663726806640625, 0.08912277221679688, 0.1016082763671875, 0.11409378051757812, 0.12657928466796875, 0.13906478881835938, 0.15155029296875, 0.16403579711914062, 0.17652130126953125, 0.18900680541992188, 0.2014923095703125, 0.21397781372070312, 0.22646331787109375, 0.23894882202148438, 0.251434326171875, 0.2639198303222656, 0.27640533447265625, 0.2888908386230469, 0.3013763427734375, 0.3138618469238281, 0.32634735107421875, 0.3388328552246094, 0.351318359375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 10.0, 13.0, 10.0, 4.0, 18.0, 16.0, 17.0, 23.0, 25.0, 30.0, 39.0, 33.0, 43.0, 51.0, 42.0, 45.0, 37.0, 61.0, 44.0, 41.0, 38.0, 36.0, 37.0, 37.0, 32.0, 28.0, 24.0, 13.0, 19.0, 18.0, 19.0, 14.0, 12.0, 11.0, 8.0, 10.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.975675582885742, -16.385644912719727, -15.795613288879395, -15.205582618713379, -14.615550994873047, -14.025520324707031, -13.435489654541016, -12.845458984375, -12.255427360534668, -11.665396690368652, -11.07536506652832, -10.485334396362305, -9.895303726196289, -9.305272102355957, -8.715241432189941, -8.12520980834961, -7.535179138183594, -6.94514799118042, -6.355116844177246, -5.7650861740112305, -5.175055027008057, -4.585023880004883, -3.994992971420288, -3.4049620628356934, -2.8149309158325195, -2.2248997688293457, -1.634868860244751, -1.0448378324508667, -0.4548068046569824, 0.1352243423461914, 0.7252552509307861, 1.3152861595153809, 1.9053192138671875, 2.4953503608703613, 3.085381269454956, 3.675412178039551, 4.265443325042725, 4.855474472045898, 5.445505142211914, 6.035536289215088, 6.625567436218262, 7.2155985832214355, 7.805629730224609, 8.395660400390625, 8.98569107055664, 9.575722694396973, 10.165753364562988, 10.75578498840332, 11.345815658569336, 11.935846328735352, 12.525877952575684, 13.1159086227417, 13.705940246582031, 14.295970916748047, 14.886001586914062, 15.476032257080078, 16.066062927246094, 16.65609359741211, 17.246124267578125, 17.836156845092773, 18.42618751525879, 19.016218185424805, 19.60624885559082, 20.196279525756836, 20.786312103271484]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 11.0, 6.0, 14.0, 13.0, 13.0, 20.0, 14.0, 18.0, 26.0, 25.0, 27.0, 22.0, 29.0, 40.0, 38.0, 43.0, 36.0, 46.0, 34.0, 42.0, 40.0, 42.0, 50.0, 36.0, 26.0, 35.0, 32.0, 37.0, 27.0, 26.0, 27.0, 12.0, 18.0, 12.0, 8.0, 9.0, 11.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.029541015625, -21.3182315826416, -20.606924057006836, -19.895614624023438, -19.18430519104004, -18.47299575805664, -17.761688232421875, -17.050378799438477, -16.339069366455078, -15.627760887145996, -14.916451454162598, -14.205142974853516, -13.493833541870117, -12.782525062561035, -12.071216583251953, -11.359907150268555, -10.648599624633789, -9.937291145324707, -9.225981712341309, -8.514673233032227, -7.803364276885986, -7.092055320739746, -6.380746841430664, -5.669437885284424, -4.958128929138184, -4.246819972991943, -3.5355112552642822, -2.824202537536621, -2.112893581390381, -1.4015846252441406, -0.6902761459350586, 0.02103281021118164, 0.7323398590087891, 1.4436486959457397, 2.1549575328826904, 2.8662662506103516, 3.577575206756592, 4.288884162902832, 5.000192642211914, 5.711501598358154, 6.4228105545043945, 7.134119510650635, 7.845428466796875, 8.556736946105957, 9.268045425415039, 9.979354858398438, 10.69066333770752, 11.401971817016602, 12.11328125, 12.824589729309082, 13.53589916229248, 14.247207641601562, 14.958517074584961, 15.669825553894043, 16.381134033203125, 17.092443466186523, 17.803752899169922, 18.51506233215332, 19.226369857788086, 19.937679290771484, 20.648988723754883, 21.36029815673828, 22.071605682373047, 22.782915115356445, 23.49422264099121]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 11.0, 25.0, 20.0, 24.0, 50.0, 68.0, 97.0, 148.0, 242.0, 348.0, 527.0, 812.0, 1268.0, 1903.0, 2998.0, 4504.0, 6926.0, 10882.0, 15985.0, 23698.0, 33894.0, 46093.0, 61897.0, 78232.0, 93243.0, 103147.0, 106082.0, 100920.0, 89005.0, 73115.0, 57091.0, 42675.0, 30405.0, 20891.0, 14291.0, 9323.0, 6093.0, 4063.0, 2640.0, 1683.0, 1153.0, 725.0, 486.0, 301.0, 188.0, 128.0, 83.0, 69.0, 35.0, 30.0, 16.0, 12.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0], "bins": [-14.5625, -14.1123046875, -13.662109375, -13.2119140625, -12.76171875, -12.3115234375, -11.861328125, -11.4111328125, -10.9609375, -10.5107421875, -10.060546875, -9.6103515625, -9.16015625, -8.7099609375, -8.259765625, -7.8095703125, -7.359375, -6.9091796875, -6.458984375, -6.0087890625, -5.55859375, -5.1083984375, -4.658203125, -4.2080078125, -3.7578125, -3.3076171875, -2.857421875, -2.4072265625, -1.95703125, -1.5068359375, -1.056640625, -0.6064453125, -0.15625, 0.2939453125, 0.744140625, 1.1943359375, 1.64453125, 2.0947265625, 2.544921875, 2.9951171875, 3.4453125, 3.8955078125, 4.345703125, 4.7958984375, 5.24609375, 5.6962890625, 6.146484375, 6.5966796875, 7.046875, 7.4970703125, 7.947265625, 8.3974609375, 8.84765625, 9.2978515625, 9.748046875, 10.1982421875, 10.6484375, 11.0986328125, 11.548828125, 11.9990234375, 12.44921875, 12.8994140625, 13.349609375, 13.7998046875, 14.25]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 15.0, 8.0, 11.0, 17.0, 19.0, 31.0, 28.0, 16.0, 30.0, 30.0, 34.0, 31.0, 37.0, 46.0, 42.0, 45.0, 34.0, 55.0, 46.0, 35.0, 40.0, 46.0, 42.0, 45.0, 27.0, 34.0, 19.0, 21.0, 21.0, 16.0, 14.0, 9.0, 13.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.3125, -22.54833984375, -21.7841796875, -21.02001953125, -20.255859375, -19.49169921875, -18.7275390625, -17.96337890625, -17.19921875, -16.43505859375, -15.6708984375, -14.90673828125, -14.142578125, -13.37841796875, -12.6142578125, -11.85009765625, -11.0859375, -10.32177734375, -9.5576171875, -8.79345703125, -8.029296875, -7.26513671875, -6.5009765625, -5.73681640625, -4.97265625, -4.20849609375, -3.4443359375, -2.68017578125, -1.916015625, -1.15185546875, -0.3876953125, 0.37646484375, 1.140625, 1.90478515625, 2.6689453125, 3.43310546875, 4.197265625, 4.96142578125, 5.7255859375, 6.48974609375, 7.25390625, 8.01806640625, 8.7822265625, 9.54638671875, 10.310546875, 11.07470703125, 11.8388671875, 12.60302734375, 13.3671875, 14.13134765625, 14.8955078125, 15.65966796875, 16.423828125, 17.18798828125, 17.9521484375, 18.71630859375, 19.48046875, 20.24462890625, 21.0087890625, 21.77294921875, 22.537109375, 23.30126953125, 24.0654296875, 24.82958984375, 25.59375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 6.0, 7.0, 9.0, 18.0, 28.0, 47.0, 67.0, 104.0, 155.0, 281.0, 402.0, 630.0, 1103.0, 1737.0, 3001.0, 4823.0, 7719.0, 12526.0, 19708.0, 30481.0, 45227.0, 64571.0, 86510.0, 105724.0, 120711.0, 121862.0, 111201.0, 93039.0, 71247.0, 50701.0, 34672.0, 22626.0, 14280.0, 8924.0, 5591.0, 3371.0, 2133.0, 1347.0, 742.0, 455.0, 314.0, 186.0, 95.0, 65.0, 36.0, 32.0, 17.0, 12.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-17.1875, -16.6690673828125, -16.150634765625, -15.6322021484375, -15.11376953125, -14.5953369140625, -14.076904296875, -13.5584716796875, -13.0400390625, -12.5216064453125, -12.003173828125, -11.4847412109375, -10.96630859375, -10.4478759765625, -9.929443359375, -9.4110107421875, -8.892578125, -8.3741455078125, -7.855712890625, -7.3372802734375, -6.81884765625, -6.3004150390625, -5.781982421875, -5.2635498046875, -4.7451171875, -4.2266845703125, -3.708251953125, -3.1898193359375, -2.67138671875, -2.1529541015625, -1.634521484375, -1.1160888671875, -0.59765625, -0.0792236328125, 0.439208984375, 0.9576416015625, 1.47607421875, 1.9945068359375, 2.512939453125, 3.0313720703125, 3.5498046875, 4.0682373046875, 4.586669921875, 5.1051025390625, 5.62353515625, 6.1419677734375, 6.660400390625, 7.1788330078125, 7.697265625, 8.2156982421875, 8.734130859375, 9.2525634765625, 9.77099609375, 10.2894287109375, 10.807861328125, 11.3262939453125, 11.8447265625, 12.3631591796875, 12.881591796875, 13.4000244140625, 13.91845703125, 14.4368896484375, 14.955322265625, 15.4737548828125, 15.9921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 5.0, 5.0, 10.0, 6.0, 4.0, 13.0, 18.0, 13.0, 32.0, 29.0, 16.0, 22.0, 24.0, 31.0, 40.0, 22.0, 41.0, 39.0, 36.0, 38.0, 48.0, 46.0, 44.0, 33.0, 35.0, 43.0, 30.0, 29.0, 25.0, 34.0, 24.0, 25.0, 33.0, 16.0, 11.0, 16.0, 11.0, 12.0, 7.0, 8.0, 4.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.53125, -13.092529296875, -12.65380859375, -12.215087890625, -11.7763671875, -11.337646484375, -10.89892578125, -10.460205078125, -10.021484375, -9.582763671875, -9.14404296875, -8.705322265625, -8.2666015625, -7.827880859375, -7.38916015625, -6.950439453125, -6.51171875, -6.072998046875, -5.63427734375, -5.195556640625, -4.7568359375, -4.318115234375, -3.87939453125, -3.440673828125, -3.001953125, -2.563232421875, -2.12451171875, -1.685791015625, -1.2470703125, -0.808349609375, -0.36962890625, 0.069091796875, 0.5078125, 0.946533203125, 1.38525390625, 1.823974609375, 2.2626953125, 2.701416015625, 3.14013671875, 3.578857421875, 4.017578125, 4.456298828125, 4.89501953125, 5.333740234375, 5.7724609375, 6.211181640625, 6.64990234375, 7.088623046875, 7.52734375, 7.966064453125, 8.40478515625, 8.843505859375, 9.2822265625, 9.720947265625, 10.15966796875, 10.598388671875, 11.037109375, 11.475830078125, 11.91455078125, 12.353271484375, 12.7919921875, 13.230712890625, 13.66943359375, 14.108154296875, 14.546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 18.0, 33.0, 44.0, 82.0, 153.0, 182.0, 262.0, 462.0, 715.0, 1098.0, 1705.0, 2948.0, 4596.0, 7470.0, 11714.0, 18991.0, 29066.0, 43897.0, 62389.0, 84717.0, 105703.0, 119541.0, 123002.0, 113273.0, 94886.0, 72497.0, 51984.0, 35046.0, 22844.0, 14477.0, 9243.0, 5781.0, 3587.0, 2235.0, 1402.0, 937.0, 557.0, 349.0, 242.0, 167.0, 74.0, 58.0, 32.0, 21.0, 17.0, 11.0, 13.0, 8.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2802734375, -4.138671875, -3.9970703125, -3.85546875, -3.7138671875, -3.572265625, -3.4306640625, -3.2890625, -3.1474609375, -3.005859375, -2.8642578125, -2.72265625, -2.5810546875, -2.439453125, -2.2978515625, -2.15625, -2.0146484375, -1.873046875, -1.7314453125, -1.58984375, -1.4482421875, -1.306640625, -1.1650390625, -1.0234375, -0.8818359375, -0.740234375, -0.5986328125, -0.45703125, -0.3154296875, -0.173828125, -0.0322265625, 0.109375, 0.2509765625, 0.392578125, 0.5341796875, 0.67578125, 0.8173828125, 0.958984375, 1.1005859375, 1.2421875, 1.3837890625, 1.525390625, 1.6669921875, 1.80859375, 1.9501953125, 2.091796875, 2.2333984375, 2.375, 2.5166015625, 2.658203125, 2.7998046875, 2.94140625, 3.0830078125, 3.224609375, 3.3662109375, 3.5078125, 3.6494140625, 3.791015625, 3.9326171875, 4.07421875, 4.2158203125, 4.357421875, 4.4990234375, 4.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 5.0, 12.0, 7.0, 12.0, 13.0, 17.0, 26.0, 24.0, 37.0, 36.0, 38.0, 45.0, 41.0, 54.0, 47.0, 54.0, 38.0, 40.0, 42.0, 34.0, 41.0, 40.0, 32.0, 22.0, 40.0, 30.0, 29.0, 20.0, 25.0, 17.0, 15.0, 15.0, 5.0, 13.0, 4.0, 2.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040340423583984375, -0.0003894492983818054, -0.0003754943609237671, -0.00036153942346572876, -0.00034758448600769043, -0.0003336295485496521, -0.00031967461109161377, -0.00030571967363357544, -0.0002917647361755371, -0.0002778097987174988, -0.00026385486125946045, -0.0002498999238014221, -0.0002359449863433838, -0.00022199004888534546, -0.00020803511142730713, -0.0001940801739692688, -0.00018012523651123047, -0.00016617029905319214, -0.0001522153615951538, -0.00013826042413711548, -0.00012430548667907715, -0.00011035054922103882, -9.639561176300049e-05, -8.244067430496216e-05, -6.848573684692383e-05, -5.45307993888855e-05, -4.057586193084717e-05, -2.6620924472808838e-05, -1.2665987014770508e-05, 1.2889504432678223e-06, 1.5243887901306152e-05, 2.9198825359344482e-05, 4.315376281738281e-05, 5.710870027542114e-05, 7.106363773345947e-05, 8.50185751914978e-05, 9.897351264953613e-05, 0.00011292845010757446, 0.0001268833875656128, 0.00014083832502365112, 0.00015479326248168945, 0.00016874819993972778, 0.0001827031373977661, 0.00019665807485580444, 0.00021061301231384277, 0.0002245679497718811, 0.00023852288722991943, 0.00025247782468795776, 0.0002664327621459961, 0.0002803876996040344, 0.00029434263706207275, 0.0003082975745201111, 0.0003222525119781494, 0.00033620744943618774, 0.0003501623868942261, 0.0003641173243522644, 0.00037807226181030273, 0.00039202719926834106, 0.0004059821367263794, 0.0004199370741844177, 0.00043389201164245605, 0.0004478469491004944, 0.0004618018865585327, 0.00047575682401657104, 0.0004897117614746094]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 10.0, 12.0, 17.0, 24.0, 38.0, 45.0, 60.0, 102.0, 160.0, 242.0, 363.0, 598.0, 913.0, 1378.0, 2106.0, 3398.0, 5576.0, 8796.0, 14558.0, 22824.0, 36460.0, 54787.0, 78026.0, 104328.0, 124743.0, 133656.0, 124484.0, 103535.0, 77329.0, 54232.0, 35626.0, 22484.0, 14206.0, 8575.0, 5412.0, 3440.0, 2096.0, 1344.0, 851.0, 585.0, 382.0, 236.0, 177.0, 97.0, 75.0, 56.0, 46.0, 20.0, 18.0, 10.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-5.47265625, -5.3092041015625, -5.145751953125, -4.9822998046875, -4.81884765625, -4.6553955078125, -4.491943359375, -4.3284912109375, -4.1650390625, -4.0015869140625, -3.838134765625, -3.6746826171875, -3.51123046875, -3.3477783203125, -3.184326171875, -3.0208740234375, -2.857421875, -2.6939697265625, -2.530517578125, -2.3670654296875, -2.20361328125, -2.0401611328125, -1.876708984375, -1.7132568359375, -1.5498046875, -1.3863525390625, -1.222900390625, -1.0594482421875, -0.89599609375, -0.7325439453125, -0.569091796875, -0.4056396484375, -0.2421875, -0.0787353515625, 0.084716796875, 0.2481689453125, 0.41162109375, 0.5750732421875, 0.738525390625, 0.9019775390625, 1.0654296875, 1.2288818359375, 1.392333984375, 1.5557861328125, 1.71923828125, 1.8826904296875, 2.046142578125, 2.2095947265625, 2.373046875, 2.5364990234375, 2.699951171875, 2.8634033203125, 3.02685546875, 3.1903076171875, 3.353759765625, 3.5172119140625, 3.6806640625, 3.8441162109375, 4.007568359375, 4.1710205078125, 4.33447265625, 4.4979248046875, 4.661376953125, 4.8248291015625, 4.98828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 9.0, 7.0, 5.0, 14.0, 13.0, 19.0, 22.0, 24.0, 33.0, 34.0, 35.0, 46.0, 40.0, 46.0, 51.0, 58.0, 51.0, 55.0, 37.0, 57.0, 47.0, 41.0, 39.0, 40.0, 26.0, 35.0, 22.0, 15.0, 18.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.94921875, -2.866851806640625, -2.78448486328125, -2.702117919921875, -2.6197509765625, -2.537384033203125, -2.45501708984375, -2.372650146484375, -2.290283203125, -2.207916259765625, -2.12554931640625, -2.043182373046875, -1.9608154296875, -1.878448486328125, -1.79608154296875, -1.713714599609375, -1.63134765625, -1.548980712890625, -1.46661376953125, -1.384246826171875, -1.3018798828125, -1.219512939453125, -1.13714599609375, -1.054779052734375, -0.972412109375, -0.890045166015625, -0.80767822265625, -0.725311279296875, -0.6429443359375, -0.560577392578125, -0.47821044921875, -0.395843505859375, -0.3134765625, -0.231109619140625, -0.14874267578125, -0.066375732421875, 0.0159912109375, 0.098358154296875, 0.18072509765625, 0.263092041015625, 0.345458984375, 0.427825927734375, 0.51019287109375, 0.592559814453125, 0.6749267578125, 0.757293701171875, 0.83966064453125, 0.922027587890625, 1.00439453125, 1.086761474609375, 1.16912841796875, 1.251495361328125, 1.3338623046875, 1.416229248046875, 1.49859619140625, 1.580963134765625, 1.663330078125, 1.745697021484375, 1.82806396484375, 1.910430908203125, 1.9927978515625, 2.075164794921875, 2.15753173828125, 2.239898681640625, 2.322265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 2.0, 8.0, 11.0, 14.0, 13.0, 8.0, 14.0, 28.0, 20.0, 34.0, 34.0, 35.0, 44.0, 52.0, 50.0, 60.0, 52.0, 60.0, 36.0, 39.0, 45.0, 50.0, 35.0, 43.0, 30.0, 29.0, 22.0, 18.0, 13.0, 13.0, 14.0, 14.0, 12.0, 7.0, 6.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.028152465820312, -19.368614196777344, -18.709077835083008, -18.049541473388672, -17.390003204345703, -16.730464935302734, -16.0709285736084, -15.411391258239746, -14.751853942871094, -14.092316627502441, -13.432779312133789, -12.773241996765137, -12.113704681396484, -11.454167366027832, -10.79463005065918, -10.135092735290527, -9.475555419921875, -8.816018104553223, -8.15648078918457, -7.496943473815918, -6.837406158447266, -6.177868843078613, -5.518331527709961, -4.858794212341309, -4.199256896972656, -3.539719581604004, -2.8801822662353516, -2.220644950866699, -1.5611076354980469, -0.9015703201293945, -0.2420330047607422, 0.41750431060791016, 1.0770397186279297, 1.736577033996582, 2.3961143493652344, 3.0556516647338867, 3.715188980102539, 4.374726295471191, 5.034263610839844, 5.693800926208496, 6.353338241577148, 7.012875556945801, 7.672412872314453, 8.331950187683105, 8.991487503051758, 9.65102481842041, 10.310562133789062, 10.970099449157715, 11.629636764526367, 12.28917407989502, 12.948711395263672, 13.608248710632324, 14.267786026000977, 14.927323341369629, 15.586860656738281, 16.24639892578125, 16.905935287475586, 17.565471649169922, 18.22500991821289, 18.88454818725586, 19.544084548950195, 20.20362091064453, 20.8631591796875, 21.52269744873047, 22.182233810424805]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 7.0, 12.0, 7.0, 10.0, 17.0, 8.0, 7.0, 22.0, 25.0, 24.0, 22.0, 31.0, 21.0, 46.0, 33.0, 43.0, 36.0, 40.0, 33.0, 28.0, 47.0, 27.0, 45.0, 43.0, 43.0, 36.0, 42.0, 35.0, 29.0, 28.0, 16.0, 21.0, 18.0, 18.0, 10.0, 13.0, 8.0, 9.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.120607376098633, -22.418781280517578, -21.716955184936523, -21.01512908935547, -20.31330108642578, -19.611474990844727, -18.909648895263672, -18.207822799682617, -17.505996704101562, -16.804170608520508, -16.102344512939453, -15.400517463684082, -14.698690414428711, -13.996864318847656, -13.295038223266602, -12.593212127685547, -11.89138412475586, -11.189558029174805, -10.487730979919434, -9.785904884338379, -9.084077835083008, -8.382251739501953, -7.680425643920898, -6.9785990715026855, -6.276772499084473, -5.57494592666626, -4.873119354248047, -4.171293258666992, -3.4694666862487793, -2.7676401138305664, -2.0658140182495117, -1.3639874458312988, -0.6621589660644531, 0.039667487144470215, 0.7414939403533936, 1.4433202743530273, 2.1451468467712402, 2.846973419189453, 3.548799514770508, 4.250626087188721, 4.952452659606934, 5.6542792320251465, 6.356105804443359, 7.057931900024414, 7.759758472442627, 8.46158504486084, 9.163411140441895, 9.865238189697266, 10.56706428527832, 11.268890380859375, 11.970717430114746, 12.6725435256958, 13.374370574951172, 14.076196670532227, 14.778022766113281, 15.479848861694336, 16.18167495727539, 16.883501052856445, 17.5853271484375, 18.287155151367188, 18.988981246948242, 19.690807342529297, 20.39263343811035, 21.094459533691406, 21.796287536621094]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 19.0, 33.0, 43.0, 68.0, 106.0, 173.0, 264.0, 438.0, 742.0, 1073.0, 1877.0, 2853.0, 4711.0, 7600.0, 12137.0, 19266.0, 30981.0, 48276.0, 75909.0, 116064.0, 171454.0, 246278.0, 333164.0, 420729.0, 482471.0, 495343.0, 454626.0, 377461.0, 288027.0, 206313.0, 140629.0, 93252.0, 60172.0, 38633.0, 23920.0, 14831.0, 9348.0, 5860.0, 3499.0, 2137.0, 1362.0, 768.0, 523.0, 328.0, 193.0, 146.0, 80.0, 53.0, 28.0, 11.0, 9.0, 1.0, 2.0, 2.0, 2.0], "bins": [-16.734375, -16.2457275390625, -15.757080078125, -15.2684326171875, -14.77978515625, -14.2911376953125, -13.802490234375, -13.3138427734375, -12.8251953125, -12.3365478515625, -11.847900390625, -11.3592529296875, -10.87060546875, -10.3819580078125, -9.893310546875, -9.4046630859375, -8.916015625, -8.4273681640625, -7.938720703125, -7.4500732421875, -6.96142578125, -6.4727783203125, -5.984130859375, -5.4954833984375, -5.0068359375, -4.5181884765625, -4.029541015625, -3.5408935546875, -3.05224609375, -2.5635986328125, -2.074951171875, -1.5863037109375, -1.09765625, -0.6090087890625, -0.120361328125, 0.3682861328125, 0.85693359375, 1.3455810546875, 1.834228515625, 2.3228759765625, 2.8115234375, 3.3001708984375, 3.788818359375, 4.2774658203125, 4.76611328125, 5.2547607421875, 5.743408203125, 6.2320556640625, 6.720703125, 7.2093505859375, 7.697998046875, 8.1866455078125, 8.67529296875, 9.1639404296875, 9.652587890625, 10.1412353515625, 10.6298828125, 11.1185302734375, 11.607177734375, 12.0958251953125, 12.58447265625, 13.0731201171875, 13.561767578125, 14.0504150390625, 14.5390625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 6.0, 5.0, 5.0, 9.0, 7.0, 8.0, 14.0, 12.0, 17.0, 21.0, 31.0, 24.0, 22.0, 43.0, 28.0, 31.0, 27.0, 40.0, 43.0, 27.0, 28.0, 41.0, 32.0, 40.0, 39.0, 29.0, 39.0, 30.0, 33.0, 40.0, 29.0, 27.0, 33.0, 17.0, 14.0, 16.0, 10.0, 11.0, 12.0, 11.0, 11.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-16.25, -15.75390625, -15.2578125, -14.76171875, -14.265625, -13.76953125, -13.2734375, -12.77734375, -12.28125, -11.78515625, -11.2890625, -10.79296875, -10.296875, -9.80078125, -9.3046875, -8.80859375, -8.3125, -7.81640625, -7.3203125, -6.82421875, -6.328125, -5.83203125, -5.3359375, -4.83984375, -4.34375, -3.84765625, -3.3515625, -2.85546875, -2.359375, -1.86328125, -1.3671875, -0.87109375, -0.375, 0.12109375, 0.6171875, 1.11328125, 1.609375, 2.10546875, 2.6015625, 3.09765625, 3.59375, 4.08984375, 4.5859375, 5.08203125, 5.578125, 6.07421875, 6.5703125, 7.06640625, 7.5625, 8.05859375, 8.5546875, 9.05078125, 9.546875, 10.04296875, 10.5390625, 11.03515625, 11.53125, 12.02734375, 12.5234375, 13.01953125, 13.515625, 14.01171875, 14.5078125, 15.00390625, 15.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 7.0, 1.0, 15.0, 30.0, 58.0, 81.0, 133.0, 211.0, 351.0, 561.0, 945.0, 1503.0, 2425.0, 4054.0, 6538.0, 10522.0, 16345.0, 26076.0, 39629.0, 59569.0, 87844.0, 124988.0, 172410.0, 227684.0, 287788.0, 344226.0, 385396.0, 406391.0, 397522.0, 364757.0, 314969.0, 255882.0, 197915.0, 146756.0, 104056.0, 72157.0, 48206.0, 31521.0, 20369.0, 13205.0, 8152.0, 5120.0, 3128.0, 1852.0, 1199.0, 708.0, 391.0, 269.0, 158.0, 85.0, 61.0, 27.0, 18.0, 11.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-13.125, -12.71142578125, -12.2978515625, -11.88427734375, -11.470703125, -11.05712890625, -10.6435546875, -10.22998046875, -9.81640625, -9.40283203125, -8.9892578125, -8.57568359375, -8.162109375, -7.74853515625, -7.3349609375, -6.92138671875, -6.5078125, -6.09423828125, -5.6806640625, -5.26708984375, -4.853515625, -4.43994140625, -4.0263671875, -3.61279296875, -3.19921875, -2.78564453125, -2.3720703125, -1.95849609375, -1.544921875, -1.13134765625, -0.7177734375, -0.30419921875, 0.109375, 0.52294921875, 0.9365234375, 1.35009765625, 1.763671875, 2.17724609375, 2.5908203125, 3.00439453125, 3.41796875, 3.83154296875, 4.2451171875, 4.65869140625, 5.072265625, 5.48583984375, 5.8994140625, 6.31298828125, 6.7265625, 7.14013671875, 7.5537109375, 7.96728515625, 8.380859375, 8.79443359375, 9.2080078125, 9.62158203125, 10.03515625, 10.44873046875, 10.8623046875, 11.27587890625, 11.689453125, 12.10302734375, 12.5166015625, 12.93017578125, 13.34375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 0.0, 6.0, 11.0, 17.0, 28.0, 22.0, 35.0, 28.0, 42.0, 55.0, 73.0, 71.0, 88.0, 70.0, 102.0, 116.0, 136.0, 147.0, 132.0, 181.0, 159.0, 158.0, 186.0, 197.0, 191.0, 164.0, 176.0, 165.0, 156.0, 136.0, 165.0, 130.0, 87.0, 95.0, 84.0, 83.0, 67.0, 53.0, 57.0, 38.0, 26.0, 22.0, 20.0, 19.0, 22.0, 15.0, 4.0, 6.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.71875, -6.5015869140625, -6.284423828125, -6.0672607421875, -5.85009765625, -5.6329345703125, -5.415771484375, -5.1986083984375, -4.9814453125, -4.7642822265625, -4.547119140625, -4.3299560546875, -4.11279296875, -3.8956298828125, -3.678466796875, -3.4613037109375, -3.244140625, -3.0269775390625, -2.809814453125, -2.5926513671875, -2.37548828125, -2.1583251953125, -1.941162109375, -1.7239990234375, -1.5068359375, -1.2896728515625, -1.072509765625, -0.8553466796875, -0.63818359375, -0.4210205078125, -0.203857421875, 0.0133056640625, 0.23046875, 0.4476318359375, 0.664794921875, 0.8819580078125, 1.09912109375, 1.3162841796875, 1.533447265625, 1.7506103515625, 1.9677734375, 2.1849365234375, 2.402099609375, 2.6192626953125, 2.83642578125, 3.0535888671875, 3.270751953125, 3.4879150390625, 3.705078125, 3.9222412109375, 4.139404296875, 4.3565673828125, 4.57373046875, 4.7908935546875, 5.008056640625, 5.2252197265625, 5.4423828125, 5.6595458984375, 5.876708984375, 6.0938720703125, 6.31103515625, 6.5281982421875, 6.745361328125, 6.9625244140625, 7.1796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 14.0, 12.0, 10.0, 27.0, 19.0, 24.0, 31.0, 28.0, 31.0, 45.0, 59.0, 48.0, 39.0, 39.0, 50.0, 36.0, 39.0, 50.0, 40.0, 39.0, 39.0, 34.0, 18.0, 37.0, 18.0, 22.0, 17.0, 17.0, 13.0, 16.0, 10.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.5313777923584, -16.966203689575195, -16.401029586791992, -15.835855484008789, -15.270681381225586, -14.705507278442383, -14.14033317565918, -13.575159072875977, -13.009984970092773, -12.44481086730957, -11.879636764526367, -11.314462661743164, -10.749288558959961, -10.184114456176758, -9.618940353393555, -9.053766250610352, -8.488592147827148, -7.923418045043945, -7.358243942260742, -6.793069839477539, -6.227895736694336, -5.662721633911133, -5.09754753112793, -4.532373428344727, -3.9671993255615234, -3.4020252227783203, -2.836851119995117, -2.271677017211914, -1.706502914428711, -1.1413288116455078, -0.5761547088623047, -0.010980606079101562, 0.5541915893554688, 1.1193656921386719, 1.684539794921875, 2.249713897705078, 2.8148880004882812, 3.3800621032714844, 3.9452362060546875, 4.510410308837891, 5.075584411621094, 5.640758514404297, 6.2059326171875, 6.771106719970703, 7.336280822753906, 7.901454925537109, 8.466629028320312, 9.031803131103516, 9.596977233886719, 10.162151336669922, 10.727325439453125, 11.292499542236328, 11.857673645019531, 12.422847747802734, 12.988021850585938, 13.55319595336914, 14.118370056152344, 14.683544158935547, 15.24871826171875, 15.813892364501953, 16.379066467285156, 16.94424057006836, 17.509414672851562, 18.074588775634766, 18.63976287841797]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 5.0, 12.0, 11.0, 8.0, 15.0, 15.0, 18.0, 20.0, 13.0, 20.0, 17.0, 31.0, 35.0, 27.0, 32.0, 23.0, 36.0, 37.0, 33.0, 26.0, 36.0, 43.0, 40.0, 37.0, 38.0, 26.0, 39.0, 39.0, 28.0, 29.0, 33.0, 34.0, 20.0, 21.0, 15.0, 15.0, 9.0, 9.0, 8.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.478485107421875, -18.89680290222168, -18.31511878967285, -17.733436584472656, -17.151752471923828, -16.570070266723633, -15.988387107849121, -15.40670394897461, -14.825020790100098, -14.243337631225586, -13.661654472351074, -13.079971313476562, -12.498289108276367, -11.916604995727539, -11.334922790527344, -10.753239631652832, -10.17155647277832, -9.589873313903809, -9.008190155029297, -8.426506996154785, -7.844824314117432, -7.26314115524292, -6.681458473205566, -6.099775314331055, -5.518092155456543, -4.936408996582031, -4.3547258377075195, -3.773043155670166, -3.1913599967956543, -2.6096768379211426, -2.02799391746521, -1.4463109970092773, -0.8646297454833984, -0.28294670581817627, 0.2987363338470459, 0.8804193735122681, 1.4621024131774902, 2.043785572052002, 2.6254684925079346, 3.207151412963867, 3.788834571838379, 4.370517730712891, 4.952200889587402, 5.533883571624756, 6.115566730499268, 6.697249889373779, 7.278932571411133, 7.8606157302856445, 8.442298889160156, 9.023982048034668, 9.60566520690918, 10.187348365783691, 10.769031524658203, 11.350713729858398, 11.93239688873291, 12.514080047607422, 13.095763206481934, 13.677446365356445, 14.259129524230957, 14.840812683105469, 15.422494888305664, 16.004179000854492, 16.585861206054688, 17.167545318603516, 17.74922752380371]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 22.0, 16.0, 25.0, 54.0, 53.0, 77.0, 131.0, 196.0, 274.0, 383.0, 603.0, 860.0, 1172.0, 1814.0, 2663.0, 3881.0, 5788.0, 8356.0, 12711.0, 18857.0, 28815.0, 43810.0, 68217.0, 105414.0, 155890.0, 184158.0, 138520.0, 91590.0, 59219.0, 38489.0, 25648.0, 16461.0, 11185.0, 7370.0, 5025.0, 3406.0, 2338.0, 1568.0, 1110.0, 735.0, 530.0, 349.0, 233.0, 166.0, 126.0, 88.0, 57.0, 33.0, 22.0, 14.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.05078125, -2.956451416015625, -2.86212158203125, -2.767791748046875, -2.6734619140625, -2.579132080078125, -2.48480224609375, -2.390472412109375, -2.296142578125, -2.201812744140625, -2.10748291015625, -2.013153076171875, -1.9188232421875, -1.824493408203125, -1.73016357421875, -1.635833740234375, -1.54150390625, -1.447174072265625, -1.35284423828125, -1.258514404296875, -1.1641845703125, -1.069854736328125, -0.97552490234375, -0.881195068359375, -0.786865234375, -0.692535400390625, -0.59820556640625, -0.503875732421875, -0.4095458984375, -0.315216064453125, -0.22088623046875, -0.126556396484375, -0.0322265625, 0.062103271484375, 0.15643310546875, 0.250762939453125, 0.3450927734375, 0.439422607421875, 0.53375244140625, 0.628082275390625, 0.722412109375, 0.816741943359375, 0.91107177734375, 1.005401611328125, 1.0997314453125, 1.194061279296875, 1.28839111328125, 1.382720947265625, 1.47705078125, 1.571380615234375, 1.66571044921875, 1.760040283203125, 1.8543701171875, 1.948699951171875, 2.04302978515625, 2.137359619140625, 2.231689453125, 2.326019287109375, 2.42034912109375, 2.514678955078125, 2.6090087890625, 2.703338623046875, 2.79766845703125, 2.891998291015625, 2.986328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 4.0, 11.0, 9.0, 8.0, 11.0, 13.0, 17.0, 20.0, 24.0, 25.0, 22.0, 26.0, 32.0, 35.0, 36.0, 28.0, 30.0, 34.0, 40.0, 55.0, 35.0, 47.0, 38.0, 42.0, 35.0, 38.0, 38.0, 37.0, 27.0, 31.0, 29.0, 22.0, 17.0, 10.0, 17.0, 9.0, 6.0, 14.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.34375, -21.682373046875, -21.02099609375, -20.359619140625, -19.6982421875, -19.036865234375, -18.37548828125, -17.714111328125, -17.052734375, -16.391357421875, -15.72998046875, -15.068603515625, -14.4072265625, -13.745849609375, -13.08447265625, -12.423095703125, -11.76171875, -11.100341796875, -10.43896484375, -9.777587890625, -9.1162109375, -8.454833984375, -7.79345703125, -7.132080078125, -6.470703125, -5.809326171875, -5.14794921875, -4.486572265625, -3.8251953125, -3.163818359375, -2.50244140625, -1.841064453125, -1.1796875, -0.518310546875, 0.14306640625, 0.804443359375, 1.4658203125, 2.127197265625, 2.78857421875, 3.449951171875, 4.111328125, 4.772705078125, 5.43408203125, 6.095458984375, 6.7568359375, 7.418212890625, 8.07958984375, 8.740966796875, 9.40234375, 10.063720703125, 10.72509765625, 11.386474609375, 12.0478515625, 12.709228515625, 13.37060546875, 14.031982421875, 14.693359375, 15.354736328125, 16.01611328125, 16.677490234375, 17.3388671875, 18.000244140625, 18.66162109375, 19.322998046875, 19.984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 11.0, 19.0, 18.0, 33.0, 50.0, 59.0, 96.0, 144.0, 230.0, 286.0, 457.0, 689.0, 1046.0, 1619.0, 2486.0, 3979.0, 5928.0, 9476.0, 15351.0, 24734.0, 40250.0, 67158.0, 116038.0, 196990.0, 219778.0, 137184.0, 79599.0, 47171.0, 28876.0, 17762.0, 11080.0, 7030.0, 4470.0, 2937.0, 1856.0, 1215.0, 796.0, 567.0, 335.0, 267.0, 160.0, 105.0, 65.0, 43.0, 41.0, 28.0, 18.0, 12.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.904296875, -2.81396484375, -2.7236328125, -2.63330078125, -2.54296875, -2.45263671875, -2.3623046875, -2.27197265625, -2.181640625, -2.09130859375, -2.0009765625, -1.91064453125, -1.8203125, -1.72998046875, -1.6396484375, -1.54931640625, -1.458984375, -1.36865234375, -1.2783203125, -1.18798828125, -1.09765625, -1.00732421875, -0.9169921875, -0.82666015625, -0.736328125, -0.64599609375, -0.5556640625, -0.46533203125, -0.375, -0.28466796875, -0.1943359375, -0.10400390625, -0.013671875, 0.07666015625, 0.1669921875, 0.25732421875, 0.34765625, 0.43798828125, 0.5283203125, 0.61865234375, 0.708984375, 0.79931640625, 0.8896484375, 0.97998046875, 1.0703125, 1.16064453125, 1.2509765625, 1.34130859375, 1.431640625, 1.52197265625, 1.6123046875, 1.70263671875, 1.79296875, 1.88330078125, 1.9736328125, 2.06396484375, 2.154296875, 2.24462890625, 2.3349609375, 2.42529296875, 2.515625, 2.60595703125, 2.6962890625, 2.78662109375, 2.876953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 12.0, 5.0, 10.0, 16.0, 8.0, 9.0, 29.0, 17.0, 20.0, 28.0, 29.0, 27.0, 30.0, 42.0, 42.0, 45.0, 34.0, 49.0, 40.0, 41.0, 44.0, 42.0, 38.0, 35.0, 38.0, 36.0, 33.0, 24.0, 25.0, 17.0, 21.0, 12.0, 20.0, 13.0, 13.0, 11.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.2734375, -14.8433837890625, -14.413330078125, -13.9832763671875, -13.55322265625, -13.1231689453125, -12.693115234375, -12.2630615234375, -11.8330078125, -11.4029541015625, -10.972900390625, -10.5428466796875, -10.11279296875, -9.6827392578125, -9.252685546875, -8.8226318359375, -8.392578125, -7.9625244140625, -7.532470703125, -7.1024169921875, -6.67236328125, -6.2423095703125, -5.812255859375, -5.3822021484375, -4.9521484375, -4.5220947265625, -4.092041015625, -3.6619873046875, -3.23193359375, -2.8018798828125, -2.371826171875, -1.9417724609375, -1.51171875, -1.0816650390625, -0.651611328125, -0.2215576171875, 0.20849609375, 0.6385498046875, 1.068603515625, 1.4986572265625, 1.9287109375, 2.3587646484375, 2.788818359375, 3.2188720703125, 3.64892578125, 4.0789794921875, 4.509033203125, 4.9390869140625, 5.369140625, 5.7991943359375, 6.229248046875, 6.6593017578125, 7.08935546875, 7.5194091796875, 7.949462890625, 8.3795166015625, 8.8095703125, 9.2396240234375, 9.669677734375, 10.0997314453125, 10.52978515625, 10.9598388671875, 11.389892578125, 11.8199462890625, 12.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 15.0, 22.0, 30.0, 42.0, 53.0, 110.0, 202.0, 259.0, 438.0, 692.0, 1073.0, 1727.0, 2904.0, 4911.0, 8505.0, 14605.0, 27582.0, 54945.0, 124445.0, 327763.0, 270909.0, 103594.0, 47648.0, 24133.0, 13107.0, 7533.0, 4351.0, 2630.0, 1561.0, 1026.0, 647.0, 385.0, 246.0, 153.0, 94.0, 77.0, 35.0, 37.0, 12.0, 19.0, 12.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24902725219726562, -0.24121856689453125, -0.23340988159179688, -0.2256011962890625, -0.21779251098632812, -0.20998382568359375, -0.20217514038085938, -0.194366455078125, -0.18655776977539062, -0.17874908447265625, -0.17094039916992188, -0.1631317138671875, -0.15532302856445312, -0.14751434326171875, -0.13970565795898438, -0.13189697265625, -0.12408828735351562, -0.11627960205078125, -0.10847091674804688, -0.1006622314453125, -0.09285354614257812, -0.08504486083984375, -0.07723617553710938, -0.069427490234375, -0.061618804931640625, -0.05381011962890625, -0.046001434326171875, -0.0381927490234375, -0.030384063720703125, -0.02257537841796875, -0.014766693115234375, -0.0069580078125, 0.000850677490234375, 0.00865936279296875, 0.016468048095703125, 0.0242767333984375, 0.032085418701171875, 0.03989410400390625, 0.047702789306640625, 0.055511474609375, 0.06332015991210938, 0.07112884521484375, 0.07893753051757812, 0.0867462158203125, 0.09455490112304688, 0.10236358642578125, 0.11017227172851562, 0.11798095703125, 0.12578964233398438, 0.13359832763671875, 0.14140701293945312, 0.1492156982421875, 0.15702438354492188, 0.16483306884765625, 0.17264175415039062, 0.180450439453125, 0.18825912475585938, 0.19606781005859375, 0.20387649536132812, 0.2116851806640625, 0.21949386596679688, 0.22730255126953125, 0.23511123657226562, 0.242919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 4.0, 9.0, 10.0, 11.0, 10.0, 18.0, 12.0, 27.0, 18.0, 26.0, 25.0, 28.0, 34.0, 40.0, 46.0, 42.0, 39.0, 41.0, 45.0, 64.0, 52.0, 38.0, 52.0, 38.0, 33.0, 35.0, 30.0, 30.0, 24.0, 13.0, 14.0, 17.0, 5.0, 9.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-2.849102020263672e-05, -2.7602538466453552e-05, -2.6714056730270386e-05, -2.582557499408722e-05, -2.4937093257904053e-05, -2.4048611521720886e-05, -2.316012978553772e-05, -2.2271648049354553e-05, -2.1383166313171387e-05, -2.049468457698822e-05, -1.9606202840805054e-05, -1.8717721104621887e-05, -1.782923936843872e-05, -1.6940757632255554e-05, -1.6052275896072388e-05, -1.5163794159889221e-05, -1.4275312423706055e-05, -1.3386830687522888e-05, -1.2498348951339722e-05, -1.1609867215156555e-05, -1.0721385478973389e-05, -9.832903742790222e-06, -8.944422006607056e-06, -8.05594027042389e-06, -7.167458534240723e-06, -6.278976798057556e-06, -5.39049506187439e-06, -4.502013325691223e-06, -3.6135315895080566e-06, -2.72504985332489e-06, -1.8365681171417236e-06, -9.480863809585571e-07, -5.960464477539063e-08, 8.288770914077759e-07, 1.7173588275909424e-06, 2.605840563774109e-06, 3.4943222999572754e-06, 4.382804036140442e-06, 5.271285772323608e-06, 6.159767508506775e-06, 7.048249244689941e-06, 7.936730980873108e-06, 8.825212717056274e-06, 9.713694453239441e-06, 1.0602176189422607e-05, 1.1490657925605774e-05, 1.237913966178894e-05, 1.3267621397972107e-05, 1.4156103134155273e-05, 1.504458487033844e-05, 1.5933066606521606e-05, 1.6821548342704773e-05, 1.771003007888794e-05, 1.8598511815071106e-05, 1.9486993551254272e-05, 2.037547528743744e-05, 2.1263957023620605e-05, 2.2152438759803772e-05, 2.304092049598694e-05, 2.3929402232170105e-05, 2.481788396835327e-05, 2.5706365704536438e-05, 2.6594847440719604e-05, 2.748332917690277e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 13.0, 19.0, 28.0, 50.0, 57.0, 75.0, 130.0, 199.0, 249.0, 336.0, 475.0, 626.0, 848.0, 1225.0, 1740.0, 2460.0, 3480.0, 4760.0, 7182.0, 10421.0, 15423.0, 23120.0, 35407.0, 56206.0, 92618.0, 174822.0, 264256.0, 134963.0, 76603.0, 47376.0, 30133.0, 19739.0, 13475.0, 8864.0, 6180.0, 4296.0, 3136.0, 2166.0, 1544.0, 1071.0, 805.0, 534.0, 430.0, 292.0, 212.0, 147.0, 108.0, 78.0, 74.0, 29.0, 25.0, 23.0, 10.0, 7.0, 4.0, 0.0, 3.0, 6.0], "bins": [-0.459228515625, -0.4450187683105469, -0.43080902099609375, -0.4165992736816406, -0.4023895263671875, -0.3881797790527344, -0.37397003173828125, -0.3597602844238281, -0.345550537109375, -0.3313407897949219, -0.31713104248046875, -0.3029212951660156, -0.2887115478515625, -0.2745018005371094, -0.26029205322265625, -0.24608230590820312, -0.23187255859375, -0.21766281127929688, -0.20345306396484375, -0.18924331665039062, -0.1750335693359375, -0.16082382202148438, -0.14661407470703125, -0.13240432739257812, -0.118194580078125, -0.10398483276367188, -0.08977508544921875, -0.07556533813476562, -0.0613555908203125, -0.047145843505859375, -0.03293609619140625, -0.018726348876953125, -0.0045166015625, 0.009693145751953125, 0.02390289306640625, 0.038112640380859375, 0.0523223876953125, 0.06653213500976562, 0.08074188232421875, 0.09495162963867188, 0.109161376953125, 0.12337112426757812, 0.13758087158203125, 0.15179061889648438, 0.1660003662109375, 0.18021011352539062, 0.19441986083984375, 0.20862960815429688, 0.22283935546875, 0.23704910278320312, 0.25125885009765625, 0.2654685974121094, 0.2796783447265625, 0.2938880920410156, 0.30809783935546875, 0.3223075866699219, 0.336517333984375, 0.3507270812988281, 0.36493682861328125, 0.3791465759277344, 0.3933563232421875, 0.4075660705566406, 0.42177581787109375, 0.4359855651855469, 0.4501953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 3.0, 2.0, 6.0, 4.0, 9.0, 11.0, 10.0, 13.0, 12.0, 16.0, 18.0, 23.0, 26.0, 35.0, 41.0, 35.0, 52.0, 70.0, 84.0, 85.0, 68.0, 60.0, 57.0, 49.0, 35.0, 15.0, 20.0, 22.0, 22.0, 19.0, 16.0, 6.0, 14.0, 9.0, 3.0, 10.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.163330078125, -0.15808486938476562, -0.15283966064453125, -0.14759445190429688, -0.1423492431640625, -0.13710403442382812, -0.13185882568359375, -0.12661361694335938, -0.121368408203125, -0.11612319946289062, -0.11087799072265625, -0.10563278198242188, -0.1003875732421875, -0.09514236450195312, -0.08989715576171875, -0.08465194702148438, -0.07940673828125, -0.07416152954101562, -0.06891632080078125, -0.06367111206054688, -0.0584259033203125, -0.053180694580078125, -0.04793548583984375, -0.042690277099609375, -0.037445068359375, -0.032199859619140625, -0.02695465087890625, -0.021709442138671875, -0.0164642333984375, -0.011219024658203125, -0.00597381591796875, -0.000728607177734375, 0.0045166015625, 0.009761810302734375, 0.01500701904296875, 0.020252227783203125, 0.0254974365234375, 0.030742645263671875, 0.03598785400390625, 0.041233062744140625, 0.046478271484375, 0.051723480224609375, 0.05696868896484375, 0.062213897705078125, 0.0674591064453125, 0.07270431518554688, 0.07794952392578125, 0.08319473266601562, 0.08843994140625, 0.09368515014648438, 0.09893035888671875, 0.10417556762695312, 0.1094207763671875, 0.11466598510742188, 0.11991119384765625, 0.12515640258789062, 0.130401611328125, 0.13564682006835938, 0.14089202880859375, 0.14613723754882812, 0.1513824462890625, 0.15662765502929688, 0.16187286376953125, 0.16711807250976562, 0.17236328125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 15.0, 10.0, 12.0, 26.0, 21.0, 21.0, 22.0, 36.0, 34.0, 44.0, 59.0, 42.0, 34.0, 47.0, 50.0, 39.0, 48.0, 45.0, 41.0, 41.0, 30.0, 30.0, 33.0, 33.0, 16.0, 19.0, 19.0, 15.0, 12.0, 20.0, 10.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.553495407104492, -16.988121032714844, -16.422746658325195, -15.857373237609863, -15.291998863220215, -14.726625442504883, -14.161251068115234, -13.595876693725586, -13.030502319335938, -12.465127944946289, -11.899754524230957, -11.334380149841309, -10.76900577545166, -10.203632354736328, -9.63825798034668, -9.072883605957031, -8.5075101852417, -7.942136287689209, -7.3767619132995605, -6.81138801574707, -6.246013641357422, -5.680639743804932, -5.115265846252441, -4.549891471862793, -3.9845175743103027, -3.4191434383392334, -2.853769302368164, -2.288395404815674, -1.7230212688446045, -1.1576471328735352, -0.5922732353210449, -0.026899099349975586, 0.5384750366210938, 1.103849172592163, 1.6692231893539429, 2.2345972061157227, 2.799971342086792, 3.3653454780578613, 3.9307193756103516, 4.49609375, 5.06146764755249, 5.6268415451049805, 6.192215919494629, 6.757589817047119, 7.322963714599609, 7.888338088989258, 8.453712463378906, 9.019085884094238, 9.584460258483887, 10.149834632873535, 10.715208053588867, 11.280582427978516, 11.845956802368164, 12.411331176757812, 12.976704597473145, 13.542078971862793, 14.107452392578125, 14.672826766967773, 15.238200187683105, 15.803574562072754, 16.368947982788086, 16.934322357177734, 17.499696731567383, 18.06507110595703, 18.63044548034668]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 5.0, 6.0, 14.0, 9.0, 7.0, 16.0, 15.0, 18.0, 18.0, 15.0, 21.0, 20.0, 29.0, 33.0, 29.0, 28.0, 29.0, 40.0, 28.0, 32.0, 29.0, 36.0, 43.0, 43.0, 35.0, 34.0, 30.0, 36.0, 37.0, 28.0, 31.0, 34.0, 30.0, 22.0, 19.0, 18.0, 14.0, 9.0, 9.0, 8.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.341848373413086, -18.765254974365234, -18.188661575317383, -17.612070083618164, -17.035476684570312, -16.45888328552246, -15.88228988647461, -15.305697441101074, -14.729104995727539, -14.152511596679688, -13.575919151306152, -12.9993257522583, -12.422733306884766, -11.846139907836914, -11.269546508789062, -10.692954063415527, -10.116360664367676, -9.539767265319824, -8.963174819946289, -8.386581420898438, -7.809988975524902, -7.233395576477051, -6.656802654266357, -6.080209732055664, -5.503616809844971, -4.927023887634277, -4.350430965423584, -3.7738378047943115, -3.197244882583618, -2.620651960372925, -2.0440587997436523, -1.467465877532959, -0.8908729553222656, -0.3142799735069275, 0.26231300830841064, 0.8389060497283936, 1.415498971939087, 1.9920918941497803, 2.5686850547790527, 3.145277976989746, 3.7218708992004395, 4.298463821411133, 4.875056743621826, 5.4516496658325195, 6.028243064880371, 6.604835510253906, 7.181428909301758, 7.758021831512451, 8.334614753723145, 8.911208152770996, 9.487800598144531, 10.064393997192383, 10.640986442565918, 11.21757984161377, 11.794172286987305, 12.370765686035156, 12.947359085083008, 13.52395248413086, 14.100544929504395, 14.677138328552246, 15.253730773925781, 15.830324172973633, 16.406917572021484, 16.983509063720703, 17.560102462768555]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 11.0, 20.0, 31.0, 45.0, 89.0, 173.0, 237.0, 368.0, 682.0, 1016.0, 1807.0, 2702.0, 4405.0, 6933.0, 11076.0, 16966.0, 25637.0, 38944.0, 54369.0, 72927.0, 92464.0, 108184.0, 115224.0, 112591.0, 100597.0, 82609.0, 63299.0, 45540.0, 31652.0, 20975.0, 13534.0, 8805.0, 5550.0, 3578.0, 2117.0, 1313.0, 794.0, 496.0, 308.0, 188.0, 116.0, 72.0, 47.0, 31.0, 13.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.5438232421875, -13.103271484375, -12.6627197265625, -12.22216796875, -11.7816162109375, -11.341064453125, -10.9005126953125, -10.4599609375, -10.0194091796875, -9.578857421875, -9.1383056640625, -8.69775390625, -8.2572021484375, -7.816650390625, -7.3760986328125, -6.935546875, -6.4949951171875, -6.054443359375, -5.6138916015625, -5.17333984375, -4.7327880859375, -4.292236328125, -3.8516845703125, -3.4111328125, -2.9705810546875, -2.530029296875, -2.0894775390625, -1.64892578125, -1.2083740234375, -0.767822265625, -0.3272705078125, 0.11328125, 0.5538330078125, 0.994384765625, 1.4349365234375, 1.87548828125, 2.3160400390625, 2.756591796875, 3.1971435546875, 3.6376953125, 4.0782470703125, 4.518798828125, 4.9593505859375, 5.39990234375, 5.8404541015625, 6.281005859375, 6.7215576171875, 7.162109375, 7.6026611328125, 8.043212890625, 8.4837646484375, 8.92431640625, 9.3648681640625, 9.805419921875, 10.2459716796875, 10.6865234375, 11.1270751953125, 11.567626953125, 12.0081787109375, 12.44873046875, 12.8892822265625, 13.329833984375, 13.7703857421875, 14.2109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 4.0, 9.0, 13.0, 24.0, 23.0, 16.0, 13.0, 19.0, 22.0, 30.0, 33.0, 26.0, 26.0, 33.0, 39.0, 33.0, 34.0, 35.0, 32.0, 47.0, 34.0, 52.0, 38.0, 32.0, 23.0, 38.0, 33.0, 32.0, 24.0, 21.0, 19.0, 21.0, 18.0, 8.0, 11.0, 12.0, 7.0, 7.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.59375, -19.000732421875, -18.40771484375, -17.814697265625, -17.2216796875, -16.628662109375, -16.03564453125, -15.442626953125, -14.849609375, -14.256591796875, -13.66357421875, -13.070556640625, -12.4775390625, -11.884521484375, -11.29150390625, -10.698486328125, -10.10546875, -9.512451171875, -8.91943359375, -8.326416015625, -7.7333984375, -7.140380859375, -6.54736328125, -5.954345703125, -5.361328125, -4.768310546875, -4.17529296875, -3.582275390625, -2.9892578125, -2.396240234375, -1.80322265625, -1.210205078125, -0.6171875, -0.024169921875, 0.56884765625, 1.161865234375, 1.7548828125, 2.347900390625, 2.94091796875, 3.533935546875, 4.126953125, 4.719970703125, 5.31298828125, 5.906005859375, 6.4990234375, 7.092041015625, 7.68505859375, 8.278076171875, 8.87109375, 9.464111328125, 10.05712890625, 10.650146484375, 11.2431640625, 11.836181640625, 12.42919921875, 13.022216796875, 13.615234375, 14.208251953125, 14.80126953125, 15.394287109375, 15.9873046875, 16.580322265625, 17.17333984375, 17.766357421875, 18.359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 13.0, 21.0, 27.0, 46.0, 60.0, 73.0, 130.0, 189.0, 279.0, 482.0, 693.0, 1100.0, 1616.0, 2619.0, 3979.0, 5992.0, 8999.0, 13513.0, 19720.0, 28265.0, 39910.0, 53233.0, 69415.0, 84836.0, 97528.0, 103891.0, 102771.0, 94723.0, 81702.0, 65468.0, 50194.0, 37056.0, 25970.0, 18020.0, 12049.0, 8235.0, 5420.0, 3574.0, 2326.0, 1549.0, 995.0, 671.0, 389.0, 282.0, 182.0, 116.0, 82.0, 55.0, 42.0, 13.0, 15.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-12.7578125, -12.357666015625, -11.95751953125, -11.557373046875, -11.1572265625, -10.757080078125, -10.35693359375, -9.956787109375, -9.556640625, -9.156494140625, -8.75634765625, -8.356201171875, -7.9560546875, -7.555908203125, -7.15576171875, -6.755615234375, -6.35546875, -5.955322265625, -5.55517578125, -5.155029296875, -4.7548828125, -4.354736328125, -3.95458984375, -3.554443359375, -3.154296875, -2.754150390625, -2.35400390625, -1.953857421875, -1.5537109375, -1.153564453125, -0.75341796875, -0.353271484375, 0.046875, 0.447021484375, 0.84716796875, 1.247314453125, 1.6474609375, 2.047607421875, 2.44775390625, 2.847900390625, 3.248046875, 3.648193359375, 4.04833984375, 4.448486328125, 4.8486328125, 5.248779296875, 5.64892578125, 6.049072265625, 6.44921875, 6.849365234375, 7.24951171875, 7.649658203125, 8.0498046875, 8.449951171875, 8.85009765625, 9.250244140625, 9.650390625, 10.050537109375, 10.45068359375, 10.850830078125, 11.2509765625, 11.651123046875, 12.05126953125, 12.451416015625, 12.8515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 4.0, 11.0, 17.0, 4.0, 15.0, 16.0, 24.0, 21.0, 22.0, 26.0, 29.0, 21.0, 30.0, 37.0, 47.0, 40.0, 30.0, 41.0, 35.0, 45.0, 52.0, 38.0, 37.0, 43.0, 28.0, 34.0, 34.0, 29.0, 29.0, 14.0, 17.0, 15.0, 25.0, 14.0, 10.0, 14.0, 6.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.4140625, -12.0147705078125, -11.615478515625, -11.2161865234375, -10.81689453125, -10.4176025390625, -10.018310546875, -9.6190185546875, -9.2197265625, -8.8204345703125, -8.421142578125, -8.0218505859375, -7.62255859375, -7.2232666015625, -6.823974609375, -6.4246826171875, -6.025390625, -5.6260986328125, -5.226806640625, -4.8275146484375, -4.42822265625, -4.0289306640625, -3.629638671875, -3.2303466796875, -2.8310546875, -2.4317626953125, -2.032470703125, -1.6331787109375, -1.23388671875, -0.8345947265625, -0.435302734375, -0.0360107421875, 0.36328125, 0.7625732421875, 1.161865234375, 1.5611572265625, 1.96044921875, 2.3597412109375, 2.759033203125, 3.1583251953125, 3.5576171875, 3.9569091796875, 4.356201171875, 4.7554931640625, 5.15478515625, 5.5540771484375, 5.953369140625, 6.3526611328125, 6.751953125, 7.1512451171875, 7.550537109375, 7.9498291015625, 8.34912109375, 8.7484130859375, 9.147705078125, 9.5469970703125, 9.9462890625, 10.3455810546875, 10.744873046875, 11.1441650390625, 11.54345703125, 11.9427490234375, 12.342041015625, 12.7413330078125, 13.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 18.0, 21.0, 25.0, 47.0, 82.0, 90.0, 144.0, 258.0, 428.0, 660.0, 1091.0, 1885.0, 3342.0, 5846.0, 10244.0, 18290.0, 31165.0, 53244.0, 83252.0, 118347.0, 146438.0, 155852.0, 138329.0, 105258.0, 70340.0, 43558.0, 25571.0, 14855.0, 8386.0, 4748.0, 2699.0, 1611.0, 931.0, 562.0, 339.0, 198.0, 131.0, 94.0, 54.0, 39.0, 22.0, 19.0, 11.0, 7.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.4375, -5.25811767578125, -5.0787353515625, -4.89935302734375, -4.719970703125, -4.54058837890625, -4.3612060546875, -4.18182373046875, -4.00244140625, -3.82305908203125, -3.6436767578125, -3.46429443359375, -3.284912109375, -3.10552978515625, -2.9261474609375, -2.74676513671875, -2.5673828125, -2.38800048828125, -2.2086181640625, -2.02923583984375, -1.849853515625, -1.67047119140625, -1.4910888671875, -1.31170654296875, -1.13232421875, -0.95294189453125, -0.7735595703125, -0.59417724609375, -0.414794921875, -0.23541259765625, -0.0560302734375, 0.12335205078125, 0.302734375, 0.48211669921875, 0.6614990234375, 0.84088134765625, 1.020263671875, 1.19964599609375, 1.3790283203125, 1.55841064453125, 1.73779296875, 1.91717529296875, 2.0965576171875, 2.27593994140625, 2.455322265625, 2.63470458984375, 2.8140869140625, 2.99346923828125, 3.1728515625, 3.35223388671875, 3.5316162109375, 3.71099853515625, 3.890380859375, 4.06976318359375, 4.2491455078125, 4.42852783203125, 4.60791015625, 4.78729248046875, 4.9666748046875, 5.14605712890625, 5.325439453125, 5.50482177734375, 5.6842041015625, 5.86358642578125, 6.04296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 6.0, 15.0, 12.0, 18.0, 20.0, 15.0, 39.0, 26.0, 23.0, 31.0, 27.0, 57.0, 41.0, 62.0, 49.0, 57.0, 55.0, 41.0, 64.0, 45.0, 37.0, 42.0, 26.0, 35.0, 22.0, 24.0, 21.0, 13.0, 14.0, 10.0, 10.0, 6.0, 2.0, 5.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005044937133789062, -0.00048752129077911377, -0.0004705488681793213, -0.0004535764455795288, -0.00043660402297973633, -0.00041963160037994385, -0.00040265917778015137, -0.0003856867551803589, -0.0003687143325805664, -0.0003517419099807739, -0.00033476948738098145, -0.00031779706478118896, -0.0003008246421813965, -0.000283852219581604, -0.0002668797969818115, -0.00024990737438201904, -0.00023293495178222656, -0.00021596252918243408, -0.0001989901065826416, -0.00018201768398284912, -0.00016504526138305664, -0.00014807283878326416, -0.00013110041618347168, -0.0001141279935836792, -9.715557098388672e-05, -8.018314838409424e-05, -6.321072578430176e-05, -4.623830318450928e-05, -2.9265880584716797e-05, -1.2293457984924316e-05, 4.678964614868164e-06, 2.1651387214660645e-05, 3.8623809814453125e-05, 5.5596232414245605e-05, 7.256865501403809e-05, 8.954107761383057e-05, 0.00010651350021362305, 0.00012348592281341553, 0.000140458345413208, 0.0001574307680130005, 0.00017440319061279297, 0.00019137561321258545, 0.00020834803581237793, 0.0002253204584121704, 0.0002422928810119629, 0.00025926530361175537, 0.00027623772621154785, 0.00029321014881134033, 0.0003101825714111328, 0.0003271549940109253, 0.0003441274166107178, 0.00036109983921051025, 0.00037807226181030273, 0.0003950446844100952, 0.0004120171070098877, 0.0004289895296096802, 0.00044596195220947266, 0.00046293437480926514, 0.0004799067974090576, 0.0004968792200088501, 0.0005138516426086426, 0.0005308240652084351, 0.0005477964878082275, 0.00056476891040802, 0.0005817413330078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 14.0, 24.0, 34.0, 41.0, 57.0, 109.0, 143.0, 195.0, 276.0, 484.0, 699.0, 1082.0, 1743.0, 2847.0, 4634.0, 7904.0, 13229.0, 22082.0, 36458.0, 58002.0, 86945.0, 118104.0, 141369.0, 146121.0, 129068.0, 98438.0, 67830.0, 43607.0, 26601.0, 16091.0, 9391.0, 5663.0, 3516.0, 2035.0, 1324.0, 838.0, 558.0, 327.0, 247.0, 136.0, 104.0, 61.0, 43.0, 32.0, 19.0, 13.0, 14.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.61297607421875, -5.4329833984375, -5.25299072265625, -5.072998046875, -4.89300537109375, -4.7130126953125, -4.53302001953125, -4.35302734375, -4.17303466796875, -3.9930419921875, -3.81304931640625, -3.633056640625, -3.45306396484375, -3.2730712890625, -3.09307861328125, -2.9130859375, -2.73309326171875, -2.5531005859375, -2.37310791015625, -2.193115234375, -2.01312255859375, -1.8331298828125, -1.65313720703125, -1.47314453125, -1.29315185546875, -1.1131591796875, -0.93316650390625, -0.753173828125, -0.57318115234375, -0.3931884765625, -0.21319580078125, -0.033203125, 0.14678955078125, 0.3267822265625, 0.50677490234375, 0.686767578125, 0.86676025390625, 1.0467529296875, 1.22674560546875, 1.40673828125, 1.58673095703125, 1.7667236328125, 1.94671630859375, 2.126708984375, 2.30670166015625, 2.4866943359375, 2.66668701171875, 2.8466796875, 3.02667236328125, 3.2066650390625, 3.38665771484375, 3.566650390625, 3.74664306640625, 3.9266357421875, 4.10662841796875, 4.28662109375, 4.46661376953125, 4.6466064453125, 4.82659912109375, 5.006591796875, 5.18658447265625, 5.3665771484375, 5.54656982421875, 5.7265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 7.0, 13.0, 13.0, 11.0, 13.0, 13.0, 25.0, 30.0, 42.0, 42.0, 41.0, 61.0, 70.0, 73.0, 58.0, 72.0, 48.0, 73.0, 45.0, 44.0, 35.0, 34.0, 21.0, 26.0, 25.0, 16.0, 11.0, 5.0, 11.0, 4.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-3.95703125, -3.858062744140625, -3.75909423828125, -3.660125732421875, -3.5611572265625, -3.462188720703125, -3.36322021484375, -3.264251708984375, -3.165283203125, -3.066314697265625, -2.96734619140625, -2.868377685546875, -2.7694091796875, -2.670440673828125, -2.57147216796875, -2.472503662109375, -2.37353515625, -2.274566650390625, -2.17559814453125, -2.076629638671875, -1.9776611328125, -1.878692626953125, -1.77972412109375, -1.680755615234375, -1.581787109375, -1.482818603515625, -1.38385009765625, -1.284881591796875, -1.1859130859375, -1.086944580078125, -0.98797607421875, -0.889007568359375, -0.7900390625, -0.691070556640625, -0.59210205078125, -0.493133544921875, -0.3941650390625, -0.295196533203125, -0.19622802734375, -0.097259521484375, 0.001708984375, 0.100677490234375, 0.19964599609375, 0.298614501953125, 0.3975830078125, 0.496551513671875, 0.59552001953125, 0.694488525390625, 0.79345703125, 0.892425537109375, 0.99139404296875, 1.090362548828125, 1.1893310546875, 1.288299560546875, 1.38726806640625, 1.486236572265625, 1.585205078125, 1.684173583984375, 1.78314208984375, 1.882110595703125, 1.9810791015625, 2.080047607421875, 2.17901611328125, 2.277984619140625, 2.376953125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 4.0, 7.0, 7.0, 10.0, 11.0, 8.0, 9.0, 10.0, 15.0, 24.0, 21.0, 32.0, 38.0, 35.0, 40.0, 42.0, 52.0, 39.0, 46.0, 52.0, 48.0, 42.0, 43.0, 36.0, 50.0, 37.0, 37.0, 28.0, 27.0, 22.0, 18.0, 21.0, 20.0, 12.0, 5.0, 8.0, 9.0, 10.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.937471389770508, -18.364242553710938, -17.791011810302734, -17.21778106689453, -16.64455223083496, -16.07132339477539, -15.498092651367188, -14.9248628616333, -14.351633071899414, -13.778403282165527, -13.20517349243164, -12.631943702697754, -12.058713912963867, -11.48548412322998, -10.912254333496094, -10.339024543762207, -9.76579475402832, -9.192564964294434, -8.619335174560547, -8.04610538482666, -7.472875595092773, -6.899645805358887, -6.326416015625, -5.753186225891113, -5.179956436157227, -4.60672664642334, -4.033496856689453, -3.4602670669555664, -2.8870372772216797, -2.313807487487793, -1.7405776977539062, -1.1673479080200195, -0.5941200256347656, -0.020890235900878906, 0.5523395538330078, 1.1255693435668945, 1.6987991333007812, 2.272028923034668, 2.8452587127685547, 3.4184885025024414, 3.991718292236328, 4.564948081970215, 5.138177871704102, 5.711407661437988, 6.284637451171875, 6.857867240905762, 7.431097030639648, 8.004326820373535, 8.577556610107422, 9.150786399841309, 9.724016189575195, 10.297245979309082, 10.870475769042969, 11.443705558776855, 12.016935348510742, 12.590165138244629, 13.163394927978516, 13.736624717712402, 14.309854507446289, 14.883084297180176, 15.456314086914062, 16.029544830322266, 16.602773666381836, 17.176002502441406, 17.74923324584961]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 4.0, 4.0, 6.0, 17.0, 6.0, 8.0, 14.0, 16.0, 18.0, 22.0, 24.0, 24.0, 18.0, 29.0, 33.0, 28.0, 33.0, 36.0, 30.0, 36.0, 31.0, 44.0, 39.0, 42.0, 49.0, 36.0, 37.0, 37.0, 33.0, 24.0, 30.0, 31.0, 24.0, 22.0, 21.0, 18.0, 8.0, 16.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0], "bins": [-21.505176544189453, -20.888151168823242, -20.27112579345703, -19.654102325439453, -19.037076950073242, -18.42005157470703, -17.803028106689453, -17.186002731323242, -16.56897735595703, -15.95195198059082, -15.334927558898926, -14.717903137207031, -14.10087776184082, -13.48385238647461, -12.866827964782715, -12.24980354309082, -11.63277816772461, -11.015752792358398, -10.398728370666504, -9.78170394897461, -9.164678573608398, -8.547653198242188, -7.930628776550293, -7.31360387802124, -6.6965789794921875, -6.079554080963135, -5.462529182434082, -4.845504283905029, -4.228479385375977, -3.611454486846924, -2.994429588317871, -2.3774046897888184, -1.7603778839111328, -1.14335298538208, -0.5263280868530273, 0.09069681167602539, 0.7077217102050781, 1.3247466087341309, 1.9417715072631836, 2.5587964057922363, 3.175821304321289, 3.792846202850342, 4.4098711013793945, 5.026895999908447, 5.6439208984375, 6.260945796966553, 6.8779706954956055, 7.494995594024658, 8.112020492553711, 8.729045867919922, 9.346070289611816, 9.963094711303711, 10.580120086669922, 11.197145462036133, 11.814169883728027, 12.431194305419922, 13.048219680786133, 13.665245056152344, 14.282269477844238, 14.899293899536133, 15.516319274902344, 16.133344650268555, 16.750370025634766, 17.367393493652344, 17.984418869018555]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 8.0, 19.0, 40.0, 66.0, 96.0, 142.0, 241.0, 389.0, 651.0, 1031.0, 1674.0, 2717.0, 4508.0, 6879.0, 11073.0, 17145.0, 27290.0, 42491.0, 64995.0, 97653.0, 144083.0, 205704.0, 280755.0, 359132.0, 427700.0, 465213.0, 458787.0, 410538.0, 338673.0, 259786.0, 187597.0, 130275.0, 87671.0, 57636.0, 37533.0, 24131.0, 15153.0, 9439.0, 5976.0, 3579.0, 2302.0, 1407.0, 803.0, 496.0, 328.0, 218.0, 103.0, 61.0, 45.0, 18.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.65625, -13.2275390625, -12.798828125, -12.3701171875, -11.94140625, -11.5126953125, -11.083984375, -10.6552734375, -10.2265625, -9.7978515625, -9.369140625, -8.9404296875, -8.51171875, -8.0830078125, -7.654296875, -7.2255859375, -6.796875, -6.3681640625, -5.939453125, -5.5107421875, -5.08203125, -4.6533203125, -4.224609375, -3.7958984375, -3.3671875, -2.9384765625, -2.509765625, -2.0810546875, -1.65234375, -1.2236328125, -0.794921875, -0.3662109375, 0.0625, 0.4912109375, 0.919921875, 1.3486328125, 1.77734375, 2.2060546875, 2.634765625, 3.0634765625, 3.4921875, 3.9208984375, 4.349609375, 4.7783203125, 5.20703125, 5.6357421875, 6.064453125, 6.4931640625, 6.921875, 7.3505859375, 7.779296875, 8.2080078125, 8.63671875, 9.0654296875, 9.494140625, 9.9228515625, 10.3515625, 10.7802734375, 11.208984375, 11.6376953125, 12.06640625, 12.4951171875, 12.923828125, 13.3525390625, 13.78125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 10.0, 10.0, 11.0, 11.0, 20.0, 19.0, 24.0, 14.0, 23.0, 32.0, 30.0, 39.0, 36.0, 36.0, 29.0, 37.0, 36.0, 44.0, 49.0, 39.0, 45.0, 32.0, 36.0, 36.0, 36.0, 31.0, 23.0, 36.0, 22.0, 25.0, 21.0, 9.0, 19.0, 11.0, 9.0, 8.0, 7.0, 9.0, 6.0, 1.0, 1.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.665771484375, -15.17529296875, -14.684814453125, -14.1943359375, -13.703857421875, -13.21337890625, -12.722900390625, -12.232421875, -11.741943359375, -11.25146484375, -10.760986328125, -10.2705078125, -9.780029296875, -9.28955078125, -8.799072265625, -8.30859375, -7.818115234375, -7.32763671875, -6.837158203125, -6.3466796875, -5.856201171875, -5.36572265625, -4.875244140625, -4.384765625, -3.894287109375, -3.40380859375, -2.913330078125, -2.4228515625, -1.932373046875, -1.44189453125, -0.951416015625, -0.4609375, 0.029541015625, 0.52001953125, 1.010498046875, 1.5009765625, 1.991455078125, 2.48193359375, 2.972412109375, 3.462890625, 3.953369140625, 4.44384765625, 4.934326171875, 5.4248046875, 5.915283203125, 6.40576171875, 6.896240234375, 7.38671875, 7.877197265625, 8.36767578125, 8.858154296875, 9.3486328125, 9.839111328125, 10.32958984375, 10.820068359375, 11.310546875, 11.801025390625, 12.29150390625, 12.781982421875, 13.2724609375, 13.762939453125, 14.25341796875, 14.743896484375, 15.234375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 15.0, 29.0, 47.0, 103.0, 170.0, 290.0, 556.0, 905.0, 1533.0, 2806.0, 4833.0, 8412.0, 14313.0, 23750.0, 38852.0, 62052.0, 95152.0, 142542.0, 203074.0, 273146.0, 345539.0, 408333.0, 444954.0, 448352.0, 413384.0, 353292.0, 281967.0, 210228.0, 148638.0, 100349.0, 65110.0, 40765.0, 24802.0, 15086.0, 8840.0, 5249.0, 2974.0, 1637.0, 921.0, 550.0, 301.0, 196.0, 101.0, 59.0, 25.0, 20.0, 11.0, 3.0, 10.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.3203125, -13.8870849609375, -13.453857421875, -13.0206298828125, -12.58740234375, -12.1541748046875, -11.720947265625, -11.2877197265625, -10.8544921875, -10.4212646484375, -9.988037109375, -9.5548095703125, -9.12158203125, -8.6883544921875, -8.255126953125, -7.8218994140625, -7.388671875, -6.9554443359375, -6.522216796875, -6.0889892578125, -5.65576171875, -5.2225341796875, -4.789306640625, -4.3560791015625, -3.9228515625, -3.4896240234375, -3.056396484375, -2.6231689453125, -2.18994140625, -1.7567138671875, -1.323486328125, -0.8902587890625, -0.45703125, -0.0238037109375, 0.409423828125, 0.8426513671875, 1.27587890625, 1.7091064453125, 2.142333984375, 2.5755615234375, 3.0087890625, 3.4420166015625, 3.875244140625, 4.3084716796875, 4.74169921875, 5.1749267578125, 5.608154296875, 6.0413818359375, 6.474609375, 6.9078369140625, 7.341064453125, 7.7742919921875, 8.20751953125, 8.6407470703125, 9.073974609375, 9.5072021484375, 9.9404296875, 10.3736572265625, 10.806884765625, 11.2401123046875, 11.67333984375, 12.1065673828125, 12.539794921875, 12.9730224609375, 13.40625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 12.0, 9.0, 16.0, 20.0, 28.0, 28.0, 45.0, 45.0, 51.0, 69.0, 94.0, 89.0, 105.0, 127.0, 156.0, 187.0, 194.0, 176.0, 206.0, 204.0, 215.0, 218.0, 193.0, 214.0, 197.0, 167.0, 146.0, 130.0, 120.0, 117.0, 98.0, 73.0, 56.0, 54.0, 52.0, 35.0, 24.0, 20.0, 18.0, 10.0, 15.0, 8.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.1875, -7.9456787109375, -7.703857421875, -7.4620361328125, -7.22021484375, -6.9783935546875, -6.736572265625, -6.4947509765625, -6.2529296875, -6.0111083984375, -5.769287109375, -5.5274658203125, -5.28564453125, -5.0438232421875, -4.802001953125, -4.5601806640625, -4.318359375, -4.0765380859375, -3.834716796875, -3.5928955078125, -3.35107421875, -3.1092529296875, -2.867431640625, -2.6256103515625, -2.3837890625, -2.1419677734375, -1.900146484375, -1.6583251953125, -1.41650390625, -1.1746826171875, -0.932861328125, -0.6910400390625, -0.44921875, -0.2073974609375, 0.034423828125, 0.2762451171875, 0.51806640625, 0.7598876953125, 1.001708984375, 1.2435302734375, 1.4853515625, 1.7271728515625, 1.968994140625, 2.2108154296875, 2.45263671875, 2.6944580078125, 2.936279296875, 3.1781005859375, 3.419921875, 3.6617431640625, 3.903564453125, 4.1453857421875, 4.38720703125, 4.6290283203125, 4.870849609375, 5.1126708984375, 5.3544921875, 5.5963134765625, 5.838134765625, 6.0799560546875, 6.32177734375, 6.5635986328125, 6.805419921875, 7.0472412109375, 7.2890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 6.0, 14.0, 7.0, 17.0, 30.0, 27.0, 29.0, 25.0, 45.0, 30.0, 47.0, 51.0, 68.0, 48.0, 61.0, 61.0, 45.0, 56.0, 45.0, 41.0, 46.0, 35.0, 26.0, 30.0, 27.0, 8.0, 11.0, 5.0, 9.0, 13.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.800466537475586, -19.15241241455078, -18.504356384277344, -17.85630226135254, -17.2082462310791, -16.560192108154297, -15.912137031555176, -15.264081954956055, -14.616026878356934, -13.967971801757812, -13.319916725158691, -12.67186164855957, -12.023807525634766, -11.375751495361328, -10.727697372436523, -10.079642295837402, -9.431587219238281, -8.78353214263916, -8.135477066040039, -7.487422466278076, -6.839367389678955, -6.191312313079834, -5.543257713317871, -4.89520263671875, -4.247147560119629, -3.599092483520508, -2.951037645339966, -2.302982807159424, -1.6549277305603027, -1.0068726539611816, -0.35881781578063965, 0.28923702239990234, 0.9372940063476562, 1.5853489637374878, 2.2334039211273193, 2.8814587593078613, 3.5295138359069824, 4.1775689125061035, 4.825623512268066, 5.4736785888671875, 6.121733665466309, 6.76978874206543, 7.417843818664551, 8.065898895263672, 8.713953018188477, 9.362009048461914, 10.010063171386719, 10.65811824798584, 11.306173324584961, 11.954228401184082, 12.602283477783203, 13.250338554382324, 13.898393630981445, 14.54644775390625, 15.194502830505371, 15.842557907104492, 16.490612030029297, 17.1386661529541, 17.78672218322754, 18.434776306152344, 19.08283233642578, 19.730886459350586, 20.378942489624023, 21.026996612548828, 21.675052642822266]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 5.0, 10.0, 12.0, 5.0, 11.0, 16.0, 16.0, 15.0, 16.0, 23.0, 23.0, 28.0, 34.0, 33.0, 48.0, 32.0, 43.0, 49.0, 42.0, 36.0, 33.0, 39.0, 42.0, 41.0, 37.0, 30.0, 36.0, 38.0, 38.0, 20.0, 33.0, 17.0, 20.0, 18.0, 16.0, 10.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.51458740234375, -19.896921157836914, -19.279253005981445, -18.66158676147461, -18.04391860961914, -17.426252365112305, -16.808584213256836, -16.19091796875, -15.573250770568848, -14.955583572387695, -14.337916374206543, -13.72024917602539, -13.102582931518555, -12.484914779663086, -11.86724853515625, -11.249581336975098, -10.631914138793945, -10.014246940612793, -9.39657974243164, -8.778912544250488, -8.161245346069336, -7.543578624725342, -6.925911903381348, -6.308244705200195, -5.690577507019043, -5.072910308837891, -4.455243110656738, -3.837576389312744, -3.219909191131592, -2.6022419929504395, -1.9845750331878662, -1.366908073425293, -0.7492408752441406, -0.13157379627227783, 0.48609328269958496, 1.1037603616714478, 1.7214274406433105, 2.339094638824463, 2.956761598587036, 3.5744285583496094, 4.192095756530762, 4.809762954711914, 5.427430152893066, 6.0450968742370605, 6.662764072418213, 7.280431270599365, 7.898097991943359, 8.515765190124512, 9.133432388305664, 9.751099586486816, 10.368766784667969, 10.986433982849121, 11.604101181030273, 12.22176742553711, 12.839434623718262, 13.457101821899414, 14.074769020080566, 14.692436218261719, 15.310103416442871, 15.927770614624023, 16.54543685913086, 17.163105010986328, 17.780771255493164, 18.3984375, 19.01610565185547]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 12.0, 15.0, 45.0, 45.0, 67.0, 94.0, 129.0, 199.0, 311.0, 380.0, 602.0, 857.0, 1168.0, 1694.0, 2515.0, 3724.0, 5178.0, 7746.0, 11387.0, 17138.0, 25948.0, 39814.0, 63043.0, 100954.0, 158685.0, 197439.0, 147692.0, 91621.0, 58352.0, 37259.0, 24537.0, 15954.0, 10707.0, 7368.0, 4916.0, 3372.0, 2345.0, 1565.0, 1113.0, 824.0, 556.0, 398.0, 249.0, 162.0, 125.0, 81.0, 56.0, 33.0, 26.0, 11.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.904296875, -2.814697265625, -2.72509765625, -2.635498046875, -2.5458984375, -2.456298828125, -2.36669921875, -2.277099609375, -2.1875, -2.097900390625, -2.00830078125, -1.918701171875, -1.8291015625, -1.739501953125, -1.64990234375, -1.560302734375, -1.470703125, -1.381103515625, -1.29150390625, -1.201904296875, -1.1123046875, -1.022705078125, -0.93310546875, -0.843505859375, -0.75390625, -0.664306640625, -0.57470703125, -0.485107421875, -0.3955078125, -0.305908203125, -0.21630859375, -0.126708984375, -0.037109375, 0.052490234375, 0.14208984375, 0.231689453125, 0.3212890625, 0.410888671875, 0.50048828125, 0.590087890625, 0.6796875, 0.769287109375, 0.85888671875, 0.948486328125, 1.0380859375, 1.127685546875, 1.21728515625, 1.306884765625, 1.396484375, 1.486083984375, 1.57568359375, 1.665283203125, 1.7548828125, 1.844482421875, 1.93408203125, 2.023681640625, 2.11328125, 2.202880859375, 2.29248046875, 2.382080078125, 2.4716796875, 2.561279296875, 2.65087890625, 2.740478515625, 2.830078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 3.0, 8.0, 10.0, 15.0, 12.0, 12.0, 6.0, 20.0, 24.0, 24.0, 28.0, 31.0, 26.0, 36.0, 41.0, 35.0, 30.0, 33.0, 40.0, 32.0, 39.0, 38.0, 41.0, 29.0, 43.0, 31.0, 29.0, 37.0, 29.0, 27.0, 37.0, 23.0, 21.0, 13.0, 13.0, 19.0, 13.0, 7.0, 5.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-19.796875, -19.217529296875, -18.63818359375, -18.058837890625, -17.4794921875, -16.900146484375, -16.32080078125, -15.741455078125, -15.162109375, -14.582763671875, -14.00341796875, -13.424072265625, -12.8447265625, -12.265380859375, -11.68603515625, -11.106689453125, -10.52734375, -9.947998046875, -9.36865234375, -8.789306640625, -8.2099609375, -7.630615234375, -7.05126953125, -6.471923828125, -5.892578125, -5.313232421875, -4.73388671875, -4.154541015625, -3.5751953125, -2.995849609375, -2.41650390625, -1.837158203125, -1.2578125, -0.678466796875, -0.09912109375, 0.480224609375, 1.0595703125, 1.638916015625, 2.21826171875, 2.797607421875, 3.376953125, 3.956298828125, 4.53564453125, 5.114990234375, 5.6943359375, 6.273681640625, 6.85302734375, 7.432373046875, 8.01171875, 8.591064453125, 9.17041015625, 9.749755859375, 10.3291015625, 10.908447265625, 11.48779296875, 12.067138671875, 12.646484375, 13.225830078125, 13.80517578125, 14.384521484375, 14.9638671875, 15.543212890625, 16.12255859375, 16.701904296875, 17.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 7.0, 10.0, 17.0, 21.0, 42.0, 63.0, 62.0, 101.0, 147.0, 261.0, 352.0, 556.0, 781.0, 1220.0, 1827.0, 2811.0, 4199.0, 6427.0, 9930.0, 15313.0, 24128.0, 37988.0, 62263.0, 103194.0, 173169.0, 216582.0, 149848.0, 89236.0, 54052.0, 33516.0, 21006.0, 13578.0, 8685.0, 5834.0, 3780.0, 2485.0, 1678.0, 1094.0, 677.0, 511.0, 359.0, 245.0, 169.0, 107.0, 71.0, 51.0, 36.0, 24.0, 12.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-2.61328125, -2.529937744140625, -2.44659423828125, -2.363250732421875, -2.2799072265625, -2.196563720703125, -2.11322021484375, -2.029876708984375, -1.946533203125, -1.863189697265625, -1.77984619140625, -1.696502685546875, -1.6131591796875, -1.529815673828125, -1.44647216796875, -1.363128662109375, -1.27978515625, -1.196441650390625, -1.11309814453125, -1.029754638671875, -0.9464111328125, -0.863067626953125, -0.77972412109375, -0.696380615234375, -0.613037109375, -0.529693603515625, -0.44635009765625, -0.363006591796875, -0.2796630859375, -0.196319580078125, -0.11297607421875, -0.029632568359375, 0.0537109375, 0.137054443359375, 0.22039794921875, 0.303741455078125, 0.3870849609375, 0.470428466796875, 0.55377197265625, 0.637115478515625, 0.720458984375, 0.803802490234375, 0.88714599609375, 0.970489501953125, 1.0538330078125, 1.137176513671875, 1.22052001953125, 1.303863525390625, 1.38720703125, 1.470550537109375, 1.55389404296875, 1.637237548828125, 1.7205810546875, 1.803924560546875, 1.88726806640625, 1.970611572265625, 2.053955078125, 2.137298583984375, 2.22064208984375, 2.303985595703125, 2.3873291015625, 2.470672607421875, 2.55401611328125, 2.637359619140625, 2.720703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 15.0, 9.0, 12.0, 12.0, 18.0, 14.0, 12.0, 15.0, 19.0, 28.0, 37.0, 31.0, 35.0, 36.0, 46.0, 40.0, 38.0, 31.0, 32.0, 40.0, 49.0, 39.0, 51.0, 32.0, 33.0, 31.0, 28.0, 29.0, 28.0, 14.0, 28.0, 19.0, 15.0, 13.0, 17.0, 12.0, 5.0, 8.0, 5.0, 7.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.1171875, -11.7501220703125, -11.383056640625, -11.0159912109375, -10.64892578125, -10.2818603515625, -9.914794921875, -9.5477294921875, -9.1806640625, -8.8135986328125, -8.446533203125, -8.0794677734375, -7.71240234375, -7.3453369140625, -6.978271484375, -6.6112060546875, -6.244140625, -5.8770751953125, -5.510009765625, -5.1429443359375, -4.77587890625, -4.4088134765625, -4.041748046875, -3.6746826171875, -3.3076171875, -2.9405517578125, -2.573486328125, -2.2064208984375, -1.83935546875, -1.4722900390625, -1.105224609375, -0.7381591796875, -0.37109375, -0.0040283203125, 0.363037109375, 0.7301025390625, 1.09716796875, 1.4642333984375, 1.831298828125, 2.1983642578125, 2.5654296875, 2.9324951171875, 3.299560546875, 3.6666259765625, 4.03369140625, 4.4007568359375, 4.767822265625, 5.1348876953125, 5.501953125, 5.8690185546875, 6.236083984375, 6.6031494140625, 6.97021484375, 7.3372802734375, 7.704345703125, 8.0714111328125, 8.4384765625, 8.8055419921875, 9.172607421875, 9.5396728515625, 9.90673828125, 10.2738037109375, 10.640869140625, 11.0079345703125, 11.375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 10.0, 10.0, 12.0, 22.0, 42.0, 32.0, 75.0, 89.0, 129.0, 198.0, 253.0, 352.0, 567.0, 800.0, 1159.0, 1830.0, 2825.0, 4425.0, 6961.0, 11390.0, 19355.0, 34119.0, 63647.0, 134668.0, 318263.0, 233029.0, 97268.0, 48522.0, 26813.0, 15813.0, 9304.0, 5812.0, 3707.0, 2304.0, 1486.0, 1045.0, 688.0, 450.0, 317.0, 211.0, 155.0, 119.0, 85.0, 50.0, 37.0, 33.0, 19.0, 11.0, 10.0, 12.0, 5.0, 6.0, 7.0, 2.0, 1.0, 2.0], "bins": [-0.171630859375, -0.1663970947265625, -0.161163330078125, -0.1559295654296875, -0.15069580078125, -0.1454620361328125, -0.140228271484375, -0.1349945068359375, -0.1297607421875, -0.1245269775390625, -0.119293212890625, -0.1140594482421875, -0.10882568359375, -0.1035919189453125, -0.098358154296875, -0.0931243896484375, -0.087890625, -0.0826568603515625, -0.077423095703125, -0.0721893310546875, -0.06695556640625, -0.0617218017578125, -0.056488037109375, -0.0512542724609375, -0.0460205078125, -0.0407867431640625, -0.035552978515625, -0.0303192138671875, -0.02508544921875, -0.0198516845703125, -0.014617919921875, -0.0093841552734375, -0.004150390625, 0.0010833740234375, 0.006317138671875, 0.0115509033203125, 0.01678466796875, 0.0220184326171875, 0.027252197265625, 0.0324859619140625, 0.0377197265625, 0.0429534912109375, 0.048187255859375, 0.0534210205078125, 0.05865478515625, 0.0638885498046875, 0.069122314453125, 0.0743560791015625, 0.07958984375, 0.0848236083984375, 0.090057373046875, 0.0952911376953125, 0.10052490234375, 0.1057586669921875, 0.110992431640625, 0.1162261962890625, 0.1214599609375, 0.1266937255859375, 0.131927490234375, 0.1371612548828125, 0.14239501953125, 0.1476287841796875, 0.152862548828125, 0.1580963134765625, 0.163330078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 3.0, 7.0, 8.0, 7.0, 12.0, 16.0, 18.0, 26.0, 25.0, 41.0, 40.0, 59.0, 51.0, 76.0, 58.0, 69.0, 72.0, 67.0, 64.0, 38.0, 51.0, 49.0, 28.0, 22.0, 27.0, 16.0, 22.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4928321838378906e-05, -3.3882446587085724e-05, -3.283657133579254e-05, -3.179069608449936e-05, -3.074482083320618e-05, -2.9698945581912994e-05, -2.8653070330619812e-05, -2.760719507932663e-05, -2.6561319828033447e-05, -2.5515444576740265e-05, -2.4469569325447083e-05, -2.34236940741539e-05, -2.2377818822860718e-05, -2.1331943571567535e-05, -2.0286068320274353e-05, -1.924019306898117e-05, -1.8194317817687988e-05, -1.7148442566394806e-05, -1.6102567315101624e-05, -1.5056692063808441e-05, -1.4010816812515259e-05, -1.2964941561222076e-05, -1.1919066309928894e-05, -1.0873191058635712e-05, -9.82731580734253e-06, -8.781440556049347e-06, -7.735565304756165e-06, -6.689690053462982e-06, -5.6438148021698e-06, -4.5979395508766174e-06, -3.552064299583435e-06, -2.5061890482902527e-06, -1.4603137969970703e-06, -4.1443854570388794e-07, 6.314367055892944e-07, 1.6773119568824768e-06, 2.723187208175659e-06, 3.7690624594688416e-06, 4.814937710762024e-06, 5.860812962055206e-06, 6.906688213348389e-06, 7.952563464641571e-06, 8.998438715934753e-06, 1.0044313967227936e-05, 1.1090189218521118e-05, 1.21360644698143e-05, 1.3181939721107483e-05, 1.4227814972400665e-05, 1.5273690223693848e-05, 1.631956547498703e-05, 1.7365440726280212e-05, 1.8411315977573395e-05, 1.9457191228866577e-05, 2.050306648015976e-05, 2.1548941731452942e-05, 2.2594816982746124e-05, 2.3640692234039307e-05, 2.468656748533249e-05, 2.573244273662567e-05, 2.6778317987918854e-05, 2.7824193239212036e-05, 2.887006849050522e-05, 2.99159437417984e-05, 3.096181899309158e-05, 3.2007694244384766e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 4.0, 6.0, 8.0, 11.0, 8.0, 18.0, 17.0, 29.0, 29.0, 62.0, 75.0, 91.0, 134.0, 167.0, 259.0, 369.0, 461.0, 718.0, 959.0, 1456.0, 2216.0, 3410.0, 5446.0, 8903.0, 14855.0, 26149.0, 47141.0, 91489.0, 207895.0, 338681.0, 139744.0, 68229.0, 36652.0, 20621.0, 11820.0, 7131.0, 4469.0, 2819.0, 1809.0, 1241.0, 828.0, 597.0, 411.0, 311.0, 242.0, 151.0, 116.0, 77.0, 52.0, 54.0, 32.0, 23.0, 19.0, 11.0, 10.0, 9.0, 4.0, 3.0, 4.0, 6.0, 3.0], "bins": [-0.415771484375, -0.40289306640625, -0.3900146484375, -0.37713623046875, -0.3642578125, -0.35137939453125, -0.3385009765625, -0.32562255859375, -0.312744140625, -0.29986572265625, -0.2869873046875, -0.27410888671875, -0.26123046875, -0.24835205078125, -0.2354736328125, -0.22259521484375, -0.209716796875, -0.19683837890625, -0.1839599609375, -0.17108154296875, -0.158203125, -0.14532470703125, -0.1324462890625, -0.11956787109375, -0.106689453125, -0.09381103515625, -0.0809326171875, -0.06805419921875, -0.05517578125, -0.04229736328125, -0.0294189453125, -0.01654052734375, -0.003662109375, 0.00921630859375, 0.0220947265625, 0.03497314453125, 0.0478515625, 0.06072998046875, 0.0736083984375, 0.08648681640625, 0.099365234375, 0.11224365234375, 0.1251220703125, 0.13800048828125, 0.15087890625, 0.16375732421875, 0.1766357421875, 0.18951416015625, 0.202392578125, 0.21527099609375, 0.2281494140625, 0.24102783203125, 0.25390625, 0.26678466796875, 0.2796630859375, 0.29254150390625, 0.305419921875, 0.31829833984375, 0.3311767578125, 0.34405517578125, 0.35693359375, 0.36981201171875, 0.3826904296875, 0.39556884765625, 0.408447265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 9.0, 8.0, 14.0, 20.0, 16.0, 27.0, 23.0, 41.0, 51.0, 71.0, 81.0, 94.0, 92.0, 85.0, 62.0, 53.0, 40.0, 46.0, 34.0, 31.0, 15.0, 14.0, 13.0, 11.0, 11.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130859375, -0.1268157958984375, -0.122772216796875, -0.1187286376953125, -0.11468505859375, -0.1106414794921875, -0.106597900390625, -0.1025543212890625, -0.0985107421875, -0.0944671630859375, -0.090423583984375, -0.0863800048828125, -0.08233642578125, -0.0782928466796875, -0.074249267578125, -0.0702056884765625, -0.066162109375, -0.0621185302734375, -0.058074951171875, -0.0540313720703125, -0.04998779296875, -0.0459442138671875, -0.041900634765625, -0.0378570556640625, -0.0338134765625, -0.0297698974609375, -0.025726318359375, -0.0216827392578125, -0.01763916015625, -0.0135955810546875, -0.009552001953125, -0.0055084228515625, -0.00146484375, 0.0025787353515625, 0.006622314453125, 0.0106658935546875, 0.01470947265625, 0.0187530517578125, 0.022796630859375, 0.0268402099609375, 0.0308837890625, 0.0349273681640625, 0.038970947265625, 0.0430145263671875, 0.04705810546875, 0.0511016845703125, 0.055145263671875, 0.0591888427734375, 0.063232421875, 0.0672760009765625, 0.071319580078125, 0.0753631591796875, 0.07940673828125, 0.0834503173828125, 0.087493896484375, 0.0915374755859375, 0.0955810546875, 0.0996246337890625, 0.103668212890625, 0.1077117919921875, 0.11175537109375, 0.1157989501953125, 0.119842529296875, 0.1238861083984375, 0.1279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 6.0, 15.0, 10.0, 17.0, 27.0, 31.0, 22.0, 30.0, 39.0, 35.0, 52.0, 52.0, 63.0, 47.0, 61.0, 61.0, 46.0, 59.0, 46.0, 44.0, 37.0, 32.0, 28.0, 33.0, 22.0, 10.0, 11.0, 9.0, 8.0, 11.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.753684997558594, -19.107946395874023, -18.462209701538086, -17.816471099853516, -17.170734405517578, -16.524995803833008, -15.879258155822754, -15.2335205078125, -14.587782859802246, -13.942045211791992, -13.296307563781738, -12.650569915771484, -12.004831314086914, -11.359094619750977, -10.713356018066406, -10.067618370056152, -9.421880722045898, -8.776143074035645, -8.13040542602539, -7.4846673011779785, -6.838929653167725, -6.193192005157471, -5.547453880310059, -4.901716232299805, -4.255978584289551, -3.610240936279297, -2.964503049850464, -2.318765163421631, -1.673027515411377, -1.027289867401123, -0.38155198097229004, 0.26418590545654297, 0.9099235534667969, 1.5556613206863403, 2.201399087905884, 2.847136974334717, 3.4928746223449707, 4.138612270355225, 4.784350395202637, 5.430088043212891, 6.0758256912231445, 6.721563339233398, 7.367300987243652, 8.013038635253906, 8.658777236938477, 9.304513931274414, 9.950252532958984, 10.595990180969238, 11.241727828979492, 11.887465476989746, 12.533203125, 13.178940773010254, 13.824678421020508, 14.470417022705078, 15.116154670715332, 15.761892318725586, 16.407630920410156, 17.053369522094727, 17.699106216430664, 18.344844818115234, 18.990581512451172, 19.636320114135742, 20.28205680847168, 20.92779541015625, 21.573532104492188]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 5.0, 11.0, 10.0, 6.0, 11.0, 14.0, 18.0, 15.0, 15.0, 25.0, 23.0, 26.0, 34.0, 34.0, 46.0, 34.0, 43.0, 51.0, 38.0, 38.0, 33.0, 39.0, 46.0, 38.0, 37.0, 29.0, 37.0, 35.0, 38.0, 24.0, 31.0, 17.0, 20.0, 16.0, 19.0, 9.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.323606491088867, -19.70870018005371, -19.093795776367188, -18.47888946533203, -17.863983154296875, -17.24907684326172, -16.634172439575195, -16.01926612854004, -15.404359817504883, -14.789454460144043, -14.174548149108887, -13.559642791748047, -12.94473648071289, -12.32983112335205, -11.714925765991211, -11.100019454956055, -10.485114097595215, -9.870208740234375, -9.255302429199219, -8.640397071838379, -8.025490760803223, -7.410585403442383, -6.795679569244385, -6.180773735046387, -5.565867900848389, -4.950962066650391, -4.336056232452393, -3.7211506366729736, -3.1062448024749756, -2.4913389682769775, -1.8764333724975586, -1.2615275382995605, -0.6466217041015625, -0.03171592950820923, 0.583189845085144, 1.1980955600738525, 1.8130013942718506, 2.4279072284698486, 3.0428128242492676, 3.6577186584472656, 4.272624492645264, 4.887530326843262, 5.50243616104126, 6.117341995239258, 6.732247352600098, 7.347153663635254, 7.962059020996094, 8.57696533203125, 9.19187068939209, 9.80677604675293, 10.421682357788086, 11.036587715148926, 11.651494026184082, 12.266399383544922, 12.881305694580078, 13.496211051940918, 14.111116409301758, 14.726021766662598, 15.340928077697754, 15.955833435058594, 16.57073974609375, 17.185646057128906, 17.80055046081543, 18.415456771850586, 19.030363082885742]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 8.0, 15.0, 23.0, 39.0, 66.0, 118.0, 148.0, 271.0, 380.0, 625.0, 980.0, 1503.0, 2258.0, 3723.0, 5560.0, 8663.0, 12581.0, 18700.0, 26827.0, 37164.0, 49549.0, 64844.0, 78285.0, 90931.0, 98786.0, 100507.0, 95751.0, 84444.0, 70423.0, 56255.0, 42556.0, 30906.0, 21690.0, 15041.0, 9879.0, 6672.0, 4342.0, 2917.0, 1759.0, 1232.0, 765.0, 506.0, 309.0, 195.0, 129.0, 88.0, 46.0, 35.0, 24.0, 18.0, 8.0, 6.0, 1.0, 1.0, 2.0], "bins": [-12.1328125, -11.7781982421875, -11.423583984375, -11.0689697265625, -10.71435546875, -10.3597412109375, -10.005126953125, -9.6505126953125, -9.2958984375, -8.9412841796875, -8.586669921875, -8.2320556640625, -7.87744140625, -7.5228271484375, -7.168212890625, -6.8135986328125, -6.458984375, -6.1043701171875, -5.749755859375, -5.3951416015625, -5.04052734375, -4.6859130859375, -4.331298828125, -3.9766845703125, -3.6220703125, -3.2674560546875, -2.912841796875, -2.5582275390625, -2.20361328125, -1.8489990234375, -1.494384765625, -1.1397705078125, -0.78515625, -0.4305419921875, -0.075927734375, 0.2786865234375, 0.63330078125, 0.9879150390625, 1.342529296875, 1.6971435546875, 2.0517578125, 2.4063720703125, 2.760986328125, 3.1156005859375, 3.47021484375, 3.8248291015625, 4.179443359375, 4.5340576171875, 4.888671875, 5.2432861328125, 5.597900390625, 5.9525146484375, 6.30712890625, 6.6617431640625, 7.016357421875, 7.3709716796875, 7.7255859375, 8.0802001953125, 8.434814453125, 8.7894287109375, 9.14404296875, 9.4986572265625, 9.853271484375, 10.2078857421875, 10.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 2.0, 5.0, 10.0, 7.0, 9.0, 11.0, 7.0, 19.0, 16.0, 25.0, 20.0, 17.0, 24.0, 28.0, 39.0, 44.0, 30.0, 27.0, 34.0, 38.0, 49.0, 33.0, 38.0, 37.0, 39.0, 40.0, 27.0, 31.0, 34.0, 33.0, 33.0, 15.0, 35.0, 19.0, 26.0, 16.0, 11.0, 16.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.625, -18.061767578125, -17.49853515625, -16.935302734375, -16.3720703125, -15.808837890625, -15.24560546875, -14.682373046875, -14.119140625, -13.555908203125, -12.99267578125, -12.429443359375, -11.8662109375, -11.302978515625, -10.73974609375, -10.176513671875, -9.61328125, -9.050048828125, -8.48681640625, -7.923583984375, -7.3603515625, -6.797119140625, -6.23388671875, -5.670654296875, -5.107421875, -4.544189453125, -3.98095703125, -3.417724609375, -2.8544921875, -2.291259765625, -1.72802734375, -1.164794921875, -0.6015625, -0.038330078125, 0.52490234375, 1.088134765625, 1.6513671875, 2.214599609375, 2.77783203125, 3.341064453125, 3.904296875, 4.467529296875, 5.03076171875, 5.593994140625, 6.1572265625, 6.720458984375, 7.28369140625, 7.846923828125, 8.41015625, 8.973388671875, 9.53662109375, 10.099853515625, 10.6630859375, 11.226318359375, 11.78955078125, 12.352783203125, 12.916015625, 13.479248046875, 14.04248046875, 14.605712890625, 15.1689453125, 15.732177734375, 16.29541015625, 16.858642578125, 17.421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [7.0, 5.0, 12.0, 13.0, 22.0, 49.0, 60.0, 88.0, 165.0, 223.0, 368.0, 506.0, 825.0, 1165.0, 1796.0, 2708.0, 3829.0, 5513.0, 8082.0, 11628.0, 16451.0, 22680.0, 30432.0, 40625.0, 51924.0, 63340.0, 74730.0, 83746.0, 89442.0, 90193.0, 86256.0, 77617.0, 66850.0, 55210.0, 44078.0, 33519.0, 25085.0, 17794.0, 12909.0, 9074.0, 6413.0, 4397.0, 2925.0, 1997.0, 1267.0, 851.0, 604.0, 395.0, 240.0, 155.0, 91.0, 69.0, 50.0, 44.0, 17.0, 16.0, 12.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.3515625, -9.03076171875, -8.7099609375, -8.38916015625, -8.068359375, -7.74755859375, -7.4267578125, -7.10595703125, -6.78515625, -6.46435546875, -6.1435546875, -5.82275390625, -5.501953125, -5.18115234375, -4.8603515625, -4.53955078125, -4.21875, -3.89794921875, -3.5771484375, -3.25634765625, -2.935546875, -2.61474609375, -2.2939453125, -1.97314453125, -1.65234375, -1.33154296875, -1.0107421875, -0.68994140625, -0.369140625, -0.04833984375, 0.2724609375, 0.59326171875, 0.9140625, 1.23486328125, 1.5556640625, 1.87646484375, 2.197265625, 2.51806640625, 2.8388671875, 3.15966796875, 3.48046875, 3.80126953125, 4.1220703125, 4.44287109375, 4.763671875, 5.08447265625, 5.4052734375, 5.72607421875, 6.046875, 6.36767578125, 6.6884765625, 7.00927734375, 7.330078125, 7.65087890625, 7.9716796875, 8.29248046875, 8.61328125, 8.93408203125, 9.2548828125, 9.57568359375, 9.896484375, 10.21728515625, 10.5380859375, 10.85888671875, 11.1796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 10.0, 3.0, 9.0, 10.0, 10.0, 6.0, 9.0, 14.0, 20.0, 16.0, 20.0, 23.0, 21.0, 20.0, 37.0, 22.0, 35.0, 29.0, 28.0, 40.0, 24.0, 29.0, 33.0, 31.0, 33.0, 34.0, 35.0, 36.0, 29.0, 33.0, 29.0, 23.0, 21.0, 28.0, 24.0, 19.0, 17.0, 20.0, 16.0, 13.0, 8.0, 16.0, 7.0, 12.0, 6.0, 8.0, 5.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0], "bins": [-10.328125, -10.0126953125, -9.697265625, -9.3818359375, -9.06640625, -8.7509765625, -8.435546875, -8.1201171875, -7.8046875, -7.4892578125, -7.173828125, -6.8583984375, -6.54296875, -6.2275390625, -5.912109375, -5.5966796875, -5.28125, -4.9658203125, -4.650390625, -4.3349609375, -4.01953125, -3.7041015625, -3.388671875, -3.0732421875, -2.7578125, -2.4423828125, -2.126953125, -1.8115234375, -1.49609375, -1.1806640625, -0.865234375, -0.5498046875, -0.234375, 0.0810546875, 0.396484375, 0.7119140625, 1.02734375, 1.3427734375, 1.658203125, 1.9736328125, 2.2890625, 2.6044921875, 2.919921875, 3.2353515625, 3.55078125, 3.8662109375, 4.181640625, 4.4970703125, 4.8125, 5.1279296875, 5.443359375, 5.7587890625, 6.07421875, 6.3896484375, 6.705078125, 7.0205078125, 7.3359375, 7.6513671875, 7.966796875, 8.2822265625, 8.59765625, 8.9130859375, 9.228515625, 9.5439453125, 9.859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 12.0, 15.0, 36.0, 48.0, 82.0, 125.0, 186.0, 267.0, 424.0, 605.0, 944.0, 1521.0, 2424.0, 3984.0, 6123.0, 9508.0, 15156.0, 22577.0, 33953.0, 49389.0, 67398.0, 87527.0, 104621.0, 115470.0, 115398.0, 105852.0, 88348.0, 67941.0, 49748.0, 34042.0, 22977.0, 15107.0, 9737.0, 6090.0, 4019.0, 2413.0, 1555.0, 1062.0, 661.0, 445.0, 267.0, 186.0, 121.0, 63.0, 59.0, 24.0, 18.0, 10.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-3.66015625, -3.5382080078125, -3.416259765625, -3.2943115234375, -3.17236328125, -3.0504150390625, -2.928466796875, -2.8065185546875, -2.6845703125, -2.5626220703125, -2.440673828125, -2.3187255859375, -2.19677734375, -2.0748291015625, -1.952880859375, -1.8309326171875, -1.708984375, -1.5870361328125, -1.465087890625, -1.3431396484375, -1.22119140625, -1.0992431640625, -0.977294921875, -0.8553466796875, -0.7333984375, -0.6114501953125, -0.489501953125, -0.3675537109375, -0.24560546875, -0.1236572265625, -0.001708984375, 0.1202392578125, 0.2421875, 0.3641357421875, 0.486083984375, 0.6080322265625, 0.72998046875, 0.8519287109375, 0.973876953125, 1.0958251953125, 1.2177734375, 1.3397216796875, 1.461669921875, 1.5836181640625, 1.70556640625, 1.8275146484375, 1.949462890625, 2.0714111328125, 2.193359375, 2.3153076171875, 2.437255859375, 2.5592041015625, 2.68115234375, 2.8031005859375, 2.925048828125, 3.0469970703125, 3.1689453125, 3.2908935546875, 3.412841796875, 3.5347900390625, 3.65673828125, 3.7786865234375, 3.900634765625, 4.0225830078125, 4.14453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 8.0, 10.0, 14.0, 10.0, 17.0, 26.0, 24.0, 24.0, 30.0, 32.0, 33.0, 34.0, 36.0, 53.0, 50.0, 51.0, 44.0, 50.0, 50.0, 43.0, 43.0, 40.0, 31.0, 37.0, 30.0, 27.0, 34.0, 22.0, 21.0, 17.0, 5.0, 6.0, 8.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004680156707763672, -0.00045404955744743347, -0.00044008344411849976, -0.00042611733078956604, -0.0004121512174606323, -0.0003981851041316986, -0.0003842189908027649, -0.0003702528774738312, -0.00035628676414489746, -0.00034232065081596375, -0.00032835453748703003, -0.0003143884241580963, -0.0003004223108291626, -0.0002864561975002289, -0.00027249008417129517, -0.00025852397084236145, -0.00024455785751342773, -0.00023059174418449402, -0.0002166256308555603, -0.0002026595175266266, -0.00018869340419769287, -0.00017472729086875916, -0.00016076117753982544, -0.00014679506421089172, -0.000132828950881958, -0.00011886283755302429, -0.00010489672422409058, -9.093061089515686e-05, -7.696449756622314e-05, -6.299838423728943e-05, -4.903227090835571e-05, -3.5066157579422e-05, -2.110004425048828e-05, -7.1339309215545654e-06, 6.83218240737915e-06, 2.0798295736312866e-05, 3.476440906524658e-05, 4.87305223941803e-05, 6.269663572311401e-05, 7.666274905204773e-05, 9.062886238098145e-05, 0.00010459497570991516, 0.00011856108903884888, 0.0001325272023677826, 0.0001464933156967163, 0.00016045942902565002, 0.00017442554235458374, 0.00018839165568351746, 0.00020235776901245117, 0.0002163238823413849, 0.0002302899956703186, 0.0002442561089992523, 0.00025822222232818604, 0.00027218833565711975, 0.00028615444898605347, 0.0003001205623149872, 0.0003140866756439209, 0.0003280527889728546, 0.00034201890230178833, 0.00035598501563072205, 0.00036995112895965576, 0.0003839172422885895, 0.0003978833556175232, 0.0004118494689464569, 0.0004258155822753906]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 4.0, 13.0, 25.0, 45.0, 69.0, 97.0, 147.0, 223.0, 401.0, 582.0, 921.0, 1501.0, 2435.0, 4031.0, 6626.0, 10669.0, 17254.0, 27499.0, 42566.0, 62790.0, 87169.0, 110564.0, 126278.0, 129335.0, 117116.0, 96053.0, 70929.0, 48892.0, 31905.0, 20082.0, 12517.0, 7608.0, 4706.0, 2800.0, 1760.0, 1079.0, 691.0, 423.0, 283.0, 161.0, 123.0, 62.0, 43.0, 18.0, 32.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2734375, -4.13177490234375, -3.9901123046875, -3.84844970703125, -3.706787109375, -3.56512451171875, -3.4234619140625, -3.28179931640625, -3.14013671875, -2.99847412109375, -2.8568115234375, -2.71514892578125, -2.573486328125, -2.43182373046875, -2.2901611328125, -2.14849853515625, -2.0068359375, -1.86517333984375, -1.7235107421875, -1.58184814453125, -1.440185546875, -1.29852294921875, -1.1568603515625, -1.01519775390625, -0.87353515625, -0.73187255859375, -0.5902099609375, -0.44854736328125, -0.306884765625, -0.16522216796875, -0.0235595703125, 0.11810302734375, 0.259765625, 0.40142822265625, 0.5430908203125, 0.68475341796875, 0.826416015625, 0.96807861328125, 1.1097412109375, 1.25140380859375, 1.39306640625, 1.53472900390625, 1.6763916015625, 1.81805419921875, 1.959716796875, 2.10137939453125, 2.2430419921875, 2.38470458984375, 2.5263671875, 2.66802978515625, 2.8096923828125, 2.95135498046875, 3.093017578125, 3.23468017578125, 3.3763427734375, 3.51800537109375, 3.65966796875, 3.80133056640625, 3.9429931640625, 4.08465576171875, 4.226318359375, 4.36798095703125, 4.5096435546875, 4.65130615234375, 4.79296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 9.0, 7.0, 13.0, 11.0, 12.0, 16.0, 24.0, 13.0, 25.0, 26.0, 34.0, 32.0, 33.0, 34.0, 48.0, 40.0, 49.0, 45.0, 48.0, 50.0, 56.0, 53.0, 43.0, 37.0, 26.0, 40.0, 23.0, 28.0, 17.0, 19.0, 14.0, 13.0, 8.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9931640625, -1.9305267333984375, -1.867889404296875, -1.8052520751953125, -1.74261474609375, -1.6799774169921875, -1.617340087890625, -1.5547027587890625, -1.4920654296875, -1.4294281005859375, -1.366790771484375, -1.3041534423828125, -1.24151611328125, -1.1788787841796875, -1.116241455078125, -1.0536041259765625, -0.990966796875, -0.9283294677734375, -0.865692138671875, -0.8030548095703125, -0.74041748046875, -0.6777801513671875, -0.615142822265625, -0.5525054931640625, -0.4898681640625, -0.4272308349609375, -0.364593505859375, -0.3019561767578125, -0.23931884765625, -0.1766815185546875, -0.114044189453125, -0.0514068603515625, 0.01123046875, 0.0738677978515625, 0.136505126953125, 0.1991424560546875, 0.26177978515625, 0.3244171142578125, 0.387054443359375, 0.4496917724609375, 0.5123291015625, 0.5749664306640625, 0.637603759765625, 0.7002410888671875, 0.76287841796875, 0.8255157470703125, 0.888153076171875, 0.9507904052734375, 1.013427734375, 1.0760650634765625, 1.138702392578125, 1.2013397216796875, 1.26397705078125, 1.3266143798828125, 1.389251708984375, 1.4518890380859375, 1.5145263671875, 1.5771636962890625, 1.639801025390625, 1.7024383544921875, 1.76507568359375, 1.8277130126953125, 1.890350341796875, 1.9529876708984375, 2.015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 8.0, 6.0, 9.0, 12.0, 14.0, 17.0, 11.0, 19.0, 18.0, 28.0, 29.0, 41.0, 46.0, 43.0, 40.0, 44.0, 42.0, 55.0, 52.0, 53.0, 56.0, 51.0, 49.0, 31.0, 29.0, 26.0, 27.0, 20.0, 19.0, 23.0, 18.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.630645751953125, -18.050676345825195, -17.470706939697266, -16.890737533569336, -16.310768127441406, -15.730798721313477, -15.150829315185547, -14.570859909057617, -13.990890502929688, -13.410921096801758, -12.830951690673828, -12.250982284545898, -11.671012878417969, -11.091043472290039, -10.51107406616211, -9.93110466003418, -9.351134300231934, -8.771164894104004, -8.191195487976074, -7.6112260818481445, -7.031256675720215, -6.451287269592285, -5.871317386627197, -5.291347980499268, -4.711378574371338, -4.131409168243408, -3.5514397621154785, -2.9714701175689697, -2.39150071144104, -1.8115313053131104, -1.2315616607666016, -0.6515922546386719, -0.07162284851074219, 0.5083466172218323, 1.0883160829544067, 1.668285608291626, 2.2482550144195557, 2.8282244205474854, 3.408194065093994, 3.988163471221924, 4.5681328773498535, 5.148102283477783, 5.728071689605713, 6.308041572570801, 6.8880109786987305, 7.46798038482666, 8.04794979095459, 8.62791919708252, 9.20788860321045, 9.787858009338379, 10.367827415466309, 10.947796821594238, 11.527766227722168, 12.107735633850098, 12.687705993652344, 13.267675399780273, 13.847644805908203, 14.427614212036133, 15.007583618164062, 15.587553024291992, 16.167522430419922, 16.74749183654785, 17.32746124267578, 17.90743064880371, 18.48740005493164]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 18.0, 25.0, 10.0, 18.0, 20.0, 25.0, 19.0, 27.0, 33.0, 33.0, 39.0, 39.0, 37.0, 42.0, 36.0, 33.0, 39.0, 32.0, 38.0, 44.0, 41.0, 34.0, 29.0, 37.0, 32.0, 22.0, 23.0, 27.0, 23.0, 15.0, 26.0, 9.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.912578582763672, -18.298572540283203, -17.6845645904541, -17.070558547973633, -16.45655059814453, -15.842544555664062, -15.228537559509277, -14.614530563354492, -14.000523567199707, -13.386516571044922, -12.772509574890137, -12.158502578735352, -11.544496536254883, -10.930488586425781, -10.316482543945312, -9.702475547790527, -9.088468551635742, -8.474461555480957, -7.860454559326172, -7.246448040008545, -6.63244104385376, -6.018434047698975, -5.404427528381348, -4.7904205322265625, -4.176413536071777, -3.562406539916992, -2.948399782180786, -2.33439302444458, -1.720386028289795, -1.1063790321350098, -0.4923722743988037, 0.12163448333740234, 0.7356395721435547, 1.3496464490890503, 1.963653326034546, 2.577660083770752, 3.191667079925537, 3.8056740760803223, 4.419680595397949, 5.033687591552734, 5.6476945877075195, 6.261701583862305, 6.87570858001709, 7.489715099334717, 8.103721618652344, 8.717729568481445, 9.331735610961914, 9.9457426071167, 10.559749603271484, 11.17375659942627, 11.787763595581055, 12.40177059173584, 13.015777587890625, 13.629783630371094, 14.243790626525879, 14.857797622680664, 15.47180461883545, 16.085811614990234, 16.699817657470703, 17.313825607299805, 17.927831649780273, 18.541839599609375, 19.155845642089844, 19.769851684570312, 20.383859634399414]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 6.0, 11.0, 34.0, 39.0, 100.0, 156.0, 257.0, 452.0, 747.0, 1198.0, 2097.0, 3556.0, 5996.0, 10343.0, 16886.0, 27958.0, 44940.0, 72153.0, 111810.0, 166500.0, 239409.0, 322277.0, 407163.0, 467205.0, 487982.0, 458313.0, 389800.0, 305592.0, 223747.0, 155079.0, 102291.0, 66150.0, 41300.0, 25569.0, 15396.0, 8960.0, 5391.0, 3198.0, 1740.0, 1008.0, 655.0, 347.0, 185.0, 112.0, 58.0, 53.0, 30.0, 10.0, 11.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.234375, -13.7950439453125, -13.355712890625, -12.9163818359375, -12.47705078125, -12.0377197265625, -11.598388671875, -11.1590576171875, -10.7197265625, -10.2803955078125, -9.841064453125, -9.4017333984375, -8.96240234375, -8.5230712890625, -8.083740234375, -7.6444091796875, -7.205078125, -6.7657470703125, -6.326416015625, -5.8870849609375, -5.44775390625, -5.0084228515625, -4.569091796875, -4.1297607421875, -3.6904296875, -3.2510986328125, -2.811767578125, -2.3724365234375, -1.93310546875, -1.4937744140625, -1.054443359375, -0.6151123046875, -0.17578125, 0.2635498046875, 0.702880859375, 1.1422119140625, 1.58154296875, 2.0208740234375, 2.460205078125, 2.8995361328125, 3.3388671875, 3.7781982421875, 4.217529296875, 4.6568603515625, 5.09619140625, 5.5355224609375, 5.974853515625, 6.4141845703125, 6.853515625, 7.2928466796875, 7.732177734375, 8.1715087890625, 8.61083984375, 9.0501708984375, 9.489501953125, 9.9288330078125, 10.3681640625, 10.8074951171875, 11.246826171875, 11.6861572265625, 12.12548828125, 12.5648193359375, 13.004150390625, 13.4434814453125, 13.8828125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 14.0, 17.0, 14.0, 18.0, 13.0, 30.0, 23.0, 27.0, 33.0, 28.0, 27.0, 32.0, 46.0, 29.0, 30.0, 34.0, 28.0, 30.0, 36.0, 35.0, 29.0, 35.0, 30.0, 30.0, 31.0, 30.0, 26.0, 14.0, 28.0, 17.0, 22.0, 22.0, 17.0, 12.0, 14.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-13.75, -13.3253173828125, -12.900634765625, -12.4759521484375, -12.05126953125, -11.6265869140625, -11.201904296875, -10.7772216796875, -10.3525390625, -9.9278564453125, -9.503173828125, -9.0784912109375, -8.65380859375, -8.2291259765625, -7.804443359375, -7.3797607421875, -6.955078125, -6.5303955078125, -6.105712890625, -5.6810302734375, -5.25634765625, -4.8316650390625, -4.406982421875, -3.9822998046875, -3.5576171875, -3.1329345703125, -2.708251953125, -2.2835693359375, -1.85888671875, -1.4342041015625, -1.009521484375, -0.5848388671875, -0.16015625, 0.2645263671875, 0.689208984375, 1.1138916015625, 1.53857421875, 1.9632568359375, 2.387939453125, 2.8126220703125, 3.2373046875, 3.6619873046875, 4.086669921875, 4.5113525390625, 4.93603515625, 5.3607177734375, 5.785400390625, 6.2100830078125, 6.634765625, 7.0594482421875, 7.484130859375, 7.9088134765625, 8.33349609375, 8.7581787109375, 9.182861328125, 9.6075439453125, 10.0322265625, 10.4569091796875, 10.881591796875, 11.3062744140625, 11.73095703125, 12.1556396484375, 12.580322265625, 13.0050048828125, 13.4296875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 13.0, 11.0, 32.0, 50.0, 78.0, 147.0, 211.0, 355.0, 581.0, 935.0, 1641.0, 2647.0, 4269.0, 6910.0, 10991.0, 17106.0, 25953.0, 39649.0, 59018.0, 85163.0, 118643.0, 161566.0, 210533.0, 262318.0, 313501.0, 352629.0, 376627.0, 378524.0, 359979.0, 324347.0, 274830.0, 224013.0, 172349.0, 128091.0, 92645.0, 64616.0, 43489.0, 28909.0, 18890.0, 12042.0, 7740.0, 4628.0, 2944.0, 1844.0, 1084.0, 698.0, 427.0, 242.0, 152.0, 77.0, 56.0, 37.0, 27.0, 16.0, 4.0, 4.0, 6.0, 2.0], "bins": [-11.90625, -11.5467529296875, -11.187255859375, -10.8277587890625, -10.46826171875, -10.1087646484375, -9.749267578125, -9.3897705078125, -9.0302734375, -8.6707763671875, -8.311279296875, -7.9517822265625, -7.59228515625, -7.2327880859375, -6.873291015625, -6.5137939453125, -6.154296875, -5.7947998046875, -5.435302734375, -5.0758056640625, -4.71630859375, -4.3568115234375, -3.997314453125, -3.6378173828125, -3.2783203125, -2.9188232421875, -2.559326171875, -2.1998291015625, -1.84033203125, -1.4808349609375, -1.121337890625, -0.7618408203125, -0.40234375, -0.0428466796875, 0.316650390625, 0.6761474609375, 1.03564453125, 1.3951416015625, 1.754638671875, 2.1141357421875, 2.4736328125, 2.8331298828125, 3.192626953125, 3.5521240234375, 3.91162109375, 4.2711181640625, 4.630615234375, 4.9901123046875, 5.349609375, 5.7091064453125, 6.068603515625, 6.4281005859375, 6.78759765625, 7.1470947265625, 7.506591796875, 7.8660888671875, 8.2255859375, 8.5850830078125, 8.944580078125, 9.3040771484375, 9.66357421875, 10.0230712890625, 10.382568359375, 10.7420654296875, 11.1015625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 11.0, 25.0, 23.0, 32.0, 30.0, 31.0, 39.0, 58.0, 68.0, 82.0, 96.0, 98.0, 132.0, 142.0, 175.0, 170.0, 166.0, 189.0, 188.0, 221.0, 206.0, 193.0, 187.0, 168.0, 177.0, 146.0, 161.0, 127.0, 114.0, 107.0, 94.0, 74.0, 63.0, 58.0, 36.0, 29.0, 29.0, 23.0, 17.0, 17.0, 13.0, 6.0, 4.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4453125, -6.222900390625, -6.00048828125, -5.778076171875, -5.5556640625, -5.333251953125, -5.11083984375, -4.888427734375, -4.666015625, -4.443603515625, -4.22119140625, -3.998779296875, -3.7763671875, -3.553955078125, -3.33154296875, -3.109130859375, -2.88671875, -2.664306640625, -2.44189453125, -2.219482421875, -1.9970703125, -1.774658203125, -1.55224609375, -1.329833984375, -1.107421875, -0.885009765625, -0.66259765625, -0.440185546875, -0.2177734375, 0.004638671875, 0.22705078125, 0.449462890625, 0.671875, 0.894287109375, 1.11669921875, 1.339111328125, 1.5615234375, 1.783935546875, 2.00634765625, 2.228759765625, 2.451171875, 2.673583984375, 2.89599609375, 3.118408203125, 3.3408203125, 3.563232421875, 3.78564453125, 4.008056640625, 4.23046875, 4.452880859375, 4.67529296875, 4.897705078125, 5.1201171875, 5.342529296875, 5.56494140625, 5.787353515625, 6.009765625, 6.232177734375, 6.45458984375, 6.677001953125, 6.8994140625, 7.121826171875, 7.34423828125, 7.566650390625, 7.7890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 2.0, 8.0, 7.0, 7.0, 7.0, 6.0, 18.0, 6.0, 19.0, 19.0, 18.0, 29.0, 26.0, 34.0, 23.0, 31.0, 30.0, 34.0, 38.0, 47.0, 69.0, 43.0, 61.0, 37.0, 35.0, 35.0, 41.0, 27.0, 35.0, 35.0, 16.0, 29.0, 13.0, 20.0, 19.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.981654167175293, -13.473119735717773, -12.96458625793457, -12.456052780151367, -11.947518348693848, -11.438983917236328, -10.930450439453125, -10.421916961669922, -9.913382530212402, -9.404848098754883, -8.89631462097168, -8.387781143188477, -7.879246711730957, -7.370712757110596, -6.862178802490234, -6.353644847869873, -5.845110893249512, -5.33657693862915, -4.828042984008789, -4.319509029388428, -3.8109750747680664, -3.302441120147705, -2.7939071655273438, -2.2853732109069824, -1.776839256286621, -1.2683053016662598, -0.7597713470458984, -0.2512373924255371, 0.2572965621948242, 0.7658305168151855, 1.2743644714355469, 1.7828984260559082, 2.291433334350586, 2.7999672889709473, 3.3085012435913086, 3.81703519821167, 4.325569152832031, 4.834103107452393, 5.342637062072754, 5.851171016693115, 6.359704971313477, 6.868238925933838, 7.376772880554199, 7.8853068351745605, 8.393840789794922, 8.902374267578125, 9.410908699035645, 9.919443130493164, 10.427976608276367, 10.93651008605957, 11.44504451751709, 11.95357894897461, 12.462112426757812, 12.970645904541016, 13.479180335998535, 13.987714767456055, 14.496248245239258, 15.004781723022461, 15.51331615447998, 16.0218505859375, 16.530384063720703, 17.038917541503906, 17.54745101928711, 18.055986404418945, 18.56451988220215]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 14.0, 7.0, 9.0, 14.0, 9.0, 16.0, 21.0, 26.0, 24.0, 20.0, 30.0, 36.0, 31.0, 35.0, 47.0, 35.0, 33.0, 51.0, 40.0, 32.0, 51.0, 42.0, 43.0, 45.0, 36.0, 40.0, 32.0, 35.0, 21.0, 22.0, 13.0, 20.0, 9.0, 9.0, 16.0, 8.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.922182083129883, -20.296356201171875, -19.670530319213867, -19.044702529907227, -18.41887664794922, -17.79305076599121, -17.167224884033203, -16.541399002075195, -15.915572166442871, -15.289746284484863, -14.663919448852539, -14.038093566894531, -13.412267684936523, -12.7864408493042, -12.160614967346191, -11.534788131713867, -10.90896224975586, -10.283136367797852, -9.657309532165527, -9.03148365020752, -8.405656814575195, -7.7798309326171875, -7.15400505065918, -6.528178691864014, -5.902352333068848, -5.276525974273682, -4.650699615478516, -4.024873733520508, -3.399047374725342, -2.773221015930176, -2.147394895553589, -1.521568775177002, -0.8957405090332031, -0.26991426944732666, 0.3559119701385498, 0.9817382097244263, 1.6075644493103027, 2.2333908081054688, 2.8592169284820557, 3.4850430488586426, 4.110869407653809, 4.736695766448975, 5.362522125244141, 5.988348007202148, 6.6141743659973145, 7.2400007247924805, 7.865826606750488, 8.491653442382812, 9.11747932434082, 9.743305206298828, 10.369132041931152, 10.99495792388916, 11.620784759521484, 12.246610641479492, 12.8724365234375, 13.498262405395508, 14.124089241027832, 14.74991512298584, 15.375741958618164, 16.001567840576172, 16.62739372253418, 17.253219604492188, 17.879047393798828, 18.504873275756836, 19.130699157714844]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 13.0, 20.0, 16.0, 28.0, 48.0, 64.0, 111.0, 142.0, 213.0, 318.0, 472.0, 637.0, 1064.0, 1562.0, 2432.0, 3669.0, 5655.0, 8762.0, 13784.0, 22172.0, 35106.0, 55707.0, 89847.0, 143732.0, 204154.0, 169817.0, 107901.0, 66783.0, 41543.0, 26294.0, 16558.0, 10570.0, 6778.0, 4248.0, 2836.0, 1868.0, 1175.0, 825.0, 507.0, 352.0, 231.0, 176.0, 107.0, 84.0, 59.0, 44.0, 26.0, 14.0, 10.0, 11.0, 9.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.998046875, -2.9090576171875, -2.820068359375, -2.7310791015625, -2.64208984375, -2.5531005859375, -2.464111328125, -2.3751220703125, -2.2861328125, -2.1971435546875, -2.108154296875, -2.0191650390625, -1.93017578125, -1.8411865234375, -1.752197265625, -1.6632080078125, -1.57421875, -1.4852294921875, -1.396240234375, -1.3072509765625, -1.21826171875, -1.1292724609375, -1.040283203125, -0.9512939453125, -0.8623046875, -0.7733154296875, -0.684326171875, -0.5953369140625, -0.50634765625, -0.4173583984375, -0.328369140625, -0.2393798828125, -0.150390625, -0.0614013671875, 0.027587890625, 0.1165771484375, 0.20556640625, 0.2945556640625, 0.383544921875, 0.4725341796875, 0.5615234375, 0.6505126953125, 0.739501953125, 0.8284912109375, 0.91748046875, 1.0064697265625, 1.095458984375, 1.1844482421875, 1.2734375, 1.3624267578125, 1.451416015625, 1.5404052734375, 1.62939453125, 1.7183837890625, 1.807373046875, 1.8963623046875, 1.9853515625, 2.0743408203125, 2.163330078125, 2.2523193359375, 2.34130859375, 2.4302978515625, 2.519287109375, 2.6082763671875, 2.697265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 8.0, 7.0, 7.0, 9.0, 9.0, 13.0, 21.0, 14.0, 20.0, 27.0, 21.0, 26.0, 25.0, 34.0, 28.0, 35.0, 29.0, 33.0, 43.0, 54.0, 35.0, 35.0, 47.0, 51.0, 51.0, 46.0, 29.0, 39.0, 24.0, 38.0, 26.0, 23.0, 15.0, 12.0, 12.0, 11.0, 13.0, 5.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.90625, -20.263916015625, -19.62158203125, -18.979248046875, -18.3369140625, -17.694580078125, -17.05224609375, -16.409912109375, -15.767578125, -15.125244140625, -14.48291015625, -13.840576171875, -13.1982421875, -12.555908203125, -11.91357421875, -11.271240234375, -10.62890625, -9.986572265625, -9.34423828125, -8.701904296875, -8.0595703125, -7.417236328125, -6.77490234375, -6.132568359375, -5.490234375, -4.847900390625, -4.20556640625, -3.563232421875, -2.9208984375, -2.278564453125, -1.63623046875, -0.993896484375, -0.3515625, 0.290771484375, 0.93310546875, 1.575439453125, 2.2177734375, 2.860107421875, 3.50244140625, 4.144775390625, 4.787109375, 5.429443359375, 6.07177734375, 6.714111328125, 7.3564453125, 7.998779296875, 8.64111328125, 9.283447265625, 9.92578125, 10.568115234375, 11.21044921875, 11.852783203125, 12.4951171875, 13.137451171875, 13.77978515625, 14.422119140625, 15.064453125, 15.706787109375, 16.34912109375, 16.991455078125, 17.6337890625, 18.276123046875, 18.91845703125, 19.560791015625, 20.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 13.0, 12.0, 38.0, 29.0, 37.0, 72.0, 102.0, 125.0, 156.0, 246.0, 421.0, 641.0, 878.0, 1246.0, 1907.0, 2889.0, 4458.0, 6826.0, 10670.0, 16713.0, 26808.0, 43820.0, 73331.0, 125581.0, 204707.0, 206188.0, 126874.0, 73994.0, 44476.0, 27413.0, 16672.0, 10721.0, 6946.0, 4465.0, 2988.0, 1999.0, 1232.0, 875.0, 629.0, 458.0, 285.0, 163.0, 132.0, 103.0, 56.0, 56.0, 38.0, 25.0, 17.0, 10.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-3.00390625, -2.91290283203125, -2.8218994140625, -2.73089599609375, -2.639892578125, -2.54888916015625, -2.4578857421875, -2.36688232421875, -2.27587890625, -2.18487548828125, -2.0938720703125, -2.00286865234375, -1.911865234375, -1.82086181640625, -1.7298583984375, -1.63885498046875, -1.5478515625, -1.45684814453125, -1.3658447265625, -1.27484130859375, -1.183837890625, -1.09283447265625, -1.0018310546875, -0.91082763671875, -0.81982421875, -0.72882080078125, -0.6378173828125, -0.54681396484375, -0.455810546875, -0.36480712890625, -0.2738037109375, -0.18280029296875, -0.091796875, -0.00079345703125, 0.0902099609375, 0.18121337890625, 0.272216796875, 0.36322021484375, 0.4542236328125, 0.54522705078125, 0.63623046875, 0.72723388671875, 0.8182373046875, 0.90924072265625, 1.000244140625, 1.09124755859375, 1.1822509765625, 1.27325439453125, 1.3642578125, 1.45526123046875, 1.5462646484375, 1.63726806640625, 1.728271484375, 1.81927490234375, 1.9102783203125, 2.00128173828125, 2.09228515625, 2.18328857421875, 2.2742919921875, 2.36529541015625, 2.456298828125, 2.54730224609375, 2.6383056640625, 2.72930908203125, 2.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 8.0, 10.0, 10.0, 16.0, 21.0, 7.0, 17.0, 13.0, 22.0, 26.0, 27.0, 39.0, 38.0, 38.0, 47.0, 23.0, 51.0, 48.0, 40.0, 38.0, 39.0, 37.0, 38.0, 35.0, 33.0, 31.0, 26.0, 32.0, 26.0, 29.0, 19.0, 27.0, 12.0, 11.0, 14.0, 8.0, 6.0, 4.0, 8.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.66650390625, -10.2626953125, -9.85888671875, -9.455078125, -9.05126953125, -8.6474609375, -8.24365234375, -7.83984375, -7.43603515625, -7.0322265625, -6.62841796875, -6.224609375, -5.82080078125, -5.4169921875, -5.01318359375, -4.609375, -4.20556640625, -3.8017578125, -3.39794921875, -2.994140625, -2.59033203125, -2.1865234375, -1.78271484375, -1.37890625, -0.97509765625, -0.5712890625, -0.16748046875, 0.236328125, 0.64013671875, 1.0439453125, 1.44775390625, 1.8515625, 2.25537109375, 2.6591796875, 3.06298828125, 3.466796875, 3.87060546875, 4.2744140625, 4.67822265625, 5.08203125, 5.48583984375, 5.8896484375, 6.29345703125, 6.697265625, 7.10107421875, 7.5048828125, 7.90869140625, 8.3125, 8.71630859375, 9.1201171875, 9.52392578125, 9.927734375, 10.33154296875, 10.7353515625, 11.13916015625, 11.54296875, 11.94677734375, 12.3505859375, 12.75439453125, 13.158203125, 13.56201171875, 13.9658203125, 14.36962890625, 14.7734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 10.0, 12.0, 17.0, 29.0, 33.0, 59.0, 88.0, 156.0, 245.0, 399.0, 631.0, 960.0, 1636.0, 2834.0, 4906.0, 8524.0, 15150.0, 29048.0, 60086.0, 152340.0, 388844.0, 222256.0, 79980.0, 36557.0, 19002.0, 10384.0, 5862.0, 3398.0, 1960.0, 1195.0, 758.0, 423.0, 251.0, 165.0, 114.0, 74.0, 67.0, 24.0, 28.0, 8.0, 11.0, 8.0, 10.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1669921875, -0.1618804931640625, -0.156768798828125, -0.1516571044921875, -0.14654541015625, -0.1414337158203125, -0.136322021484375, -0.1312103271484375, -0.1260986328125, -0.1209869384765625, -0.115875244140625, -0.1107635498046875, -0.10565185546875, -0.1005401611328125, -0.095428466796875, -0.0903167724609375, -0.085205078125, -0.0800933837890625, -0.074981689453125, -0.0698699951171875, -0.06475830078125, -0.0596466064453125, -0.054534912109375, -0.0494232177734375, -0.0443115234375, -0.0391998291015625, -0.034088134765625, -0.0289764404296875, -0.02386474609375, -0.0187530517578125, -0.013641357421875, -0.0085296630859375, -0.00341796875, 0.0016937255859375, 0.006805419921875, 0.0119171142578125, 0.01702880859375, 0.0221405029296875, 0.027252197265625, 0.0323638916015625, 0.0374755859375, 0.0425872802734375, 0.047698974609375, 0.0528106689453125, 0.05792236328125, 0.0630340576171875, 0.068145751953125, 0.0732574462890625, 0.078369140625, 0.0834808349609375, 0.088592529296875, 0.0937042236328125, 0.09881591796875, 0.1039276123046875, 0.109039306640625, 0.1141510009765625, 0.1192626953125, 0.1243743896484375, 0.129486083984375, 0.1345977783203125, 0.13970947265625, 0.1448211669921875, 0.149932861328125, 0.1550445556640625, 0.16015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 9.0, 14.0, 15.0, 23.0, 17.0, 23.0, 25.0, 54.0, 37.0, 49.0, 35.0, 47.0, 48.0, 54.0, 54.0, 52.0, 52.0, 50.0, 46.0, 39.0, 36.0, 37.0, 22.0, 29.0, 18.0, 19.0, 15.0, 12.0, 10.0, 7.0, 3.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.2530555725097656e-05, -2.186838537454605e-05, -2.1206215023994446e-05, -2.054404467344284e-05, -1.9881874322891235e-05, -1.921970397233963e-05, -1.8557533621788025e-05, -1.789536327123642e-05, -1.7233192920684814e-05, -1.657102257013321e-05, -1.5908852219581604e-05, -1.5246681869029999e-05, -1.4584511518478394e-05, -1.3922341167926788e-05, -1.3260170817375183e-05, -1.2598000466823578e-05, -1.1935830116271973e-05, -1.1273659765720367e-05, -1.0611489415168762e-05, -9.949319064617157e-06, -9.287148714065552e-06, -8.624978363513947e-06, -7.962808012962341e-06, -7.300637662410736e-06, -6.638467311859131e-06, -5.976296961307526e-06, -5.31412661075592e-06, -4.651956260204315e-06, -3.98978590965271e-06, -3.3276155591011047e-06, -2.6654452085494995e-06, -2.0032748579978943e-06, -1.341104507446289e-06, -6.789341568946838e-07, -1.6763806343078613e-08, 6.454065442085266e-07, 1.3075768947601318e-06, 1.969747245311737e-06, 2.6319175958633423e-06, 3.2940879464149475e-06, 3.956258296966553e-06, 4.618428647518158e-06, 5.280598998069763e-06, 5.942769348621368e-06, 6.604939699172974e-06, 7.267110049724579e-06, 7.929280400276184e-06, 8.59145075082779e-06, 9.253621101379395e-06, 9.915791451931e-06, 1.0577961802482605e-05, 1.124013215303421e-05, 1.1902302503585815e-05, 1.256447285413742e-05, 1.3226643204689026e-05, 1.3888813555240631e-05, 1.4550983905792236e-05, 1.5213154256343842e-05, 1.5875324606895447e-05, 1.6537494957447052e-05, 1.7199665307998657e-05, 1.7861835658550262e-05, 1.8524006009101868e-05, 1.9186176359653473e-05, 1.9848346710205078e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 18.0, 16.0, 27.0, 64.0, 64.0, 118.0, 186.0, 246.0, 373.0, 560.0, 779.0, 1090.0, 1653.0, 2396.0, 3603.0, 5310.0, 7945.0, 12304.0, 18741.0, 30108.0, 49710.0, 89696.0, 185924.0, 303306.0, 143751.0, 73428.0, 42469.0, 25916.0, 16658.0, 10599.0, 7117.0, 4658.0, 3016.0, 2155.0, 1490.0, 938.0, 660.0, 474.0, 301.0, 235.0, 140.0, 102.0, 71.0, 38.0, 42.0, 14.0, 13.0, 11.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.24412155151367188, -0.23580169677734375, -0.22748184204101562, -0.2191619873046875, -0.21084213256835938, -0.20252227783203125, -0.19420242309570312, -0.185882568359375, -0.17756271362304688, -0.16924285888671875, -0.16092300415039062, -0.1526031494140625, -0.14428329467773438, -0.13596343994140625, -0.12764358520507812, -0.11932373046875, -0.11100387573242188, -0.10268402099609375, -0.09436416625976562, -0.0860443115234375, -0.07772445678710938, -0.06940460205078125, -0.061084747314453125, -0.052764892578125, -0.044445037841796875, -0.03612518310546875, -0.027805328369140625, -0.0194854736328125, -0.011165618896484375, -0.00284576416015625, 0.005474090576171875, 0.0137939453125, 0.022113800048828125, 0.03043365478515625, 0.038753509521484375, 0.0470733642578125, 0.055393218994140625, 0.06371307373046875, 0.07203292846679688, 0.080352783203125, 0.08867263793945312, 0.09699249267578125, 0.10531234741210938, 0.1136322021484375, 0.12195205688476562, 0.13027191162109375, 0.13859176635742188, 0.14691162109375, 0.15523147583007812, 0.16355133056640625, 0.17187118530273438, 0.1801910400390625, 0.18851089477539062, 0.19683074951171875, 0.20515060424804688, 0.213470458984375, 0.22179031372070312, 0.23011016845703125, 0.23843002319335938, 0.2467498779296875, 0.2550697326660156, 0.26338958740234375, 0.2717094421386719, 0.280029296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 1.0, 6.0, 8.0, 12.0, 9.0, 13.0, 20.0, 33.0, 41.0, 49.0, 81.0, 103.0, 106.0, 97.0, 112.0, 49.0, 50.0, 40.0, 34.0, 22.0, 21.0, 15.0, 13.0, 6.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07898902893066406, -0.07570266723632812, -0.07241630554199219, -0.06912994384765625, -0.06584358215332031, -0.06255722045898438, -0.05927085876464844, -0.0559844970703125, -0.05269813537597656, -0.049411773681640625, -0.04612541198730469, -0.04283905029296875, -0.03955268859863281, -0.036266326904296875, -0.03297996520996094, -0.029693603515625, -0.026407241821289062, -0.023120880126953125, -0.019834518432617188, -0.01654815673828125, -0.013261795043945312, -0.009975433349609375, -0.0066890716552734375, -0.0034027099609375, -0.0001163482666015625, 0.003170013427734375, 0.0064563751220703125, 0.00974273681640625, 0.013029098510742188, 0.016315460205078125, 0.019601821899414062, 0.02288818359375, 0.026174545288085938, 0.029460906982421875, 0.03274726867675781, 0.03603363037109375, 0.03931999206542969, 0.042606353759765625, 0.04589271545410156, 0.0491790771484375, 0.05246543884277344, 0.055751800537109375, 0.05903816223144531, 0.06232452392578125, 0.06561088562011719, 0.06889724731445312, 0.07218360900878906, 0.075469970703125, 0.07875633239746094, 0.08204269409179688, 0.08532905578613281, 0.08861541748046875, 0.09190177917480469, 0.09518814086914062, 0.09847450256347656, 0.1017608642578125, 0.10504722595214844, 0.10833358764648438, 0.11161994934082031, 0.11490631103515625, 0.11819267272949219, 0.12147903442382812, 0.12476539611816406, 0.1280517578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 6.0, 6.0, 11.0, 11.0, 9.0, 19.0, 17.0, 21.0, 27.0, 27.0, 34.0, 22.0, 35.0, 26.0, 35.0, 40.0, 43.0, 63.0, 48.0, 53.0, 44.0, 33.0, 36.0, 42.0, 32.0, 37.0, 26.0, 16.0, 29.0, 17.0, 22.0, 13.0, 18.0, 13.0, 7.0, 9.0, 9.0, 5.0, 2.0, 7.0, 0.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.900808334350586, -13.398384094238281, -12.895960807800293, -12.393537521362305, -11.89111328125, -11.388689041137695, -10.886265754699707, -10.383842468261719, -9.881418228149414, -9.37899398803711, -8.876570701599121, -8.374147415161133, -7.871723175048828, -7.369299411773682, -6.866875648498535, -6.364451885223389, -5.862028121948242, -5.359604358673096, -4.857180595397949, -4.354756832122803, -3.8523330688476562, -3.3499093055725098, -2.8474855422973633, -2.345061779022217, -1.8426380157470703, -1.3402142524719238, -0.8377904891967773, -0.33536672592163086, 0.16705703735351562, 0.6694808006286621, 1.1719045639038086, 1.674328327178955, 2.1767520904541016, 2.679175853729248, 3.1815996170043945, 3.684023380279541, 4.1864471435546875, 4.688870906829834, 5.1912946701049805, 5.693718433380127, 6.196142196655273, 6.69856595993042, 7.200989723205566, 7.703413486480713, 8.20583724975586, 8.708261489868164, 9.210684776306152, 9.71310806274414, 10.215532302856445, 10.71795654296875, 11.220379829406738, 11.722803115844727, 12.225227355957031, 12.727651596069336, 13.230074882507324, 13.732498168945312, 14.234922409057617, 14.737346649169922, 15.23976993560791, 15.742193222045898, 16.244617462158203, 16.747041702270508, 17.249465942382812, 17.751888275146484, 18.25431251525879]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 14.0, 7.0, 8.0, 15.0, 7.0, 17.0, 21.0, 26.0, 25.0, 17.0, 32.0, 37.0, 30.0, 32.0, 47.0, 37.0, 30.0, 49.0, 47.0, 27.0, 53.0, 42.0, 44.0, 44.0, 31.0, 46.0, 30.0, 36.0, 21.0, 23.0, 14.0, 16.0, 14.0, 7.0, 16.0, 8.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.8687801361084, -20.247539520263672, -19.626298904418945, -19.00505828857422, -18.383819580078125, -17.7625789642334, -17.141338348388672, -16.520097732543945, -15.898857116699219, -15.277616500854492, -14.656375885009766, -14.035136222839355, -13.413895606994629, -12.792654991149902, -12.171415328979492, -11.550174713134766, -10.928934097290039, -10.307693481445312, -9.686452865600586, -9.065213203430176, -8.44397258758545, -7.822731971740723, -7.201491832733154, -6.580251693725586, -5.959011077880859, -5.337770462036133, -4.7165303230285645, -4.095290184020996, -3.4740495681762695, -2.852809190750122, -2.2315688133239746, -1.6103286743164062, -0.9890861511230469, -0.3678457736968994, 0.25339460372924805, 0.8746349811553955, 1.495875358581543, 2.1171157360076904, 2.738356113433838, 3.3595962524414062, 3.980836868286133, 4.602077484130859, 5.223317623138428, 5.844557762145996, 6.465798377990723, 7.087038993835449, 7.708279132843018, 8.329519271850586, 8.950759887695312, 9.572000503540039, 10.193241119384766, 10.814480781555176, 11.435721397399902, 12.056962013244629, 12.678201675415039, 13.299442291259766, 13.920682907104492, 14.541923522949219, 15.163164138793945, 15.784403800964355, 16.405643463134766, 17.026884078979492, 17.64812469482422, 18.269365310668945, 18.890605926513672]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 23.0, 38.0, 69.0, 96.0, 173.0, 269.0, 405.0, 711.0, 1203.0, 1865.0, 3153.0, 4744.0, 7500.0, 11803.0, 17744.0, 26522.0, 38288.0, 52886.0, 69976.0, 86697.0, 100435.0, 107988.0, 106860.0, 98640.0, 84842.0, 66979.0, 50253.0, 36622.0, 25147.0, 16688.0, 11183.0, 7118.0, 4423.0, 2723.0, 1635.0, 1065.0, 655.0, 439.0, 274.0, 166.0, 85.0, 61.0, 33.0, 13.0, 11.0, 13.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.390625, -11.0338134765625, -10.677001953125, -10.3201904296875, -9.96337890625, -9.6065673828125, -9.249755859375, -8.8929443359375, -8.5361328125, -8.1793212890625, -7.822509765625, -7.4656982421875, -7.10888671875, -6.7520751953125, -6.395263671875, -6.0384521484375, -5.681640625, -5.3248291015625, -4.968017578125, -4.6112060546875, -4.25439453125, -3.8975830078125, -3.540771484375, -3.1839599609375, -2.8271484375, -2.4703369140625, -2.113525390625, -1.7567138671875, -1.39990234375, -1.0430908203125, -0.686279296875, -0.3294677734375, 0.02734375, 0.3841552734375, 0.740966796875, 1.0977783203125, 1.45458984375, 1.8114013671875, 2.168212890625, 2.5250244140625, 2.8818359375, 3.2386474609375, 3.595458984375, 3.9522705078125, 4.30908203125, 4.6658935546875, 5.022705078125, 5.3795166015625, 5.736328125, 6.0931396484375, 6.449951171875, 6.8067626953125, 7.16357421875, 7.5203857421875, 7.877197265625, 8.2340087890625, 8.5908203125, 8.9476318359375, 9.304443359375, 9.6612548828125, 10.01806640625, 10.3748779296875, 10.731689453125, 11.0885009765625, 11.4453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 12.0, 11.0, 7.0, 11.0, 20.0, 8.0, 19.0, 28.0, 19.0, 29.0, 32.0, 36.0, 32.0, 35.0, 39.0, 45.0, 49.0, 47.0, 59.0, 34.0, 40.0, 57.0, 41.0, 37.0, 35.0, 36.0, 33.0, 25.0, 22.0, 22.0, 20.0, 18.0, 13.0, 7.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.39404296875, -20.7255859375, -20.05712890625, -19.388671875, -18.72021484375, -18.0517578125, -17.38330078125, -16.71484375, -16.04638671875, -15.3779296875, -14.70947265625, -14.041015625, -13.37255859375, -12.7041015625, -12.03564453125, -11.3671875, -10.69873046875, -10.0302734375, -9.36181640625, -8.693359375, -8.02490234375, -7.3564453125, -6.68798828125, -6.01953125, -5.35107421875, -4.6826171875, -4.01416015625, -3.345703125, -2.67724609375, -2.0087890625, -1.34033203125, -0.671875, -0.00341796875, 0.6650390625, 1.33349609375, 2.001953125, 2.67041015625, 3.3388671875, 4.00732421875, 4.67578125, 5.34423828125, 6.0126953125, 6.68115234375, 7.349609375, 8.01806640625, 8.6865234375, 9.35498046875, 10.0234375, 10.69189453125, 11.3603515625, 12.02880859375, 12.697265625, 13.36572265625, 14.0341796875, 14.70263671875, 15.37109375, 16.03955078125, 16.7080078125, 17.37646484375, 18.044921875, 18.71337890625, 19.3818359375, 20.05029296875, 20.71875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 8.0, 10.0, 10.0, 17.0, 31.0, 43.0, 61.0, 105.0, 166.0, 249.0, 417.0, 742.0, 1108.0, 1809.0, 2913.0, 4598.0, 7077.0, 11311.0, 17152.0, 25526.0, 37228.0, 51391.0, 67667.0, 83806.0, 97278.0, 105902.0, 106375.0, 98703.0, 85899.0, 69760.0, 53623.0, 39036.0, 27387.0, 18214.0, 11890.0, 7732.0, 4931.0, 3133.0, 1952.0, 1208.0, 801.0, 498.0, 318.0, 177.0, 119.0, 61.0, 50.0, 24.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.5401611328125, -10.189697265625, -9.8392333984375, -9.48876953125, -9.1383056640625, -8.787841796875, -8.4373779296875, -8.0869140625, -7.7364501953125, -7.385986328125, -7.0355224609375, -6.68505859375, -6.3345947265625, -5.984130859375, -5.6336669921875, -5.283203125, -4.9327392578125, -4.582275390625, -4.2318115234375, -3.88134765625, -3.5308837890625, -3.180419921875, -2.8299560546875, -2.4794921875, -2.1290283203125, -1.778564453125, -1.4281005859375, -1.07763671875, -0.7271728515625, -0.376708984375, -0.0262451171875, 0.32421875, 0.6746826171875, 1.025146484375, 1.3756103515625, 1.72607421875, 2.0765380859375, 2.427001953125, 2.7774658203125, 3.1279296875, 3.4783935546875, 3.828857421875, 4.1793212890625, 4.52978515625, 4.8802490234375, 5.230712890625, 5.5811767578125, 5.931640625, 6.2821044921875, 6.632568359375, 6.9830322265625, 7.33349609375, 7.6839599609375, 8.034423828125, 8.3848876953125, 8.7353515625, 9.0858154296875, 9.436279296875, 9.7867431640625, 10.13720703125, 10.4876708984375, 10.838134765625, 11.1885986328125, 11.5390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 3.0, 2.0, 9.0, 10.0, 14.0, 19.0, 16.0, 18.0, 22.0, 14.0, 26.0, 21.0, 37.0, 41.0, 44.0, 35.0, 45.0, 45.0, 39.0, 54.0, 53.0, 38.0, 39.0, 47.0, 37.0, 42.0, 28.0, 25.0, 19.0, 30.0, 20.0, 22.0, 17.0, 7.0, 10.0, 15.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.281005859375, -12.88232421875, -12.483642578125, -12.0849609375, -11.686279296875, -11.28759765625, -10.888916015625, -10.490234375, -10.091552734375, -9.69287109375, -9.294189453125, -8.8955078125, -8.496826171875, -8.09814453125, -7.699462890625, -7.30078125, -6.902099609375, -6.50341796875, -6.104736328125, -5.7060546875, -5.307373046875, -4.90869140625, -4.510009765625, -4.111328125, -3.712646484375, -3.31396484375, -2.915283203125, -2.5166015625, -2.117919921875, -1.71923828125, -1.320556640625, -0.921875, -0.523193359375, -0.12451171875, 0.274169921875, 0.6728515625, 1.071533203125, 1.47021484375, 1.868896484375, 2.267578125, 2.666259765625, 3.06494140625, 3.463623046875, 3.8623046875, 4.260986328125, 4.65966796875, 5.058349609375, 5.45703125, 5.855712890625, 6.25439453125, 6.653076171875, 7.0517578125, 7.450439453125, 7.84912109375, 8.247802734375, 8.646484375, 9.045166015625, 9.44384765625, 9.842529296875, 10.2412109375, 10.639892578125, 11.03857421875, 11.437255859375, 11.8359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 18.0, 15.0, 23.0, 52.0, 44.0, 104.0, 136.0, 244.0, 338.0, 618.0, 833.0, 1367.0, 2199.0, 3440.0, 5735.0, 9116.0, 14049.0, 22041.0, 33555.0, 48482.0, 67041.0, 86951.0, 105636.0, 115984.0, 116154.0, 106819.0, 89759.0, 69219.0, 50522.0, 34577.0, 23068.0, 14910.0, 9398.0, 6006.0, 3675.0, 2363.0, 1431.0, 957.0, 609.0, 389.0, 226.0, 156.0, 99.0, 76.0, 48.0, 25.0, 21.0, 11.0, 7.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.654296875, -3.53662109375, -3.4189453125, -3.30126953125, -3.18359375, -3.06591796875, -2.9482421875, -2.83056640625, -2.712890625, -2.59521484375, -2.4775390625, -2.35986328125, -2.2421875, -2.12451171875, -2.0068359375, -1.88916015625, -1.771484375, -1.65380859375, -1.5361328125, -1.41845703125, -1.30078125, -1.18310546875, -1.0654296875, -0.94775390625, -0.830078125, -0.71240234375, -0.5947265625, -0.47705078125, -0.359375, -0.24169921875, -0.1240234375, -0.00634765625, 0.111328125, 0.22900390625, 0.3466796875, 0.46435546875, 0.58203125, 0.69970703125, 0.8173828125, 0.93505859375, 1.052734375, 1.17041015625, 1.2880859375, 1.40576171875, 1.5234375, 1.64111328125, 1.7587890625, 1.87646484375, 1.994140625, 2.11181640625, 2.2294921875, 2.34716796875, 2.46484375, 2.58251953125, 2.7001953125, 2.81787109375, 2.935546875, 3.05322265625, 3.1708984375, 3.28857421875, 3.40625, 3.52392578125, 3.6416015625, 3.75927734375, 3.876953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 8.0, 12.0, 14.0, 19.0, 22.0, 13.0, 23.0, 30.0, 31.0, 46.0, 43.0, 43.0, 38.0, 46.0, 36.0, 51.0, 54.0, 45.0, 40.0, 43.0, 44.0, 28.0, 40.0, 32.0, 21.0, 16.0, 22.0, 19.0, 19.0, 10.0, 11.0, 18.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00039696693420410156, -0.00038512423634529114, -0.0003732815384864807, -0.0003614388406276703, -0.00034959614276885986, -0.00033775344491004944, -0.000325910747051239, -0.0003140680491924286, -0.00030222535133361816, -0.00029038265347480774, -0.0002785399556159973, -0.0002666972577571869, -0.00025485455989837646, -0.00024301186203956604, -0.00023116916418075562, -0.0002193264663219452, -0.00020748376846313477, -0.00019564107060432434, -0.00018379837274551392, -0.0001719556748867035, -0.00016011297702789307, -0.00014827027916908264, -0.00013642758131027222, -0.0001245848834514618, -0.00011274218559265137, -0.00010089948773384094, -8.905678987503052e-05, -7.721409201622009e-05, -6.537139415740967e-05, -5.352869629859924e-05, -4.168599843978882e-05, -2.9843300580978394e-05, -1.800060272216797e-05, -6.157904863357544e-06, 5.684792995452881e-06, 1.7527490854263306e-05, 2.937018871307373e-05, 4.1212886571884155e-05, 5.305558443069458e-05, 6.4898282289505e-05, 7.674098014831543e-05, 8.858367800712585e-05, 0.00010042637586593628, 0.0001122690737247467, 0.00012411177158355713, 0.00013595446944236755, 0.00014779716730117798, 0.0001596398651599884, 0.00017148256301879883, 0.00018332526087760925, 0.00019516795873641968, 0.0002070106565952301, 0.00021885335445404053, 0.00023069605231285095, 0.00024253875017166138, 0.0002543814480304718, 0.0002662241458892822, 0.00027806684374809265, 0.0002899095416069031, 0.0003017522394657135, 0.0003135949373245239, 0.00032543763518333435, 0.0003372803330421448, 0.0003491230309009552, 0.0003609657287597656]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 9.0, 5.0, 16.0, 14.0, 25.0, 34.0, 39.0, 73.0, 106.0, 167.0, 288.0, 416.0, 644.0, 1002.0, 1558.0, 2432.0, 3955.0, 6185.0, 10067.0, 15953.0, 24990.0, 38612.0, 56680.0, 78908.0, 101523.0, 120318.0, 126441.0, 119438.0, 100976.0, 77707.0, 55967.0, 37396.0, 24392.0, 15616.0, 9923.0, 6211.0, 3850.0, 2404.0, 1507.0, 944.0, 609.0, 407.0, 253.0, 167.0, 117.0, 74.0, 53.0, 29.0, 22.0, 16.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.3359375, -4.19818115234375, -4.0604248046875, -3.92266845703125, -3.784912109375, -3.64715576171875, -3.5093994140625, -3.37164306640625, -3.23388671875, -3.09613037109375, -2.9583740234375, -2.82061767578125, -2.682861328125, -2.54510498046875, -2.4073486328125, -2.26959228515625, -2.1318359375, -1.99407958984375, -1.8563232421875, -1.71856689453125, -1.580810546875, -1.44305419921875, -1.3052978515625, -1.16754150390625, -1.02978515625, -0.89202880859375, -0.7542724609375, -0.61651611328125, -0.478759765625, -0.34100341796875, -0.2032470703125, -0.06549072265625, 0.072265625, 0.21002197265625, 0.3477783203125, 0.48553466796875, 0.623291015625, 0.76104736328125, 0.8988037109375, 1.03656005859375, 1.17431640625, 1.31207275390625, 1.4498291015625, 1.58758544921875, 1.725341796875, 1.86309814453125, 2.0008544921875, 2.13861083984375, 2.2763671875, 2.41412353515625, 2.5518798828125, 2.68963623046875, 2.827392578125, 2.96514892578125, 3.1029052734375, 3.24066162109375, 3.37841796875, 3.51617431640625, 3.6539306640625, 3.79168701171875, 3.929443359375, 4.06719970703125, 4.2049560546875, 4.34271240234375, 4.48046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 10.0, 4.0, 8.0, 9.0, 9.0, 25.0, 22.0, 28.0, 33.0, 22.0, 47.0, 37.0, 42.0, 60.0, 62.0, 61.0, 48.0, 55.0, 49.0, 60.0, 45.0, 44.0, 38.0, 32.0, 34.0, 23.0, 18.0, 14.0, 12.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.310211181640625, -2.24151611328125, -2.172821044921875, -2.1041259765625, -2.035430908203125, -1.96673583984375, -1.898040771484375, -1.829345703125, -1.760650634765625, -1.69195556640625, -1.623260498046875, -1.5545654296875, -1.485870361328125, -1.41717529296875, -1.348480224609375, -1.27978515625, -1.211090087890625, -1.14239501953125, -1.073699951171875, -1.0050048828125, -0.936309814453125, -0.86761474609375, -0.798919677734375, -0.730224609375, -0.661529541015625, -0.59283447265625, -0.524139404296875, -0.4554443359375, -0.386749267578125, -0.31805419921875, -0.249359130859375, -0.1806640625, -0.111968994140625, -0.04327392578125, 0.025421142578125, 0.0941162109375, 0.162811279296875, 0.23150634765625, 0.300201416015625, 0.368896484375, 0.437591552734375, 0.50628662109375, 0.574981689453125, 0.6436767578125, 0.712371826171875, 0.78106689453125, 0.849761962890625, 0.91845703125, 0.987152099609375, 1.05584716796875, 1.124542236328125, 1.1932373046875, 1.261932373046875, 1.33062744140625, 1.399322509765625, 1.468017578125, 1.536712646484375, 1.60540771484375, 1.674102783203125, 1.7427978515625, 1.811492919921875, 1.88018798828125, 1.948883056640625, 2.017578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 11.0, 6.0, 10.0, 12.0, 9.0, 14.0, 22.0, 19.0, 27.0, 21.0, 31.0, 29.0, 48.0, 39.0, 38.0, 45.0, 36.0, 53.0, 48.0, 42.0, 41.0, 49.0, 41.0, 33.0, 42.0, 32.0, 31.0, 25.0, 29.0, 13.0, 20.0, 17.0, 10.0, 11.0, 7.0, 9.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.244462966918945, -14.705984115600586, -14.167505264282227, -13.62902545928955, -13.090546607971191, -12.552067756652832, -12.013587951660156, -11.475109100341797, -10.936630249023438, -10.398151397705078, -9.859672546386719, -9.321192741394043, -8.782713890075684, -8.244235038757324, -7.705755710601807, -7.167276382446289, -6.62879753112793, -6.09031867980957, -5.551839351654053, -5.013360023498535, -4.474881172180176, -3.9364020824432373, -3.397922992706299, -2.8594439029693604, -2.320964813232422, -1.7824857234954834, -1.244006633758545, -0.7055275440216064, -0.16704845428466797, 0.3714306354522705, 0.909909725189209, 1.4483888149261475, 1.986867904663086, 2.5253469944000244, 3.063826084136963, 3.6023051738739014, 4.14078426361084, 4.679263114929199, 5.217742443084717, 5.756221771240234, 6.294700622558594, 6.833179473876953, 7.371658802032471, 7.910138130187988, 8.448616981506348, 8.987095832824707, 9.525575637817383, 10.064054489135742, 10.602533340454102, 11.141012191772461, 11.67949104309082, 12.217970848083496, 12.756449699401855, 13.294928550720215, 13.83340835571289, 14.37188720703125, 14.91036605834961, 15.448844909667969, 15.987323760986328, 16.525802612304688, 17.064281463623047, 17.60276222229004, 18.1412410736084, 18.679719924926758, 19.218198776245117]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 7.0, 5.0, 11.0, 7.0, 13.0, 14.0, 23.0, 21.0, 25.0, 28.0, 15.0, 29.0, 27.0, 38.0, 41.0, 46.0, 46.0, 40.0, 42.0, 41.0, 37.0, 41.0, 54.0, 37.0, 36.0, 39.0, 36.0, 31.0, 28.0, 22.0, 21.0, 20.0, 17.0, 22.0, 7.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.634889602661133, -21.970996856689453, -21.30710220336914, -20.643207550048828, -19.97931480407715, -19.31542205810547, -18.651527404785156, -17.987632751464844, -17.323740005493164, -16.659847259521484, -15.995952606201172, -15.332058906555176, -14.66816520690918, -14.004271507263184, -13.340377807617188, -12.676484107971191, -12.012590408325195, -11.3486967086792, -10.684803009033203, -10.020909309387207, -9.357015609741211, -8.693121910095215, -8.029228210449219, -7.365334510803223, -6.701440811157227, -6.0375471115112305, -5.373653411865234, -4.709759712219238, -4.045866012573242, -3.381972312927246, -2.71807861328125, -2.054184913635254, -1.390289306640625, -0.7263956069946289, -0.06250190734863281, 0.6013917922973633, 1.2652854919433594, 1.9291791915893555, 2.5930728912353516, 3.2569665908813477, 3.9208602905273438, 4.58475399017334, 5.248647689819336, 5.912541389465332, 6.576435089111328, 7.240328788757324, 7.90422248840332, 8.568116188049316, 9.232009887695312, 9.895903587341309, 10.559797286987305, 11.2236909866333, 11.887584686279297, 12.551478385925293, 13.215372085571289, 13.879265785217285, 14.543159484863281, 15.207053184509277, 15.870946884155273, 16.534839630126953, 17.198734283447266, 17.862628936767578, 18.526521682739258, 19.190414428710938, 19.85430908203125]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 40.0, 47.0, 75.0, 134.0, 206.0, 386.0, 576.0, 868.0, 1528.0, 2435.0, 3759.0, 6041.0, 9615.0, 15290.0, 23750.0, 36583.0, 55290.0, 81602.0, 117833.0, 165207.0, 223705.0, 285516.0, 349491.0, 397795.0, 421182.0, 414169.0, 377503.0, 321978.0, 257659.0, 195204.0, 141761.0, 98806.0, 66757.0, 44333.0, 28713.0, 18281.0, 11604.0, 7250.0, 4475.0, 2713.0, 1663.0, 944.0, 617.0, 361.0, 218.0, 145.0, 71.0, 41.0, 29.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-13.0546875, -12.66796875, -12.28125, -11.89453125, -11.5078125, -11.12109375, -10.734375, -10.34765625, -9.9609375, -9.57421875, -9.1875, -8.80078125, -8.4140625, -8.02734375, -7.640625, -7.25390625, -6.8671875, -6.48046875, -6.09375, -5.70703125, -5.3203125, -4.93359375, -4.546875, -4.16015625, -3.7734375, -3.38671875, -3.0, -2.61328125, -2.2265625, -1.83984375, -1.453125, -1.06640625, -0.6796875, -0.29296875, 0.09375, 0.48046875, 0.8671875, 1.25390625, 1.640625, 2.02734375, 2.4140625, 2.80078125, 3.1875, 3.57421875, 3.9609375, 4.34765625, 4.734375, 5.12109375, 5.5078125, 5.89453125, 6.28125, 6.66796875, 7.0546875, 7.44140625, 7.828125, 8.21484375, 8.6015625, 8.98828125, 9.375, 9.76171875, 10.1484375, 10.53515625, 10.921875, 11.30859375, 11.6953125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 13.0, 16.0, 9.0, 16.0, 24.0, 19.0, 12.0, 18.0, 33.0, 23.0, 31.0, 35.0, 23.0, 37.0, 45.0, 32.0, 38.0, 43.0, 29.0, 28.0, 39.0, 47.0, 38.0, 35.0, 36.0, 25.0, 35.0, 35.0, 24.0, 30.0, 19.0, 13.0, 16.0, 13.0, 9.0, 8.0, 6.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.9609375, -14.4927978515625, -14.024658203125, -13.5565185546875, -13.08837890625, -12.6202392578125, -12.152099609375, -11.6839599609375, -11.2158203125, -10.7476806640625, -10.279541015625, -9.8114013671875, -9.34326171875, -8.8751220703125, -8.406982421875, -7.9388427734375, -7.470703125, -7.0025634765625, -6.534423828125, -6.0662841796875, -5.59814453125, -5.1300048828125, -4.661865234375, -4.1937255859375, -3.7255859375, -3.2574462890625, -2.789306640625, -2.3211669921875, -1.85302734375, -1.3848876953125, -0.916748046875, -0.4486083984375, 0.01953125, 0.4876708984375, 0.955810546875, 1.4239501953125, 1.89208984375, 2.3602294921875, 2.828369140625, 3.2965087890625, 3.7646484375, 4.2327880859375, 4.700927734375, 5.1690673828125, 5.63720703125, 6.1053466796875, 6.573486328125, 7.0416259765625, 7.509765625, 7.9779052734375, 8.446044921875, 8.9141845703125, 9.38232421875, 9.8504638671875, 10.318603515625, 10.7867431640625, 11.2548828125, 11.7230224609375, 12.191162109375, 12.6593017578125, 13.12744140625, 13.5955810546875, 14.063720703125, 14.5318603515625, 15.0]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 17.0, 41.0, 43.0, 102.0, 160.0, 247.0, 485.0, 868.0, 1538.0, 2555.0, 4383.0, 7003.0, 11993.0, 19081.0, 30158.0, 46320.0, 69790.0, 101207.0, 143130.0, 193001.0, 247751.0, 303707.0, 349493.0, 382319.0, 393751.0, 380742.0, 348079.0, 298285.0, 243771.0, 188703.0, 138647.0, 99157.0, 67552.0, 44577.0, 29094.0, 18356.0, 11289.0, 6843.0, 4172.0, 2422.0, 1463.0, 882.0, 485.0, 246.0, 164.0, 88.0, 53.0, 35.0, 17.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.40625, -12.0240478515625, -11.641845703125, -11.2596435546875, -10.87744140625, -10.4952392578125, -10.113037109375, -9.7308349609375, -9.3486328125, -8.9664306640625, -8.584228515625, -8.2020263671875, -7.81982421875, -7.4376220703125, -7.055419921875, -6.6732177734375, -6.291015625, -5.9088134765625, -5.526611328125, -5.1444091796875, -4.76220703125, -4.3800048828125, -3.997802734375, -3.6156005859375, -3.2333984375, -2.8511962890625, -2.468994140625, -2.0867919921875, -1.70458984375, -1.3223876953125, -0.940185546875, -0.5579833984375, -0.17578125, 0.2064208984375, 0.588623046875, 0.9708251953125, 1.35302734375, 1.7352294921875, 2.117431640625, 2.4996337890625, 2.8818359375, 3.2640380859375, 3.646240234375, 4.0284423828125, 4.41064453125, 4.7928466796875, 5.175048828125, 5.5572509765625, 5.939453125, 6.3216552734375, 6.703857421875, 7.0860595703125, 7.46826171875, 7.8504638671875, 8.232666015625, 8.6148681640625, 8.9970703125, 9.3792724609375, 9.761474609375, 10.1436767578125, 10.52587890625, 10.9080810546875, 11.290283203125, 11.6724853515625, 12.0546875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 2.0, 10.0, 10.0, 3.0, 13.0, 18.0, 19.0, 35.0, 37.0, 57.0, 72.0, 82.0, 107.0, 131.0, 124.0, 155.0, 169.0, 187.0, 179.0, 218.0, 226.0, 218.0, 207.0, 215.0, 202.0, 194.0, 175.0, 146.0, 131.0, 110.0, 109.0, 96.0, 81.0, 62.0, 72.0, 46.0, 36.0, 36.0, 23.0, 14.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59375, -7.3466796875, -7.099609375, -6.8525390625, -6.60546875, -6.3583984375, -6.111328125, -5.8642578125, -5.6171875, -5.3701171875, -5.123046875, -4.8759765625, -4.62890625, -4.3818359375, -4.134765625, -3.8876953125, -3.640625, -3.3935546875, -3.146484375, -2.8994140625, -2.65234375, -2.4052734375, -2.158203125, -1.9111328125, -1.6640625, -1.4169921875, -1.169921875, -0.9228515625, -0.67578125, -0.4287109375, -0.181640625, 0.0654296875, 0.3125, 0.5595703125, 0.806640625, 1.0537109375, 1.30078125, 1.5478515625, 1.794921875, 2.0419921875, 2.2890625, 2.5361328125, 2.783203125, 3.0302734375, 3.27734375, 3.5244140625, 3.771484375, 4.0185546875, 4.265625, 4.5126953125, 4.759765625, 5.0068359375, 5.25390625, 5.5009765625, 5.748046875, 5.9951171875, 6.2421875, 6.4892578125, 6.736328125, 6.9833984375, 7.23046875, 7.4775390625, 7.724609375, 7.9716796875, 8.21875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 6.0, 5.0, 6.0, 17.0, 16.0, 24.0, 27.0, 18.0, 32.0, 42.0, 41.0, 47.0, 48.0, 54.0, 52.0, 41.0, 59.0, 37.0, 48.0, 37.0, 38.0, 49.0, 40.0, 26.0, 32.0, 22.0, 23.0, 20.0, 13.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.639983177185059, -14.0423002243042, -13.444618225097656, -12.846935272216797, -12.249252319335938, -11.651569366455078, -11.053886413574219, -10.456204414367676, -9.858521461486816, -9.260838508605957, -8.663156509399414, -8.065473556518555, -7.467790603637695, -6.870107650756836, -6.272425174713135, -5.674742698669434, -5.077059745788574, -4.479376792907715, -3.8816943168640137, -3.2840116024017334, -2.686328887939453, -2.088646173477173, -1.4909634590148926, -0.8932809829711914, -0.29559803009033203, 0.30208468437194824, 0.8997673988342285, 1.4974501132965088, 2.095132827758789, 2.6928155422210693, 3.2904982566833496, 3.888180732727051, 4.485864639282227, 5.083547592163086, 5.681230068206787, 6.278912544250488, 6.876595497131348, 7.474278450012207, 8.07196044921875, 8.66964340209961, 9.267326354980469, 9.865009307861328, 10.462692260742188, 11.06037425994873, 11.65805721282959, 12.25574016571045, 12.853422164916992, 13.451105117797852, 14.048788070678711, 14.64647102355957, 15.24415397644043, 15.841835975646973, 16.439517974853516, 17.037200927734375, 17.634883880615234, 18.232566833496094, 18.830249786376953, 19.427932739257812, 20.025615692138672, 20.62329864501953, 21.22098159790039, 21.818662643432617, 22.416345596313477, 23.014028549194336, 23.611711502075195]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 6.0, 4.0, 13.0, 5.0, 5.0, 8.0, 7.0, 15.0, 8.0, 20.0, 17.0, 24.0, 28.0, 18.0, 22.0, 33.0, 38.0, 31.0, 29.0, 37.0, 45.0, 38.0, 38.0, 39.0, 36.0, 39.0, 44.0, 39.0, 36.0, 28.0, 32.0, 27.0, 26.0, 17.0, 17.0, 17.0, 17.0, 17.0, 13.0, 15.0, 13.0, 9.0, 10.0, 12.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.830968856811523, -18.26372528076172, -17.696483612060547, -17.129240036010742, -16.561996459960938, -15.994754791259766, -15.427511215209961, -14.860268592834473, -14.293025970458984, -13.725783348083496, -13.158540725708008, -12.591297149658203, -12.024054527282715, -11.456811904907227, -10.889568328857422, -10.322325706481934, -9.755083084106445, -9.187840461730957, -8.620597839355469, -8.053354263305664, -7.486111640930176, -6.9188690185546875, -6.351625919342041, -5.7843828201293945, -5.217140197753906, -4.649897575378418, -4.0826544761657715, -3.515411615371704, -2.9481687545776367, -2.3809258937835693, -1.813683032989502, -1.2464401721954346, -0.67919921875, -0.11195635795593262, 0.45528650283813477, 1.0225293636322021, 1.5897722244262695, 2.157015085220337, 2.7242579460144043, 3.2915008068084717, 3.858743667602539, 4.425986289978027, 4.993229389190674, 5.56047248840332, 6.127715110778809, 6.694957733154297, 7.262200832366943, 7.82944393157959, 8.396686553955078, 8.963929176330566, 9.531171798706055, 10.09841537475586, 10.665657997131348, 11.232900619506836, 11.80014419555664, 12.367386817932129, 12.934629440307617, 13.501872062683105, 14.069114685058594, 14.636358261108398, 15.203600883483887, 15.770843505859375, 16.33808708190918, 16.90532875061035, 17.472572326660156]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 2.0, 9.0, 13.0, 19.0, 18.0, 38.0, 50.0, 115.0, 142.0, 181.0, 275.0, 432.0, 553.0, 826.0, 1231.0, 1843.0, 2679.0, 3838.0, 5760.0, 8342.0, 12625.0, 19039.0, 29194.0, 44586.0, 68218.0, 105220.0, 157498.0, 183381.0, 138893.0, 90996.0, 59324.0, 38161.0, 24632.0, 16477.0, 10743.0, 7351.0, 4982.0, 3485.0, 2310.0, 1588.0, 1122.0, 745.0, 522.0, 351.0, 252.0, 171.0, 103.0, 94.0, 48.0, 27.0, 20.0, 17.0, 10.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3125, -2.238677978515625, -2.16485595703125, -2.091033935546875, -2.0172119140625, -1.943389892578125, -1.86956787109375, -1.795745849609375, -1.721923828125, -1.648101806640625, -1.57427978515625, -1.500457763671875, -1.4266357421875, -1.352813720703125, -1.27899169921875, -1.205169677734375, -1.13134765625, -1.057525634765625, -0.98370361328125, -0.909881591796875, -0.8360595703125, -0.762237548828125, -0.68841552734375, -0.614593505859375, -0.540771484375, -0.466949462890625, -0.39312744140625, -0.319305419921875, -0.2454833984375, -0.171661376953125, -0.09783935546875, -0.024017333984375, 0.0498046875, 0.123626708984375, 0.19744873046875, 0.271270751953125, 0.3450927734375, 0.418914794921875, 0.49273681640625, 0.566558837890625, 0.640380859375, 0.714202880859375, 0.78802490234375, 0.861846923828125, 0.9356689453125, 1.009490966796875, 1.08331298828125, 1.157135009765625, 1.23095703125, 1.304779052734375, 1.37860107421875, 1.452423095703125, 1.5262451171875, 1.600067138671875, 1.67388916015625, 1.747711181640625, 1.821533203125, 1.895355224609375, 1.96917724609375, 2.042999267578125, 2.1168212890625, 2.190643310546875, 2.26446533203125, 2.338287353515625, 2.412109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 12.0, 8.0, 16.0, 17.0, 16.0, 21.0, 18.0, 21.0, 20.0, 20.0, 33.0, 37.0, 30.0, 39.0, 26.0, 37.0, 44.0, 56.0, 39.0, 44.0, 41.0, 38.0, 32.0, 37.0, 37.0, 23.0, 38.0, 14.0, 16.0, 22.0, 22.0, 20.0, 22.0, 13.0, 10.0, 9.0, 13.0, 5.0, 6.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -20.431396484375, -19.81591796875, -19.200439453125, -18.5849609375, -17.969482421875, -17.35400390625, -16.738525390625, -16.123046875, -15.507568359375, -14.89208984375, -14.276611328125, -13.6611328125, -13.045654296875, -12.43017578125, -11.814697265625, -11.19921875, -10.583740234375, -9.96826171875, -9.352783203125, -8.7373046875, -8.121826171875, -7.50634765625, -6.890869140625, -6.275390625, -5.659912109375, -5.04443359375, -4.428955078125, -3.8134765625, -3.197998046875, -2.58251953125, -1.967041015625, -1.3515625, -0.736083984375, -0.12060546875, 0.494873046875, 1.1103515625, 1.725830078125, 2.34130859375, 2.956787109375, 3.572265625, 4.187744140625, 4.80322265625, 5.418701171875, 6.0341796875, 6.649658203125, 7.26513671875, 7.880615234375, 8.49609375, 9.111572265625, 9.72705078125, 10.342529296875, 10.9580078125, 11.573486328125, 12.18896484375, 12.804443359375, 13.419921875, 14.035400390625, 14.65087890625, 15.266357421875, 15.8818359375, 16.497314453125, 17.11279296875, 17.728271484375, 18.34375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 9.0, 13.0, 28.0, 42.0, 51.0, 63.0, 113.0, 164.0, 225.0, 352.0, 607.0, 920.0, 1338.0, 2110.0, 3433.0, 5519.0, 9040.0, 14921.0, 25574.0, 43618.0, 76024.0, 137393.0, 232075.0, 212982.0, 120347.0, 66572.0, 38359.0, 22126.0, 13249.0, 8160.0, 4809.0, 3019.0, 1899.0, 1142.0, 750.0, 543.0, 333.0, 206.0, 128.0, 94.0, 67.0, 40.0, 28.0, 22.0, 21.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.181640625, -3.08489990234375, -2.9881591796875, -2.89141845703125, -2.794677734375, -2.69793701171875, -2.6011962890625, -2.50445556640625, -2.40771484375, -2.31097412109375, -2.2142333984375, -2.11749267578125, -2.020751953125, -1.92401123046875, -1.8272705078125, -1.73052978515625, -1.6337890625, -1.53704833984375, -1.4403076171875, -1.34356689453125, -1.246826171875, -1.15008544921875, -1.0533447265625, -0.95660400390625, -0.85986328125, -0.76312255859375, -0.6663818359375, -0.56964111328125, -0.472900390625, -0.37615966796875, -0.2794189453125, -0.18267822265625, -0.0859375, 0.01080322265625, 0.1075439453125, 0.20428466796875, 0.301025390625, 0.39776611328125, 0.4945068359375, 0.59124755859375, 0.68798828125, 0.78472900390625, 0.8814697265625, 0.97821044921875, 1.074951171875, 1.17169189453125, 1.2684326171875, 1.36517333984375, 1.4619140625, 1.55865478515625, 1.6553955078125, 1.75213623046875, 1.848876953125, 1.94561767578125, 2.0423583984375, 2.13909912109375, 2.23583984375, 2.33258056640625, 2.4293212890625, 2.52606201171875, 2.622802734375, 2.71954345703125, 2.8162841796875, 2.91302490234375, 3.009765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 10.0, 5.0, 12.0, 12.0, 16.0, 12.0, 14.0, 16.0, 21.0, 20.0, 20.0, 27.0, 31.0, 20.0, 38.0, 33.0, 41.0, 33.0, 41.0, 28.0, 35.0, 48.0, 40.0, 29.0, 30.0, 35.0, 37.0, 32.0, 29.0, 21.0, 31.0, 27.0, 22.0, 26.0, 18.0, 21.0, 12.0, 8.0, 13.0, 10.0, 5.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6015625, -10.2242431640625, -9.846923828125, -9.4696044921875, -9.09228515625, -8.7149658203125, -8.337646484375, -7.9603271484375, -7.5830078125, -7.2056884765625, -6.828369140625, -6.4510498046875, -6.07373046875, -5.6964111328125, -5.319091796875, -4.9417724609375, -4.564453125, -4.1871337890625, -3.809814453125, -3.4324951171875, -3.05517578125, -2.6778564453125, -2.300537109375, -1.9232177734375, -1.5458984375, -1.1685791015625, -0.791259765625, -0.4139404296875, -0.03662109375, 0.3406982421875, 0.718017578125, 1.0953369140625, 1.47265625, 1.8499755859375, 2.227294921875, 2.6046142578125, 2.98193359375, 3.3592529296875, 3.736572265625, 4.1138916015625, 4.4912109375, 4.8685302734375, 5.245849609375, 5.6231689453125, 6.00048828125, 6.3778076171875, 6.755126953125, 7.1324462890625, 7.509765625, 7.8870849609375, 8.264404296875, 8.6417236328125, 9.01904296875, 9.3963623046875, 9.773681640625, 10.1510009765625, 10.5283203125, 10.9056396484375, 11.282958984375, 11.6602783203125, 12.03759765625, 12.4149169921875, 12.792236328125, 13.1695556640625, 13.546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 15.0, 21.0, 24.0, 60.0, 55.0, 98.0, 144.0, 211.0, 330.0, 422.0, 668.0, 935.0, 1532.0, 2300.0, 3428.0, 5389.0, 8404.0, 13644.0, 22396.0, 38778.0, 69390.0, 138046.0, 267301.0, 224461.0, 109483.0, 57047.0, 31986.0, 19200.0, 11887.0, 7275.0, 4595.0, 3012.0, 1953.0, 1354.0, 823.0, 565.0, 420.0, 254.0, 198.0, 148.0, 96.0, 58.0, 37.0, 21.0, 19.0, 16.0, 17.0, 9.0, 10.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08367919921875, -0.08105087280273438, -0.07842254638671875, -0.07579421997070312, -0.0731658935546875, -0.07053756713867188, -0.06790924072265625, -0.06528091430664062, -0.062652587890625, -0.060024261474609375, -0.05739593505859375, -0.054767608642578125, -0.0521392822265625, -0.049510955810546875, -0.04688262939453125, -0.044254302978515625, -0.0416259765625, -0.038997650146484375, -0.03636932373046875, -0.033740997314453125, -0.0311126708984375, -0.028484344482421875, -0.02585601806640625, -0.023227691650390625, -0.020599365234375, -0.017971038818359375, -0.01534271240234375, -0.012714385986328125, -0.0100860595703125, -0.007457733154296875, -0.00482940673828125, -0.002201080322265625, 0.00042724609375, 0.003055572509765625, 0.00568389892578125, 0.008312225341796875, 0.0109405517578125, 0.013568878173828125, 0.01619720458984375, 0.018825531005859375, 0.021453857421875, 0.024082183837890625, 0.02671051025390625, 0.029338836669921875, 0.0319671630859375, 0.034595489501953125, 0.03722381591796875, 0.039852142333984375, 0.04248046875, 0.045108795166015625, 0.04773712158203125, 0.050365447998046875, 0.0529937744140625, 0.055622100830078125, 0.05825042724609375, 0.060878753662109375, 0.063507080078125, 0.06613540649414062, 0.06876373291015625, 0.07139205932617188, 0.0740203857421875, 0.07664871215820312, 0.07927703857421875, 0.08190536499023438, 0.08453369140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 8.0, 9.0, 9.0, 17.0, 19.0, 21.0, 14.0, 19.0, 23.0, 39.0, 22.0, 32.0, 38.0, 46.0, 36.0, 40.0, 37.0, 43.0, 42.0, 50.0, 53.0, 35.0, 25.0, 41.0, 34.0, 26.0, 27.0, 24.0, 31.0, 22.0, 17.0, 18.0, 18.0, 15.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4781951904296875e-05, -1.4321878552436829e-05, -1.3861805200576782e-05, -1.3401731848716736e-05, -1.294165849685669e-05, -1.2481585144996643e-05, -1.2021511793136597e-05, -1.156143844127655e-05, -1.1101365089416504e-05, -1.0641291737556458e-05, -1.0181218385696411e-05, -9.721145033836365e-06, -9.261071681976318e-06, -8.800998330116272e-06, -8.340924978256226e-06, -7.88085162639618e-06, -7.420778274536133e-06, -6.9607049226760864e-06, -6.50063157081604e-06, -6.040558218955994e-06, -5.580484867095947e-06, -5.120411515235901e-06, -4.6603381633758545e-06, -4.200264811515808e-06, -3.7401914596557617e-06, -3.2801181077957153e-06, -2.820044755935669e-06, -2.3599714040756226e-06, -1.8998980522155762e-06, -1.4398247003555298e-06, -9.797513484954834e-07, -5.19677996635437e-07, -5.960464477539063e-08, 4.0046870708465576e-07, 8.605420589447021e-07, 1.3206154108047485e-06, 1.780688762664795e-06, 2.2407621145248413e-06, 2.7008354663848877e-06, 3.160908818244934e-06, 3.6209821701049805e-06, 4.081055521965027e-06, 4.541128873825073e-06, 5.00120222568512e-06, 5.461275577545166e-06, 5.921348929405212e-06, 6.381422281265259e-06, 6.841495633125305e-06, 7.3015689849853516e-06, 7.761642336845398e-06, 8.221715688705444e-06, 8.68178904056549e-06, 9.141862392425537e-06, 9.601935744285583e-06, 1.006200909614563e-05, 1.0522082448005676e-05, 1.0982155799865723e-05, 1.1442229151725769e-05, 1.1902302503585815e-05, 1.2362375855445862e-05, 1.2822449207305908e-05, 1.3282522559165955e-05, 1.3742595911026001e-05, 1.4202669262886047e-05, 1.4662742614746094e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 9.0, 5.0, 13.0, 28.0, 40.0, 64.0, 75.0, 121.0, 201.0, 338.0, 383.0, 696.0, 921.0, 1449.0, 2229.0, 3361.0, 5106.0, 7990.0, 12269.0, 19521.0, 32115.0, 54967.0, 100658.0, 207228.0, 279572.0, 138500.0, 72217.0, 40975.0, 24204.0, 15258.0, 9773.0, 6184.0, 4137.0, 2635.0, 1813.0, 1174.0, 718.0, 550.0, 347.0, 247.0, 145.0, 116.0, 65.0, 44.0, 33.0, 21.0, 12.0, 12.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.203369140625, -0.19705963134765625, -0.1907501220703125, -0.18444061279296875, -0.178131103515625, -0.17182159423828125, -0.1655120849609375, -0.15920257568359375, -0.15289306640625, -0.14658355712890625, -0.1402740478515625, -0.13396453857421875, -0.127655029296875, -0.12134552001953125, -0.1150360107421875, -0.10872650146484375, -0.1024169921875, -0.09610748291015625, -0.0897979736328125, -0.08348846435546875, -0.077178955078125, -0.07086944580078125, -0.0645599365234375, -0.05825042724609375, -0.05194091796875, -0.04563140869140625, -0.0393218994140625, -0.03301239013671875, -0.026702880859375, -0.02039337158203125, -0.0140838623046875, -0.00777435302734375, -0.00146484375, 0.00484466552734375, 0.0111541748046875, 0.01746368408203125, 0.023773193359375, 0.03008270263671875, 0.0363922119140625, 0.04270172119140625, 0.04901123046875, 0.05532073974609375, 0.0616302490234375, 0.06793975830078125, 0.074249267578125, 0.08055877685546875, 0.0868682861328125, 0.09317779541015625, 0.0994873046875, 0.10579681396484375, 0.1121063232421875, 0.11841583251953125, 0.124725341796875, 0.13103485107421875, 0.1373443603515625, 0.14365386962890625, 0.14996337890625, 0.15627288818359375, 0.1625823974609375, 0.16889190673828125, 0.175201416015625, 0.18151092529296875, 0.1878204345703125, 0.19412994384765625, 0.200439453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 13.0, 25.0, 19.0, 28.0, 43.0, 50.0, 73.0, 145.0, 216.0, 113.0, 93.0, 59.0, 35.0, 19.0, 21.0, 13.0, 11.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.1098623275756836, -0.10552787780761719, -0.10119342803955078, -0.09685897827148438, -0.09252452850341797, -0.08819007873535156, -0.08385562896728516, -0.07952117919921875, -0.07518672943115234, -0.07085227966308594, -0.06651782989501953, -0.062183380126953125, -0.05784893035888672, -0.05351448059082031, -0.049180030822753906, -0.0448455810546875, -0.040511131286621094, -0.03617668151855469, -0.03184223175048828, -0.027507781982421875, -0.02317333221435547, -0.018838882446289062, -0.014504432678222656, -0.01016998291015625, -0.005835533142089844, -0.0015010833740234375, 0.0028333663940429688, 0.007167816162109375, 0.011502265930175781, 0.015836715698242188, 0.020171165466308594, 0.024505615234375, 0.028840065002441406, 0.03317451477050781, 0.03750896453857422, 0.041843414306640625, 0.04617786407470703, 0.05051231384277344, 0.054846763610839844, 0.05918121337890625, 0.06351566314697266, 0.06785011291503906, 0.07218456268310547, 0.07651901245117188, 0.08085346221923828, 0.08518791198730469, 0.0895223617553711, 0.0938568115234375, 0.0981912612915039, 0.10252571105957031, 0.10686016082763672, 0.11119461059570312, 0.11552906036376953, 0.11986351013183594, 0.12419795989990234, 0.12853240966796875, 0.13286685943603516, 0.13720130920410156, 0.14153575897216797, 0.14587020874023438, 0.15020465850830078, 0.1545391082763672, 0.1588735580444336, 0.1632080078125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 10.0, 5.0, 7.0, 12.0, 14.0, 25.0, 14.0, 25.0, 20.0, 32.0, 38.0, 46.0, 43.0, 55.0, 57.0, 48.0, 52.0, 40.0, 42.0, 46.0, 36.0, 44.0, 46.0, 33.0, 33.0, 26.0, 24.0, 26.0, 17.0, 12.0, 13.0, 9.0, 6.0, 8.0, 7.0, 4.0, 2.0, 11.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.52010726928711, -13.925849914550781, -13.331592559814453, -12.737336158752441, -12.143078804016113, -11.548821449279785, -10.954565048217773, -10.360307693481445, -9.766050338745117, -9.171792984008789, -8.577535629272461, -7.983279228210449, -7.389021873474121, -6.794764518737793, -6.200507640838623, -5.606250762939453, -5.011993408203125, -4.417736053466797, -3.823479175567627, -3.229222059249878, -2.634964942932129, -2.04070782661438, -1.4464507102966309, -0.8521938323974609, -0.2579364776611328, 0.3363206386566162, 0.9305777549743652, 1.5248348712921143, 2.1190919876098633, 2.7133491039276123, 3.3076062202453613, 3.9018630981445312, 4.496120452880859, 5.0903778076171875, 5.684634685516357, 6.278891563415527, 6.8731489181518555, 7.467406272888184, 8.061662673950195, 8.655920028686523, 9.250177383422852, 9.84443473815918, 10.438692092895508, 11.03294849395752, 11.627205848693848, 12.221463203430176, 12.815719604492188, 13.409976959228516, 14.004234313964844, 14.598491668701172, 15.1927490234375, 15.787005424499512, 16.381263732910156, 16.97551918029785, 17.56977653503418, 18.164033889770508, 18.758291244506836, 19.352548599243164, 19.946805953979492, 20.54106330871582, 21.135318756103516, 21.729576110839844, 22.323833465576172, 22.9180908203125, 23.512348175048828]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 6.0, 13.0, 3.0, 5.0, 8.0, 9.0, 14.0, 7.0, 23.0, 16.0, 26.0, 27.0, 20.0, 18.0, 36.0, 39.0, 27.0, 33.0, 35.0, 44.0, 39.0, 40.0, 36.0, 39.0, 35.0, 47.0, 36.0, 37.0, 27.0, 32.0, 25.0, 29.0, 15.0, 18.0, 17.0, 17.0, 16.0, 13.0, 15.0, 13.0, 9.0, 10.0, 12.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.767269134521484, -18.201866149902344, -17.636463165283203, -17.071060180664062, -16.505657196044922, -15.940254211425781, -15.37485122680664, -14.8094482421875, -14.24404525756836, -13.678642272949219, -13.113239288330078, -12.547836303710938, -11.982433319091797, -11.417030334472656, -10.851627349853516, -10.286224365234375, -9.720821380615234, -9.155418395996094, -8.590015411376953, -8.024612426757812, -7.459209442138672, -6.893806457519531, -6.328403472900391, -5.76300048828125, -5.197597503662109, -4.632194519042969, -4.066791534423828, -3.5013885498046875, -2.935985565185547, -2.3705825805664062, -1.8051795959472656, -1.239776611328125, -0.6743717193603516, -0.10896873474121094, 0.4564342498779297, 1.0218372344970703, 1.587240219116211, 2.1526432037353516, 2.718046188354492, 3.283449172973633, 3.8488521575927734, 4.414255142211914, 4.979658126831055, 5.545061111450195, 6.110464096069336, 6.675867080688477, 7.241270065307617, 7.806673049926758, 8.372076034545898, 8.937479019165039, 9.50288200378418, 10.06828498840332, 10.633687973022461, 11.199090957641602, 11.764493942260742, 12.329896926879883, 12.895299911499023, 13.460702896118164, 14.026105880737305, 14.591508865356445, 15.156911849975586, 15.722314834594727, 16.287717819213867, 16.853120803833008, 17.41852378845215]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 2.0, 13.0, 20.0, 20.0, 63.0, 81.0, 126.0, 201.0, 291.0, 451.0, 730.0, 1119.0, 1842.0, 2843.0, 4440.0, 6764.0, 10286.0, 15381.0, 21942.0, 30911.0, 42621.0, 55021.0, 70343.0, 83260.0, 93571.0, 98372.0, 98063.0, 90277.0, 78822.0, 65236.0, 51410.0, 38328.0, 27369.0, 19691.0, 13159.0, 9023.0, 5951.0, 3802.0, 2446.0, 1540.0, 970.0, 621.0, 400.0, 269.0, 153.0, 119.0, 78.0, 35.0, 30.0, 17.0, 16.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.484375, -10.1650390625, -9.845703125, -9.5263671875, -9.20703125, -8.8876953125, -8.568359375, -8.2490234375, -7.9296875, -7.6103515625, -7.291015625, -6.9716796875, -6.65234375, -6.3330078125, -6.013671875, -5.6943359375, -5.375, -5.0556640625, -4.736328125, -4.4169921875, -4.09765625, -3.7783203125, -3.458984375, -3.1396484375, -2.8203125, -2.5009765625, -2.181640625, -1.8623046875, -1.54296875, -1.2236328125, -0.904296875, -0.5849609375, -0.265625, 0.0537109375, 0.373046875, 0.6923828125, 1.01171875, 1.3310546875, 1.650390625, 1.9697265625, 2.2890625, 2.6083984375, 2.927734375, 3.2470703125, 3.56640625, 3.8857421875, 4.205078125, 4.5244140625, 4.84375, 5.1630859375, 5.482421875, 5.8017578125, 6.12109375, 6.4404296875, 6.759765625, 7.0791015625, 7.3984375, 7.7177734375, 8.037109375, 8.3564453125, 8.67578125, 8.9951171875, 9.314453125, 9.6337890625, 9.953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 8.0, 8.0, 5.0, 11.0, 15.0, 17.0, 14.0, 22.0, 25.0, 20.0, 22.0, 20.0, 29.0, 36.0, 34.0, 41.0, 32.0, 46.0, 42.0, 40.0, 32.0, 30.0, 32.0, 32.0, 38.0, 43.0, 34.0, 21.0, 24.0, 23.0, 22.0, 22.0, 18.0, 20.0, 16.0, 9.0, 17.0, 11.0, 6.0, 9.0, 9.0, 5.0, 2.0, 7.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0], "bins": [-18.390625, -17.84912109375, -17.3076171875, -16.76611328125, -16.224609375, -15.68310546875, -15.1416015625, -14.60009765625, -14.05859375, -13.51708984375, -12.9755859375, -12.43408203125, -11.892578125, -11.35107421875, -10.8095703125, -10.26806640625, -9.7265625, -9.18505859375, -8.6435546875, -8.10205078125, -7.560546875, -7.01904296875, -6.4775390625, -5.93603515625, -5.39453125, -4.85302734375, -4.3115234375, -3.77001953125, -3.228515625, -2.68701171875, -2.1455078125, -1.60400390625, -1.0625, -0.52099609375, 0.0205078125, 0.56201171875, 1.103515625, 1.64501953125, 2.1865234375, 2.72802734375, 3.26953125, 3.81103515625, 4.3525390625, 4.89404296875, 5.435546875, 5.97705078125, 6.5185546875, 7.06005859375, 7.6015625, 8.14306640625, 8.6845703125, 9.22607421875, 9.767578125, 10.30908203125, 10.8505859375, 11.39208984375, 11.93359375, 12.47509765625, 13.0166015625, 13.55810546875, 14.099609375, 14.64111328125, 15.1826171875, 15.72412109375, 16.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 18.0, 27.0, 39.0, 58.0, 101.0, 173.0, 310.0, 490.0, 686.0, 1150.0, 1822.0, 3035.0, 4596.0, 7157.0, 10822.0, 16594.0, 23969.0, 34041.0, 46287.0, 60896.0, 75471.0, 88809.0, 98227.0, 101202.0, 98220.0, 88569.0, 75385.0, 59985.0, 46066.0, 34056.0, 23658.0, 16248.0, 10994.0, 7110.0, 4550.0, 2907.0, 1829.0, 1124.0, 738.0, 419.0, 273.0, 177.0, 95.0, 75.0, 30.0, 22.0, 17.0, 13.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.6640625, -10.3358154296875, -10.007568359375, -9.6793212890625, -9.35107421875, -9.0228271484375, -8.694580078125, -8.3663330078125, -8.0380859375, -7.7098388671875, -7.381591796875, -7.0533447265625, -6.72509765625, -6.3968505859375, -6.068603515625, -5.7403564453125, -5.412109375, -5.0838623046875, -4.755615234375, -4.4273681640625, -4.09912109375, -3.7708740234375, -3.442626953125, -3.1143798828125, -2.7861328125, -2.4578857421875, -2.129638671875, -1.8013916015625, -1.47314453125, -1.1448974609375, -0.816650390625, -0.4884033203125, -0.16015625, 0.1680908203125, 0.496337890625, 0.8245849609375, 1.15283203125, 1.4810791015625, 1.809326171875, 2.1375732421875, 2.4658203125, 2.7940673828125, 3.122314453125, 3.4505615234375, 3.77880859375, 4.1070556640625, 4.435302734375, 4.7635498046875, 5.091796875, 5.4200439453125, 5.748291015625, 6.0765380859375, 6.40478515625, 6.7330322265625, 7.061279296875, 7.3895263671875, 7.7177734375, 8.0460205078125, 8.374267578125, 8.7025146484375, 9.03076171875, 9.3590087890625, 9.687255859375, 10.0155029296875, 10.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 13.0, 11.0, 3.0, 11.0, 12.0, 16.0, 13.0, 20.0, 34.0, 27.0, 27.0, 33.0, 27.0, 30.0, 25.0, 41.0, 53.0, 40.0, 30.0, 51.0, 33.0, 34.0, 44.0, 30.0, 32.0, 36.0, 31.0, 29.0, 25.0, 28.0, 29.0, 22.0, 21.0, 17.0, 13.0, 6.0, 12.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.5081787109375, -11.149169921875, -10.7901611328125, -10.43115234375, -10.0721435546875, -9.713134765625, -9.3541259765625, -8.9951171875, -8.6361083984375, -8.277099609375, -7.9180908203125, -7.55908203125, -7.2000732421875, -6.841064453125, -6.4820556640625, -6.123046875, -5.7640380859375, -5.405029296875, -5.0460205078125, -4.68701171875, -4.3280029296875, -3.968994140625, -3.6099853515625, -3.2509765625, -2.8919677734375, -2.532958984375, -2.1739501953125, -1.81494140625, -1.4559326171875, -1.096923828125, -0.7379150390625, -0.37890625, -0.0198974609375, 0.339111328125, 0.6981201171875, 1.05712890625, 1.4161376953125, 1.775146484375, 2.1341552734375, 2.4931640625, 2.8521728515625, 3.211181640625, 3.5701904296875, 3.92919921875, 4.2882080078125, 4.647216796875, 5.0062255859375, 5.365234375, 5.7242431640625, 6.083251953125, 6.4422607421875, 6.80126953125, 7.1602783203125, 7.519287109375, 7.8782958984375, 8.2373046875, 8.5963134765625, 8.955322265625, 9.3143310546875, 9.67333984375, 10.0323486328125, 10.391357421875, 10.7503662109375, 11.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 8.0, 14.0, 23.0, 31.0, 55.0, 88.0, 155.0, 226.0, 344.0, 621.0, 931.0, 1542.0, 2459.0, 3972.0, 6268.0, 9960.0, 15486.0, 23603.0, 35334.0, 49379.0, 67093.0, 86047.0, 101193.0, 110376.0, 111759.0, 102912.0, 88361.0, 70206.0, 52255.0, 37143.0, 25219.0, 16900.0, 10592.0, 6730.0, 4268.0, 2620.0, 1637.0, 1024.0, 675.0, 421.0, 232.0, 151.0, 96.0, 60.0, 31.0, 14.0, 14.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.572265625, -3.460906982421875, -3.34954833984375, -3.238189697265625, -3.1268310546875, -3.015472412109375, -2.90411376953125, -2.792755126953125, -2.681396484375, -2.570037841796875, -2.45867919921875, -2.347320556640625, -2.2359619140625, -2.124603271484375, -2.01324462890625, -1.901885986328125, -1.79052734375, -1.679168701171875, -1.56781005859375, -1.456451416015625, -1.3450927734375, -1.233734130859375, -1.12237548828125, -1.011016845703125, -0.899658203125, -0.788299560546875, -0.67694091796875, -0.565582275390625, -0.4542236328125, -0.342864990234375, -0.23150634765625, -0.120147705078125, -0.0087890625, 0.102569580078125, 0.21392822265625, 0.325286865234375, 0.4366455078125, 0.548004150390625, 0.65936279296875, 0.770721435546875, 0.882080078125, 0.993438720703125, 1.10479736328125, 1.216156005859375, 1.3275146484375, 1.438873291015625, 1.55023193359375, 1.661590576171875, 1.77294921875, 1.884307861328125, 1.99566650390625, 2.107025146484375, 2.2183837890625, 2.329742431640625, 2.44110107421875, 2.552459716796875, 2.663818359375, 2.775177001953125, 2.88653564453125, 2.997894287109375, 3.1092529296875, 3.220611572265625, 3.33197021484375, 3.443328857421875, 3.5546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 10.0, 10.0, 16.0, 16.0, 20.0, 26.0, 23.0, 39.0, 28.0, 37.0, 35.0, 40.0, 39.0, 49.0, 51.0, 47.0, 45.0, 48.0, 59.0, 51.0, 36.0, 35.0, 37.0, 29.0, 23.0, 26.0, 24.0, 16.0, 16.0, 12.0, 9.0, 11.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003979206085205078, -0.00038371607661247253, -0.00036951154470443726, -0.000355307012796402, -0.0003411024808883667, -0.0003268979489803314, -0.00031269341707229614, -0.00029848888516426086, -0.0002842843532562256, -0.0002700798213481903, -0.00025587528944015503, -0.00024167075753211975, -0.00022746622562408447, -0.0002132616937160492, -0.00019905716180801392, -0.00018485262989997864, -0.00017064809799194336, -0.00015644356608390808, -0.0001422390341758728, -0.00012803450226783752, -0.00011382997035980225, -9.962543845176697e-05, -8.542090654373169e-05, -7.121637463569641e-05, -5.701184272766113e-05, -4.2807310819625854e-05, -2.8602778911590576e-05, -1.4398247003555298e-05, -1.9371509552001953e-07, 1.4010816812515259e-05, 2.8215348720550537e-05, 4.2419880628585815e-05, 5.6624412536621094e-05, 7.082894444465637e-05, 8.503347635269165e-05, 9.923800826072693e-05, 0.00011344254016876221, 0.00012764707207679749, 0.00014185160398483276, 0.00015605613589286804, 0.00017026066780090332, 0.0001844651997089386, 0.00019866973161697388, 0.00021287426352500916, 0.00022707879543304443, 0.0002412833273410797, 0.000255487859249115, 0.00026969239115715027, 0.00028389692306518555, 0.0002981014549732208, 0.0003123059868812561, 0.0003265105187892914, 0.00034071505069732666, 0.00035491958260536194, 0.0003691241145133972, 0.0003833286464214325, 0.0003975331783294678, 0.00041173771023750305, 0.00042594224214553833, 0.0004401467740535736, 0.0004543513059616089, 0.00046855583786964417, 0.00048276036977767944, 0.0004969649016857147, 0.00051116943359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 13.0, 16.0, 27.0, 33.0, 48.0, 91.0, 128.0, 222.0, 372.0, 573.0, 986.0, 1723.0, 2696.0, 4637.0, 7698.0, 12472.0, 20458.0, 32586.0, 49202.0, 70533.0, 94589.0, 115004.0, 126618.0, 124788.0, 110599.0, 88685.0, 64330.0, 44211.0, 29014.0, 18370.0, 11150.0, 6649.0, 3982.0, 2328.0, 1483.0, 871.0, 535.0, 324.0, 220.0, 101.0, 67.0, 47.0, 28.0, 21.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.33984375, -4.20367431640625, -4.0675048828125, -3.93133544921875, -3.795166015625, -3.65899658203125, -3.5228271484375, -3.38665771484375, -3.25048828125, -3.11431884765625, -2.9781494140625, -2.84197998046875, -2.705810546875, -2.56964111328125, -2.4334716796875, -2.29730224609375, -2.1611328125, -2.02496337890625, -1.8887939453125, -1.75262451171875, -1.616455078125, -1.48028564453125, -1.3441162109375, -1.20794677734375, -1.07177734375, -0.93560791015625, -0.7994384765625, -0.66326904296875, -0.527099609375, -0.39093017578125, -0.2547607421875, -0.11859130859375, 0.017578125, 0.15374755859375, 0.2899169921875, 0.42608642578125, 0.562255859375, 0.69842529296875, 0.8345947265625, 0.97076416015625, 1.10693359375, 1.24310302734375, 1.3792724609375, 1.51544189453125, 1.651611328125, 1.78778076171875, 1.9239501953125, 2.06011962890625, 2.1962890625, 2.33245849609375, 2.4686279296875, 2.60479736328125, 2.740966796875, 2.87713623046875, 3.0133056640625, 3.14947509765625, 3.28564453125, 3.42181396484375, 3.5579833984375, 3.69415283203125, 3.830322265625, 3.96649169921875, 4.1026611328125, 4.23883056640625, 4.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 7.0, 2.0, 9.0, 12.0, 11.0, 13.0, 12.0, 23.0, 32.0, 31.0, 49.0, 32.0, 27.0, 38.0, 52.0, 44.0, 56.0, 55.0, 47.0, 47.0, 31.0, 44.0, 41.0, 39.0, 28.0, 28.0, 38.0, 26.0, 27.0, 10.0, 14.0, 11.0, 13.0, 9.0, 8.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8212890625, -1.7668914794921875, -1.712493896484375, -1.6580963134765625, -1.60369873046875, -1.5493011474609375, -1.494903564453125, -1.4405059814453125, -1.3861083984375, -1.3317108154296875, -1.277313232421875, -1.2229156494140625, -1.16851806640625, -1.1141204833984375, -1.059722900390625, -1.0053253173828125, -0.950927734375, -0.8965301513671875, -0.842132568359375, -0.7877349853515625, -0.73333740234375, -0.6789398193359375, -0.624542236328125, -0.5701446533203125, -0.5157470703125, -0.4613494873046875, -0.406951904296875, -0.3525543212890625, -0.29815673828125, -0.2437591552734375, -0.189361572265625, -0.1349639892578125, -0.08056640625, -0.0261688232421875, 0.028228759765625, 0.0826263427734375, 0.13702392578125, 0.1914215087890625, 0.245819091796875, 0.3002166748046875, 0.3546142578125, 0.4090118408203125, 0.463409423828125, 0.5178070068359375, 0.57220458984375, 0.6266021728515625, 0.680999755859375, 0.7353973388671875, 0.789794921875, 0.8441925048828125, 0.898590087890625, 0.9529876708984375, 1.00738525390625, 1.0617828369140625, 1.116180419921875, 1.1705780029296875, 1.2249755859375, 1.2793731689453125, 1.333770751953125, 1.3881683349609375, 1.44256591796875, 1.4969635009765625, 1.551361083984375, 1.6057586669921875, 1.66015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 1.0, 7.0, 3.0, 5.0, 7.0, 10.0, 17.0, 14.0, 28.0, 22.0, 26.0, 20.0, 32.0, 34.0, 59.0, 47.0, 49.0, 49.0, 38.0, 52.0, 34.0, 50.0, 46.0, 48.0, 45.0, 41.0, 24.0, 24.0, 36.0, 22.0, 19.0, 16.0, 11.0, 14.0, 16.0, 5.0, 7.0, 6.0, 2.0, 4.0, 8.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.756897926330566, -13.184160232543945, -12.61142349243164, -12.03868579864502, -11.465949058532715, -10.893211364746094, -10.320474624633789, -9.747736930847168, -9.174999237060547, -8.602261543273926, -8.029524803161621, -7.456787109375, -6.884050369262695, -6.311312675476074, -5.738575458526611, -5.165838241577148, -4.593101501464844, -4.020364284515381, -3.447627067565918, -2.874889612197876, -2.302152395248413, -1.7294151782989502, -1.1566777229309082, -0.5839405059814453, -0.011203289031982422, 0.5615339875221252, 1.134271264076233, 1.7070086002349854, 2.2797458171844482, 2.852483034133911, 3.425220489501953, 3.997957706451416, 4.570695877075195, 5.143433094024658, 5.716170310974121, 6.288908004760742, 6.861644744873047, 7.434382438659668, 8.007120132446289, 8.579856872558594, 9.152593612670898, 9.72533130645752, 10.298068046569824, 10.870805740356445, 11.44354248046875, 12.016280174255371, 12.589017868041992, 13.161754608154297, 13.734492301940918, 14.307229995727539, 14.879966735839844, 15.452704429626465, 16.025442123413086, 16.59817886352539, 17.170915603637695, 17.74365234375, 18.316390991210938, 18.889127731323242, 19.46186637878418, 20.034603118896484, 20.60733985900879, 21.180076599121094, 21.75281524658203, 22.325551986694336, 22.89828872680664]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 9.0, 13.0, 7.0, 11.0, 16.0, 13.0, 25.0, 21.0, 33.0, 28.0, 37.0, 48.0, 41.0, 43.0, 42.0, 39.0, 46.0, 44.0, 53.0, 50.0, 32.0, 39.0, 45.0, 21.0, 41.0, 29.0, 28.0, 22.0, 14.0, 15.0, 16.0, 15.0, 7.0, 8.0, 9.0, 4.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40592384338379, -21.72707176208496, -21.048219680786133, -20.369367599487305, -19.690515518188477, -19.01166343688965, -18.33281135559082, -17.653959274291992, -16.975107192993164, -16.296255111694336, -15.617403030395508, -14.93855094909668, -14.259698867797852, -13.580846786499023, -12.901994705200195, -12.223142623901367, -11.544291496276855, -10.865439414978027, -10.1865873336792, -9.507735252380371, -8.828883171081543, -8.150031089782715, -7.471179485321045, -6.792327404022217, -6.113475322723389, -5.4346232414245605, -4.755771160125732, -4.0769195556640625, -3.3980672359466553, -2.719215154647827, -2.040363311767578, -1.36151123046875, -0.6826591491699219, -0.0038071274757385254, 0.6750448942184448, 1.3538968563079834, 2.0327489376068115, 2.7116010189056396, 3.3904528617858887, 4.069304943084717, 4.748157024383545, 5.427009105682373, 6.105861186981201, 6.784712791442871, 7.463564872741699, 8.142416954040527, 8.821269035339355, 9.500121116638184, 10.178973197937012, 10.85782527923584, 11.536677360534668, 12.215529441833496, 12.894381523132324, 13.573233604431152, 14.252084732055664, 14.930936813354492, 15.60978889465332, 16.28864097595215, 16.967493057250977, 17.646345138549805, 18.325197219848633, 19.00404930114746, 19.68290138244629, 20.361753463745117, 21.040605545043945]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 10.0, 12.0, 25.0, 37.0, 77.0, 107.0, 133.0, 256.0, 444.0, 697.0, 1116.0, 1762.0, 2828.0, 4540.0, 6871.0, 10968.0, 16674.0, 25120.0, 37819.0, 54640.0, 79577.0, 111668.0, 151646.0, 200545.0, 253125.0, 305414.0, 349525.0, 376537.0, 384452.0, 366839.0, 330109.0, 281540.0, 228147.0, 177269.0, 132956.0, 95805.0, 67636.0, 46852.0, 31462.0, 20872.0, 13715.0, 8933.0, 5744.0, 3638.0, 2323.0, 1458.0, 867.0, 608.0, 349.0, 220.0, 129.0, 82.0, 55.0, 29.0, 16.0, 9.0, 4.0], "bins": [-13.0859375, -12.7149658203125, -12.343994140625, -11.9730224609375, -11.60205078125, -11.2310791015625, -10.860107421875, -10.4891357421875, -10.1181640625, -9.7471923828125, -9.376220703125, -9.0052490234375, -8.63427734375, -8.2633056640625, -7.892333984375, -7.5213623046875, -7.150390625, -6.7794189453125, -6.408447265625, -6.0374755859375, -5.66650390625, -5.2955322265625, -4.924560546875, -4.5535888671875, -4.1826171875, -3.8116455078125, -3.440673828125, -3.0697021484375, -2.69873046875, -2.3277587890625, -1.956787109375, -1.5858154296875, -1.21484375, -0.8438720703125, -0.472900390625, -0.1019287109375, 0.26904296875, 0.6400146484375, 1.010986328125, 1.3819580078125, 1.7529296875, 2.1239013671875, 2.494873046875, 2.8658447265625, 3.23681640625, 3.6077880859375, 3.978759765625, 4.3497314453125, 4.720703125, 5.0916748046875, 5.462646484375, 5.8336181640625, 6.20458984375, 6.5755615234375, 6.946533203125, 7.3175048828125, 7.6884765625, 8.0594482421875, 8.430419921875, 8.8013916015625, 9.17236328125, 9.5433349609375, 9.914306640625, 10.2852783203125, 10.65625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 16.0, 19.0, 12.0, 18.0, 32.0, 20.0, 35.0, 34.0, 44.0, 33.0, 38.0, 43.0, 41.0, 45.0, 52.0, 41.0, 48.0, 32.0, 45.0, 38.0, 38.0, 33.0, 28.0, 22.0, 23.0, 20.0, 27.0, 16.0, 12.0, 9.0, 7.0, 8.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.28125, -16.734375, -16.1875, -15.640625, -15.09375, -14.546875, -14.0, -13.453125, -12.90625, -12.359375, -11.8125, -11.265625, -10.71875, -10.171875, -9.625, -9.078125, -8.53125, -7.984375, -7.4375, -6.890625, -6.34375, -5.796875, -5.25, -4.703125, -4.15625, -3.609375, -3.0625, -2.515625, -1.96875, -1.421875, -0.875, -0.328125, 0.21875, 0.765625, 1.3125, 1.859375, 2.40625, 2.953125, 3.5, 4.046875, 4.59375, 5.140625, 5.6875, 6.234375, 6.78125, 7.328125, 7.875, 8.421875, 8.96875, 9.515625, 10.0625, 10.609375, 11.15625, 11.703125, 12.25, 12.796875, 13.34375, 13.890625, 14.4375, 14.984375, 15.53125, 16.078125, 16.625, 17.171875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 13.0, 13.0, 27.0, 65.0, 98.0, 134.0, 214.0, 422.0, 704.0, 1183.0, 2008.0, 3194.0, 5396.0, 8759.0, 13732.0, 21321.0, 33049.0, 48799.0, 71728.0, 101932.0, 138403.0, 182221.0, 230167.0, 279200.0, 320240.0, 352131.0, 365669.0, 361344.0, 338999.0, 303003.0, 256339.0, 208729.0, 161680.0, 120417.0, 87688.0, 60326.0, 41221.0, 27302.0, 17760.0, 10985.0, 7088.0, 4237.0, 2591.0, 1565.0, 957.0, 483.0, 315.0, 201.0, 104.0, 58.0, 31.0, 17.0, 10.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.3681640625, -10.986328125, -10.6044921875, -10.22265625, -9.8408203125, -9.458984375, -9.0771484375, -8.6953125, -8.3134765625, -7.931640625, -7.5498046875, -7.16796875, -6.7861328125, -6.404296875, -6.0224609375, -5.640625, -5.2587890625, -4.876953125, -4.4951171875, -4.11328125, -3.7314453125, -3.349609375, -2.9677734375, -2.5859375, -2.2041015625, -1.822265625, -1.4404296875, -1.05859375, -0.6767578125, -0.294921875, 0.0869140625, 0.46875, 0.8505859375, 1.232421875, 1.6142578125, 1.99609375, 2.3779296875, 2.759765625, 3.1416015625, 3.5234375, 3.9052734375, 4.287109375, 4.6689453125, 5.05078125, 5.4326171875, 5.814453125, 6.1962890625, 6.578125, 6.9599609375, 7.341796875, 7.7236328125, 8.10546875, 8.4873046875, 8.869140625, 9.2509765625, 9.6328125, 10.0146484375, 10.396484375, 10.7783203125, 11.16015625, 11.5419921875, 11.923828125, 12.3056640625, 12.6875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 8.0, 9.0, 22.0, 12.0, 22.0, 31.0, 21.0, 43.0, 66.0, 64.0, 84.0, 91.0, 87.0, 123.0, 147.0, 144.0, 200.0, 174.0, 198.0, 223.0, 196.0, 186.0, 221.0, 187.0, 167.0, 172.0, 167.0, 160.0, 109.0, 123.0, 103.0, 105.0, 82.0, 58.0, 47.0, 57.0, 49.0, 20.0, 25.0, 17.0, 15.0, 13.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.109375, -7.8592529296875, -7.609130859375, -7.3590087890625, -7.10888671875, -6.8587646484375, -6.608642578125, -6.3585205078125, -6.1083984375, -5.8582763671875, -5.608154296875, -5.3580322265625, -5.10791015625, -4.8577880859375, -4.607666015625, -4.3575439453125, -4.107421875, -3.8572998046875, -3.607177734375, -3.3570556640625, -3.10693359375, -2.8568115234375, -2.606689453125, -2.3565673828125, -2.1064453125, -1.8563232421875, -1.606201171875, -1.3560791015625, -1.10595703125, -0.8558349609375, -0.605712890625, -0.3555908203125, -0.10546875, 0.1446533203125, 0.394775390625, 0.6448974609375, 0.89501953125, 1.1451416015625, 1.395263671875, 1.6453857421875, 1.8955078125, 2.1456298828125, 2.395751953125, 2.6458740234375, 2.89599609375, 3.1461181640625, 3.396240234375, 3.6463623046875, 3.896484375, 4.1466064453125, 4.396728515625, 4.6468505859375, 4.89697265625, 5.1470947265625, 5.397216796875, 5.6473388671875, 5.8974609375, 6.1475830078125, 6.397705078125, 6.6478271484375, 6.89794921875, 7.1480712890625, 7.398193359375, 7.6483154296875, 7.8984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 6.0, 8.0, 17.0, 15.0, 30.0, 23.0, 27.0, 27.0, 41.0, 38.0, 51.0, 43.0, 41.0, 37.0, 54.0, 52.0, 46.0, 47.0, 58.0, 42.0, 43.0, 29.0, 37.0, 33.0, 28.0, 23.0, 16.0, 12.0, 11.0, 8.0, 7.0, 9.0, 7.0, 12.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.6616153717041, -20.02762222290039, -19.39362907409668, -18.75963592529297, -18.125642776489258, -17.491649627685547, -16.857656478881836, -16.223663330078125, -15.589670181274414, -14.955677032470703, -14.321683883666992, -13.687690734863281, -13.05369758605957, -12.41970443725586, -11.785711288452148, -11.151718139648438, -10.517724990844727, -9.883731842041016, -9.249738693237305, -8.615745544433594, -7.981752395629883, -7.347759246826172, -6.713766098022461, -6.07977294921875, -5.445779800415039, -4.811786651611328, -4.177793502807617, -3.5438003540039062, -2.9098072052001953, -2.2758140563964844, -1.6418209075927734, -1.0078277587890625, -0.37383270263671875, 0.2601604461669922, 0.8941535949707031, 1.528146743774414, 2.162139892578125, 2.796133041381836, 3.430126190185547, 4.064119338989258, 4.698112487792969, 5.33210563659668, 5.966098785400391, 6.600091934204102, 7.2340850830078125, 7.868078231811523, 8.502071380615234, 9.136064529418945, 9.770057678222656, 10.404050827026367, 11.038043975830078, 11.672037124633789, 12.3060302734375, 12.940023422241211, 13.574016571044922, 14.208009719848633, 14.842002868652344, 15.475996017456055, 16.109989166259766, 16.743982315063477, 17.377975463867188, 18.0119686126709, 18.64596176147461, 19.27995491027832, 19.91394805908203]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 9.0, 12.0, 10.0, 12.0, 8.0, 17.0, 18.0, 24.0, 25.0, 24.0, 20.0, 31.0, 33.0, 34.0, 37.0, 27.0, 47.0, 31.0, 48.0, 48.0, 43.0, 48.0, 37.0, 30.0, 25.0, 22.0, 24.0, 36.0, 29.0, 23.0, 23.0, 16.0, 18.0, 17.0, 10.0, 10.0, 5.0, 11.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-18.28009605407715, -17.677419662475586, -17.074743270874023, -16.47206687927246, -15.869390487670898, -15.266714096069336, -14.664037704467773, -14.061361312866211, -13.458684921264648, -12.856008529663086, -12.253332138061523, -11.650655746459961, -11.047979354858398, -10.445302963256836, -9.842626571655273, -9.239950180053711, -8.637274742126465, -8.034598350524902, -7.43192195892334, -6.829245567321777, -6.226569175720215, -5.623892784118652, -5.021216869354248, -4.4185404777526855, -3.815864086151123, -3.2131876945495605, -2.610511302947998, -2.0078351497650146, -1.4051587581634521, -0.8024823665618896, -0.19980621337890625, 0.40287017822265625, 1.0055465698242188, 1.6082229614257812, 2.2108993530273438, 2.813575506210327, 3.4162518978118896, 4.018928527832031, 4.6216044425964355, 5.224280834197998, 5.8269572257995605, 6.429633617401123, 7.0323100090026855, 7.63498592376709, 8.237662315368652, 8.840338706970215, 9.443015098571777, 10.04569149017334, 10.648367881774902, 11.251044273376465, 11.853720664978027, 12.45639705657959, 13.059073448181152, 13.661749839782715, 14.264425277709961, 14.867101669311523, 15.469778060913086, 16.07245445251465, 16.67513084411621, 17.277807235717773, 17.880483627319336, 18.4831600189209, 19.08583641052246, 19.688512802124023, 20.291189193725586]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 11.0, 9.0, 29.0, 29.0, 30.0, 66.0, 107.0, 139.0, 238.0, 350.0, 522.0, 807.0, 1267.0, 2079.0, 3406.0, 5578.0, 9311.0, 15761.0, 28103.0, 49531.0, 89016.0, 162415.0, 246329.0, 188899.0, 106563.0, 58960.0, 32806.0, 18489.0, 10789.0, 6459.0, 3886.0, 2442.0, 1422.0, 947.0, 593.0, 373.0, 263.0, 183.0, 96.0, 84.0, 63.0, 39.0, 22.0, 12.0, 13.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.048828125, -2.94598388671875, -2.8431396484375, -2.74029541015625, -2.637451171875, -2.53460693359375, -2.4317626953125, -2.32891845703125, -2.22607421875, -2.12322998046875, -2.0203857421875, -1.91754150390625, -1.814697265625, -1.71185302734375, -1.6090087890625, -1.50616455078125, -1.4033203125, -1.30047607421875, -1.1976318359375, -1.09478759765625, -0.991943359375, -0.88909912109375, -0.7862548828125, -0.68341064453125, -0.58056640625, -0.47772216796875, -0.3748779296875, -0.27203369140625, -0.169189453125, -0.06634521484375, 0.0364990234375, 0.13934326171875, 0.2421875, 0.34503173828125, 0.4478759765625, 0.55072021484375, 0.653564453125, 0.75640869140625, 0.8592529296875, 0.96209716796875, 1.06494140625, 1.16778564453125, 1.2706298828125, 1.37347412109375, 1.476318359375, 1.57916259765625, 1.6820068359375, 1.78485107421875, 1.8876953125, 1.99053955078125, 2.0933837890625, 2.19622802734375, 2.299072265625, 2.40191650390625, 2.5047607421875, 2.60760498046875, 2.71044921875, 2.81329345703125, 2.9161376953125, 3.01898193359375, 3.121826171875, 3.22467041015625, 3.3275146484375, 3.43035888671875, 3.533203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 6.0, 6.0, 16.0, 9.0, 11.0, 20.0, 11.0, 20.0, 15.0, 32.0, 24.0, 23.0, 39.0, 30.0, 29.0, 31.0, 41.0, 35.0, 45.0, 51.0, 34.0, 41.0, 35.0, 37.0, 30.0, 36.0, 27.0, 27.0, 27.0, 21.0, 25.0, 24.0, 16.0, 15.0, 15.0, 19.0, 8.0, 6.0, 19.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.671875, -19.039306640625, -18.40673828125, -17.774169921875, -17.1416015625, -16.509033203125, -15.87646484375, -15.243896484375, -14.611328125, -13.978759765625, -13.34619140625, -12.713623046875, -12.0810546875, -11.448486328125, -10.81591796875, -10.183349609375, -9.55078125, -8.918212890625, -8.28564453125, -7.653076171875, -7.0205078125, -6.387939453125, -5.75537109375, -5.122802734375, -4.490234375, -3.857666015625, -3.22509765625, -2.592529296875, -1.9599609375, -1.327392578125, -0.69482421875, -0.062255859375, 0.5703125, 1.202880859375, 1.83544921875, 2.468017578125, 3.1005859375, 3.733154296875, 4.36572265625, 4.998291015625, 5.630859375, 6.263427734375, 6.89599609375, 7.528564453125, 8.1611328125, 8.793701171875, 9.42626953125, 10.058837890625, 10.69140625, 11.323974609375, 11.95654296875, 12.589111328125, 13.2216796875, 13.854248046875, 14.48681640625, 15.119384765625, 15.751953125, 16.384521484375, 17.01708984375, 17.649658203125, 18.2822265625, 18.914794921875, 19.54736328125, 20.179931640625, 20.8125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 9.0, 12.0, 29.0, 29.0, 44.0, 79.0, 112.0, 173.0, 228.0, 356.0, 487.0, 723.0, 1048.0, 1637.0, 2393.0, 3605.0, 5652.0, 8464.0, 13095.0, 20512.0, 32873.0, 53630.0, 89556.0, 151963.0, 219360.0, 173313.0, 103649.0, 61781.0, 37456.0, 23162.0, 14989.0, 9522.0, 6128.0, 4119.0, 2734.0, 1840.0, 1240.0, 786.0, 557.0, 376.0, 253.0, 180.0, 125.0, 80.0, 67.0, 43.0, 21.0, 16.0, 19.0, 5.0, 6.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.857421875, -2.76708984375, -2.6767578125, -2.58642578125, -2.49609375, -2.40576171875, -2.3154296875, -2.22509765625, -2.134765625, -2.04443359375, -1.9541015625, -1.86376953125, -1.7734375, -1.68310546875, -1.5927734375, -1.50244140625, -1.412109375, -1.32177734375, -1.2314453125, -1.14111328125, -1.05078125, -0.96044921875, -0.8701171875, -0.77978515625, -0.689453125, -0.59912109375, -0.5087890625, -0.41845703125, -0.328125, -0.23779296875, -0.1474609375, -0.05712890625, 0.033203125, 0.12353515625, 0.2138671875, 0.30419921875, 0.39453125, 0.48486328125, 0.5751953125, 0.66552734375, 0.755859375, 0.84619140625, 0.9365234375, 1.02685546875, 1.1171875, 1.20751953125, 1.2978515625, 1.38818359375, 1.478515625, 1.56884765625, 1.6591796875, 1.74951171875, 1.83984375, 1.93017578125, 2.0205078125, 2.11083984375, 2.201171875, 2.29150390625, 2.3818359375, 2.47216796875, 2.5625, 2.65283203125, 2.7431640625, 2.83349609375, 2.923828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 11.0, 14.0, 16.0, 6.0, 15.0, 16.0, 19.0, 11.0, 23.0, 20.0, 27.0, 25.0, 29.0, 37.0, 31.0, 47.0, 40.0, 28.0, 49.0, 42.0, 46.0, 34.0, 32.0, 25.0, 29.0, 34.0, 34.0, 21.0, 28.0, 25.0, 23.0, 21.0, 21.0, 20.0, 14.0, 11.0, 9.0, 7.0, 11.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.109375, -12.7166748046875, -12.323974609375, -11.9312744140625, -11.53857421875, -11.1458740234375, -10.753173828125, -10.3604736328125, -9.9677734375, -9.5750732421875, -9.182373046875, -8.7896728515625, -8.39697265625, -8.0042724609375, -7.611572265625, -7.2188720703125, -6.826171875, -6.4334716796875, -6.040771484375, -5.6480712890625, -5.25537109375, -4.8626708984375, -4.469970703125, -4.0772705078125, -3.6845703125, -3.2918701171875, -2.899169921875, -2.5064697265625, -2.11376953125, -1.7210693359375, -1.328369140625, -0.9356689453125, -0.54296875, -0.1502685546875, 0.242431640625, 0.6351318359375, 1.02783203125, 1.4205322265625, 1.813232421875, 2.2059326171875, 2.5986328125, 2.9913330078125, 3.384033203125, 3.7767333984375, 4.16943359375, 4.5621337890625, 4.954833984375, 5.3475341796875, 5.740234375, 6.1329345703125, 6.525634765625, 6.9183349609375, 7.31103515625, 7.7037353515625, 8.096435546875, 8.4891357421875, 8.8818359375, 9.2745361328125, 9.667236328125, 10.0599365234375, 10.45263671875, 10.8453369140625, 11.238037109375, 11.6307373046875, 12.0234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 11.0, 21.0, 36.0, 48.0, 82.0, 96.0, 184.0, 319.0, 589.0, 968.0, 1602.0, 2937.0, 5198.0, 9718.0, 18285.0, 36801.0, 81277.0, 215560.0, 377296.0, 167179.0, 65386.0, 30757.0, 15470.0, 8298.0, 4449.0, 2482.0, 1443.0, 844.0, 475.0, 289.0, 158.0, 101.0, 54.0, 35.0, 27.0, 23.0, 15.0, 7.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1182861328125, -0.11463260650634766, -0.11097908020019531, -0.10732555389404297, -0.10367202758789062, -0.10001850128173828, -0.09636497497558594, -0.0927114486694336, -0.08905792236328125, -0.0854043960571289, -0.08175086975097656, -0.07809734344482422, -0.07444381713867188, -0.07079029083251953, -0.06713676452636719, -0.06348323822021484, -0.0598297119140625, -0.056176185607910156, -0.05252265930175781, -0.04886913299560547, -0.045215606689453125, -0.04156208038330078, -0.03790855407714844, -0.034255027770996094, -0.03060150146484375, -0.026947975158691406, -0.023294448852539062, -0.01964092254638672, -0.015987396240234375, -0.012333869934082031, -0.008680343627929688, -0.005026817321777344, -0.001373291015625, 0.0022802352905273438, 0.0059337615966796875, 0.009587287902832031, 0.013240814208984375, 0.01689434051513672, 0.020547866821289062, 0.024201393127441406, 0.02785491943359375, 0.031508445739746094, 0.03516197204589844, 0.03881549835205078, 0.042469024658203125, 0.04612255096435547, 0.04977607727050781, 0.053429603576660156, 0.0570831298828125, 0.060736656188964844, 0.06439018249511719, 0.06804370880126953, 0.07169723510742188, 0.07535076141357422, 0.07900428771972656, 0.0826578140258789, 0.08631134033203125, 0.0899648666381836, 0.09361839294433594, 0.09727191925048828, 0.10092544555664062, 0.10457897186279297, 0.10823249816894531, 0.11188602447509766, 0.11553955078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 17.0, 27.0, 20.0, 26.0, 20.0, 27.0, 36.0, 16.0, 40.0, 41.0, 32.0, 41.0, 58.0, 49.0, 39.0, 54.0, 38.0, 49.0, 31.0, 48.0, 32.0, 33.0, 27.0, 25.0, 17.0, 23.0, 15.0, 14.0, 14.0, 7.0, 7.0, 5.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4543533325195312e-05, -1.407042145729065e-05, -1.3597309589385986e-05, -1.3124197721481323e-05, -1.265108585357666e-05, -1.2177973985671997e-05, -1.1704862117767334e-05, -1.1231750249862671e-05, -1.0758638381958008e-05, -1.0285526514053345e-05, -9.812414646148682e-06, -9.339302778244019e-06, -8.866190910339355e-06, -8.393079042434692e-06, -7.91996717453003e-06, -7.446855306625366e-06, -6.973743438720703e-06, -6.50063157081604e-06, -6.027519702911377e-06, -5.554407835006714e-06, -5.081295967102051e-06, -4.608184099197388e-06, -4.135072231292725e-06, -3.6619603633880615e-06, -3.1888484954833984e-06, -2.7157366275787354e-06, -2.2426247596740723e-06, -1.7695128917694092e-06, -1.296401023864746e-06, -8.23289155960083e-07, -3.501772880554199e-07, 1.2293457984924316e-07, 5.960464477539062e-07, 1.0691583156585693e-06, 1.5422701835632324e-06, 2.0153820514678955e-06, 2.4884939193725586e-06, 2.9616057872772217e-06, 3.4347176551818848e-06, 3.907829523086548e-06, 4.380941390991211e-06, 4.854053258895874e-06, 5.327165126800537e-06, 5.8002769947052e-06, 6.273388862609863e-06, 6.746500730514526e-06, 7.2196125984191895e-06, 7.692724466323853e-06, 8.165836334228516e-06, 8.638948202133179e-06, 9.112060070037842e-06, 9.585171937942505e-06, 1.0058283805847168e-05, 1.0531395673751831e-05, 1.1004507541656494e-05, 1.1477619409561157e-05, 1.195073127746582e-05, 1.2423843145370483e-05, 1.2896955013275146e-05, 1.337006688117981e-05, 1.3843178749084473e-05, 1.4316290616989136e-05, 1.4789402484893799e-05, 1.5262514352798462e-05, 1.5735626220703125e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 10.0, 14.0, 9.0, 32.0, 24.0, 33.0, 53.0, 82.0, 124.0, 187.0, 303.0, 411.0, 603.0, 924.0, 1337.0, 2085.0, 3218.0, 4944.0, 7723.0, 11815.0, 18429.0, 29428.0, 48457.0, 85628.0, 164317.0, 288222.0, 164875.0, 84852.0, 48510.0, 29335.0, 18523.0, 11870.0, 7689.0, 4946.0, 3310.0, 2136.0, 1330.0, 889.0, 617.0, 409.0, 295.0, 157.0, 119.0, 91.0, 62.0, 27.0, 30.0, 15.0, 12.0, 8.0, 9.0, 9.0, 6.0, 1.0, 1.0, 2.0, 5.0], "bins": [-0.218505859375, -0.21178245544433594, -0.20505905151367188, -0.1983356475830078, -0.19161224365234375, -0.1848888397216797, -0.17816543579101562, -0.17144203186035156, -0.1647186279296875, -0.15799522399902344, -0.15127182006835938, -0.1445484161376953, -0.13782501220703125, -0.1311016082763672, -0.12437820434570312, -0.11765480041503906, -0.110931396484375, -0.10420799255371094, -0.09748458862304688, -0.09076118469238281, -0.08403778076171875, -0.07731437683105469, -0.07059097290039062, -0.06386756896972656, -0.0571441650390625, -0.05042076110839844, -0.043697357177734375, -0.03697395324707031, -0.03025054931640625, -0.023527145385742188, -0.016803741455078125, -0.010080337524414062, -0.00335693359375, 0.0033664703369140625, 0.010089874267578125, 0.016813278198242188, 0.02353668212890625, 0.030260086059570312, 0.036983489990234375, 0.04370689392089844, 0.0504302978515625, 0.05715370178222656, 0.06387710571289062, 0.07060050964355469, 0.07732391357421875, 0.08404731750488281, 0.09077072143554688, 0.09749412536621094, 0.104217529296875, 0.11094093322753906, 0.11766433715820312, 0.12438774108886719, 0.13111114501953125, 0.1378345489501953, 0.14455795288085938, 0.15128135681152344, 0.1580047607421875, 0.16472816467285156, 0.17145156860351562, 0.1781749725341797, 0.18489837646484375, 0.1916217803955078, 0.19834518432617188, 0.20506858825683594, 0.2117919921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 19.0, 17.0, 40.0, 49.0, 79.0, 88.0, 105.0, 132.0, 114.0, 89.0, 58.0, 54.0, 36.0, 20.0, 17.0, 14.0, 6.0, 5.0, 5.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07859420776367188, -0.07582855224609375, -0.07306289672851562, -0.0702972412109375, -0.06753158569335938, -0.06476593017578125, -0.062000274658203125, -0.059234619140625, -0.056468963623046875, -0.05370330810546875, -0.050937652587890625, -0.0481719970703125, -0.045406341552734375, -0.04264068603515625, -0.039875030517578125, -0.037109375, -0.034343719482421875, -0.03157806396484375, -0.028812408447265625, -0.0260467529296875, -0.023281097412109375, -0.02051544189453125, -0.017749786376953125, -0.014984130859375, -0.012218475341796875, -0.00945281982421875, -0.006687164306640625, -0.0039215087890625, -0.001155853271484375, 0.00160980224609375, 0.004375457763671875, 0.00714111328125, 0.009906768798828125, 0.01267242431640625, 0.015438079833984375, 0.0182037353515625, 0.020969390869140625, 0.02373504638671875, 0.026500701904296875, 0.029266357421875, 0.032032012939453125, 0.03479766845703125, 0.037563323974609375, 0.0403289794921875, 0.043094635009765625, 0.04586029052734375, 0.048625946044921875, 0.0513916015625, 0.054157257080078125, 0.05692291259765625, 0.059688568115234375, 0.0624542236328125, 0.06521987915039062, 0.06798553466796875, 0.07075119018554688, 0.073516845703125, 0.07628250122070312, 0.07904815673828125, 0.08181381225585938, 0.0845794677734375, 0.08734512329101562, 0.09011077880859375, 0.09287643432617188, 0.09564208984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 8.0, 8.0, 6.0, 12.0, 16.0, 21.0, 30.0, 19.0, 27.0, 29.0, 49.0, 39.0, 47.0, 48.0, 32.0, 43.0, 52.0, 55.0, 51.0, 44.0, 54.0, 41.0, 43.0, 37.0, 28.0, 28.0, 28.0, 25.0, 10.0, 8.0, 15.0, 5.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.452543258666992, -19.818645477294922, -19.18474578857422, -18.55084800720215, -17.916948318481445, -17.283050537109375, -16.649150848388672, -16.0152530670166, -15.381355285644531, -14.747456550598145, -14.113557815551758, -13.479660034179688, -12.8457612991333, -12.211862564086914, -11.577963829040527, -10.94406509399414, -10.310166358947754, -9.676267623901367, -9.04236888885498, -8.408470153808594, -7.774572372436523, -7.140673637390137, -6.50677490234375, -5.8728766441345215, -5.238977909088135, -4.605079174041748, -3.9711809158325195, -3.337282180786133, -2.703383684158325, -2.0694851875305176, -1.4355864524841309, -0.8016881942749023, -0.16778945922851562, 0.46610909700393677, 1.1000076532363892, 1.7339062690734863, 2.367804765701294, 3.0017032623291016, 3.6356019973754883, 4.269500255584717, 4.9033989906311035, 5.53729772567749, 6.171195983886719, 6.8050947189331055, 7.438993453979492, 8.072891235351562, 8.706790924072266, 9.340688705444336, 9.974587440490723, 10.60848617553711, 11.242384910583496, 11.876283645629883, 12.510181427001953, 13.14408016204834, 13.777978897094727, 14.411876678466797, 15.0457763671875, 15.679675102233887, 16.313573837280273, 16.947471618652344, 17.581371307373047, 18.215269088745117, 18.849166870117188, 19.48306655883789, 20.11696434020996]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 13.0, 10.0, 11.0, 8.0, 16.0, 21.0, 22.0, 26.0, 23.0, 19.0, 32.0, 34.0, 34.0, 36.0, 28.0, 47.0, 32.0, 46.0, 48.0, 45.0, 47.0, 37.0, 30.0, 26.0, 22.0, 24.0, 34.0, 29.0, 24.0, 23.0, 16.0, 17.0, 17.0, 11.0, 9.0, 5.0, 11.0, 10.0, 7.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-18.260574340820312, -17.657394409179688, -17.054214477539062, -16.451034545898438, -15.847855567932129, -15.244675636291504, -14.641495704650879, -14.03831672668457, -13.435136795043945, -12.83195686340332, -12.228776931762695, -11.62559700012207, -11.022418022155762, -10.419238090515137, -9.816058158874512, -9.212879180908203, -8.609698295593262, -8.006518363952637, -7.40333890914917, -6.800158977508545, -6.196979522705078, -5.593799591064453, -4.990619659423828, -4.387440204620361, -3.7842602729797363, -3.1810805797576904, -2.5779008865356445, -1.9747209548950195, -1.3715412616729736, -0.7683615684509277, -0.16518163681030273, 0.43799781799316406, 1.041177749633789, 1.644357442855835, 2.247537136077881, 2.850717067718506, 3.4538967609405518, 4.057076454162598, 4.660256385803223, 5.2634358406066895, 5.8666157722473145, 6.4697957038879395, 7.072975158691406, 7.676155090332031, 8.279335021972656, 8.882514953613281, 9.485694885253906, 10.088873863220215, 10.69205379486084, 11.295233726501465, 11.89841365814209, 12.501592636108398, 13.104772567749023, 13.707952499389648, 14.311132431030273, 14.914312362670898, 15.517492294311523, 16.12067222595215, 16.723852157592773, 17.3270320892334, 17.930212020874023, 18.533390045166016, 19.13656997680664, 19.739749908447266, 20.34292984008789]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 8.0, 9.0, 10.0, 23.0, 34.0, 50.0, 69.0, 151.0, 181.0, 261.0, 459.0, 749.0, 1154.0, 1836.0, 2975.0, 4421.0, 6723.0, 10272.0, 15429.0, 22216.0, 31648.0, 43565.0, 57349.0, 71097.0, 84104.0, 93599.0, 98772.0, 97561.0, 89496.0, 78820.0, 64298.0, 50429.0, 37436.0, 27157.0, 18979.0, 12986.0, 8648.0, 5563.0, 3619.0, 2285.0, 1487.0, 994.0, 589.0, 396.0, 263.0, 157.0, 88.0, 53.0, 37.0, 28.0, 13.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6484375, -9.3243408203125, -9.000244140625, -8.6761474609375, -8.35205078125, -8.0279541015625, -7.703857421875, -7.3797607421875, -7.0556640625, -6.7315673828125, -6.407470703125, -6.0833740234375, -5.75927734375, -5.4351806640625, -5.111083984375, -4.7869873046875, -4.462890625, -4.1387939453125, -3.814697265625, -3.4906005859375, -3.16650390625, -2.8424072265625, -2.518310546875, -2.1942138671875, -1.8701171875, -1.5460205078125, -1.221923828125, -0.8978271484375, -0.57373046875, -0.2496337890625, 0.074462890625, 0.3985595703125, 0.72265625, 1.0467529296875, 1.370849609375, 1.6949462890625, 2.01904296875, 2.3431396484375, 2.667236328125, 2.9913330078125, 3.3154296875, 3.6395263671875, 3.963623046875, 4.2877197265625, 4.61181640625, 4.9359130859375, 5.260009765625, 5.5841064453125, 5.908203125, 6.2322998046875, 6.556396484375, 6.8804931640625, 7.20458984375, 7.5286865234375, 7.852783203125, 8.1768798828125, 8.5009765625, 8.8250732421875, 9.149169921875, 9.4732666015625, 9.79736328125, 10.1214599609375, 10.445556640625, 10.7696533203125, 11.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 8.0, 2.0, 3.0, 5.0, 9.0, 12.0, 10.0, 11.0, 16.0, 11.0, 20.0, 19.0, 27.0, 22.0, 33.0, 19.0, 25.0, 50.0, 34.0, 42.0, 38.0, 40.0, 50.0, 49.0, 40.0, 45.0, 40.0, 31.0, 32.0, 38.0, 28.0, 24.0, 24.0, 23.0, 22.0, 18.0, 11.0, 9.0, 15.0, 10.0, 5.0, 10.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.390625, -18.7421875, -18.09375, -17.4453125, -16.796875, -16.1484375, -15.5, -14.8515625, -14.203125, -13.5546875, -12.90625, -12.2578125, -11.609375, -10.9609375, -10.3125, -9.6640625, -9.015625, -8.3671875, -7.71875, -7.0703125, -6.421875, -5.7734375, -5.125, -4.4765625, -3.828125, -3.1796875, -2.53125, -1.8828125, -1.234375, -0.5859375, 0.0625, 0.7109375, 1.359375, 2.0078125, 2.65625, 3.3046875, 3.953125, 4.6015625, 5.25, 5.8984375, 6.546875, 7.1953125, 7.84375, 8.4921875, 9.140625, 9.7890625, 10.4375, 11.0859375, 11.734375, 12.3828125, 13.03125, 13.6796875, 14.328125, 14.9765625, 15.625, 16.2734375, 16.921875, 17.5703125, 18.21875, 18.8671875, 19.515625, 20.1640625, 20.8125, 21.4609375, 22.109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 22.0, 34.0, 50.0, 77.0, 135.0, 203.0, 334.0, 491.0, 755.0, 1236.0, 1889.0, 3075.0, 4719.0, 7170.0, 10596.0, 15605.0, 22155.0, 31162.0, 41546.0, 54069.0, 66906.0, 78954.0, 88064.0, 93815.0, 93835.0, 88793.0, 78993.0, 67329.0, 54220.0, 41852.0, 31104.0, 22717.0, 15488.0, 10787.0, 7211.0, 4784.0, 3022.0, 1988.0, 1214.0, 806.0, 517.0, 308.0, 189.0, 123.0, 83.0, 48.0, 27.0, 22.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-10.2109375, -9.901611328125, -9.59228515625, -9.282958984375, -8.9736328125, -8.664306640625, -8.35498046875, -8.045654296875, -7.736328125, -7.427001953125, -7.11767578125, -6.808349609375, -6.4990234375, -6.189697265625, -5.88037109375, -5.571044921875, -5.26171875, -4.952392578125, -4.64306640625, -4.333740234375, -4.0244140625, -3.715087890625, -3.40576171875, -3.096435546875, -2.787109375, -2.477783203125, -2.16845703125, -1.859130859375, -1.5498046875, -1.240478515625, -0.93115234375, -0.621826171875, -0.3125, -0.003173828125, 0.30615234375, 0.615478515625, 0.9248046875, 1.234130859375, 1.54345703125, 1.852783203125, 2.162109375, 2.471435546875, 2.78076171875, 3.090087890625, 3.3994140625, 3.708740234375, 4.01806640625, 4.327392578125, 4.63671875, 4.946044921875, 5.25537109375, 5.564697265625, 5.8740234375, 6.183349609375, 6.49267578125, 6.802001953125, 7.111328125, 7.420654296875, 7.72998046875, 8.039306640625, 8.3486328125, 8.657958984375, 8.96728515625, 9.276611328125, 9.5859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 7.0, 5.0, 8.0, 4.0, 6.0, 8.0, 10.0, 7.0, 14.0, 11.0, 20.0, 22.0, 17.0, 19.0, 33.0, 29.0, 31.0, 30.0, 28.0, 29.0, 34.0, 48.0, 35.0, 42.0, 38.0, 32.0, 36.0, 40.0, 36.0, 40.0, 25.0, 33.0, 27.0, 30.0, 19.0, 22.0, 10.0, 16.0, 15.0, 21.0, 17.0, 7.0, 9.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.03564453125, -10.6572265625, -10.27880859375, -9.900390625, -9.52197265625, -9.1435546875, -8.76513671875, -8.38671875, -8.00830078125, -7.6298828125, -7.25146484375, -6.873046875, -6.49462890625, -6.1162109375, -5.73779296875, -5.359375, -4.98095703125, -4.6025390625, -4.22412109375, -3.845703125, -3.46728515625, -3.0888671875, -2.71044921875, -2.33203125, -1.95361328125, -1.5751953125, -1.19677734375, -0.818359375, -0.43994140625, -0.0615234375, 0.31689453125, 0.6953125, 1.07373046875, 1.4521484375, 1.83056640625, 2.208984375, 2.58740234375, 2.9658203125, 3.34423828125, 3.72265625, 4.10107421875, 4.4794921875, 4.85791015625, 5.236328125, 5.61474609375, 5.9931640625, 6.37158203125, 6.75, 7.12841796875, 7.5068359375, 7.88525390625, 8.263671875, 8.64208984375, 9.0205078125, 9.39892578125, 9.77734375, 10.15576171875, 10.5341796875, 10.91259765625, 11.291015625, 11.66943359375, 12.0478515625, 12.42626953125, 12.8046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 7.0, 7.0, 21.0, 31.0, 51.0, 97.0, 129.0, 222.0, 350.0, 540.0, 892.0, 1386.0, 2241.0, 3389.0, 5337.0, 8265.0, 12513.0, 18603.0, 26320.0, 36942.0, 48931.0, 62793.0, 76785.0, 87791.0, 95433.0, 97824.0, 93812.0, 85673.0, 72217.0, 58953.0, 45534.0, 33434.0, 23947.0, 16579.0, 11119.0, 7270.0, 4772.0, 3095.0, 1999.0, 1161.0, 759.0, 499.0, 301.0, 176.0, 144.0, 79.0, 47.0, 40.0, 22.0, 10.0, 8.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.751007080078125, -2.65045166015625, -2.549896240234375, -2.4493408203125, -2.348785400390625, -2.24822998046875, -2.147674560546875, -2.047119140625, -1.946563720703125, -1.84600830078125, -1.745452880859375, -1.6448974609375, -1.544342041015625, -1.44378662109375, -1.343231201171875, -1.24267578125, -1.142120361328125, -1.04156494140625, -0.941009521484375, -0.8404541015625, -0.739898681640625, -0.63934326171875, -0.538787841796875, -0.438232421875, -0.337677001953125, -0.23712158203125, -0.136566162109375, -0.0360107421875, 0.064544677734375, 0.16510009765625, 0.265655517578125, 0.3662109375, 0.466766357421875, 0.56732177734375, 0.667877197265625, 0.7684326171875, 0.868988037109375, 0.96954345703125, 1.070098876953125, 1.170654296875, 1.271209716796875, 1.37176513671875, 1.472320556640625, 1.5728759765625, 1.673431396484375, 1.77398681640625, 1.874542236328125, 1.97509765625, 2.075653076171875, 2.17620849609375, 2.276763916015625, 2.3773193359375, 2.477874755859375, 2.57843017578125, 2.678985595703125, 2.779541015625, 2.880096435546875, 2.98065185546875, 3.081207275390625, 3.1817626953125, 3.282318115234375, 3.38287353515625, 3.483428955078125, 3.583984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 10.0, 5.0, 13.0, 8.0, 15.0, 9.0, 11.0, 17.0, 23.0, 31.0, 28.0, 25.0, 30.0, 41.0, 38.0, 69.0, 42.0, 52.0, 52.0, 41.0, 45.0, 47.0, 66.0, 41.0, 46.0, 42.0, 25.0, 19.0, 27.0, 18.0, 12.0, 13.0, 7.0, 4.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0005736351013183594, -0.0005589835345745087, -0.000544331967830658, -0.0005296804010868073, -0.0005150288343429565, -0.0005003772675991058, -0.0004857257008552551, -0.0004710741341114044, -0.0004564225673675537, -0.000441771000623703, -0.0004271194338798523, -0.0004124678671360016, -0.0003978163003921509, -0.00038316473364830017, -0.00036851316690444946, -0.00035386160016059875, -0.00033921003341674805, -0.00032455846667289734, -0.00030990689992904663, -0.0002952553331851959, -0.0002806037664413452, -0.0002659521996974945, -0.0002513006329536438, -0.0002366490662097931, -0.00022199749946594238, -0.00020734593272209167, -0.00019269436597824097, -0.00017804279923439026, -0.00016339123249053955, -0.00014873966574668884, -0.00013408809900283813, -0.00011943653225898743, -0.00010478496551513672, -9.013339877128601e-05, -7.54818320274353e-05, -6.0830265283584595e-05, -4.617869853973389e-05, -3.152713179588318e-05, -1.687556505203247e-05, -2.2239983081817627e-06, 1.2427568435668945e-05, 2.7079135179519653e-05, 4.173070192337036e-05, 5.638226866722107e-05, 7.103383541107178e-05, 8.568540215492249e-05, 0.0001003369688987732, 0.0001149885356426239, 0.0001296401023864746, 0.00014429166913032532, 0.00015894323587417603, 0.00017359480261802673, 0.00018824636936187744, 0.00020289793610572815, 0.00021754950284957886, 0.00023220106959342957, 0.0002468526363372803, 0.000261504203081131, 0.0002761557698249817, 0.0002908073365688324, 0.0003054589033126831, 0.0003201104700565338, 0.0003347620368003845, 0.00034941360354423523, 0.00036406517028808594]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 8.0, 34.0, 35.0, 62.0, 97.0, 136.0, 255.0, 421.0, 738.0, 1168.0, 1957.0, 3258.0, 5579.0, 9241.0, 15333.0, 24277.0, 37354.0, 55042.0, 75309.0, 96372.0, 113244.0, 120981.0, 118026.0, 104004.0, 83965.0, 62529.0, 44054.0, 28697.0, 18169.0, 11338.0, 6751.0, 3977.0, 2452.0, 1496.0, 863.0, 494.0, 322.0, 219.0, 108.0, 73.0, 44.0, 30.0, 16.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.18438720703125, -4.0523681640625, -3.92034912109375, -3.788330078125, -3.65631103515625, -3.5242919921875, -3.39227294921875, -3.26025390625, -3.12823486328125, -2.9962158203125, -2.86419677734375, -2.732177734375, -2.60015869140625, -2.4681396484375, -2.33612060546875, -2.2041015625, -2.07208251953125, -1.9400634765625, -1.80804443359375, -1.676025390625, -1.54400634765625, -1.4119873046875, -1.27996826171875, -1.14794921875, -1.01593017578125, -0.8839111328125, -0.75189208984375, -0.619873046875, -0.48785400390625, -0.3558349609375, -0.22381591796875, -0.091796875, 0.04022216796875, 0.1722412109375, 0.30426025390625, 0.436279296875, 0.56829833984375, 0.7003173828125, 0.83233642578125, 0.96435546875, 1.09637451171875, 1.2283935546875, 1.36041259765625, 1.492431640625, 1.62445068359375, 1.7564697265625, 1.88848876953125, 2.0205078125, 2.15252685546875, 2.2845458984375, 2.41656494140625, 2.548583984375, 2.68060302734375, 2.8126220703125, 2.94464111328125, 3.07666015625, 3.20867919921875, 3.3406982421875, 3.47271728515625, 3.604736328125, 3.73675537109375, 3.8687744140625, 4.00079345703125, 4.1328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 11.0, 6.0, 7.0, 11.0, 17.0, 19.0, 16.0, 22.0, 23.0, 35.0, 34.0, 33.0, 46.0, 53.0, 39.0, 48.0, 47.0, 44.0, 64.0, 49.0, 49.0, 48.0, 41.0, 44.0, 35.0, 33.0, 22.0, 28.0, 17.0, 19.0, 15.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8157958984375, -1.752685546875, -1.6895751953125, -1.62646484375, -1.5633544921875, -1.500244140625, -1.4371337890625, -1.3740234375, -1.3109130859375, -1.247802734375, -1.1846923828125, -1.12158203125, -1.0584716796875, -0.995361328125, -0.9322509765625, -0.869140625, -0.8060302734375, -0.742919921875, -0.6798095703125, -0.61669921875, -0.5535888671875, -0.490478515625, -0.4273681640625, -0.3642578125, -0.3011474609375, -0.238037109375, -0.1749267578125, -0.11181640625, -0.0487060546875, 0.014404296875, 0.0775146484375, 0.140625, 0.2037353515625, 0.266845703125, 0.3299560546875, 0.39306640625, 0.4561767578125, 0.519287109375, 0.5823974609375, 0.6455078125, 0.7086181640625, 0.771728515625, 0.8348388671875, 0.89794921875, 0.9610595703125, 1.024169921875, 1.0872802734375, 1.150390625, 1.2135009765625, 1.276611328125, 1.3397216796875, 1.40283203125, 1.4659423828125, 1.529052734375, 1.5921630859375, 1.6552734375, 1.7183837890625, 1.781494140625, 1.8446044921875, 1.90771484375, 1.9708251953125, 2.033935546875, 2.0970458984375, 2.16015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 4.0, 10.0, 5.0, 12.0, 15.0, 18.0, 27.0, 26.0, 44.0, 40.0, 25.0, 33.0, 48.0, 47.0, 48.0, 51.0, 49.0, 47.0, 61.0, 45.0, 36.0, 49.0, 32.0, 31.0, 31.0, 31.0, 32.0, 21.0, 9.0, 10.0, 19.0, 12.0, 6.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.989988327026367, -19.344646453857422, -18.699304580688477, -18.05396270751953, -17.408620834350586, -16.76327896118164, -16.117937088012695, -15.472594261169434, -14.827252388000488, -14.181910514831543, -13.536568641662598, -12.891226768493652, -12.24588394165039, -11.600542068481445, -10.9552001953125, -10.309858322143555, -9.66451644897461, -9.019174575805664, -8.373832702636719, -7.728490352630615, -7.08314847946167, -6.437806606292725, -5.792464256286621, -5.147122383117676, -4.5017805099487305, -3.856438636779785, -3.2110965251922607, -2.5657544136047363, -1.920412540435791, -1.2750706672668457, -0.6297285556793213, 0.015613555908203125, 0.6609535217285156, 1.3062955141067505, 1.9516375064849854, 2.5969796180725098, 3.242321491241455, 3.8876633644104004, 4.533005714416504, 5.178347587585449, 5.8236894607543945, 6.46903133392334, 7.114373207092285, 7.759715557098389, 8.405057907104492, 9.050399780273438, 9.695741653442383, 10.341083526611328, 10.986425399780273, 11.631767272949219, 12.277109146118164, 12.92245101928711, 13.567792892456055, 14.213134765625, 14.858477592468262, 15.503819465637207, 16.14916229248047, 16.794504165649414, 17.43984603881836, 18.085187911987305, 18.73052978515625, 19.375871658325195, 20.02121353149414, 20.66655731201172, 21.31189727783203]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 12.0, 11.0, 14.0, 9.0, 12.0, 15.0, 17.0, 18.0, 20.0, 14.0, 32.0, 30.0, 29.0, 47.0, 43.0, 47.0, 32.0, 35.0, 41.0, 48.0, 29.0, 48.0, 40.0, 26.0, 35.0, 37.0, 27.0, 34.0, 17.0, 20.0, 21.0, 16.0, 16.0, 17.0, 11.0, 25.0, 14.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.22197151184082, -19.555076599121094, -18.88818359375, -18.221288681030273, -17.554393768310547, -16.887500762939453, -16.220605850219727, -15.553711891174316, -14.886817932128906, -14.219923973083496, -13.553030014038086, -12.88613510131836, -12.21924114227295, -11.552347183227539, -10.885452270507812, -10.218558311462402, -9.551664352416992, -8.884770393371582, -8.217876434326172, -7.550981521606445, -6.884087562561035, -6.217193603515625, -5.550299167633057, -4.883404731750488, -4.216510772705078, -3.549616575241089, -2.8827223777770996, -2.2158281803131104, -1.548933982849121, -0.8820397853851318, -0.21514558792114258, 0.4517488479614258, 1.1186408996582031, 1.7855350971221924, 2.4524292945861816, 3.119323492050171, 3.78621768951416, 4.45311164855957, 5.120006084442139, 5.786900520324707, 6.453794479370117, 7.120688438415527, 7.787582874298096, 8.454477310180664, 9.121371269226074, 9.788265228271484, 10.455160140991211, 11.122054100036621, 11.788948059082031, 12.455842018127441, 13.122735977172852, 13.789630889892578, 14.456524848937988, 15.123418807983398, 15.790313720703125, 16.45720672607422, 17.124101638793945, 17.790996551513672, 18.457889556884766, 19.124784469604492, 19.79167938232422, 20.458572387695312, 21.12546730041504, 21.792362213134766, 22.45925521850586]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 15.0, 16.0, 46.0, 56.0, 110.0, 188.0, 366.0, 596.0, 952.0, 1572.0, 2625.0, 4359.0, 7012.0, 11319.0, 17769.0, 28193.0, 42912.0, 64469.0, 94063.0, 132491.0, 180098.0, 235211.0, 293162.0, 344353.0, 381701.0, 397313.0, 388896.0, 357033.0, 306639.0, 251062.0, 195067.0, 144705.0, 103399.0, 71660.0, 48613.0, 32050.0, 20479.0, 12857.0, 8134.0, 4933.0, 3115.0, 1851.0, 1170.0, 652.0, 390.0, 246.0, 161.0, 82.0, 47.0, 36.0, 25.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.25, -13.8131103515625, -13.376220703125, -12.9393310546875, -12.50244140625, -12.0655517578125, -11.628662109375, -11.1917724609375, -10.7548828125, -10.3179931640625, -9.881103515625, -9.4442138671875, -9.00732421875, -8.5704345703125, -8.133544921875, -7.6966552734375, -7.259765625, -6.8228759765625, -6.385986328125, -5.9490966796875, -5.51220703125, -5.0753173828125, -4.638427734375, -4.2015380859375, -3.7646484375, -3.3277587890625, -2.890869140625, -2.4539794921875, -2.01708984375, -1.5802001953125, -1.143310546875, -0.7064208984375, -0.26953125, 0.1673583984375, 0.604248046875, 1.0411376953125, 1.47802734375, 1.9149169921875, 2.351806640625, 2.7886962890625, 3.2255859375, 3.6624755859375, 4.099365234375, 4.5362548828125, 4.97314453125, 5.4100341796875, 5.846923828125, 6.2838134765625, 6.720703125, 7.1575927734375, 7.594482421875, 8.0313720703125, 8.46826171875, 8.9051513671875, 9.342041015625, 9.7789306640625, 10.2158203125, 10.6527099609375, 11.089599609375, 11.5264892578125, 11.96337890625, 12.4002685546875, 12.837158203125, 13.2740478515625, 13.7109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 13.0, 19.0, 10.0, 15.0, 20.0, 14.0, 21.0, 37.0, 23.0, 31.0, 34.0, 42.0, 40.0, 49.0, 46.0, 42.0, 40.0, 43.0, 44.0, 43.0, 35.0, 36.0, 32.0, 24.0, 23.0, 28.0, 18.0, 26.0, 16.0, 15.0, 19.0, 22.0, 9.0, 15.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.890625, -18.296875, -17.703125, -17.109375, -16.515625, -15.921875, -15.328125, -14.734375, -14.140625, -13.546875, -12.953125, -12.359375, -11.765625, -11.171875, -10.578125, -9.984375, -9.390625, -8.796875, -8.203125, -7.609375, -7.015625, -6.421875, -5.828125, -5.234375, -4.640625, -4.046875, -3.453125, -2.859375, -2.265625, -1.671875, -1.078125, -0.484375, 0.109375, 0.703125, 1.296875, 1.890625, 2.484375, 3.078125, 3.671875, 4.265625, 4.859375, 5.453125, 6.046875, 6.640625, 7.234375, 7.828125, 8.421875, 9.015625, 9.609375, 10.203125, 10.796875, 11.390625, 11.984375, 12.578125, 13.171875, 13.765625, 14.359375, 14.953125, 15.546875, 16.140625, 16.734375, 17.328125, 17.921875, 18.515625, 19.109375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 20.0, 40.0, 46.0, 90.0, 158.0, 263.0, 440.0, 827.0, 1429.0, 2386.0, 4064.0, 6565.0, 10685.0, 17287.0, 27561.0, 42406.0, 63990.0, 91809.0, 127833.0, 173735.0, 224113.0, 275350.0, 322707.0, 358214.0, 378509.0, 375501.0, 353580.0, 315210.0, 266247.0, 214497.0, 165281.0, 120972.0, 86945.0, 59416.0, 39239.0, 25756.0, 15999.0, 10050.0, 6170.0, 3643.0, 2207.0, 1301.0, 754.0, 405.0, 281.0, 132.0, 78.0, 36.0, 26.0, 13.0, 8.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.7734375, -14.3245849609375, -13.875732421875, -13.4268798828125, -12.97802734375, -12.5291748046875, -12.080322265625, -11.6314697265625, -11.1826171875, -10.7337646484375, -10.284912109375, -9.8360595703125, -9.38720703125, -8.9383544921875, -8.489501953125, -8.0406494140625, -7.591796875, -7.1429443359375, -6.694091796875, -6.2452392578125, -5.79638671875, -5.3475341796875, -4.898681640625, -4.4498291015625, -4.0009765625, -3.5521240234375, -3.103271484375, -2.6544189453125, -2.20556640625, -1.7567138671875, -1.307861328125, -0.8590087890625, -0.41015625, 0.0386962890625, 0.487548828125, 0.9364013671875, 1.38525390625, 1.8341064453125, 2.282958984375, 2.7318115234375, 3.1806640625, 3.6295166015625, 4.078369140625, 4.5272216796875, 4.97607421875, 5.4249267578125, 5.873779296875, 6.3226318359375, 6.771484375, 7.2203369140625, 7.669189453125, 8.1180419921875, 8.56689453125, 9.0157470703125, 9.464599609375, 9.9134521484375, 10.3623046875, 10.8111572265625, 11.260009765625, 11.7088623046875, 12.15771484375, 12.6065673828125, 13.055419921875, 13.5042724609375, 13.953125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 12.0, 12.0, 19.0, 21.0, 41.0, 50.0, 51.0, 73.0, 88.0, 91.0, 110.0, 110.0, 157.0, 165.0, 185.0, 203.0, 212.0, 225.0, 212.0, 214.0, 222.0, 192.0, 181.0, 178.0, 160.0, 152.0, 122.0, 114.0, 85.0, 79.0, 75.0, 55.0, 48.0, 40.0, 31.0, 22.0, 19.0, 12.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.2589111328125, -7.963134765625, -7.6673583984375, -7.37158203125, -7.0758056640625, -6.780029296875, -6.4842529296875, -6.1884765625, -5.8927001953125, -5.596923828125, -5.3011474609375, -5.00537109375, -4.7095947265625, -4.413818359375, -4.1180419921875, -3.822265625, -3.5264892578125, -3.230712890625, -2.9349365234375, -2.63916015625, -2.3433837890625, -2.047607421875, -1.7518310546875, -1.4560546875, -1.1602783203125, -0.864501953125, -0.5687255859375, -0.27294921875, 0.0228271484375, 0.318603515625, 0.6143798828125, 0.91015625, 1.2059326171875, 1.501708984375, 1.7974853515625, 2.09326171875, 2.3890380859375, 2.684814453125, 2.9805908203125, 3.2763671875, 3.5721435546875, 3.867919921875, 4.1636962890625, 4.45947265625, 4.7552490234375, 5.051025390625, 5.3468017578125, 5.642578125, 5.9383544921875, 6.234130859375, 6.5299072265625, 6.82568359375, 7.1214599609375, 7.417236328125, 7.7130126953125, 8.0087890625, 8.3045654296875, 8.600341796875, 8.8961181640625, 9.19189453125, 9.4876708984375, 9.783447265625, 10.0792236328125, 10.375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 4.0, 12.0, 9.0, 13.0, 20.0, 27.0, 37.0, 18.0, 42.0, 35.0, 35.0, 37.0, 44.0, 54.0, 40.0, 43.0, 50.0, 47.0, 58.0, 45.0, 31.0, 31.0, 35.0, 27.0, 25.0, 23.0, 29.0, 24.0, 21.0, 12.0, 18.0, 13.0, 7.0, 10.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.590007781982422, -18.876171112060547, -18.162334442138672, -17.448497772216797, -16.734661102294922, -16.020822525024414, -15.306985855102539, -14.593149185180664, -13.879312515258789, -13.165475845336914, -12.451639175415039, -11.737801551818848, -11.023964881896973, -10.310128211975098, -9.596290588378906, -8.882453918457031, -8.168617248535156, -7.454780578613281, -6.740943431854248, -6.027106285095215, -5.31326961517334, -4.599432945251465, -3.8855957984924316, -3.1717586517333984, -2.4579219818115234, -1.7440850734710693, -1.0302481651306152, -0.31641125679016113, 0.39742565155029297, 1.111262559890747, 1.8250994682312012, 2.5389366149902344, 3.2527732849121094, 3.9666101932525635, 4.680447101593018, 5.394284248352051, 6.108120918273926, 6.821957588195801, 7.535794734954834, 8.249631881713867, 8.963468551635742, 9.677305221557617, 10.391141891479492, 11.104979515075684, 11.818816184997559, 12.532652854919434, 13.246490478515625, 13.9603271484375, 14.674163818359375, 15.38800048828125, 16.101837158203125, 16.815673828125, 17.529510498046875, 18.243349075317383, 18.957185745239258, 19.671022415161133, 20.384859085083008, 21.098695755004883, 21.812532424926758, 22.526369094848633, 23.24020767211914, 23.954044342041016, 24.66788101196289, 25.381717681884766, 26.09555435180664]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 13.0, 13.0, 10.0, 15.0, 22.0, 22.0, 27.0, 28.0, 22.0, 41.0, 28.0, 55.0, 41.0, 45.0, 46.0, 43.0, 41.0, 52.0, 38.0, 41.0, 42.0, 32.0, 26.0, 22.0, 22.0, 29.0, 27.0, 16.0, 14.0, 20.0, 13.0, 10.0, 12.0, 6.0, 12.0, 9.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28847312927246, -21.549365997314453, -20.810258865356445, -20.071151733398438, -19.33204460144043, -18.592937469482422, -17.853830337524414, -17.114723205566406, -16.3756160736084, -15.63650894165039, -14.897401809692383, -14.158294677734375, -13.419187545776367, -12.68008041381836, -11.940973281860352, -11.201866149902344, -10.46275806427002, -9.723650932312012, -8.984543800354004, -8.245436668395996, -7.506329536437988, -6.7672224044799805, -6.0281147956848145, -5.289007663726807, -4.549900531768799, -3.810793399810791, -3.071686267852783, -2.3325788974761963, -1.5934717655181885, -0.8543646335601807, -0.11525726318359375, 0.6238498687744141, 1.3629570007324219, 2.1020641326904297, 2.8411712646484375, 3.5802786350250244, 4.319385528564453, 5.058492660522461, 5.797600269317627, 6.536707401275635, 7.275814533233643, 8.014922142028809, 8.754029273986816, 9.493136405944824, 10.232243537902832, 10.97135066986084, 11.710457801818848, 12.449564933776855, 13.188672065734863, 13.927779197692871, 14.666886329650879, 15.405993461608887, 16.14510154724121, 16.88420867919922, 17.623315811157227, 18.362422943115234, 19.101530075073242, 19.84063720703125, 20.579744338989258, 21.318851470947266, 22.057958602905273, 22.79706573486328, 23.53617286682129, 24.275279998779297, 25.014387130737305]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 8.0, 15.0, 18.0, 27.0, 34.0, 45.0, 71.0, 108.0, 147.0, 212.0, 245.0, 447.0, 613.0, 931.0, 1247.0, 1954.0, 2591.0, 3904.0, 5790.0, 8406.0, 12391.0, 19033.0, 29377.0, 46311.0, 74246.0, 118934.0, 176743.0, 186000.0, 130437.0, 81535.0, 51017.0, 31895.0, 21077.0, 13825.0, 9105.0, 6336.0, 4155.0, 2867.0, 1944.0, 1356.0, 977.0, 662.0, 489.0, 315.0, 210.0, 162.0, 119.0, 74.0, 41.0, 39.0, 22.0, 20.0, 16.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.60546875, -2.521697998046875, -2.43792724609375, -2.354156494140625, -2.2703857421875, -2.186614990234375, -2.10284423828125, -2.019073486328125, -1.935302734375, -1.851531982421875, -1.76776123046875, -1.683990478515625, -1.6002197265625, -1.516448974609375, -1.43267822265625, -1.348907470703125, -1.26513671875, -1.181365966796875, -1.09759521484375, -1.013824462890625, -0.9300537109375, -0.846282958984375, -0.76251220703125, -0.678741455078125, -0.594970703125, -0.511199951171875, -0.42742919921875, -0.343658447265625, -0.2598876953125, -0.176116943359375, -0.09234619140625, -0.008575439453125, 0.0751953125, 0.158966064453125, 0.24273681640625, 0.326507568359375, 0.4102783203125, 0.494049072265625, 0.57781982421875, 0.661590576171875, 0.745361328125, 0.829132080078125, 0.91290283203125, 0.996673583984375, 1.0804443359375, 1.164215087890625, 1.24798583984375, 1.331756591796875, 1.41552734375, 1.499298095703125, 1.58306884765625, 1.666839599609375, 1.7506103515625, 1.834381103515625, 1.91815185546875, 2.001922607421875, 2.085693359375, 2.169464111328125, 2.25323486328125, 2.337005615234375, 2.4207763671875, 2.504547119140625, 2.58831787109375, 2.672088623046875, 2.755859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 13.0, 14.0, 8.0, 9.0, 20.0, 22.0, 27.0, 22.0, 14.0, 23.0, 38.0, 35.0, 44.0, 45.0, 38.0, 34.0, 47.0, 45.0, 45.0, 44.0, 34.0, 45.0, 29.0, 34.0, 27.0, 30.0, 34.0, 13.0, 24.0, 22.0, 14.0, 13.0, 13.0, 15.0, 6.0, 14.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.21875, -20.475341796875, -19.73193359375, -18.988525390625, -18.2451171875, -17.501708984375, -16.75830078125, -16.014892578125, -15.271484375, -14.528076171875, -13.78466796875, -13.041259765625, -12.2978515625, -11.554443359375, -10.81103515625, -10.067626953125, -9.32421875, -8.580810546875, -7.83740234375, -7.093994140625, -6.3505859375, -5.607177734375, -4.86376953125, -4.120361328125, -3.376953125, -2.633544921875, -1.89013671875, -1.146728515625, -0.4033203125, 0.340087890625, 1.08349609375, 1.826904296875, 2.5703125, 3.313720703125, 4.05712890625, 4.800537109375, 5.5439453125, 6.287353515625, 7.03076171875, 7.774169921875, 8.517578125, 9.260986328125, 10.00439453125, 10.747802734375, 11.4912109375, 12.234619140625, 12.97802734375, 13.721435546875, 14.46484375, 15.208251953125, 15.95166015625, 16.695068359375, 17.4384765625, 18.181884765625, 18.92529296875, 19.668701171875, 20.412109375, 21.155517578125, 21.89892578125, 22.642333984375, 23.3857421875, 24.129150390625, 24.87255859375, 25.615966796875, 26.359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 13.0, 13.0, 19.0, 30.0, 48.0, 81.0, 132.0, 155.0, 240.0, 346.0, 454.0, 726.0, 1085.0, 1655.0, 2320.0, 3721.0, 5524.0, 8723.0, 13824.0, 21598.0, 34891.0, 58063.0, 99014.0, 170657.0, 230253.0, 159601.0, 91282.0, 54080.0, 32858.0, 20258.0, 12959.0, 8172.0, 5308.0, 3401.0, 2301.0, 1511.0, 1024.0, 665.0, 484.0, 338.0, 205.0, 165.0, 116.0, 67.0, 43.0, 41.0, 17.0, 22.0, 11.0, 8.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-3.302734375, -3.197662353515625, -3.09259033203125, -2.987518310546875, -2.8824462890625, -2.777374267578125, -2.67230224609375, -2.567230224609375, -2.462158203125, -2.357086181640625, -2.25201416015625, -2.146942138671875, -2.0418701171875, -1.936798095703125, -1.83172607421875, -1.726654052734375, -1.62158203125, -1.516510009765625, -1.41143798828125, -1.306365966796875, -1.2012939453125, -1.096221923828125, -0.99114990234375, -0.886077880859375, -0.781005859375, -0.675933837890625, -0.57086181640625, -0.465789794921875, -0.3607177734375, -0.255645751953125, -0.15057373046875, -0.045501708984375, 0.0595703125, 0.164642333984375, 0.26971435546875, 0.374786376953125, 0.4798583984375, 0.584930419921875, 0.69000244140625, 0.795074462890625, 0.900146484375, 1.005218505859375, 1.11029052734375, 1.215362548828125, 1.3204345703125, 1.425506591796875, 1.53057861328125, 1.635650634765625, 1.74072265625, 1.845794677734375, 1.95086669921875, 2.055938720703125, 2.1610107421875, 2.266082763671875, 2.37115478515625, 2.476226806640625, 2.581298828125, 2.686370849609375, 2.79144287109375, 2.896514892578125, 3.0015869140625, 3.106658935546875, 3.21173095703125, 3.316802978515625, 3.421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 11.0, 4.0, 16.0, 19.0, 18.0, 20.0, 27.0, 19.0, 25.0, 23.0, 30.0, 35.0, 27.0, 41.0, 34.0, 35.0, 53.0, 29.0, 48.0, 41.0, 38.0, 26.0, 33.0, 33.0, 31.0, 31.0, 26.0, 35.0, 14.0, 20.0, 21.0, 16.0, 11.0, 8.0, 11.0, 12.0, 5.0, 8.0, 8.0, 8.0, 7.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.125, -13.695556640625, -13.26611328125, -12.836669921875, -12.4072265625, -11.977783203125, -11.54833984375, -11.118896484375, -10.689453125, -10.260009765625, -9.83056640625, -9.401123046875, -8.9716796875, -8.542236328125, -8.11279296875, -7.683349609375, -7.25390625, -6.824462890625, -6.39501953125, -5.965576171875, -5.5361328125, -5.106689453125, -4.67724609375, -4.247802734375, -3.818359375, -3.388916015625, -2.95947265625, -2.530029296875, -2.1005859375, -1.671142578125, -1.24169921875, -0.812255859375, -0.3828125, 0.046630859375, 0.47607421875, 0.905517578125, 1.3349609375, 1.764404296875, 2.19384765625, 2.623291015625, 3.052734375, 3.482177734375, 3.91162109375, 4.341064453125, 4.7705078125, 5.199951171875, 5.62939453125, 6.058837890625, 6.48828125, 6.917724609375, 7.34716796875, 7.776611328125, 8.2060546875, 8.635498046875, 9.06494140625, 9.494384765625, 9.923828125, 10.353271484375, 10.78271484375, 11.212158203125, 11.6416015625, 12.071044921875, 12.50048828125, 12.929931640625, 13.359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 11.0, 11.0, 22.0, 23.0, 34.0, 46.0, 70.0, 97.0, 139.0, 213.0, 280.0, 385.0, 614.0, 865.0, 1332.0, 1921.0, 2871.0, 4410.0, 6969.0, 11026.0, 17740.0, 29094.0, 49672.0, 89861.0, 177785.0, 262300.0, 175076.0, 89554.0, 48744.0, 28882.0, 17623.0, 10672.0, 6842.0, 4462.0, 2849.0, 1988.0, 1238.0, 873.0, 612.0, 430.0, 272.0, 189.0, 125.0, 98.0, 53.0, 69.0, 37.0, 18.0, 16.0, 10.0, 10.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.0770263671875, -0.07458019256591797, -0.07213401794433594, -0.0696878433227539, -0.06724166870117188, -0.06479549407958984, -0.06234931945800781, -0.05990314483642578, -0.05745697021484375, -0.05501079559326172, -0.05256462097167969, -0.050118446350097656, -0.047672271728515625, -0.045226097106933594, -0.04277992248535156, -0.04033374786376953, -0.0378875732421875, -0.03544139862060547, -0.03299522399902344, -0.030549049377441406, -0.028102874755859375, -0.025656700134277344, -0.023210525512695312, -0.02076435089111328, -0.01831817626953125, -0.01587200164794922, -0.013425827026367188, -0.010979652404785156, -0.008533477783203125, -0.006087303161621094, -0.0036411285400390625, -0.0011949539184570312, 0.001251220703125, 0.0036973953247070312, 0.0061435699462890625, 0.008589744567871094, 0.011035919189453125, 0.013482093811035156, 0.015928268432617188, 0.01837444305419922, 0.02082061767578125, 0.02326679229736328, 0.025712966918945312, 0.028159141540527344, 0.030605316162109375, 0.033051490783691406, 0.03549766540527344, 0.03794384002685547, 0.0403900146484375, 0.04283618927001953, 0.04528236389160156, 0.047728538513183594, 0.050174713134765625, 0.052620887756347656, 0.05506706237792969, 0.05751323699951172, 0.05995941162109375, 0.06240558624267578, 0.06485176086425781, 0.06729793548583984, 0.06974411010742188, 0.0721902847290039, 0.07463645935058594, 0.07708263397216797, 0.07952880859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 3.0, 17.0, 14.0, 19.0, 14.0, 26.0, 24.0, 31.0, 29.0, 43.0, 29.0, 47.0, 46.0, 46.0, 50.0, 35.0, 38.0, 41.0, 48.0, 36.0, 37.0, 45.0, 33.0, 27.0, 16.0, 31.0, 14.0, 22.0, 16.0, 23.0, 9.0, 7.0, 8.0, 11.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4424324035644531e-05, -1.3940967619419098e-05, -1.3457611203193665e-05, -1.2974254786968231e-05, -1.2490898370742798e-05, -1.2007541954517365e-05, -1.1524185538291931e-05, -1.1040829122066498e-05, -1.0557472705841064e-05, -1.0074116289615631e-05, -9.590759873390198e-06, -9.107403457164764e-06, -8.624047040939331e-06, -8.140690624713898e-06, -7.657334208488464e-06, -7.173977792263031e-06, -6.690621376037598e-06, -6.207264959812164e-06, -5.723908543586731e-06, -5.240552127361298e-06, -4.757195711135864e-06, -4.273839294910431e-06, -3.7904828786849976e-06, -3.307126462459564e-06, -2.823770046234131e-06, -2.3404136300086975e-06, -1.8570572137832642e-06, -1.3737007975578308e-06, -8.903443813323975e-07, -4.069879651069641e-07, 7.636845111846924e-08, 5.597248673439026e-07, 1.043081283569336e-06, 1.5264376997947693e-06, 2.0097941160202026e-06, 2.493150532245636e-06, 2.9765069484710693e-06, 3.4598633646965027e-06, 3.943219780921936e-06, 4.426576197147369e-06, 4.909932613372803e-06, 5.393289029598236e-06, 5.8766454458236694e-06, 6.360001862049103e-06, 6.843358278274536e-06, 7.3267146944999695e-06, 7.810071110725403e-06, 8.293427526950836e-06, 8.77678394317627e-06, 9.260140359401703e-06, 9.743496775627136e-06, 1.022685319185257e-05, 1.0710209608078003e-05, 1.1193566024303436e-05, 1.167692244052887e-05, 1.2160278856754303e-05, 1.2643635272979736e-05, 1.312699168920517e-05, 1.3610348105430603e-05, 1.4093704521656036e-05, 1.457706093788147e-05, 1.5060417354106903e-05, 1.5543773770332336e-05, 1.602713018655777e-05, 1.6510486602783203e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 13.0, 27.0, 20.0, 37.0, 52.0, 81.0, 143.0, 198.0, 294.0, 442.0, 725.0, 1058.0, 1592.0, 2426.0, 3573.0, 5215.0, 7941.0, 12221.0, 18810.0, 28798.0, 46825.0, 76914.0, 139697.0, 262414.0, 185715.0, 96349.0, 56844.0, 35226.0, 22391.0, 14451.0, 9378.0, 6246.0, 4219.0, 2651.0, 1863.0, 1243.0, 822.0, 560.0, 386.0, 257.0, 155.0, 98.0, 66.0, 41.0, 38.0, 18.0, 15.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1578369140625, -0.15252304077148438, -0.14720916748046875, -0.14189529418945312, -0.1365814208984375, -0.13126754760742188, -0.12595367431640625, -0.12063980102539062, -0.115325927734375, -0.11001205444335938, -0.10469818115234375, -0.09938430786132812, -0.0940704345703125, -0.08875656127929688, -0.08344268798828125, -0.07812881469726562, -0.07281494140625, -0.06750106811523438, -0.06218719482421875, -0.056873321533203125, -0.0515594482421875, -0.046245574951171875, -0.04093170166015625, -0.035617828369140625, -0.030303955078125, -0.024990081787109375, -0.01967620849609375, -0.014362335205078125, -0.0090484619140625, -0.003734588623046875, 0.00157928466796875, 0.006893157958984375, 0.01220703125, 0.017520904541015625, 0.02283477783203125, 0.028148651123046875, 0.0334625244140625, 0.038776397705078125, 0.04409027099609375, 0.049404144287109375, 0.054718017578125, 0.060031890869140625, 0.06534576416015625, 0.07065963745117188, 0.0759735107421875, 0.08128738403320312, 0.08660125732421875, 0.09191513061523438, 0.09722900390625, 0.10254287719726562, 0.10785675048828125, 0.11317062377929688, 0.1184844970703125, 0.12379837036132812, 0.12911224365234375, 0.13442611694335938, 0.139739990234375, 0.14505386352539062, 0.15036773681640625, 0.15568161010742188, 0.1609954833984375, 0.16630935668945312, 0.17162322998046875, 0.17693710327148438, 0.1822509765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 7.0, 4.0, 9.0, 11.0, 9.0, 11.0, 10.0, 20.0, 19.0, 15.0, 23.0, 25.0, 28.0, 39.0, 56.0, 72.0, 71.0, 70.0, 62.0, 68.0, 53.0, 45.0, 43.0, 25.0, 28.0, 21.0, 22.0, 22.0, 13.0, 11.0, 12.0, 2.0, 12.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06420516967773438, -0.06218719482421875, -0.060169219970703125, -0.0581512451171875, -0.056133270263671875, -0.05411529541015625, -0.052097320556640625, -0.050079345703125, -0.048061370849609375, -0.04604339599609375, -0.044025421142578125, -0.0420074462890625, -0.039989471435546875, -0.03797149658203125, -0.035953521728515625, -0.033935546875, -0.031917572021484375, -0.02989959716796875, -0.027881622314453125, -0.0258636474609375, -0.023845672607421875, -0.02182769775390625, -0.019809722900390625, -0.017791748046875, -0.015773773193359375, -0.01375579833984375, -0.011737823486328125, -0.0097198486328125, -0.007701873779296875, -0.00568389892578125, -0.003665924072265625, -0.00164794921875, 0.000370025634765625, 0.00238800048828125, 0.004405975341796875, 0.0064239501953125, 0.008441925048828125, 0.01045989990234375, 0.012477874755859375, 0.014495849609375, 0.016513824462890625, 0.01853179931640625, 0.020549774169921875, 0.0225677490234375, 0.024585723876953125, 0.02660369873046875, 0.028621673583984375, 0.0306396484375, 0.032657623291015625, 0.03467559814453125, 0.036693572998046875, 0.0387115478515625, 0.040729522705078125, 0.04274749755859375, 0.044765472412109375, 0.046783447265625, 0.048801422119140625, 0.05081939697265625, 0.052837371826171875, 0.0548553466796875, 0.056873321533203125, 0.05889129638671875, 0.060909271240234375, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 3.0, 3.0, 10.0, 6.0, 13.0, 18.0, 23.0, 31.0, 29.0, 41.0, 37.0, 29.0, 40.0, 44.0, 45.0, 49.0, 42.0, 50.0, 35.0, 65.0, 51.0, 34.0, 30.0, 38.0, 30.0, 21.0, 25.0, 33.0, 20.0, 18.0, 20.0, 14.0, 14.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.10551643371582, -19.38246726989746, -18.6594181060791, -17.936370849609375, -17.213321685791016, -16.490272521972656, -15.767223358154297, -15.044174194335938, -14.321125030517578, -13.598075866699219, -12.875027656555176, -12.151978492736816, -11.428929328918457, -10.705881118774414, -9.982831954956055, -9.259782791137695, -8.536734580993652, -7.813685894012451, -7.090636730194092, -6.367588043212891, -5.644538879394531, -4.92149019241333, -4.198441505432129, -3.4753923416137695, -2.7523436546325684, -2.029294729232788, -1.3062459230422974, -0.5831971168518066, 0.13985180854797363, 0.8629007339477539, 1.585949420928955, 2.3089985847473145, 3.0320472717285156, 3.755096197128296, 4.478145122528076, 5.201193809509277, 5.924242973327637, 6.647291660308838, 7.370340347290039, 8.093389511108398, 8.816438674926758, 9.539487838745117, 10.26253604888916, 10.98558521270752, 11.708634376525879, 12.431682586669922, 13.154731750488281, 13.87778091430664, 14.600829124450684, 15.323878288269043, 16.046926498413086, 16.769975662231445, 17.493024826049805, 18.216073989868164, 18.93912124633789, 19.66217041015625, 20.38521957397461, 21.10826873779297, 21.831317901611328, 22.554367065429688, 23.277414321899414, 24.000463485717773, 24.723512649536133, 25.446561813354492, 26.16961097717285]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 12.0, 14.0, 10.0, 15.0, 22.0, 23.0, 25.0, 29.0, 23.0, 39.0, 30.0, 54.0, 40.0, 47.0, 43.0, 43.0, 40.0, 54.0, 39.0, 41.0, 40.0, 34.0, 26.0, 24.0, 20.0, 30.0, 26.0, 16.0, 13.0, 23.0, 11.0, 10.0, 12.0, 6.0, 12.0, 9.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.158723831176758, -21.42060089111328, -20.682476043701172, -19.944353103637695, -19.20623016357422, -18.468107223510742, -17.729984283447266, -16.991859436035156, -16.25373649597168, -15.515613555908203, -14.77748966217041, -14.039365768432617, -13.30124282836914, -12.563119888305664, -11.824995994567871, -11.086872100830078, -10.348749160766602, -9.610626220703125, -8.872502326965332, -8.134378433227539, -7.3962554931640625, -6.658132076263428, -5.920008659362793, -5.181885242462158, -4.443761825561523, -3.7056384086608887, -2.967514991760254, -2.229391574859619, -1.4912681579589844, -0.7531447410583496, -0.015021324157714844, 0.7231020927429199, 1.4612255096435547, 2.1993489265441895, 2.937472343444824, 3.675595760345459, 4.413719177246094, 5.1518425941467285, 5.889966011047363, 6.628089427947998, 7.366212844848633, 8.10433578491211, 8.842459678649902, 9.580583572387695, 10.318706512451172, 11.056829452514648, 11.794953346252441, 12.533077239990234, 13.271200180053711, 14.009323120117188, 14.74744701385498, 15.485570907592773, 16.22369384765625, 16.961816787719727, 17.699939727783203, 18.438064575195312, 19.17618751525879, 19.914310455322266, 20.652435302734375, 21.39055824279785, 22.128681182861328, 22.866804122924805, 23.60492706298828, 24.34305191040039, 25.081174850463867]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 10.0, 15.0, 31.0, 46.0, 79.0, 100.0, 176.0, 275.0, 411.0, 597.0, 916.0, 1393.0, 2175.0, 3399.0, 5116.0, 7483.0, 10902.0, 15609.0, 22301.0, 30108.0, 39969.0, 51153.0, 62981.0, 74414.0, 83290.0, 88463.0, 89884.0, 86221.0, 79110.0, 69167.0, 56856.0, 45747.0, 35079.0, 25935.0, 18854.0, 13153.0, 9047.0, 5989.0, 4114.0, 2729.0, 1808.0, 1176.0, 778.0, 509.0, 354.0, 200.0, 162.0, 98.0, 67.0, 42.0, 22.0, 16.0, 11.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-10.046875, -9.7353515625, -9.423828125, -9.1123046875, -8.80078125, -8.4892578125, -8.177734375, -7.8662109375, -7.5546875, -7.2431640625, -6.931640625, -6.6201171875, -6.30859375, -5.9970703125, -5.685546875, -5.3740234375, -5.0625, -4.7509765625, -4.439453125, -4.1279296875, -3.81640625, -3.5048828125, -3.193359375, -2.8818359375, -2.5703125, -2.2587890625, -1.947265625, -1.6357421875, -1.32421875, -1.0126953125, -0.701171875, -0.3896484375, -0.078125, 0.2333984375, 0.544921875, 0.8564453125, 1.16796875, 1.4794921875, 1.791015625, 2.1025390625, 2.4140625, 2.7255859375, 3.037109375, 3.3486328125, 3.66015625, 3.9716796875, 4.283203125, 4.5947265625, 4.90625, 5.2177734375, 5.529296875, 5.8408203125, 6.15234375, 6.4638671875, 6.775390625, 7.0869140625, 7.3984375, 7.7099609375, 8.021484375, 8.3330078125, 8.64453125, 8.9560546875, 9.267578125, 9.5791015625, 9.890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 5.0, 7.0, 7.0, 13.0, 14.0, 15.0, 16.0, 19.0, 23.0, 25.0, 39.0, 30.0, 43.0, 38.0, 45.0, 35.0, 42.0, 39.0, 45.0, 47.0, 42.0, 36.0, 39.0, 31.0, 35.0, 29.0, 25.0, 27.0, 16.0, 14.0, 25.0, 16.0, 13.0, 15.0, 11.0, 12.0, 14.0, 7.0, 4.0, 4.0, 9.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.125, -20.4111328125, -19.697265625, -18.9833984375, -18.26953125, -17.5556640625, -16.841796875, -16.1279296875, -15.4140625, -14.7001953125, -13.986328125, -13.2724609375, -12.55859375, -11.8447265625, -11.130859375, -10.4169921875, -9.703125, -8.9892578125, -8.275390625, -7.5615234375, -6.84765625, -6.1337890625, -5.419921875, -4.7060546875, -3.9921875, -3.2783203125, -2.564453125, -1.8505859375, -1.13671875, -0.4228515625, 0.291015625, 1.0048828125, 1.71875, 2.4326171875, 3.146484375, 3.8603515625, 4.57421875, 5.2880859375, 6.001953125, 6.7158203125, 7.4296875, 8.1435546875, 8.857421875, 9.5712890625, 10.28515625, 10.9990234375, 11.712890625, 12.4267578125, 13.140625, 13.8544921875, 14.568359375, 15.2822265625, 15.99609375, 16.7099609375, 17.423828125, 18.1376953125, 18.8515625, 19.5654296875, 20.279296875, 20.9931640625, 21.70703125, 22.4208984375, 23.134765625, 23.8486328125, 24.5625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 20.0, 24.0, 47.0, 54.0, 122.0, 164.0, 290.0, 462.0, 651.0, 1026.0, 1613.0, 2617.0, 3843.0, 5898.0, 8552.0, 12361.0, 17456.0, 24564.0, 32697.0, 43540.0, 54014.0, 65667.0, 75435.0, 83939.0, 88095.0, 87830.0, 84123.0, 76186.0, 65817.0, 54223.0, 43426.0, 33667.0, 24565.0, 17656.0, 12363.0, 8650.0, 5820.0, 3925.0, 2584.0, 1623.0, 1069.0, 698.0, 422.0, 299.0, 169.0, 112.0, 63.0, 41.0, 28.0, 17.0, 13.0, 7.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.953125, -9.6422119140625, -9.331298828125, -9.0203857421875, -8.70947265625, -8.3985595703125, -8.087646484375, -7.7767333984375, -7.4658203125, -7.1549072265625, -6.843994140625, -6.5330810546875, -6.22216796875, -5.9112548828125, -5.600341796875, -5.2894287109375, -4.978515625, -4.6676025390625, -4.356689453125, -4.0457763671875, -3.73486328125, -3.4239501953125, -3.113037109375, -2.8021240234375, -2.4912109375, -2.1802978515625, -1.869384765625, -1.5584716796875, -1.24755859375, -0.9366455078125, -0.625732421875, -0.3148193359375, -0.00390625, 0.3070068359375, 0.617919921875, 0.9288330078125, 1.23974609375, 1.5506591796875, 1.861572265625, 2.1724853515625, 2.4833984375, 2.7943115234375, 3.105224609375, 3.4161376953125, 3.72705078125, 4.0379638671875, 4.348876953125, 4.6597900390625, 4.970703125, 5.2816162109375, 5.592529296875, 5.9034423828125, 6.21435546875, 6.5252685546875, 6.836181640625, 7.1470947265625, 7.4580078125, 7.7689208984375, 8.079833984375, 8.3907470703125, 8.70166015625, 9.0125732421875, 9.323486328125, 9.6343994140625, 9.9453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 7.0, 9.0, 13.0, 12.0, 14.0, 12.0, 21.0, 27.0, 31.0, 21.0, 30.0, 32.0, 31.0, 34.0, 42.0, 27.0, 51.0, 40.0, 39.0, 43.0, 38.0, 43.0, 31.0, 38.0, 39.0, 41.0, 46.0, 33.0, 15.0, 23.0, 17.0, 16.0, 13.0, 9.0, 15.0, 9.0, 6.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.2747802734375, -13.807373046875, -13.3399658203125, -12.87255859375, -12.4051513671875, -11.937744140625, -11.4703369140625, -11.0029296875, -10.5355224609375, -10.068115234375, -9.6007080078125, -9.13330078125, -8.6658935546875, -8.198486328125, -7.7310791015625, -7.263671875, -6.7962646484375, -6.328857421875, -5.8614501953125, -5.39404296875, -4.9266357421875, -4.459228515625, -3.9918212890625, -3.5244140625, -3.0570068359375, -2.589599609375, -2.1221923828125, -1.65478515625, -1.1873779296875, -0.719970703125, -0.2525634765625, 0.21484375, 0.6822509765625, 1.149658203125, 1.6170654296875, 2.08447265625, 2.5518798828125, 3.019287109375, 3.4866943359375, 3.9541015625, 4.4215087890625, 4.888916015625, 5.3563232421875, 5.82373046875, 6.2911376953125, 6.758544921875, 7.2259521484375, 7.693359375, 8.1607666015625, 8.628173828125, 9.0955810546875, 9.56298828125, 10.0303955078125, 10.497802734375, 10.9652099609375, 11.4326171875, 11.9000244140625, 12.367431640625, 12.8348388671875, 13.30224609375, 13.7696533203125, 14.237060546875, 14.7044677734375, 15.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 14.0, 24.0, 25.0, 44.0, 86.0, 122.0, 215.0, 290.0, 461.0, 716.0, 1074.0, 1619.0, 2473.0, 3763.0, 5699.0, 8408.0, 12067.0, 17170.0, 24080.0, 32373.0, 42910.0, 54419.0, 66560.0, 77498.0, 85459.0, 89858.0, 89547.0, 85013.0, 76595.0, 65909.0, 53675.0, 42497.0, 32089.0, 23264.0, 16877.0, 11540.0, 8063.0, 5500.0, 3532.0, 2377.0, 1579.0, 1096.0, 709.0, 437.0, 301.0, 186.0, 120.0, 89.0, 62.0, 31.0, 15.0, 11.0, 11.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.00390625, -2.896484375, -2.7890625, -2.681640625, -2.57421875, -2.466796875, -2.359375, -2.251953125, -2.14453125, -2.037109375, -1.9296875, -1.822265625, -1.71484375, -1.607421875, -1.5, -1.392578125, -1.28515625, -1.177734375, -1.0703125, -0.962890625, -0.85546875, -0.748046875, -0.640625, -0.533203125, -0.42578125, -0.318359375, -0.2109375, -0.103515625, 0.00390625, 0.111328125, 0.21875, 0.326171875, 0.43359375, 0.541015625, 0.6484375, 0.755859375, 0.86328125, 0.970703125, 1.078125, 1.185546875, 1.29296875, 1.400390625, 1.5078125, 1.615234375, 1.72265625, 1.830078125, 1.9375, 2.044921875, 2.15234375, 2.259765625, 2.3671875, 2.474609375, 2.58203125, 2.689453125, 2.796875, 2.904296875, 3.01171875, 3.119140625, 3.2265625, 3.333984375, 3.44140625, 3.548828125, 3.65625, 3.763671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 6.0, 8.0, 7.0, 13.0, 15.0, 14.0, 25.0, 26.0, 25.0, 33.0, 34.0, 45.0, 35.0, 43.0, 26.0, 51.0, 47.0, 48.0, 47.0, 38.0, 42.0, 44.0, 38.0, 41.0, 48.0, 23.0, 26.0, 21.0, 19.0, 18.0, 16.0, 14.0, 10.0, 7.0, 10.0, 4.0, 4.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004868507385253906, -0.0004713982343673706, -0.0004559457302093506, -0.00044049322605133057, -0.00042504072189331055, -0.00040958821773529053, -0.0003941357135772705, -0.0003786832094192505, -0.00036323070526123047, -0.00034777820110321045, -0.00033232569694519043, -0.0003168731927871704, -0.0003014206886291504, -0.00028596818447113037, -0.00027051568031311035, -0.00025506317615509033, -0.0002396106719970703, -0.0002241581678390503, -0.00020870566368103027, -0.00019325315952301025, -0.00017780065536499023, -0.00016234815120697021, -0.0001468956470489502, -0.00013144314289093018, -0.00011599063873291016, -0.00010053813457489014, -8.508563041687012e-05, -6.96331262588501e-05, -5.418062210083008e-05, -3.872811794281006e-05, -2.327561378479004e-05, -7.82310962677002e-06, 7.62939453125e-06, 2.308189868927002e-05, 3.853440284729004e-05, 5.398690700531006e-05, 6.943941116333008e-05, 8.48919153213501e-05, 0.00010034441947937012, 0.00011579692363739014, 0.00013124942779541016, 0.00014670193195343018, 0.0001621544361114502, 0.00017760694026947021, 0.00019305944442749023, 0.00020851194858551025, 0.00022396445274353027, 0.0002394169569015503, 0.0002548694610595703, 0.00027032196521759033, 0.00028577446937561035, 0.00030122697353363037, 0.0003166794776916504, 0.0003321319818496704, 0.00034758448600769043, 0.00036303699016571045, 0.00037848949432373047, 0.0003939419984817505, 0.0004093945026397705, 0.00042484700679779053, 0.00044029951095581055, 0.00045575201511383057, 0.0004712045192718506, 0.0004866570234298706, 0.0005021095275878906]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 10.0, 11.0, 17.0, 34.0, 52.0, 76.0, 101.0, 161.0, 302.0, 479.0, 832.0, 1381.0, 2392.0, 4307.0, 7805.0, 13999.0, 24599.0, 41411.0, 65032.0, 93728.0, 122966.0, 140101.0, 140356.0, 123849.0, 96135.0, 66904.0, 42881.0, 25460.0, 14630.0, 8067.0, 4425.0, 2544.0, 1383.0, 837.0, 474.0, 307.0, 188.0, 115.0, 63.0, 40.0, 34.0, 16.0, 15.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.55914306640625, -5.3800048828125, -5.20086669921875, -5.021728515625, -4.84259033203125, -4.6634521484375, -4.48431396484375, -4.30517578125, -4.12603759765625, -3.9468994140625, -3.76776123046875, -3.588623046875, -3.40948486328125, -3.2303466796875, -3.05120849609375, -2.8720703125, -2.69293212890625, -2.5137939453125, -2.33465576171875, -2.155517578125, -1.97637939453125, -1.7972412109375, -1.61810302734375, -1.43896484375, -1.25982666015625, -1.0806884765625, -0.90155029296875, -0.722412109375, -0.54327392578125, -0.3641357421875, -0.18499755859375, -0.005859375, 0.17327880859375, 0.3524169921875, 0.53155517578125, 0.710693359375, 0.88983154296875, 1.0689697265625, 1.24810791015625, 1.42724609375, 1.60638427734375, 1.7855224609375, 1.96466064453125, 2.143798828125, 2.32293701171875, 2.5020751953125, 2.68121337890625, 2.8603515625, 3.03948974609375, 3.2186279296875, 3.39776611328125, 3.576904296875, 3.75604248046875, 3.9351806640625, 4.11431884765625, 4.29345703125, 4.47259521484375, 4.6517333984375, 4.83087158203125, 5.010009765625, 5.18914794921875, 5.3682861328125, 5.54742431640625, 5.7265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 12.0, 16.0, 28.0, 35.0, 52.0, 50.0, 73.0, 66.0, 77.0, 71.0, 86.0, 79.0, 57.0, 53.0, 50.0, 39.0, 34.0, 18.0, 21.0, 14.0, 9.0, 7.0, 10.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.54962158203125, -2.4508056640625, -2.35198974609375, -2.253173828125, -2.15435791015625, -2.0555419921875, -1.95672607421875, -1.85791015625, -1.75909423828125, -1.6602783203125, -1.56146240234375, -1.462646484375, -1.36383056640625, -1.2650146484375, -1.16619873046875, -1.0673828125, -0.96856689453125, -0.8697509765625, -0.77093505859375, -0.672119140625, -0.57330322265625, -0.4744873046875, -0.37567138671875, -0.27685546875, -0.17803955078125, -0.0792236328125, 0.01959228515625, 0.118408203125, 0.21722412109375, 0.3160400390625, 0.41485595703125, 0.513671875, 0.61248779296875, 0.7113037109375, 0.81011962890625, 0.908935546875, 1.00775146484375, 1.1065673828125, 1.20538330078125, 1.30419921875, 1.40301513671875, 1.5018310546875, 1.60064697265625, 1.699462890625, 1.79827880859375, 1.8970947265625, 1.99591064453125, 2.0947265625, 2.19354248046875, 2.2923583984375, 2.39117431640625, 2.489990234375, 2.58880615234375, 2.6876220703125, 2.78643798828125, 2.88525390625, 2.98406982421875, 3.0828857421875, 3.18170166015625, 3.280517578125, 3.37933349609375, 3.4781494140625, 3.57696533203125, 3.67578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 10.0, 4.0, 8.0, 15.0, 14.0, 16.0, 20.0, 24.0, 31.0, 31.0, 34.0, 38.0, 49.0, 44.0, 34.0, 50.0, 46.0, 43.0, 60.0, 50.0, 54.0, 34.0, 34.0, 29.0, 38.0, 25.0, 35.0, 26.0, 16.0, 18.0, 17.0, 13.0, 11.0, 4.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.055950164794922, -20.318437576293945, -19.580923080444336, -18.84341049194336, -18.10589599609375, -17.368383407592773, -16.630870819091797, -15.893357276916504, -15.155843734741211, -14.418330192565918, -13.680816650390625, -12.943304061889648, -12.205790519714355, -11.468276977539062, -10.730764389038086, -9.993250846862793, -9.2557373046875, -8.518223762512207, -7.780710697174072, -7.0431976318359375, -6.3056840896606445, -5.568170547485352, -4.830657482147217, -4.093144416809082, -3.355630874633789, -2.618117570877075, -1.8806042671203613, -1.1430909633636475, -0.4055776596069336, 0.3319356441497803, 1.0694489479064941, 1.806962013244629, 2.544473648071289, 3.281986951828003, 4.019500255584717, 4.757013320922852, 5.4945268630981445, 6.2320404052734375, 6.969553470611572, 7.707066535949707, 8.444580078125, 9.182093620300293, 9.919607162475586, 10.657119750976562, 11.394633293151855, 12.132146835327148, 12.869659423828125, 13.607172966003418, 14.344686508178711, 15.082200050354004, 15.819713592529297, 16.557226181030273, 17.29473876953125, 18.03225326538086, 18.769765853881836, 19.507278442382812, 20.244792938232422, 20.9823055267334, 21.719820022583008, 22.457332611083984, 23.194847106933594, 23.93235969543457, 24.669872283935547, 25.407386779785156, 26.144899368286133]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 5.0, 11.0, 15.0, 12.0, 17.0, 19.0, 17.0, 19.0, 16.0, 20.0, 20.0, 26.0, 41.0, 33.0, 42.0, 37.0, 33.0, 41.0, 41.0, 29.0, 42.0, 27.0, 30.0, 36.0, 31.0, 28.0, 32.0, 36.0, 33.0, 23.0, 20.0, 17.0, 18.0, 12.0, 14.0, 14.0, 14.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 6.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.244949340820312, -20.54758644104004, -19.8502254486084, -19.152862548828125, -18.455501556396484, -17.75813865661621, -17.060775756835938, -16.363414764404297, -15.666051864624023, -14.968689918518066, -14.27132797241211, -13.573965072631836, -12.876603126525879, -12.179241180419922, -11.481878280639648, -10.784516334533691, -10.087154388427734, -9.389792442321777, -8.69243049621582, -7.995067596435547, -7.29770565032959, -6.600343704223633, -5.902981281280518, -5.205618858337402, -4.508256912231445, -3.810894727706909, -3.113532543182373, -2.416170358657837, -1.7188081741333008, -1.0214459896087646, -0.3240838050842285, 0.3732786178588867, 1.0706405639648438, 1.7680027484893799, 2.465364933013916, 3.162727117538452, 3.8600893020629883, 4.557451248168945, 5.2548136711120605, 5.952176094055176, 6.649538040161133, 7.34689998626709, 8.044261932373047, 8.74162483215332, 9.438986778259277, 10.136348724365234, 10.833711624145508, 11.531073570251465, 12.228435516357422, 12.925797462463379, 13.623159408569336, 14.32052230834961, 15.017884254455566, 15.715246200561523, 16.412609100341797, 17.109970092773438, 17.80733299255371, 18.504695892333984, 19.202056884765625, 19.8994197845459, 20.596782684326172, 21.294143676757812, 21.991506576538086, 22.68886947631836, 23.38623046875]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 9.0, 13.0, 25.0, 32.0, 61.0, 85.0, 150.0, 231.0, 388.0, 637.0, 1021.0, 1711.0, 2809.0, 4456.0, 7241.0, 11192.0, 17135.0, 26202.0, 40102.0, 57452.0, 82096.0, 114521.0, 154157.0, 200747.0, 249627.0, 299891.0, 339749.0, 364447.0, 371885.0, 359539.0, 328077.0, 283398.0, 233772.0, 183669.0, 139324.0, 101167.0, 72459.0, 49494.0, 33328.0, 22198.0, 14603.0, 9298.0, 5978.0, 3786.0, 2335.0, 1468.0, 981.0, 565.0, 341.0, 177.0, 100.0, 65.0, 36.0, 29.0, 10.0, 13.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-15.3203125, -14.8309326171875, -14.341552734375, -13.8521728515625, -13.36279296875, -12.8734130859375, -12.384033203125, -11.8946533203125, -11.4052734375, -10.9158935546875, -10.426513671875, -9.9371337890625, -9.44775390625, -8.9583740234375, -8.468994140625, -7.9796142578125, -7.490234375, -7.0008544921875, -6.511474609375, -6.0220947265625, -5.53271484375, -5.0433349609375, -4.553955078125, -4.0645751953125, -3.5751953125, -3.0858154296875, -2.596435546875, -2.1070556640625, -1.61767578125, -1.1282958984375, -0.638916015625, -0.1495361328125, 0.33984375, 0.8292236328125, 1.318603515625, 1.8079833984375, 2.29736328125, 2.7867431640625, 3.276123046875, 3.7655029296875, 4.2548828125, 4.7442626953125, 5.233642578125, 5.7230224609375, 6.21240234375, 6.7017822265625, 7.191162109375, 7.6805419921875, 8.169921875, 8.6593017578125, 9.148681640625, 9.6380615234375, 10.12744140625, 10.6168212890625, 11.106201171875, 11.5955810546875, 12.0849609375, 12.5743408203125, 13.063720703125, 13.5531005859375, 14.04248046875, 14.5318603515625, 15.021240234375, 15.5106201171875, 16.0]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 11.0, 14.0, 25.0, 16.0, 14.0, 17.0, 23.0, 23.0, 33.0, 25.0, 31.0, 29.0, 41.0, 32.0, 34.0, 34.0, 36.0, 32.0, 42.0, 38.0, 30.0, 28.0, 38.0, 36.0, 29.0, 34.0, 22.0, 25.0, 17.0, 17.0, 16.0, 18.0, 17.0, 20.0, 12.0, 9.0, 5.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.265625, -18.6513671875, -18.037109375, -17.4228515625, -16.80859375, -16.1943359375, -15.580078125, -14.9658203125, -14.3515625, -13.7373046875, -13.123046875, -12.5087890625, -11.89453125, -11.2802734375, -10.666015625, -10.0517578125, -9.4375, -8.8232421875, -8.208984375, -7.5947265625, -6.98046875, -6.3662109375, -5.751953125, -5.1376953125, -4.5234375, -3.9091796875, -3.294921875, -2.6806640625, -2.06640625, -1.4521484375, -0.837890625, -0.2236328125, 0.390625, 1.0048828125, 1.619140625, 2.2333984375, 2.84765625, 3.4619140625, 4.076171875, 4.6904296875, 5.3046875, 5.9189453125, 6.533203125, 7.1474609375, 7.76171875, 8.3759765625, 8.990234375, 9.6044921875, 10.21875, 10.8330078125, 11.447265625, 12.0615234375, 12.67578125, 13.2900390625, 13.904296875, 14.5185546875, 15.1328125, 15.7470703125, 16.361328125, 16.9755859375, 17.58984375, 18.2041015625, 18.818359375, 19.4326171875, 20.046875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 28.0, 44.0, 71.0, 115.0, 284.0, 406.0, 759.0, 1326.0, 2446.0, 4342.0, 7719.0, 13263.0, 22447.0, 37630.0, 60941.0, 95656.0, 142795.0, 201659.0, 270704.0, 341678.0, 401014.0, 437632.0, 440497.0, 411464.0, 357677.0, 289614.0, 219212.0, 155765.0, 105152.0, 68496.0, 42410.0, 25610.0, 15166.0, 8918.0, 5138.0, 2782.0, 1523.0, 822.0, 478.0, 267.0, 132.0, 80.0, 44.0, 32.0, 14.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.21875, -20.578125, -19.9375, -19.296875, -18.65625, -18.015625, -17.375, -16.734375, -16.09375, -15.453125, -14.8125, -14.171875, -13.53125, -12.890625, -12.25, -11.609375, -10.96875, -10.328125, -9.6875, -9.046875, -8.40625, -7.765625, -7.125, -6.484375, -5.84375, -5.203125, -4.5625, -3.921875, -3.28125, -2.640625, -2.0, -1.359375, -0.71875, -0.078125, 0.5625, 1.203125, 1.84375, 2.484375, 3.125, 3.765625, 4.40625, 5.046875, 5.6875, 6.328125, 6.96875, 7.609375, 8.25, 8.890625, 9.53125, 10.171875, 10.8125, 11.453125, 12.09375, 12.734375, 13.375, 14.015625, 14.65625, 15.296875, 15.9375, 16.578125, 17.21875, 17.859375, 18.5, 19.140625, 19.78125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 12.0, 10.0, 21.0, 25.0, 37.0, 36.0, 49.0, 47.0, 62.0, 94.0, 71.0, 101.0, 105.0, 109.0, 140.0, 137.0, 158.0, 161.0, 179.0, 191.0, 194.0, 193.0, 186.0, 172.0, 169.0, 166.0, 170.0, 157.0, 129.0, 117.0, 103.0, 105.0, 70.0, 64.0, 63.0, 50.0, 52.0, 27.0, 33.0, 27.0, 16.0, 13.0, 13.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.484375, -9.1710205078125, -8.857666015625, -8.5443115234375, -8.23095703125, -7.9176025390625, -7.604248046875, -7.2908935546875, -6.9775390625, -6.6641845703125, -6.350830078125, -6.0374755859375, -5.72412109375, -5.4107666015625, -5.097412109375, -4.7840576171875, -4.470703125, -4.1573486328125, -3.843994140625, -3.5306396484375, -3.21728515625, -2.9039306640625, -2.590576171875, -2.2772216796875, -1.9638671875, -1.6505126953125, -1.337158203125, -1.0238037109375, -0.71044921875, -0.3970947265625, -0.083740234375, 0.2296142578125, 0.54296875, 0.8563232421875, 1.169677734375, 1.4830322265625, 1.79638671875, 2.1097412109375, 2.423095703125, 2.7364501953125, 3.0498046875, 3.3631591796875, 3.676513671875, 3.9898681640625, 4.30322265625, 4.6165771484375, 4.929931640625, 5.2432861328125, 5.556640625, 5.8699951171875, 6.183349609375, 6.4967041015625, 6.81005859375, 7.1234130859375, 7.436767578125, 7.7501220703125, 8.0634765625, 8.3768310546875, 8.690185546875, 9.0035400390625, 9.31689453125, 9.6302490234375, 9.943603515625, 10.2569580078125, 10.5703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 8.0, 7.0, 8.0, 17.0, 13.0, 26.0, 22.0, 33.0, 38.0, 30.0, 39.0, 45.0, 38.0, 61.0, 57.0, 51.0, 58.0, 46.0, 38.0, 52.0, 42.0, 33.0, 56.0, 32.0, 19.0, 24.0, 26.0, 16.0, 13.0, 18.0, 8.0, 11.0, 5.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.26637840270996, -27.259370803833008, -26.252361297607422, -25.24535369873047, -24.238344192504883, -23.23133659362793, -22.224327087402344, -21.21731948852539, -20.210311889648438, -19.203304290771484, -18.1962947845459, -17.189287185668945, -16.18227767944336, -15.175270080566406, -14.168261528015137, -13.161252975463867, -12.154243469238281, -11.147234916687012, -10.140226364135742, -9.133218765258789, -8.126209259033203, -7.119201183319092, -6.1121931076049805, -5.105184555053711, -4.098176002502441, -3.091167449951172, -2.0841591358184814, -1.077150821685791, -0.07014226913452148, 0.936866283416748, 1.9438743591308594, 2.950882911682129, 3.9578933715820312, 4.964901924133301, 5.97191047668457, 6.978918552398682, 7.985927104949951, 8.992935180664062, 9.999943733215332, 11.006952285766602, 12.013960838317871, 13.02096939086914, 14.02797794342041, 15.03498649597168, 16.041994094848633, 17.04900360107422, 18.056011199951172, 19.063018798828125, 20.07002830505371, 21.077035903930664, 22.08404541015625, 23.091053009033203, 24.09806251525879, 25.105070114135742, 26.112079620361328, 27.11908721923828, 28.126094818115234, 29.133102416992188, 30.140111923217773, 31.147119522094727, 32.15412902832031, 33.161136627197266, 34.16814422607422, 35.17515563964844, 36.18216323852539]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 7.0, 5.0, 4.0, 11.0, 15.0, 13.0, 14.0, 25.0, 19.0, 21.0, 18.0, 12.0, 30.0, 35.0, 31.0, 44.0, 31.0, 38.0, 35.0, 40.0, 40.0, 39.0, 44.0, 41.0, 50.0, 32.0, 26.0, 31.0, 36.0, 18.0, 25.0, 32.0, 18.0, 19.0, 17.0, 11.0, 9.0, 13.0, 5.0, 13.0, 3.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-28.070402145385742, -27.211172103881836, -26.35194206237793, -25.492712020874023, -24.633481979370117, -23.77425193786621, -22.915021896362305, -22.0557918548584, -21.196561813354492, -20.337331771850586, -19.47810173034668, -18.618871688842773, -17.759641647338867, -16.90041160583496, -16.041181564331055, -15.181951522827148, -14.322720527648926, -13.46349048614502, -12.604260444641113, -11.745030403137207, -10.8858003616333, -10.026569366455078, -9.167339324951172, -8.308109283447266, -7.448879718780518, -6.589649677276611, -5.730419635772705, -4.871189117431641, -4.011959075927734, -3.152729034423828, -2.293498992919922, -1.4342689514160156, -0.5750389099121094, 0.28419119119644165, 1.1434212923049927, 2.0026514530181885, 2.8618814945220947, 3.72111177444458, 4.580341815948486, 5.439571857452393, 6.298801898956299, 7.158031940460205, 8.01726245880127, 8.876492500305176, 9.735722541809082, 10.594952583312988, 11.454182624816895, 12.3134126663208, 13.172642707824707, 14.031872749328613, 14.89110279083252, 15.750332832336426, 16.60956382751465, 17.468793869018555, 18.32802391052246, 19.187253952026367, 20.046483993530273, 20.90571403503418, 21.764944076538086, 22.624174118041992, 23.4834041595459, 24.342634201049805, 25.20186424255371, 26.061094284057617, 26.920324325561523]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 20.0, 21.0, 56.0, 66.0, 86.0, 126.0, 204.0, 356.0, 576.0, 954.0, 1395.0, 2301.0, 3779.0, 6312.0, 10820.0, 18362.0, 31755.0, 58266.0, 108795.0, 204253.0, 257945.0, 155121.0, 82188.0, 44520.0, 24596.0, 14141.0, 8419.0, 5016.0, 3109.0, 1855.0, 1136.0, 682.0, 468.0, 316.0, 200.0, 118.0, 60.0, 52.0, 32.0, 20.0, 12.0, 11.0, 9.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.91241455078125, -3.7740478515625, -3.63568115234375, -3.497314453125, -3.35894775390625, -3.2205810546875, -3.08221435546875, -2.94384765625, -2.80548095703125, -2.6671142578125, -2.52874755859375, -2.390380859375, -2.25201416015625, -2.1136474609375, -1.97528076171875, -1.8369140625, -1.69854736328125, -1.5601806640625, -1.42181396484375, -1.283447265625, -1.14508056640625, -1.0067138671875, -0.86834716796875, -0.72998046875, -0.59161376953125, -0.4532470703125, -0.31488037109375, -0.176513671875, -0.03814697265625, 0.1002197265625, 0.23858642578125, 0.376953125, 0.51531982421875, 0.6536865234375, 0.79205322265625, 0.930419921875, 1.06878662109375, 1.2071533203125, 1.34552001953125, 1.48388671875, 1.62225341796875, 1.7606201171875, 1.89898681640625, 2.037353515625, 2.17572021484375, 2.3140869140625, 2.45245361328125, 2.5908203125, 2.72918701171875, 2.8675537109375, 3.00592041015625, 3.144287109375, 3.28265380859375, 3.4210205078125, 3.55938720703125, 3.69775390625, 3.83612060546875, 3.9744873046875, 4.11285400390625, 4.251220703125, 4.38958740234375, 4.5279541015625, 4.66632080078125, 4.8046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 4.0, 8.0, 13.0, 8.0, 19.0, 15.0, 24.0, 18.0, 19.0, 18.0, 28.0, 44.0, 30.0, 39.0, 38.0, 54.0, 53.0, 41.0, 37.0, 40.0, 45.0, 46.0, 49.0, 37.0, 27.0, 38.0, 26.0, 30.0, 22.0, 19.0, 15.0, 17.0, 18.0, 10.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-34.6875, -33.70654296875, -32.7255859375, -31.74462890625, -30.763671875, -29.78271484375, -28.8017578125, -27.82080078125, -26.83984375, -25.85888671875, -24.8779296875, -23.89697265625, -22.916015625, -21.93505859375, -20.9541015625, -19.97314453125, -18.9921875, -18.01123046875, -17.0302734375, -16.04931640625, -15.068359375, -14.08740234375, -13.1064453125, -12.12548828125, -11.14453125, -10.16357421875, -9.1826171875, -8.20166015625, -7.220703125, -6.23974609375, -5.2587890625, -4.27783203125, -3.296875, -2.31591796875, -1.3349609375, -0.35400390625, 0.626953125, 1.60791015625, 2.5888671875, 3.56982421875, 4.55078125, 5.53173828125, 6.5126953125, 7.49365234375, 8.474609375, 9.45556640625, 10.4365234375, 11.41748046875, 12.3984375, 13.37939453125, 14.3603515625, 15.34130859375, 16.322265625, 17.30322265625, 18.2841796875, 19.26513671875, 20.24609375, 21.22705078125, 22.2080078125, 23.18896484375, 24.169921875, 25.15087890625, 26.1318359375, 27.11279296875, 28.09375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 17.0, 21.0, 16.0, 27.0, 38.0, 71.0, 95.0, 110.0, 171.0, 259.0, 344.0, 465.0, 699.0, 961.0, 1470.0, 2173.0, 3041.0, 4595.0, 6919.0, 10136.0, 15297.0, 23584.0, 36700.0, 58502.0, 96715.0, 158424.0, 209388.0, 157166.0, 95521.0, 58112.0, 37101.0, 23659.0, 15355.0, 10170.0, 6702.0, 4554.0, 3019.0, 2141.0, 1491.0, 1005.0, 707.0, 478.0, 365.0, 221.0, 169.0, 129.0, 77.0, 53.0, 34.0, 22.0, 26.0, 12.0, 8.0, 7.0, 9.0, 1.0, 1.0, 3.0], "bins": [-3.857421875, -3.73870849609375, -3.6199951171875, -3.50128173828125, -3.382568359375, -3.26385498046875, -3.1451416015625, -3.02642822265625, -2.90771484375, -2.78900146484375, -2.6702880859375, -2.55157470703125, -2.432861328125, -2.31414794921875, -2.1954345703125, -2.07672119140625, -1.9580078125, -1.83929443359375, -1.7205810546875, -1.60186767578125, -1.483154296875, -1.36444091796875, -1.2457275390625, -1.12701416015625, -1.00830078125, -0.88958740234375, -0.7708740234375, -0.65216064453125, -0.533447265625, -0.41473388671875, -0.2960205078125, -0.17730712890625, -0.05859375, 0.06011962890625, 0.1788330078125, 0.29754638671875, 0.416259765625, 0.53497314453125, 0.6536865234375, 0.77239990234375, 0.89111328125, 1.00982666015625, 1.1285400390625, 1.24725341796875, 1.365966796875, 1.48468017578125, 1.6033935546875, 1.72210693359375, 1.8408203125, 1.95953369140625, 2.0782470703125, 2.19696044921875, 2.315673828125, 2.43438720703125, 2.5531005859375, 2.67181396484375, 2.79052734375, 2.90924072265625, 3.0279541015625, 3.14666748046875, 3.265380859375, 3.38409423828125, 3.5028076171875, 3.62152099609375, 3.740234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 6.0, 9.0, 19.0, 8.0, 18.0, 18.0, 23.0, 19.0, 22.0, 22.0, 27.0, 34.0, 29.0, 34.0, 35.0, 44.0, 32.0, 32.0, 46.0, 40.0, 28.0, 41.0, 39.0, 37.0, 28.0, 29.0, 27.0, 29.0, 29.0, 27.0, 18.0, 26.0, 10.0, 17.0, 15.0, 15.0, 7.0, 11.0, 6.0, 1.0, 6.0, 3.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.8021240234375, -17.276123046875, -16.7501220703125, -16.22412109375, -15.6981201171875, -15.172119140625, -14.6461181640625, -14.1201171875, -13.5941162109375, -13.068115234375, -12.5421142578125, -12.01611328125, -11.4901123046875, -10.964111328125, -10.4381103515625, -9.912109375, -9.3861083984375, -8.860107421875, -8.3341064453125, -7.80810546875, -7.2821044921875, -6.756103515625, -6.2301025390625, -5.7041015625, -5.1781005859375, -4.652099609375, -4.1260986328125, -3.60009765625, -3.0740966796875, -2.548095703125, -2.0220947265625, -1.49609375, -0.9700927734375, -0.444091796875, 0.0819091796875, 0.60791015625, 1.1339111328125, 1.659912109375, 2.1859130859375, 2.7119140625, 3.2379150390625, 3.763916015625, 4.2899169921875, 4.81591796875, 5.3419189453125, 5.867919921875, 6.3939208984375, 6.919921875, 7.4459228515625, 7.971923828125, 8.4979248046875, 9.02392578125, 9.5499267578125, 10.075927734375, 10.6019287109375, 11.1279296875, 11.6539306640625, 12.179931640625, 12.7059326171875, 13.23193359375, 13.7579345703125, 14.283935546875, 14.8099365234375, 15.3359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 7.0, 7.0, 6.0, 8.0, 5.0, 21.0, 24.0, 26.0, 53.0, 66.0, 97.0, 116.0, 162.0, 241.0, 345.0, 452.0, 676.0, 979.0, 1433.0, 2041.0, 3064.0, 4681.0, 7105.0, 11019.0, 17985.0, 29494.0, 51211.0, 95765.0, 186598.0, 260988.0, 167439.0, 85691.0, 46642.0, 27348.0, 16501.0, 10103.0, 6595.0, 4355.0, 2807.0, 1953.0, 1325.0, 919.0, 624.0, 441.0, 307.0, 252.0, 177.0, 113.0, 87.0, 59.0, 37.0, 29.0, 25.0, 18.0, 12.0, 9.0, 5.0, 11.0, 1.0, 2.0, 5.0], "bins": [-0.09564208984375, -0.09269142150878906, -0.08974075317382812, -0.08679008483886719, -0.08383941650390625, -0.08088874816894531, -0.07793807983398438, -0.07498741149902344, -0.0720367431640625, -0.06908607482910156, -0.06613540649414062, -0.06318473815917969, -0.06023406982421875, -0.05728340148925781, -0.054332733154296875, -0.05138206481933594, -0.048431396484375, -0.04548072814941406, -0.042530059814453125, -0.03957939147949219, -0.03662872314453125, -0.03367805480957031, -0.030727386474609375, -0.027776718139648438, -0.0248260498046875, -0.021875381469726562, -0.018924713134765625, -0.015974044799804688, -0.01302337646484375, -0.010072708129882812, -0.007122039794921875, -0.0041713714599609375, -0.001220703125, 0.0017299652099609375, 0.004680633544921875, 0.0076313018798828125, 0.01058197021484375, 0.013532638549804688, 0.016483306884765625, 0.019433975219726562, 0.0223846435546875, 0.025335311889648438, 0.028285980224609375, 0.031236648559570312, 0.03418731689453125, 0.03713798522949219, 0.040088653564453125, 0.04303932189941406, 0.045989990234375, 0.04894065856933594, 0.051891326904296875, 0.05484199523925781, 0.05779266357421875, 0.06074333190917969, 0.06369400024414062, 0.06664466857910156, 0.0695953369140625, 0.07254600524902344, 0.07549667358398438, 0.07844734191894531, 0.08139801025390625, 0.08434867858886719, 0.08729934692382812, 0.09025001525878906, 0.09320068359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 1.0, 8.0, 10.0, 14.0, 14.0, 10.0, 14.0, 22.0, 17.0, 33.0, 22.0, 26.0, 39.0, 24.0, 42.0, 31.0, 41.0, 38.0, 44.0, 41.0, 50.0, 46.0, 34.0, 40.0, 36.0, 33.0, 43.0, 30.0, 20.0, 25.0, 19.0, 13.0, 24.0, 18.0, 12.0, 18.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.7726793885231018e-05, -1.7154961824417114e-05, -1.658312976360321e-05, -1.6011297702789307e-05, -1.5439465641975403e-05, -1.4867633581161499e-05, -1.4295801520347595e-05, -1.3723969459533691e-05, -1.3152137398719788e-05, -1.2580305337905884e-05, -1.200847327709198e-05, -1.1436641216278076e-05, -1.0864809155464172e-05, -1.0292977094650269e-05, -9.721145033836365e-06, -9.149312973022461e-06, -8.577480912208557e-06, -8.005648851394653e-06, -7.4338167905807495e-06, -6.861984729766846e-06, -6.290152668952942e-06, -5.718320608139038e-06, -5.146488547325134e-06, -4.5746564865112305e-06, -4.002824425697327e-06, -3.430992364883423e-06, -2.859160304069519e-06, -2.2873282432556152e-06, -1.7154961824417114e-06, -1.1436641216278076e-06, -5.718320608139038e-07, 0.0, 5.718320608139038e-07, 1.1436641216278076e-06, 1.7154961824417114e-06, 2.2873282432556152e-06, 2.859160304069519e-06, 3.430992364883423e-06, 4.002824425697327e-06, 4.5746564865112305e-06, 5.146488547325134e-06, 5.718320608139038e-06, 6.290152668952942e-06, 6.861984729766846e-06, 7.4338167905807495e-06, 8.005648851394653e-06, 8.577480912208557e-06, 9.149312973022461e-06, 9.721145033836365e-06, 1.0292977094650269e-05, 1.0864809155464172e-05, 1.1436641216278076e-05, 1.200847327709198e-05, 1.2580305337905884e-05, 1.3152137398719788e-05, 1.3723969459533691e-05, 1.4295801520347595e-05, 1.4867633581161499e-05, 1.5439465641975403e-05, 1.6011297702789307e-05, 1.658312976360321e-05, 1.7154961824417114e-05, 1.7726793885231018e-05, 1.8298625946044922e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 18.0, 17.0, 49.0, 62.0, 79.0, 109.0, 179.0, 271.0, 397.0, 598.0, 868.0, 1358.0, 1848.0, 2811.0, 3928.0, 6028.0, 8896.0, 12914.0, 19369.0, 29786.0, 46232.0, 75647.0, 133030.0, 242290.0, 188768.0, 101790.0, 59434.0, 37352.0, 24237.0, 16120.0, 10996.0, 7430.0, 5004.0, 3379.0, 2377.0, 1610.0, 1043.0, 733.0, 516.0, 362.0, 211.0, 135.0, 78.0, 73.0, 50.0, 27.0, 19.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.1991748809814453, -0.19290542602539062, -0.18663597106933594, -0.18036651611328125, -0.17409706115722656, -0.16782760620117188, -0.1615581512451172, -0.1552886962890625, -0.1490192413330078, -0.14274978637695312, -0.13648033142089844, -0.13021087646484375, -0.12394142150878906, -0.11767196655273438, -0.11140251159667969, -0.105133056640625, -0.09886360168457031, -0.09259414672851562, -0.08632469177246094, -0.08005523681640625, -0.07378578186035156, -0.06751632690429688, -0.06124687194824219, -0.0549774169921875, -0.04870796203613281, -0.042438507080078125, -0.03616905212402344, -0.02989959716796875, -0.023630142211914062, -0.017360687255859375, -0.011091232299804688, -0.00482177734375, 0.0014476776123046875, 0.007717132568359375, 0.013986587524414062, 0.02025604248046875, 0.026525497436523438, 0.032794952392578125, 0.03906440734863281, 0.0453338623046875, 0.05160331726074219, 0.057872772216796875, 0.06414222717285156, 0.07041168212890625, 0.07668113708496094, 0.08295059204101562, 0.08922004699707031, 0.095489501953125, 0.10175895690917969, 0.10802841186523438, 0.11429786682128906, 0.12056732177734375, 0.12683677673339844, 0.13310623168945312, 0.1393756866455078, 0.1456451416015625, 0.1519145965576172, 0.15818405151367188, 0.16445350646972656, 0.17072296142578125, 0.17699241638183594, 0.18326187133789062, 0.1895313262939453, 0.19580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 8.0, 12.0, 8.0, 16.0, 22.0, 38.0, 37.0, 49.0, 61.0, 79.0, 109.0, 102.0, 97.0, 80.0, 63.0, 53.0, 34.0, 25.0, 20.0, 16.0, 10.0, 5.0, 8.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09957218170166016, -0.09617805480957031, -0.09278392791748047, -0.08938980102539062, -0.08599567413330078, -0.08260154724121094, -0.0792074203491211, -0.07581329345703125, -0.0724191665649414, -0.06902503967285156, -0.06563091278076172, -0.062236785888671875, -0.05884265899658203, -0.05544853210449219, -0.052054405212402344, -0.0486602783203125, -0.045266151428222656, -0.04187202453613281, -0.03847789764404297, -0.035083770751953125, -0.03168964385986328, -0.028295516967773438, -0.024901390075683594, -0.02150726318359375, -0.018113136291503906, -0.014719009399414062, -0.011324882507324219, -0.007930755615234375, -0.004536628723144531, -0.0011425018310546875, 0.0022516250610351562, 0.005645751953125, 0.009039878845214844, 0.012434005737304688, 0.01582813262939453, 0.019222259521484375, 0.02261638641357422, 0.026010513305664062, 0.029404640197753906, 0.03279876708984375, 0.036192893981933594, 0.03958702087402344, 0.04298114776611328, 0.046375274658203125, 0.04976940155029297, 0.05316352844238281, 0.056557655334472656, 0.0599517822265625, 0.06334590911865234, 0.06674003601074219, 0.07013416290283203, 0.07352828979492188, 0.07692241668701172, 0.08031654357910156, 0.0837106704711914, 0.08710479736328125, 0.0904989242553711, 0.09389305114746094, 0.09728717803955078, 0.10068130493164062, 0.10407543182373047, 0.10746955871582031, 0.11086368560791016, 0.1142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 9.0, 18.0, 20.0, 29.0, 29.0, 36.0, 33.0, 41.0, 38.0, 42.0, 60.0, 57.0, 51.0, 52.0, 44.0, 48.0, 51.0, 37.0, 38.0, 45.0, 42.0, 24.0, 21.0, 27.0, 19.0, 12.0, 15.0, 12.0, 11.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.633695602416992, -27.625804901123047, -26.6179141998291, -25.610023498535156, -24.60213279724121, -23.594242095947266, -22.586349487304688, -21.578460693359375, -20.570568084716797, -19.56267738342285, -18.554786682128906, -17.54689598083496, -16.539005279541016, -15.53111457824707, -14.523222923278809, -13.515332221984863, -12.507442474365234, -11.499551773071289, -10.491661071777344, -9.483770370483398, -8.475879669189453, -7.46798849105835, -6.460097312927246, -5.452206611633301, -4.4443159103393555, -3.43642520904541, -2.4285342693328857, -1.4206433296203613, -0.412752628326416, 0.5951380729675293, 1.6030292510986328, 2.610919952392578, 3.6188087463378906, 4.626699447631836, 5.634590148925781, 6.642481327056885, 7.65037202835083, 8.658262252807617, 9.666153907775879, 10.674044609069824, 11.68193531036377, 12.689826011657715, 13.69771671295166, 14.705608367919922, 15.713499069213867, 16.721389770507812, 17.729280471801758, 18.737171173095703, 19.74506187438965, 20.752952575683594, 21.76084327697754, 22.768733978271484, 23.77662467956543, 24.784515380859375, 25.792407989501953, 26.800296783447266, 27.808189392089844, 28.81608009338379, 29.823970794677734, 30.83186149597168, 31.839752197265625, 32.8476448059082, 33.855533599853516, 34.863426208496094, 35.871315002441406]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 8.0, 3.0, 5.0, 10.0, 14.0, 12.0, 16.0, 25.0, 17.0, 24.0, 14.0, 15.0, 29.0, 34.0, 29.0, 41.0, 37.0, 37.0, 36.0, 38.0, 36.0, 42.0, 46.0, 43.0, 47.0, 37.0, 23.0, 31.0, 38.0, 17.0, 27.0, 29.0, 19.0, 20.0, 17.0, 12.0, 8.0, 14.0, 5.0, 13.0, 3.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-28.29906463623047, -27.437580108642578, -26.576095581054688, -25.714611053466797, -24.85312843322754, -23.99164390563965, -23.130159378051758, -22.268674850463867, -21.407190322875977, -20.545705795288086, -19.684221267700195, -18.822738647460938, -17.961254119873047, -17.099769592285156, -16.238285064697266, -15.376800537109375, -14.5153169631958, -13.65383243560791, -12.792348861694336, -11.930864334106445, -11.069379806518555, -10.207895278930664, -9.34641170501709, -8.4849271774292, -7.623443126678467, -6.761959075927734, -5.900474548339844, -5.038990497589111, -4.177506446838379, -3.3160219192504883, -2.454537868499756, -1.5930533409118652, -0.7315692901611328, 0.12991493940353394, 0.9913991689682007, 1.8528833389282227, 2.714367628097534, 3.5758519172668457, 4.437335968017578, 5.298820495605469, 6.160304546356201, 7.021788597106934, 7.883273124694824, 8.744756698608398, 9.606241226196289, 10.46772575378418, 11.32921028137207, 12.190694808959961, 13.052178382873535, 13.913662910461426, 14.775146484375, 15.63663101196289, 16.49811553955078, 17.359600067138672, 18.221084594726562, 19.082569122314453, 19.94405174255371, 20.8055362701416, 21.667020797729492, 22.52850341796875, 23.38998794555664, 24.25147247314453, 25.112957000732422, 25.974441528320312, 26.835926055908203]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 13.0, 25.0, 38.0, 57.0, 109.0, 170.0, 258.0, 441.0, 590.0, 994.0, 1599.0, 2522.0, 3797.0, 5779.0, 8728.0, 12719.0, 18121.0, 25311.0, 34461.0, 45586.0, 57916.0, 69734.0, 80731.0, 87501.0, 92296.0, 90354.0, 84688.0, 74589.0, 63614.0, 50849.0, 39687.0, 29082.0, 21265.0, 14922.0, 10267.0, 6936.0, 4566.0, 2971.0, 1974.0, 1203.0, 848.0, 502.0, 298.0, 191.0, 104.0, 55.0, 41.0, 30.0, 12.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1640625, -10.7884521484375, -10.412841796875, -10.0372314453125, -9.66162109375, -9.2860107421875, -8.910400390625, -8.5347900390625, -8.1591796875, -7.7835693359375, -7.407958984375, -7.0323486328125, -6.65673828125, -6.2811279296875, -5.905517578125, -5.5299072265625, -5.154296875, -4.7786865234375, -4.403076171875, -4.0274658203125, -3.65185546875, -3.2762451171875, -2.900634765625, -2.5250244140625, -2.1494140625, -1.7738037109375, -1.398193359375, -1.0225830078125, -0.64697265625, -0.2713623046875, 0.104248046875, 0.4798583984375, 0.85546875, 1.2310791015625, 1.606689453125, 1.9822998046875, 2.35791015625, 2.7335205078125, 3.109130859375, 3.4847412109375, 3.8603515625, 4.2359619140625, 4.611572265625, 4.9871826171875, 5.36279296875, 5.7384033203125, 6.114013671875, 6.4896240234375, 6.865234375, 7.2408447265625, 7.616455078125, 7.9920654296875, 8.36767578125, 8.7432861328125, 9.118896484375, 9.4945068359375, 9.8701171875, 10.2457275390625, 10.621337890625, 10.9969482421875, 11.37255859375, 11.7481689453125, 12.123779296875, 12.4993896484375, 12.875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 3.0, 9.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 26.0, 21.0, 17.0, 20.0, 19.0, 36.0, 42.0, 24.0, 34.0, 45.0, 37.0, 43.0, 40.0, 45.0, 38.0, 43.0, 41.0, 30.0, 34.0, 45.0, 27.0, 19.0, 18.0, 32.0, 21.0, 24.0, 17.0, 15.0, 22.0, 10.0, 10.0, 10.0, 7.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.34375, -28.453125, -27.5625, -26.671875, -25.78125, -24.890625, -24.0, -23.109375, -22.21875, -21.328125, -20.4375, -19.546875, -18.65625, -17.765625, -16.875, -15.984375, -15.09375, -14.203125, -13.3125, -12.421875, -11.53125, -10.640625, -9.75, -8.859375, -7.96875, -7.078125, -6.1875, -5.296875, -4.40625, -3.515625, -2.625, -1.734375, -0.84375, 0.046875, 0.9375, 1.828125, 2.71875, 3.609375, 4.5, 5.390625, 6.28125, 7.171875, 8.0625, 8.953125, 9.84375, 10.734375, 11.625, 12.515625, 13.40625, 14.296875, 15.1875, 16.078125, 16.96875, 17.859375, 18.75, 19.640625, 20.53125, 21.421875, 22.3125, 23.203125, 24.09375, 24.984375, 25.875, 26.765625, 27.65625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 22.0, 36.0, 31.0, 42.0, 88.0, 95.0, 199.0, 274.0, 435.0, 626.0, 1042.0, 1472.0, 2335.0, 3635.0, 5457.0, 7933.0, 12018.0, 17351.0, 23914.0, 32922.0, 43761.0, 55470.0, 68137.0, 78875.0, 87156.0, 91882.0, 91311.0, 85479.0, 76497.0, 65190.0, 52594.0, 40918.0, 30787.0, 22418.0, 15833.0, 10819.0, 7382.0, 4814.0, 3277.0, 2113.0, 1370.0, 917.0, 589.0, 358.0, 239.0, 167.0, 87.0, 65.0, 45.0, 21.0, 24.0, 13.0, 4.0, 7.0, 3.0, 1.0, 3.0], "bins": [-12.6953125, -12.3092041015625, -11.923095703125, -11.5369873046875, -11.15087890625, -10.7647705078125, -10.378662109375, -9.9925537109375, -9.6064453125, -9.2203369140625, -8.834228515625, -8.4481201171875, -8.06201171875, -7.6759033203125, -7.289794921875, -6.9036865234375, -6.517578125, -6.1314697265625, -5.745361328125, -5.3592529296875, -4.97314453125, -4.5870361328125, -4.200927734375, -3.8148193359375, -3.4287109375, -3.0426025390625, -2.656494140625, -2.2703857421875, -1.88427734375, -1.4981689453125, -1.112060546875, -0.7259521484375, -0.33984375, 0.0462646484375, 0.432373046875, 0.8184814453125, 1.20458984375, 1.5906982421875, 1.976806640625, 2.3629150390625, 2.7490234375, 3.1351318359375, 3.521240234375, 3.9073486328125, 4.29345703125, 4.6795654296875, 5.065673828125, 5.4517822265625, 5.837890625, 6.2239990234375, 6.610107421875, 6.9962158203125, 7.38232421875, 7.7684326171875, 8.154541015625, 8.5406494140625, 8.9267578125, 9.3128662109375, 9.698974609375, 10.0850830078125, 10.47119140625, 10.8572998046875, 11.243408203125, 11.6295166015625, 12.015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 9.0, 13.0, 12.0, 21.0, 19.0, 28.0, 20.0, 26.0, 36.0, 29.0, 34.0, 41.0, 28.0, 41.0, 45.0, 43.0, 53.0, 46.0, 49.0, 43.0, 34.0, 51.0, 31.0, 37.0, 27.0, 30.0, 22.0, 19.0, 12.0, 16.0, 20.0, 13.0, 4.0, 5.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.140625, -19.5078125, -18.875, -18.2421875, -17.609375, -16.9765625, -16.34375, -15.7109375, -15.078125, -14.4453125, -13.8125, -13.1796875, -12.546875, -11.9140625, -11.28125, -10.6484375, -10.015625, -9.3828125, -8.75, -8.1171875, -7.484375, -6.8515625, -6.21875, -5.5859375, -4.953125, -4.3203125, -3.6875, -3.0546875, -2.421875, -1.7890625, -1.15625, -0.5234375, 0.109375, 0.7421875, 1.375, 2.0078125, 2.640625, 3.2734375, 3.90625, 4.5390625, 5.171875, 5.8046875, 6.4375, 7.0703125, 7.703125, 8.3359375, 8.96875, 9.6015625, 10.234375, 10.8671875, 11.5, 12.1328125, 12.765625, 13.3984375, 14.03125, 14.6640625, 15.296875, 15.9296875, 16.5625, 17.1953125, 17.828125, 18.4609375, 19.09375, 19.7265625, 20.359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 18.0, 22.0, 68.0, 67.0, 147.0, 189.0, 344.0, 580.0, 955.0, 1576.0, 2506.0, 4077.0, 6622.0, 10471.0, 15996.0, 24542.0, 35758.0, 49828.0, 66169.0, 81875.0, 94818.0, 103823.0, 104753.0, 99991.0, 88025.0, 73230.0, 56871.0, 41748.0, 29156.0, 20029.0, 12811.0, 8289.0, 5105.0, 3173.0, 1864.0, 1194.0, 713.0, 446.0, 241.0, 155.0, 116.0, 58.0, 40.0, 25.0, 19.0, 20.0, 8.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.4969482421875, -4.337646484375, -4.1783447265625, -4.01904296875, -3.8597412109375, -3.700439453125, -3.5411376953125, -3.3818359375, -3.2225341796875, -3.063232421875, -2.9039306640625, -2.74462890625, -2.5853271484375, -2.426025390625, -2.2667236328125, -2.107421875, -1.9481201171875, -1.788818359375, -1.6295166015625, -1.47021484375, -1.3109130859375, -1.151611328125, -0.9923095703125, -0.8330078125, -0.6737060546875, -0.514404296875, -0.3551025390625, -0.19580078125, -0.0364990234375, 0.122802734375, 0.2821044921875, 0.44140625, 0.6007080078125, 0.760009765625, 0.9193115234375, 1.07861328125, 1.2379150390625, 1.397216796875, 1.5565185546875, 1.7158203125, 1.8751220703125, 2.034423828125, 2.1937255859375, 2.35302734375, 2.5123291015625, 2.671630859375, 2.8309326171875, 2.990234375, 3.1495361328125, 3.308837890625, 3.4681396484375, 3.62744140625, 3.7867431640625, 3.946044921875, 4.1053466796875, 4.2646484375, 4.4239501953125, 4.583251953125, 4.7425537109375, 4.90185546875, 5.0611572265625, 5.220458984375, 5.3797607421875, 5.5390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 7.0, 4.0, 8.0, 7.0, 14.0, 19.0, 13.0, 31.0, 11.0, 39.0, 28.0, 33.0, 53.0, 42.0, 41.0, 39.0, 51.0, 56.0, 38.0, 45.0, 43.0, 41.0, 35.0, 29.0, 28.0, 31.0, 35.0, 35.0, 21.0, 17.0, 18.0, 15.0, 18.0, 10.0, 8.0, 6.0, 6.0, 9.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006251335144042969, -0.0006050616502761841, -0.0005849897861480713, -0.0005649179220199585, -0.0005448460578918457, -0.0005247741937637329, -0.0005047023296356201, -0.0004846304655075073, -0.00046455860137939453, -0.00044448673725128174, -0.00042441487312316895, -0.00040434300899505615, -0.00038427114486694336, -0.00036419928073883057, -0.0003441274166107178, -0.000324055552482605, -0.0003039836883544922, -0.0002839118242263794, -0.0002638399600982666, -0.0002437680959701538, -0.00022369623184204102, -0.00020362436771392822, -0.00018355250358581543, -0.00016348063945770264, -0.00014340877532958984, -0.00012333691120147705, -0.00010326504707336426, -8.319318294525146e-05, -6.312131881713867e-05, -4.304945468902588e-05, -2.2977590560913086e-05, -2.905726432800293e-06, 1.71661376953125e-05, 3.723800182342529e-05, 5.7309865951538086e-05, 7.738173007965088e-05, 9.745359420776367e-05, 0.00011752545833587646, 0.00013759732246398926, 0.00015766918659210205, 0.00017774105072021484, 0.00019781291484832764, 0.00021788477897644043, 0.00023795664310455322, 0.000258028507232666, 0.0002781003713607788, 0.0002981722354888916, 0.0003182440996170044, 0.0003383159637451172, 0.00035838782787323, 0.0003784596920013428, 0.00039853155612945557, 0.00041860342025756836, 0.00043867528438568115, 0.00045874714851379395, 0.00047881901264190674, 0.0004988908767700195, 0.0005189627408981323, 0.0005390346050262451, 0.0005591064691543579, 0.0005791783332824707, 0.0005992501974105835, 0.0006193220615386963, 0.0006393939256668091, 0.0006594657897949219]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 19.0, 21.0, 27.0, 47.0, 79.0, 148.0, 208.0, 354.0, 528.0, 926.0, 1456.0, 2433.0, 4226.0, 6729.0, 11386.0, 18063.0, 27982.0, 42246.0, 59558.0, 80044.0, 99224.0, 112139.0, 118207.0, 111845.0, 97762.0, 79215.0, 58755.0, 41604.0, 27771.0, 17612.0, 10927.0, 6787.0, 3950.0, 2524.0, 1472.0, 873.0, 523.0, 310.0, 213.0, 135.0, 76.0, 53.0, 36.0, 15.0, 15.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.58624267578125, -5.4029541015625, -5.21966552734375, -5.036376953125, -4.85308837890625, -4.6697998046875, -4.48651123046875, -4.30322265625, -4.11993408203125, -3.9366455078125, -3.75335693359375, -3.570068359375, -3.38677978515625, -3.2034912109375, -3.02020263671875, -2.8369140625, -2.65362548828125, -2.4703369140625, -2.28704833984375, -2.103759765625, -1.92047119140625, -1.7371826171875, -1.55389404296875, -1.37060546875, -1.18731689453125, -1.0040283203125, -0.82073974609375, -0.637451171875, -0.45416259765625, -0.2708740234375, -0.08758544921875, 0.095703125, 0.27899169921875, 0.4622802734375, 0.64556884765625, 0.828857421875, 1.01214599609375, 1.1954345703125, 1.37872314453125, 1.56201171875, 1.74530029296875, 1.9285888671875, 2.11187744140625, 2.295166015625, 2.47845458984375, 2.6617431640625, 2.84503173828125, 3.0283203125, 3.21160888671875, 3.3948974609375, 3.57818603515625, 3.761474609375, 3.94476318359375, 4.1280517578125, 4.31134033203125, 4.49462890625, 4.67791748046875, 4.8612060546875, 5.04449462890625, 5.227783203125, 5.41107177734375, 5.5943603515625, 5.77764892578125, 5.9609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 8.0, 12.0, 17.0, 24.0, 13.0, 15.0, 20.0, 27.0, 35.0, 33.0, 47.0, 52.0, 57.0, 60.0, 57.0, 52.0, 48.0, 45.0, 52.0, 35.0, 37.0, 47.0, 29.0, 31.0, 22.0, 20.0, 19.0, 19.0, 12.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.540985107421875, -2.45111083984375, -2.361236572265625, -2.2713623046875, -2.181488037109375, -2.09161376953125, -2.001739501953125, -1.911865234375, -1.821990966796875, -1.73211669921875, -1.642242431640625, -1.5523681640625, -1.462493896484375, -1.37261962890625, -1.282745361328125, -1.19287109375, -1.102996826171875, -1.01312255859375, -0.923248291015625, -0.8333740234375, -0.743499755859375, -0.65362548828125, -0.563751220703125, -0.473876953125, -0.384002685546875, -0.29412841796875, -0.204254150390625, -0.1143798828125, -0.024505615234375, 0.06536865234375, 0.155242919921875, 0.2451171875, 0.334991455078125, 0.42486572265625, 0.514739990234375, 0.6046142578125, 0.694488525390625, 0.78436279296875, 0.874237060546875, 0.964111328125, 1.053985595703125, 1.14385986328125, 1.233734130859375, 1.3236083984375, 1.413482666015625, 1.50335693359375, 1.593231201171875, 1.68310546875, 1.772979736328125, 1.86285400390625, 1.952728271484375, 2.0426025390625, 2.132476806640625, 2.22235107421875, 2.312225341796875, 2.402099609375, 2.491973876953125, 2.58184814453125, 2.671722412109375, 2.7615966796875, 2.851470947265625, 2.94134521484375, 3.031219482421875, 3.12109375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 8.0, 17.0, 20.0, 23.0, 25.0, 29.0, 34.0, 35.0, 44.0, 43.0, 38.0, 65.0, 47.0, 41.0, 51.0, 34.0, 58.0, 45.0, 43.0, 43.0, 35.0, 35.0, 30.0, 24.0, 25.0, 18.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-29.038381576538086, -28.069211959838867, -27.10004425048828, -26.130874633789062, -25.161705017089844, -24.192535400390625, -23.223365783691406, -22.25419807434082, -21.2850284576416, -20.315858840942383, -19.346691131591797, -18.377521514892578, -17.40835189819336, -16.43918228149414, -15.470013618469238, -14.500844955444336, -13.531675338745117, -12.562505722045898, -11.593337059020996, -10.624168395996094, -9.654998779296875, -8.685829162597656, -7.716660499572754, -6.747491359710693, -5.778322219848633, -4.809153079986572, -3.8399839401245117, -2.870814800262451, -1.9016456604003906, -0.9324765205383301, 0.03669261932373047, 1.005861759185791, 1.9750328063964844, 2.944201946258545, 3.9133710861206055, 4.882540225982666, 5.851709365844727, 6.820878505706787, 7.790047645568848, 8.75921630859375, 9.728385925292969, 10.697555541992188, 11.66672420501709, 12.635892868041992, 13.605062484741211, 14.57423210144043, 15.543400764465332, 16.512569427490234, 17.481739044189453, 18.450908660888672, 19.42007827758789, 20.389245986938477, 21.358415603637695, 22.327585220336914, 23.2967529296875, 24.26592254638672, 25.235092163085938, 26.204261779785156, 27.173431396484375, 28.14259910583496, 29.11176872253418, 30.0809383392334, 31.050106048583984, 32.0192756652832, 32.98844528198242]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 8.0, 16.0, 18.0, 12.0, 11.0, 19.0, 14.0, 23.0, 37.0, 23.0, 30.0, 38.0, 37.0, 34.0, 44.0, 38.0, 50.0, 35.0, 46.0, 43.0, 34.0, 38.0, 40.0, 41.0, 29.0, 33.0, 26.0, 24.0, 24.0, 27.0, 13.0, 11.0, 14.0, 10.0, 13.0, 7.0, 5.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.32804489135742, -35.28412628173828, -34.24020767211914, -33.196285247802734, -32.152366638183594, -31.108448028564453, -30.064529418945312, -29.02060890197754, -27.976688385009766, -26.932769775390625, -25.88884925842285, -24.84493064880371, -23.801010131835938, -22.757091522216797, -21.713172912597656, -20.669252395629883, -19.625333786010742, -18.5814151763916, -17.537494659423828, -16.493576049804688, -15.449655532836914, -14.405736923217773, -13.361817359924316, -12.31789779663086, -11.273978233337402, -10.230058670043945, -9.186139106750488, -8.142219543457031, -7.098300457000732, -6.054380893707275, -5.010461807250977, -3.9665422439575195, -2.9226226806640625, -1.878703236579895, -0.8347837924957275, 0.2091355323791504, 1.2530550956726074, 2.2969746589660645, 3.3408937454223633, 4.38481330871582, 5.428732872009277, 6.472652435302734, 7.516571998596191, 8.560491561889648, 9.604410171508789, 10.648330688476562, 11.692249298095703, 12.73616886138916, 13.780088424682617, 14.824007987976074, 15.867927551269531, 16.911846160888672, 17.955766677856445, 18.999685287475586, 20.04360580444336, 21.0875244140625, 22.13144302368164, 23.17536163330078, 24.219282150268555, 25.263200759887695, 26.30712127685547, 27.35103988647461, 28.39495849609375, 29.438879013061523, 30.482799530029297]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 22.0, 32.0, 36.0, 83.0, 160.0, 249.0, 369.0, 678.0, 1120.0, 1734.0, 2893.0, 4851.0, 7642.0, 12161.0, 19829.0, 30566.0, 46333.0, 70380.0, 102451.0, 144796.0, 196940.0, 256585.0, 316472.0, 370762.0, 403870.0, 411042.0, 389506.0, 345703.0, 290207.0, 227561.0, 170103.0, 122646.0, 84954.0, 57589.0, 37960.0, 24651.0, 15775.0, 9783.0, 6066.0, 3751.0, 2239.0, 1521.0, 877.0, 573.0, 298.0, 195.0, 113.0, 70.0, 32.0, 26.0, 10.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.65625, -21.9541015625, -21.251953125, -20.5498046875, -19.84765625, -19.1455078125, -18.443359375, -17.7412109375, -17.0390625, -16.3369140625, -15.634765625, -14.9326171875, -14.23046875, -13.5283203125, -12.826171875, -12.1240234375, -11.421875, -10.7197265625, -10.017578125, -9.3154296875, -8.61328125, -7.9111328125, -7.208984375, -6.5068359375, -5.8046875, -5.1025390625, -4.400390625, -3.6982421875, -2.99609375, -2.2939453125, -1.591796875, -0.8896484375, -0.1875, 0.5146484375, 1.216796875, 1.9189453125, 2.62109375, 3.3232421875, 4.025390625, 4.7275390625, 5.4296875, 6.1318359375, 6.833984375, 7.5361328125, 8.23828125, 8.9404296875, 9.642578125, 10.3447265625, 11.046875, 11.7490234375, 12.451171875, 13.1533203125, 13.85546875, 14.5576171875, 15.259765625, 15.9619140625, 16.6640625, 17.3662109375, 18.068359375, 18.7705078125, 19.47265625, 20.1748046875, 20.876953125, 21.5791015625, 22.28125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 12.0, 7.0, 9.0, 13.0, 10.0, 11.0, 14.0, 19.0, 25.0, 35.0, 30.0, 37.0, 30.0, 31.0, 40.0, 45.0, 39.0, 49.0, 37.0, 41.0, 37.0, 37.0, 46.0, 33.0, 35.0, 31.0, 32.0, 36.0, 31.0, 21.0, 22.0, 18.0, 15.0, 13.0, 10.0, 5.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.0, -32.027587890625, -31.05517578125, -30.082763671875, -29.1103515625, -28.137939453125, -27.16552734375, -26.193115234375, -25.220703125, -24.248291015625, -23.27587890625, -22.303466796875, -21.3310546875, -20.358642578125, -19.38623046875, -18.413818359375, -17.44140625, -16.468994140625, -15.49658203125, -14.524169921875, -13.5517578125, -12.579345703125, -11.60693359375, -10.634521484375, -9.662109375, -8.689697265625, -7.71728515625, -6.744873046875, -5.7724609375, -4.800048828125, -3.82763671875, -2.855224609375, -1.8828125, -0.910400390625, 0.06201171875, 1.034423828125, 2.0068359375, 2.979248046875, 3.95166015625, 4.924072265625, 5.896484375, 6.868896484375, 7.84130859375, 8.813720703125, 9.7861328125, 10.758544921875, 11.73095703125, 12.703369140625, 13.67578125, 14.648193359375, 15.62060546875, 16.593017578125, 17.5654296875, 18.537841796875, 19.51025390625, 20.482666015625, 21.455078125, 22.427490234375, 23.39990234375, 24.372314453125, 25.3447265625, 26.317138671875, 27.28955078125, 28.261962890625, 29.234375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 8.0, 14.0, 18.0, 29.0, 46.0, 87.0, 122.0, 202.0, 320.0, 565.0, 845.0, 1269.0, 2259.0, 3583.0, 5981.0, 9259.0, 14895.0, 23113.0, 35322.0, 53428.0, 79082.0, 112495.0, 156054.0, 206316.0, 261005.0, 314570.0, 359178.0, 384947.0, 388824.0, 370778.0, 333052.0, 281312.0, 226414.0, 174213.0, 127608.0, 90093.0, 61735.0, 41263.0, 26717.0, 17652.0, 11074.0, 7156.0, 4447.0, 2619.0, 1670.0, 1079.0, 605.0, 359.0, 236.0, 156.0, 92.0, 56.0, 29.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0], "bins": [-24.5625, -23.79931640625, -23.0361328125, -22.27294921875, -21.509765625, -20.74658203125, -19.9833984375, -19.22021484375, -18.45703125, -17.69384765625, -16.9306640625, -16.16748046875, -15.404296875, -14.64111328125, -13.8779296875, -13.11474609375, -12.3515625, -11.58837890625, -10.8251953125, -10.06201171875, -9.298828125, -8.53564453125, -7.7724609375, -7.00927734375, -6.24609375, -5.48291015625, -4.7197265625, -3.95654296875, -3.193359375, -2.43017578125, -1.6669921875, -0.90380859375, -0.140625, 0.62255859375, 1.3857421875, 2.14892578125, 2.912109375, 3.67529296875, 4.4384765625, 5.20166015625, 5.96484375, 6.72802734375, 7.4912109375, 8.25439453125, 9.017578125, 9.78076171875, 10.5439453125, 11.30712890625, 12.0703125, 12.83349609375, 13.5966796875, 14.35986328125, 15.123046875, 15.88623046875, 16.6494140625, 17.41259765625, 18.17578125, 18.93896484375, 19.7021484375, 20.46533203125, 21.228515625, 21.99169921875, 22.7548828125, 23.51806640625, 24.28125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 1.0, 5.0, 8.0, 12.0, 18.0, 17.0, 24.0, 23.0, 36.0, 45.0, 37.0, 48.0, 84.0, 64.0, 81.0, 109.0, 108.0, 157.0, 162.0, 166.0, 174.0, 186.0, 191.0, 182.0, 212.0, 196.0, 167.0, 178.0, 176.0, 170.0, 141.0, 137.0, 121.0, 96.0, 88.0, 79.0, 64.0, 60.0, 53.0, 38.0, 46.0, 32.0, 23.0, 16.0, 10.0, 5.0, 7.0, 6.0, 6.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-14.6875, -14.2421875, -13.796875, -13.3515625, -12.90625, -12.4609375, -12.015625, -11.5703125, -11.125, -10.6796875, -10.234375, -9.7890625, -9.34375, -8.8984375, -8.453125, -8.0078125, -7.5625, -7.1171875, -6.671875, -6.2265625, -5.78125, -5.3359375, -4.890625, -4.4453125, -4.0, -3.5546875, -3.109375, -2.6640625, -2.21875, -1.7734375, -1.328125, -0.8828125, -0.4375, 0.0078125, 0.453125, 0.8984375, 1.34375, 1.7890625, 2.234375, 2.6796875, 3.125, 3.5703125, 4.015625, 4.4609375, 4.90625, 5.3515625, 5.796875, 6.2421875, 6.6875, 7.1328125, 7.578125, 8.0234375, 8.46875, 8.9140625, 9.359375, 9.8046875, 10.25, 10.6953125, 11.140625, 11.5859375, 12.03125, 12.4765625, 12.921875, 13.3671875, 13.8125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 3.0, 10.0, 14.0, 14.0, 16.0, 23.0, 35.0, 23.0, 31.0, 39.0, 46.0, 51.0, 38.0, 43.0, 55.0, 60.0, 65.0, 51.0, 39.0, 49.0, 44.0, 32.0, 38.0, 26.0, 27.0, 24.0, 21.0, 15.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-45.22449493408203, -43.83989715576172, -42.455299377441406, -41.07070541381836, -39.68610763549805, -38.301509857177734, -36.91691589355469, -35.532318115234375, -34.14772033691406, -32.76312255859375, -31.37852668762207, -29.99393081665039, -28.609333038330078, -27.224735260009766, -25.840139389038086, -24.455543518066406, -23.070945739746094, -21.68634796142578, -20.3017520904541, -18.917156219482422, -17.53255844116211, -16.147960662841797, -14.763364791870117, -13.378767967224121, -11.994171142578125, -10.609574317932129, -9.224977493286133, -7.840380668640137, -6.455783843994141, -5.0711870193481445, -3.6865901947021484, -2.3019933700561523, -0.9173927307128906, 0.46720409393310547, 1.8518009185791016, 3.2363977432250977, 4.620994567871094, 6.00559139251709, 7.390188217163086, 8.774785041809082, 10.159381866455078, 11.543978691101074, 12.92857551574707, 14.313172340393066, 15.697769165039062, 17.082366943359375, 18.466962814331055, 19.851558685302734, 21.236156463623047, 22.62075424194336, 24.00535011291504, 25.38994598388672, 26.77454376220703, 28.159141540527344, 29.543737411499023, 30.928333282470703, 32.312931060791016, 33.69752883911133, 35.082122802734375, 36.46672058105469, 37.851318359375, 39.23591613769531, 40.620513916015625, 42.00510787963867, 43.389705657958984]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 13.0, 15.0, 16.0, 21.0, 24.0, 21.0, 44.0, 30.0, 25.0, 33.0, 45.0, 37.0, 42.0, 40.0, 49.0, 41.0, 33.0, 43.0, 32.0, 31.0, 32.0, 36.0, 24.0, 31.0, 24.0, 22.0, 31.0, 19.0, 18.0, 17.0, 6.0, 8.0, 6.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.9935188293457, -40.708412170410156, -39.42330551147461, -38.13820266723633, -36.85309600830078, -35.567989349365234, -34.28288269042969, -32.99777603149414, -31.712671279907227, -30.42756462097168, -29.142459869384766, -27.85735321044922, -26.572246551513672, -25.287141799926758, -24.00203514099121, -22.716930389404297, -21.43182373046875, -20.146717071533203, -18.86161231994629, -17.576505661010742, -16.291400909423828, -15.006294250488281, -13.721187591552734, -12.436081886291504, -11.150976181030273, -9.865870475769043, -8.580764770507812, -7.295658111572266, -6.010552406311035, -4.725446701049805, -3.440340518951416, -2.1552343368530273, -0.8701324462890625, 0.41497349739074707, 1.7000794410705566, 2.985185384750366, 4.270291328430176, 5.555397033691406, 6.840503215789795, 8.125609397888184, 9.410715103149414, 10.695820808410645, 11.980926513671875, 13.266033172607422, 14.551138877868652, 15.836244583129883, 17.12135124206543, 18.406455993652344, 19.69156265258789, 20.976669311523438, 22.26177406311035, 23.5468807220459, 24.831985473632812, 26.11709213256836, 27.402198791503906, 28.687305450439453, 29.972410202026367, 31.257516860961914, 32.54262161254883, 33.827728271484375, 35.11283493041992, 36.39794158935547, 37.68304443359375, 38.9681510925293, 40.253257751464844]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 11.0, 22.0, 27.0, 36.0, 65.0, 83.0, 172.0, 230.0, 356.0, 606.0, 934.0, 1616.0, 2764.0, 4866.0, 8639.0, 16234.0, 31448.0, 62997.0, 130136.0, 251858.0, 259758.0, 137760.0, 66476.0, 32979.0, 16869.0, 9083.0, 5171.0, 2927.0, 1716.0, 1023.0, 630.0, 365.0, 229.0, 150.0, 104.0, 59.0, 59.0, 26.0, 21.0, 18.0, 8.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.90625, -6.690673828125, -6.47509765625, -6.259521484375, -6.0439453125, -5.828369140625, -5.61279296875, -5.397216796875, -5.181640625, -4.966064453125, -4.75048828125, -4.534912109375, -4.3193359375, -4.103759765625, -3.88818359375, -3.672607421875, -3.45703125, -3.241455078125, -3.02587890625, -2.810302734375, -2.5947265625, -2.379150390625, -2.16357421875, -1.947998046875, -1.732421875, -1.516845703125, -1.30126953125, -1.085693359375, -0.8701171875, -0.654541015625, -0.43896484375, -0.223388671875, -0.0078125, 0.207763671875, 0.42333984375, 0.638916015625, 0.8544921875, 1.070068359375, 1.28564453125, 1.501220703125, 1.716796875, 1.932373046875, 2.14794921875, 2.363525390625, 2.5791015625, 2.794677734375, 3.01025390625, 3.225830078125, 3.44140625, 3.656982421875, 3.87255859375, 4.088134765625, 4.3037109375, 4.519287109375, 4.73486328125, 4.950439453125, 5.166015625, 5.381591796875, 5.59716796875, 5.812744140625, 6.0283203125, 6.243896484375, 6.45947265625, 6.675048828125, 6.890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 3.0, 6.0, 9.0, 13.0, 7.0, 9.0, 18.0, 18.0, 14.0, 23.0, 23.0, 32.0, 21.0, 25.0, 31.0, 34.0, 33.0, 45.0, 44.0, 47.0, 34.0, 41.0, 46.0, 31.0, 34.0, 36.0, 33.0, 37.0, 26.0, 31.0, 26.0, 29.0, 28.0, 19.0, 21.0, 7.0, 15.0, 13.0, 6.0, 5.0, 4.0, 7.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-43.09375, -41.74951171875, -40.4052734375, -39.06103515625, -37.716796875, -36.37255859375, -35.0283203125, -33.68408203125, -32.33984375, -30.99560546875, -29.6513671875, -28.30712890625, -26.962890625, -25.61865234375, -24.2744140625, -22.93017578125, -21.5859375, -20.24169921875, -18.8974609375, -17.55322265625, -16.208984375, -14.86474609375, -13.5205078125, -12.17626953125, -10.83203125, -9.48779296875, -8.1435546875, -6.79931640625, -5.455078125, -4.11083984375, -2.7666015625, -1.42236328125, -0.078125, 1.26611328125, 2.6103515625, 3.95458984375, 5.298828125, 6.64306640625, 7.9873046875, 9.33154296875, 10.67578125, 12.02001953125, 13.3642578125, 14.70849609375, 16.052734375, 17.39697265625, 18.7412109375, 20.08544921875, 21.4296875, 22.77392578125, 24.1181640625, 25.46240234375, 26.806640625, 28.15087890625, 29.4951171875, 30.83935546875, 32.18359375, 33.52783203125, 34.8720703125, 36.21630859375, 37.560546875, 38.90478515625, 40.2490234375, 41.59326171875, 42.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 5.0, 11.0, 25.0, 27.0, 39.0, 42.0, 64.0, 105.0, 167.0, 203.0, 316.0, 429.0, 710.0, 1030.0, 1538.0, 2304.0, 3376.0, 5246.0, 8066.0, 12678.0, 20587.0, 34526.0, 58954.0, 108722.0, 199327.0, 241067.0, 150994.0, 80698.0, 45206.0, 26529.0, 16204.0, 10233.0, 6544.0, 4140.0, 2838.0, 1819.0, 1214.0, 826.0, 558.0, 404.0, 288.0, 170.0, 100.0, 66.0, 52.0, 38.0, 28.0, 14.0, 13.0, 11.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4609375, -6.26666259765625, -6.0723876953125, -5.87811279296875, -5.683837890625, -5.48956298828125, -5.2952880859375, -5.10101318359375, -4.90673828125, -4.71246337890625, -4.5181884765625, -4.32391357421875, -4.129638671875, -3.93536376953125, -3.7410888671875, -3.54681396484375, -3.3525390625, -3.15826416015625, -2.9639892578125, -2.76971435546875, -2.575439453125, -2.38116455078125, -2.1868896484375, -1.99261474609375, -1.79833984375, -1.60406494140625, -1.4097900390625, -1.21551513671875, -1.021240234375, -0.82696533203125, -0.6326904296875, -0.43841552734375, -0.244140625, -0.04986572265625, 0.1444091796875, 0.33868408203125, 0.532958984375, 0.72723388671875, 0.9215087890625, 1.11578369140625, 1.31005859375, 1.50433349609375, 1.6986083984375, 1.89288330078125, 2.087158203125, 2.28143310546875, 2.4757080078125, 2.66998291015625, 2.8642578125, 3.05853271484375, 3.2528076171875, 3.44708251953125, 3.641357421875, 3.83563232421875, 4.0299072265625, 4.22418212890625, 4.41845703125, 4.61273193359375, 4.8070068359375, 5.00128173828125, 5.195556640625, 5.38983154296875, 5.5841064453125, 5.77838134765625, 5.97265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 13.0, 12.0, 13.0, 15.0, 21.0, 21.0, 25.0, 21.0, 23.0, 33.0, 34.0, 41.0, 42.0, 45.0, 39.0, 41.0, 46.0, 45.0, 32.0, 44.0, 50.0, 44.0, 42.0, 35.0, 40.0, 29.0, 33.0, 18.0, 16.0, 17.0, 14.0, 9.0, 16.0, 10.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.96875, -34.03271484375, -33.0966796875, -32.16064453125, -31.224609375, -30.28857421875, -29.3525390625, -28.41650390625, -27.48046875, -26.54443359375, -25.6083984375, -24.67236328125, -23.736328125, -22.80029296875, -21.8642578125, -20.92822265625, -19.9921875, -19.05615234375, -18.1201171875, -17.18408203125, -16.248046875, -15.31201171875, -14.3759765625, -13.43994140625, -12.50390625, -11.56787109375, -10.6318359375, -9.69580078125, -8.759765625, -7.82373046875, -6.8876953125, -5.95166015625, -5.015625, -4.07958984375, -3.1435546875, -2.20751953125, -1.271484375, -0.33544921875, 0.6005859375, 1.53662109375, 2.47265625, 3.40869140625, 4.3447265625, 5.28076171875, 6.216796875, 7.15283203125, 8.0888671875, 9.02490234375, 9.9609375, 10.89697265625, 11.8330078125, 12.76904296875, 13.705078125, 14.64111328125, 15.5771484375, 16.51318359375, 17.44921875, 18.38525390625, 19.3212890625, 20.25732421875, 21.193359375, 22.12939453125, 23.0654296875, 24.00146484375, 24.9375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 8.0, 10.0, 12.0, 32.0, 46.0, 41.0, 93.0, 113.0, 174.0, 227.0, 374.0, 517.0, 790.0, 1177.0, 1731.0, 2803.0, 4372.0, 6968.0, 11353.0, 19527.0, 34824.0, 66068.0, 141298.0, 290024.0, 237924.0, 105662.0, 51991.0, 27903.0, 16200.0, 9591.0, 6025.0, 3656.0, 2378.0, 1510.0, 995.0, 665.0, 424.0, 325.0, 221.0, 145.0, 104.0, 72.0, 54.0, 36.0, 26.0, 14.0, 13.0, 9.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.163330078125, -0.15819740295410156, -0.15306472778320312, -0.1479320526123047, -0.14279937744140625, -0.1376667022705078, -0.13253402709960938, -0.12740135192871094, -0.1222686767578125, -0.11713600158691406, -0.11200332641601562, -0.10687065124511719, -0.10173797607421875, -0.09660530090332031, -0.09147262573242188, -0.08633995056152344, -0.081207275390625, -0.07607460021972656, -0.07094192504882812, -0.06580924987792969, -0.06067657470703125, -0.05554389953613281, -0.050411224365234375, -0.04527854919433594, -0.0401458740234375, -0.03501319885253906, -0.029880523681640625, -0.024747848510742188, -0.01961517333984375, -0.014482498168945312, -0.009349822998046875, -0.0042171478271484375, 0.00091552734375, 0.0060482025146484375, 0.011180877685546875, 0.016313552856445312, 0.02144622802734375, 0.026578903198242188, 0.031711578369140625, 0.03684425354003906, 0.0419769287109375, 0.04710960388183594, 0.052242279052734375, 0.05737495422363281, 0.06250762939453125, 0.06764030456542969, 0.07277297973632812, 0.07790565490722656, 0.083038330078125, 0.08817100524902344, 0.09330368041992188, 0.09843635559082031, 0.10356903076171875, 0.10870170593261719, 0.11383438110351562, 0.11896705627441406, 0.1240997314453125, 0.12923240661621094, 0.13436508178710938, 0.1394977569580078, 0.14463043212890625, 0.1497631072998047, 0.15489578247070312, 0.16002845764160156, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 7.0, 6.0, 15.0, 20.0, 17.0, 19.0, 26.0, 26.0, 42.0, 34.0, 39.0, 52.0, 46.0, 46.0, 49.0, 65.0, 47.0, 42.0, 44.0, 47.0, 36.0, 29.0, 34.0, 32.0, 16.0, 24.0, 16.0, 16.0, 15.0, 12.0, 11.0, 7.0, 9.0, 6.0, 4.0, 9.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.236532211303711e-05, -3.1412579119205475e-05, -3.045983612537384e-05, -2.9507093131542206e-05, -2.855435013771057e-05, -2.7601607143878937e-05, -2.6648864150047302e-05, -2.5696121156215668e-05, -2.4743378162384033e-05, -2.37906351685524e-05, -2.2837892174720764e-05, -2.188514918088913e-05, -2.0932406187057495e-05, -1.997966319322586e-05, -1.9026920199394226e-05, -1.807417720556259e-05, -1.7121434211730957e-05, -1.6168691217899323e-05, -1.5215948224067688e-05, -1.4263205230236053e-05, -1.3310462236404419e-05, -1.2357719242572784e-05, -1.140497624874115e-05, -1.0452233254909515e-05, -9.499490261077881e-06, -8.546747267246246e-06, -7.594004273414612e-06, -6.641261279582977e-06, -5.688518285751343e-06, -4.735775291919708e-06, -3.7830322980880737e-06, -2.830289304256439e-06, -1.8775463104248047e-06, -9.248033165931702e-07, 2.7939677238464355e-08, 9.806826710700989e-07, 1.9334256649017334e-06, 2.886168658733368e-06, 3.8389116525650024e-06, 4.791654646396637e-06, 5.7443976402282715e-06, 6.697140634059906e-06, 7.64988362789154e-06, 8.602626621723175e-06, 9.55536961555481e-06, 1.0508112609386444e-05, 1.1460855603218079e-05, 1.2413598597049713e-05, 1.3366341590881348e-05, 1.4319084584712982e-05, 1.5271827578544617e-05, 1.622457057237625e-05, 1.7177313566207886e-05, 1.813005656003952e-05, 1.9082799553871155e-05, 2.003554254770279e-05, 2.0988285541534424e-05, 2.194102853536606e-05, 2.2893771529197693e-05, 2.3846514523029327e-05, 2.4799257516860962e-05, 2.5752000510692596e-05, 2.670474350452423e-05, 2.7657486498355865e-05, 2.86102294921875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 15.0, 19.0, 28.0, 49.0, 63.0, 113.0, 161.0, 228.0, 321.0, 558.0, 870.0, 1358.0, 2209.0, 3300.0, 5314.0, 8135.0, 13083.0, 21016.0, 33844.0, 59174.0, 112898.0, 258060.0, 261651.0, 114712.0, 59333.0, 34620.0, 21215.0, 13107.0, 8367.0, 5342.0, 3327.0, 2181.0, 1422.0, 857.0, 573.0, 337.0, 228.0, 155.0, 113.0, 64.0, 41.0, 34.0, 19.0, 13.0, 5.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40185546875, -0.3893013000488281, -0.37674713134765625, -0.3641929626464844, -0.3516387939453125, -0.3390846252441406, -0.32653045654296875, -0.3139762878417969, -0.301422119140625, -0.2888679504394531, -0.27631378173828125, -0.2637596130371094, -0.2512054443359375, -0.23865127563476562, -0.22609710693359375, -0.21354293823242188, -0.20098876953125, -0.18843460083007812, -0.17588043212890625, -0.16332626342773438, -0.1507720947265625, -0.13821792602539062, -0.12566375732421875, -0.11310958862304688, -0.100555419921875, -0.08800125122070312, -0.07544708251953125, -0.06289291381835938, -0.0503387451171875, -0.037784576416015625, -0.02523040771484375, -0.012676239013671875, -0.0001220703125, 0.012432098388671875, 0.02498626708984375, 0.037540435791015625, 0.0500946044921875, 0.06264877319335938, 0.07520294189453125, 0.08775711059570312, 0.100311279296875, 0.11286544799804688, 0.12541961669921875, 0.13797378540039062, 0.1505279541015625, 0.16308212280273438, 0.17563629150390625, 0.18819046020507812, 0.20074462890625, 0.21329879760742188, 0.22585296630859375, 0.23840713500976562, 0.2509613037109375, 0.2635154724121094, 0.27606964111328125, 0.2886238098144531, 0.301177978515625, 0.3137321472167969, 0.32628631591796875, 0.3388404846191406, 0.3513946533203125, 0.3639488220214844, 0.37650299072265625, 0.3890571594238281, 0.401611328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 2.0, 9.0, 8.0, 12.0, 15.0, 19.0, 24.0, 55.0, 64.0, 93.0, 138.0, 133.0, 117.0, 75.0, 51.0, 46.0, 24.0, 18.0, 16.0, 19.0, 9.0, 6.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.144287109375, -0.13939666748046875, -0.1345062255859375, -0.12961578369140625, -0.124725341796875, -0.11983489990234375, -0.1149444580078125, -0.11005401611328125, -0.10516357421875, -0.10027313232421875, -0.0953826904296875, -0.09049224853515625, -0.085601806640625, -0.08071136474609375, -0.0758209228515625, -0.07093048095703125, -0.0660400390625, -0.06114959716796875, -0.0562591552734375, -0.05136871337890625, -0.046478271484375, -0.04158782958984375, -0.0366973876953125, -0.03180694580078125, -0.02691650390625, -0.02202606201171875, -0.0171356201171875, -0.01224517822265625, -0.007354736328125, -0.00246429443359375, 0.0024261474609375, 0.00731658935546875, 0.01220703125, 0.01709747314453125, 0.0219879150390625, 0.02687835693359375, 0.031768798828125, 0.03665924072265625, 0.0415496826171875, 0.04644012451171875, 0.05133056640625, 0.05622100830078125, 0.0611114501953125, 0.06600189208984375, 0.070892333984375, 0.07578277587890625, 0.0806732177734375, 0.08556365966796875, 0.0904541015625, 0.09534454345703125, 0.1002349853515625, 0.10512542724609375, 0.110015869140625, 0.11490631103515625, 0.1197967529296875, 0.12468719482421875, 0.12957763671875, 0.13446807861328125, 0.1393585205078125, 0.14424896240234375, 0.149139404296875, 0.15402984619140625, 0.1589202880859375, 0.16381072998046875, 0.168701171875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 3.0, 8.0, 12.0, 19.0, 17.0, 24.0, 26.0, 28.0, 31.0, 44.0, 40.0, 52.0, 39.0, 45.0, 53.0, 66.0, 53.0, 49.0, 44.0, 52.0, 38.0, 31.0, 41.0, 30.0, 24.0, 25.0, 20.0, 15.0, 13.0, 7.0, 8.0, 5.0, 7.0, 3.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-45.227149963378906, -43.85004425048828, -42.47293472290039, -41.095829010009766, -39.718719482421875, -38.34161376953125, -36.964508056640625, -35.587398529052734, -34.21029281616211, -32.833187103271484, -31.456077575683594, -30.07897186279297, -28.70186424255371, -27.324756622314453, -25.947649002075195, -24.570541381835938, -23.19343376159668, -21.816326141357422, -20.439218521118164, -19.062110900878906, -17.68500518798828, -16.307897567749023, -14.930789947509766, -13.553683280944824, -12.176575660705566, -10.799468040466309, -9.422361373901367, -8.04525375366211, -6.66814661026001, -5.29103946685791, -3.9139318466186523, -2.536825180053711, -1.1597175598144531, 0.21738970279693604, 1.5944969654083252, 2.971604347229004, 4.3487114906311035, 5.725818634033203, 7.102926254272461, 8.480032920837402, 9.85714054107666, 11.234248161315918, 12.61135482788086, 13.988462448120117, 15.365570068359375, 16.74267578125, 18.11978530883789, 19.496891021728516, 20.873998641967773, 22.25110626220703, 23.62821388244629, 25.005321502685547, 26.382427215576172, 27.75953483581543, 29.136642456054688, 30.513748168945312, 31.890857696533203, 33.26796340942383, 34.64507293701172, 36.022178649902344, 37.399288177490234, 38.77639389038086, 40.15350341796875, 41.530609130859375, 42.90771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 5.0, 8.0, 11.0, 11.0, 14.0, 13.0, 15.0, 16.0, 22.0, 21.0, 22.0, 42.0, 32.0, 26.0, 33.0, 43.0, 33.0, 47.0, 38.0, 50.0, 42.0, 31.0, 47.0, 31.0, 29.0, 31.0, 39.0, 25.0, 28.0, 25.0, 23.0, 31.0, 17.0, 20.0, 16.0, 6.0, 10.0, 5.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.083160400390625, -40.79657745361328, -39.50999450683594, -38.223411560058594, -36.936832427978516, -35.65024948120117, -34.36366653442383, -33.077083587646484, -31.79050064086914, -30.503917694091797, -29.217336654663086, -27.930753707885742, -26.6441707611084, -25.357589721679688, -24.071006774902344, -22.784423828125, -21.49784278869629, -20.211259841918945, -18.924678802490234, -17.63809585571289, -16.351512908935547, -15.06493091583252, -13.778348922729492, -12.491765975952148, -11.205183982849121, -9.918601989746094, -8.63201904296875, -7.345437049865723, -6.058854579925537, -4.772272109985352, -3.485690116882324, -2.1991071701049805, -0.9125251770019531, 0.37405717372894287, 1.6606395244598389, 2.9472217559814453, 4.233804225921631, 5.520386695861816, 6.806968688964844, 8.093551635742188, 9.380133628845215, 10.666715621948242, 11.953298568725586, 13.239880561828613, 14.52646255493164, 15.813045501708984, 17.099628448486328, 18.386211395263672, 19.672792434692383, 20.959375381469727, 22.245956420898438, 23.53253936767578, 24.819122314453125, 26.10570526123047, 27.39228630065918, 28.678869247436523, 29.965450286865234, 31.252033233642578, 32.53861618041992, 33.8251953125, 35.111778259277344, 36.39836120605469, 37.68494415283203, 38.971527099609375, 40.25811004638672]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 14.0, 34.0, 45.0, 65.0, 145.0, 198.0, 300.0, 467.0, 747.0, 1161.0, 1929.0, 3117.0, 4886.0, 7866.0, 12285.0, 18455.0, 28095.0, 40426.0, 55823.0, 72772.0, 90057.0, 104180.0, 110282.0, 108074.0, 97672.0, 81825.0, 63566.0, 47125.0, 33310.0, 22457.0, 14951.0, 9620.0, 6072.0, 3906.0, 2386.0, 1573.0, 934.0, 648.0, 366.0, 259.0, 154.0, 116.0, 65.0, 40.0, 29.0, 14.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0], "bins": [-21.390625, -20.756591796875, -20.12255859375, -19.488525390625, -18.8544921875, -18.220458984375, -17.58642578125, -16.952392578125, -16.318359375, -15.684326171875, -15.05029296875, -14.416259765625, -13.7822265625, -13.148193359375, -12.51416015625, -11.880126953125, -11.24609375, -10.612060546875, -9.97802734375, -9.343994140625, -8.7099609375, -8.075927734375, -7.44189453125, -6.807861328125, -6.173828125, -5.539794921875, -4.90576171875, -4.271728515625, -3.6376953125, -3.003662109375, -2.36962890625, -1.735595703125, -1.1015625, -0.467529296875, 0.16650390625, 0.800537109375, 1.4345703125, 2.068603515625, 2.70263671875, 3.336669921875, 3.970703125, 4.604736328125, 5.23876953125, 5.872802734375, 6.5068359375, 7.140869140625, 7.77490234375, 8.408935546875, 9.04296875, 9.677001953125, 10.31103515625, 10.945068359375, 11.5791015625, 12.213134765625, 12.84716796875, 13.481201171875, 14.115234375, 14.749267578125, 15.38330078125, 16.017333984375, 16.6513671875, 17.285400390625, 17.91943359375, 18.553466796875, 19.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 2.0, 3.0, 9.0, 8.0, 11.0, 7.0, 13.0, 11.0, 16.0, 20.0, 13.0, 25.0, 23.0, 24.0, 37.0, 31.0, 25.0, 46.0, 33.0, 38.0, 34.0, 41.0, 34.0, 37.0, 42.0, 40.0, 36.0, 33.0, 33.0, 26.0, 25.0, 25.0, 22.0, 27.0, 30.0, 23.0, 20.0, 11.0, 15.0, 8.0, 9.0, 7.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.46533203125, -35.2431640625, -34.02099609375, -32.798828125, -31.57666015625, -30.3544921875, -29.13232421875, -27.91015625, -26.68798828125, -25.4658203125, -24.24365234375, -23.021484375, -21.79931640625, -20.5771484375, -19.35498046875, -18.1328125, -16.91064453125, -15.6884765625, -14.46630859375, -13.244140625, -12.02197265625, -10.7998046875, -9.57763671875, -8.35546875, -7.13330078125, -5.9111328125, -4.68896484375, -3.466796875, -2.24462890625, -1.0224609375, 0.19970703125, 1.421875, 2.64404296875, 3.8662109375, 5.08837890625, 6.310546875, 7.53271484375, 8.7548828125, 9.97705078125, 11.19921875, 12.42138671875, 13.6435546875, 14.86572265625, 16.087890625, 17.31005859375, 18.5322265625, 19.75439453125, 20.9765625, 22.19873046875, 23.4208984375, 24.64306640625, 25.865234375, 27.08740234375, 28.3095703125, 29.53173828125, 30.75390625, 31.97607421875, 33.1982421875, 34.42041015625, 35.642578125, 36.86474609375, 38.0869140625, 39.30908203125, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 13.0, 13.0, 26.0, 41.0, 58.0, 110.0, 135.0, 210.0, 360.0, 542.0, 922.0, 1534.0, 2318.0, 3911.0, 6405.0, 10348.0, 16782.0, 26181.0, 40350.0, 59108.0, 81375.0, 103945.0, 121262.0, 126213.0, 117517.0, 99174.0, 76516.0, 54365.0, 36461.0, 23420.0, 15042.0, 9033.0, 5686.0, 3562.0, 2176.0, 1325.0, 787.0, 504.0, 282.0, 204.0, 141.0, 73.0, 44.0, 31.0, 21.0, 13.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.875, -25.075927734375, -24.27685546875, -23.477783203125, -22.6787109375, -21.879638671875, -21.08056640625, -20.281494140625, -19.482421875, -18.683349609375, -17.88427734375, -17.085205078125, -16.2861328125, -15.487060546875, -14.68798828125, -13.888916015625, -13.08984375, -12.290771484375, -11.49169921875, -10.692626953125, -9.8935546875, -9.094482421875, -8.29541015625, -7.496337890625, -6.697265625, -5.898193359375, -5.09912109375, -4.300048828125, -3.5009765625, -2.701904296875, -1.90283203125, -1.103759765625, -0.3046875, 0.494384765625, 1.29345703125, 2.092529296875, 2.8916015625, 3.690673828125, 4.48974609375, 5.288818359375, 6.087890625, 6.886962890625, 7.68603515625, 8.485107421875, 9.2841796875, 10.083251953125, 10.88232421875, 11.681396484375, 12.48046875, 13.279541015625, 14.07861328125, 14.877685546875, 15.6767578125, 16.475830078125, 17.27490234375, 18.073974609375, 18.873046875, 19.672119140625, 20.47119140625, 21.270263671875, 22.0693359375, 22.868408203125, 23.66748046875, 24.466552734375, 25.265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 8.0, 5.0, 13.0, 19.0, 18.0, 20.0, 20.0, 31.0, 20.0, 36.0, 32.0, 46.0, 49.0, 49.0, 51.0, 44.0, 42.0, 33.0, 46.0, 45.0, 45.0, 45.0, 41.0, 32.0, 24.0, 27.0, 28.0, 17.0, 24.0, 19.0, 18.0, 6.0, 10.0, 4.0, 13.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.772705078125, -29.81103515625, -28.849365234375, -27.8876953125, -26.926025390625, -25.96435546875, -25.002685546875, -24.041015625, -23.079345703125, -22.11767578125, -21.156005859375, -20.1943359375, -19.232666015625, -18.27099609375, -17.309326171875, -16.34765625, -15.385986328125, -14.42431640625, -13.462646484375, -12.5009765625, -11.539306640625, -10.57763671875, -9.615966796875, -8.654296875, -7.692626953125, -6.73095703125, -5.769287109375, -4.8076171875, -3.845947265625, -2.88427734375, -1.922607421875, -0.9609375, 0.000732421875, 0.96240234375, 1.924072265625, 2.8857421875, 3.847412109375, 4.80908203125, 5.770751953125, 6.732421875, 7.694091796875, 8.65576171875, 9.617431640625, 10.5791015625, 11.540771484375, 12.50244140625, 13.464111328125, 14.42578125, 15.387451171875, 16.34912109375, 17.310791015625, 18.2724609375, 19.234130859375, 20.19580078125, 21.157470703125, 22.119140625, 23.080810546875, 24.04248046875, 25.004150390625, 25.9658203125, 26.927490234375, 27.88916015625, 28.850830078125, 29.8125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 11.0, 9.0, 11.0, 23.0, 31.0, 54.0, 69.0, 137.0, 183.0, 341.0, 532.0, 830.0, 1340.0, 2282.0, 3739.0, 5865.0, 9020.0, 13954.0, 21132.0, 30813.0, 42983.0, 56647.0, 72083.0, 84917.0, 95283.0, 100906.0, 99130.0, 92779.0, 80467.0, 65859.0, 51375.0, 37956.0, 26725.0, 18190.0, 12127.0, 7771.0, 4987.0, 3092.0, 1788.0, 1168.0, 731.0, 428.0, 273.0, 200.0, 111.0, 67.0, 48.0, 32.0, 22.0, 17.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0], "bins": [-7.32421875, -7.093994140625, -6.86376953125, -6.633544921875, -6.4033203125, -6.173095703125, -5.94287109375, -5.712646484375, -5.482421875, -5.252197265625, -5.02197265625, -4.791748046875, -4.5615234375, -4.331298828125, -4.10107421875, -3.870849609375, -3.640625, -3.410400390625, -3.18017578125, -2.949951171875, -2.7197265625, -2.489501953125, -2.25927734375, -2.029052734375, -1.798828125, -1.568603515625, -1.33837890625, -1.108154296875, -0.8779296875, -0.647705078125, -0.41748046875, -0.187255859375, 0.04296875, 0.273193359375, 0.50341796875, 0.733642578125, 0.9638671875, 1.194091796875, 1.42431640625, 1.654541015625, 1.884765625, 2.114990234375, 2.34521484375, 2.575439453125, 2.8056640625, 3.035888671875, 3.26611328125, 3.496337890625, 3.7265625, 3.956787109375, 4.18701171875, 4.417236328125, 4.6474609375, 4.877685546875, 5.10791015625, 5.338134765625, 5.568359375, 5.798583984375, 6.02880859375, 6.259033203125, 6.4892578125, 6.719482421875, 6.94970703125, 7.179931640625, 7.41015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 9.0, 12.0, 22.0, 12.0, 20.0, 23.0, 27.0, 28.0, 25.0, 46.0, 42.0, 41.0, 45.0, 57.0, 50.0, 47.0, 41.0, 37.0, 44.0, 49.0, 32.0, 37.0, 24.0, 37.0, 30.0, 25.0, 18.0, 13.0, 19.0, 13.0, 12.0, 9.0, 3.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009937286376953125, -0.0009638965129852295, -0.0009340643882751465, -0.0009042322635650635, -0.0008744001388549805, -0.0008445680141448975, -0.0008147358894348145, -0.0007849037647247314, -0.0007550716400146484, -0.0007252395153045654, -0.0006954073905944824, -0.0006655752658843994, -0.0006357431411743164, -0.0006059110164642334, -0.0005760788917541504, -0.0005462467670440674, -0.0005164146423339844, -0.00048658251762390137, -0.00045675039291381836, -0.00042691826820373535, -0.00039708614349365234, -0.00036725401878356934, -0.00033742189407348633, -0.0003075897693634033, -0.0002777576446533203, -0.0002479255199432373, -0.0002180933952331543, -0.0001882612705230713, -0.00015842914581298828, -0.00012859702110290527, -9.876489639282227e-05, -6.893277168273926e-05, -3.910064697265625e-05, -9.268522262573242e-06, 2.0563602447509766e-05, 5.0395727157592773e-05, 8.022785186767578e-05, 0.00011005997657775879, 0.0001398921012878418, 0.0001697242259979248, 0.0001995563507080078, 0.00022938847541809082, 0.00025922060012817383, 0.00028905272483825684, 0.00031888484954833984, 0.00034871697425842285, 0.00037854909896850586, 0.00040838122367858887, 0.0004382133483886719, 0.0004680454730987549, 0.0004978775978088379, 0.0005277097225189209, 0.0005575418472290039, 0.0005873739719390869, 0.0006172060966491699, 0.0006470382213592529, 0.0006768703460693359, 0.0007067024707794189, 0.000736534595489502, 0.000766366720199585, 0.000796198844909668, 0.000826030969619751, 0.000855863094329834, 0.000885695219039917, 0.00091552734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 17.0, 34.0, 60.0, 75.0, 122.0, 202.0, 340.0, 614.0, 1033.0, 1958.0, 3367.0, 5888.0, 10587.0, 18266.0, 29873.0, 47009.0, 68841.0, 92840.0, 114779.0, 128422.0, 128186.0, 114211.0, 93827.0, 68804.0, 46731.0, 30006.0, 17863.0, 10673.0, 6067.0, 3324.0, 1961.0, 1065.0, 622.0, 357.0, 195.0, 132.0, 77.0, 36.0, 28.0, 17.0, 16.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.0234375, -9.710205078125, -9.39697265625, -9.083740234375, -8.7705078125, -8.457275390625, -8.14404296875, -7.830810546875, -7.517578125, -7.204345703125, -6.89111328125, -6.577880859375, -6.2646484375, -5.951416015625, -5.63818359375, -5.324951171875, -5.01171875, -4.698486328125, -4.38525390625, -4.072021484375, -3.7587890625, -3.445556640625, -3.13232421875, -2.819091796875, -2.505859375, -2.192626953125, -1.87939453125, -1.566162109375, -1.2529296875, -0.939697265625, -0.62646484375, -0.313232421875, 0.0, 0.313232421875, 0.62646484375, 0.939697265625, 1.2529296875, 1.566162109375, 1.87939453125, 2.192626953125, 2.505859375, 2.819091796875, 3.13232421875, 3.445556640625, 3.7587890625, 4.072021484375, 4.38525390625, 4.698486328125, 5.01171875, 5.324951171875, 5.63818359375, 5.951416015625, 6.2646484375, 6.577880859375, 6.89111328125, 7.204345703125, 7.517578125, 7.830810546875, 8.14404296875, 8.457275390625, 8.7705078125, 9.083740234375, 9.39697265625, 9.710205078125, 10.0234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 5.0, 3.0, 1.0, 8.0, 5.0, 7.0, 6.0, 13.0, 15.0, 7.0, 13.0, 17.0, 13.0, 27.0, 28.0, 25.0, 24.0, 32.0, 54.0, 43.0, 35.0, 33.0, 46.0, 38.0, 37.0, 37.0, 34.0, 23.0, 33.0, 47.0, 35.0, 23.0, 24.0, 32.0, 20.0, 22.0, 21.0, 15.0, 14.0, 12.0, 14.0, 14.0, 8.0, 4.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0], "bins": [-3.4296875, -3.334259033203125, -3.23883056640625, -3.143402099609375, -3.0479736328125, -2.952545166015625, -2.85711669921875, -2.761688232421875, -2.666259765625, -2.570831298828125, -2.47540283203125, -2.379974365234375, -2.2845458984375, -2.189117431640625, -2.09368896484375, -1.998260498046875, -1.90283203125, -1.807403564453125, -1.71197509765625, -1.616546630859375, -1.5211181640625, -1.425689697265625, -1.33026123046875, -1.234832763671875, -1.139404296875, -1.043975830078125, -0.94854736328125, -0.853118896484375, -0.7576904296875, -0.662261962890625, -0.56683349609375, -0.471405029296875, -0.3759765625, -0.280548095703125, -0.18511962890625, -0.089691162109375, 0.0057373046875, 0.101165771484375, 0.19659423828125, 0.292022705078125, 0.387451171875, 0.482879638671875, 0.57830810546875, 0.673736572265625, 0.7691650390625, 0.864593505859375, 0.96002197265625, 1.055450439453125, 1.15087890625, 1.246307373046875, 1.34173583984375, 1.437164306640625, 1.5325927734375, 1.628021240234375, 1.72344970703125, 1.818878173828125, 1.914306640625, 2.009735107421875, 2.10516357421875, 2.200592041015625, 2.2960205078125, 2.391448974609375, 2.48687744140625, 2.582305908203125, 2.677734375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 2.0, 4.0, 4.0, 11.0, 11.0, 14.0, 21.0, 28.0, 39.0, 39.0, 32.0, 34.0, 42.0, 42.0, 61.0, 54.0, 71.0, 57.0, 56.0, 46.0, 50.0, 40.0, 37.0, 30.0, 28.0, 37.0, 15.0, 22.0, 11.0, 10.0, 11.0, 6.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.339393615722656, -44.845157623291016, -43.350921630859375, -41.856689453125, -40.36245346069336, -38.86821746826172, -37.373985290527344, -35.8797492980957, -34.38551330566406, -32.89127731323242, -31.397043228149414, -29.902809143066406, -28.408573150634766, -26.914337158203125, -25.420103073120117, -23.92586898803711, -22.43163299560547, -20.937397003173828, -19.44316291809082, -17.948928833007812, -16.454692840576172, -14.960457801818848, -13.466222763061523, -11.9719877243042, -10.477752685546875, -8.98351764678955, -7.489282608032227, -5.995047569274902, -4.500812530517578, -3.006577491760254, -1.5123424530029297, -0.01810741424560547, 1.4761276245117188, 2.970362663269043, 4.464597702026367, 5.958832740783691, 7.453067779541016, 8.94730281829834, 10.441537857055664, 11.935772895812988, 13.430007934570312, 14.924242973327637, 16.41847801208496, 17.91271209716797, 19.40694808959961, 20.90118408203125, 22.395418167114258, 23.889652252197266, 25.383888244628906, 26.878124237060547, 28.372358322143555, 29.866592407226562, 31.360828399658203, 32.855064392089844, 34.34929656982422, 35.84353256225586, 37.3377685546875, 38.83200454711914, 40.32624053955078, 41.820472717285156, 43.3147087097168, 44.80894470214844, 46.30317687988281, 47.79741287231445, 49.291648864746094]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 11.0, 14.0, 10.0, 18.0, 19.0, 21.0, 22.0, 25.0, 35.0, 39.0, 49.0, 37.0, 42.0, 25.0, 39.0, 39.0, 36.0, 33.0, 39.0, 38.0, 41.0, 40.0, 33.0, 40.0, 26.0, 22.0, 24.0, 27.0, 21.0, 27.0, 18.0, 13.0, 11.0, 11.0, 8.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.7633171081543, -47.23638916015625, -45.7094612121582, -44.182533264160156, -42.65560531616211, -41.12867736816406, -39.60174560546875, -38.07482147216797, -36.547889709472656, -35.02096176147461, -33.49403381347656, -31.967105865478516, -30.44017791748047, -28.913249969482422, -27.386320114135742, -25.859392166137695, -24.33246612548828, -22.805538177490234, -21.278610229492188, -19.75168228149414, -18.224754333496094, -16.697826385498047, -15.170896530151367, -13.64396858215332, -12.117040634155273, -10.590112686157227, -9.06318473815918, -7.536255836486816, -6.0093278884887695, -4.482399940490723, -2.9554710388183594, -1.4285430908203125, 0.09838104248046875, 1.6253092288970947, 3.1522374153137207, 4.679165840148926, 6.206093788146973, 7.7330217361450195, 9.259950637817383, 10.78687858581543, 12.313806533813477, 13.840734481811523, 15.36766242980957, 16.89459228515625, 18.421520233154297, 19.948448181152344, 21.47537612915039, 23.002304077148438, 24.529232025146484, 26.05615997314453, 27.583087921142578, 29.110015869140625, 30.636943817138672, 32.16387176513672, 33.69080352783203, 35.21772766113281, 36.744659423828125, 38.27158737182617, 39.79851531982422, 41.325443267822266, 42.85237121582031, 44.37929916381836, 45.906227111816406, 47.43315887451172, 48.9600830078125]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 8.0, 7.0, 15.0, 8.0, 16.0, 30.0, 37.0, 59.0, 99.0, 96.0, 166.0, 230.0, 301.0, 447.0, 567.0, 741.0, 1040.0, 1346.0, 1710.0, 2185.0, 2887.0, 3518.0, 4230.0, 5094.0, 1001540.0, 5034.0, 4219.0, 3486.0, 2780.0, 2117.0, 1637.0, 1288.0, 961.0, 693.0, 537.0, 375.0, 269.0, 221.0, 164.0, 118.0, 93.0, 67.0, 46.0, 35.0, 25.0, 21.0, 18.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-338.8955993652344, -328.1161804199219, -317.3367614746094, -306.5573425292969, -295.7779541015625, -284.99853515625, -274.2191162109375, -263.439697265625, -252.6602783203125, -241.880859375, -231.1014404296875, -220.32203674316406, -209.54261779785156, -198.76319885253906, -187.98379516601562, -177.20437622070312, -166.42495727539062, -155.64553833007812, -144.86611938476562, -134.0867156982422, -123.30729675292969, -112.52787780761719, -101.74846649169922, -90.96905517578125, -80.18963623046875, -69.41021728515625, -58.63080596923828, -47.85139083862305, -37.07197570800781, -26.292560577392578, -15.513145446777344, -4.733734130859375, 6.04571533203125, 16.825130462646484, 27.60454559326172, 38.38396072387695, 49.16337585449219, 59.94279098510742, 70.72220611572266, 81.50161743164062, 92.28103637695312, 103.06045532226562, 113.8398666381836, 124.61927795410156, 135.39869689941406, 146.17811584472656, 156.95751953125, 167.7369384765625, 178.516357421875, 189.2957763671875, 200.0751953125, 210.85459899902344, 221.63401794433594, 232.41343688964844, 243.19284057617188, 253.97225952148438, 264.7516784667969, 275.5310974121094, 286.3105163574219, 297.0899353027344, 307.86932373046875, 318.64874267578125, 329.42816162109375, 340.20758056640625, 350.98699951171875]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 14.0, 8.0, 12.0, 14.0, 7.0, 19.0, 19.0, 24.0, 26.0, 24.0, 35.0, 39.0, 48.0, 60.0, 78.0, 117.0, 179.0, 280.0, 570.0, 1124.0, 2216.0, 4607.0, 10240.0, 22296.0, 42994.0, 51226108.0, 95861.0, 33024.0, 16678.0, 7467.0, 3282.0, 1636.0, 842.0, 473.0, 266.0, 148.0, 99.0, 64.0, 59.0, 45.0, 41.0, 42.0, 27.0, 21.0, 23.0, 18.0, 9.0, 14.0, 8.0, 12.0, 2.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-934.5, -905.109375, -875.71875, -846.328125, -816.9375, -787.546875, -758.15625, -728.765625, -699.375, -669.984375, -640.59375, -611.203125, -581.8125, -552.421875, -523.03125, -493.640625, -464.25, -434.859375, -405.46875, -376.078125, -346.6875, -317.296875, -287.90625, -258.515625, -229.125, -199.734375, -170.34375, -140.953125, -111.5625, -82.171875, -52.78125, -23.390625, 6.0, 35.390625, 64.78125, 94.171875, 123.5625, 152.953125, 182.34375, 211.734375, 241.125, 270.515625, 299.90625, 329.296875, 358.6875, 388.078125, 417.46875, 446.859375, 476.25, 505.640625, 535.03125, 564.421875, 593.8125, 623.203125, 652.59375, 681.984375, 711.375, 740.765625, 770.15625, 799.546875, 828.9375, 858.328125, 887.71875, 917.109375, 946.5]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 6.0, 16.0, 19.0, 17.0, 23.0, 27.0, 53.0, 47.0, 60.0, 143.0, 171.0, 248.0, 382.0, 557.0, 750.0, 1029.0, 1463.0, 2337.0, 3524.0, 5503.0, 8557.0, 14017.0, 23501.0, 42019.0, 78435.0, 158892.0, 358761.0, 1391899.0, 3376041.0, 432828.0, 184749.0, 89384.0, 47153.0, 25931.0, 15591.0, 9394.0, 5938.0, 3764.0, 2607.0, 1747.0, 1124.0, 800.0, 569.0, 442.0, 259.0, 215.0, 115.0, 109.0, 78.0, 33.0, 28.0, 26.0, 26.0, 15.0, 7.0, 4.0, 10.0, 2.0, 4.0], "bins": [-8.515625, -8.25836181640625, -8.0010986328125, -7.74383544921875, -7.486572265625, -7.22930908203125, -6.9720458984375, -6.71478271484375, -6.45751953125, -6.20025634765625, -5.9429931640625, -5.68572998046875, -5.428466796875, -5.17120361328125, -4.9139404296875, -4.65667724609375, -4.3994140625, -4.14215087890625, -3.8848876953125, -3.62762451171875, -3.370361328125, -3.11309814453125, -2.8558349609375, -2.59857177734375, -2.34130859375, -2.08404541015625, -1.8267822265625, -1.56951904296875, -1.312255859375, -1.05499267578125, -0.7977294921875, -0.54046630859375, -0.283203125, -0.02593994140625, 0.2313232421875, 0.48858642578125, 0.745849609375, 1.00311279296875, 1.2603759765625, 1.51763916015625, 1.77490234375, 2.03216552734375, 2.2894287109375, 2.54669189453125, 2.803955078125, 3.06121826171875, 3.3184814453125, 3.57574462890625, 3.8330078125, 4.09027099609375, 4.3475341796875, 4.60479736328125, 4.862060546875, 5.11932373046875, 5.3765869140625, 5.63385009765625, 5.89111328125, 6.14837646484375, 6.4056396484375, 6.66290283203125, 6.920166015625, 7.17742919921875, 7.4346923828125, 7.69195556640625, 7.94921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 11.0, 14.0, 7.0, 12.0, 12.0, 19.0, 21.0, 14.0, 18.0, 26.0, 19.0, 33.0, 29.0, 37.0, 39.0, 29.0, 32.0, 38.0, 65.0, 425.0, 456.0, 171.0, 78.0, 45.0, 43.0, 37.0, 28.0, 25.0, 27.0, 25.0, 27.0, 18.0, 22.0, 16.0, 10.0, 12.0, 14.0, 4.0, 7.0, 6.0, 10.0, 4.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.671875, -20.991943359375, -20.31201171875, -19.632080078125, -18.9521484375, -18.272216796875, -17.59228515625, -16.912353515625, -16.232421875, -15.552490234375, -14.87255859375, -14.192626953125, -13.5126953125, -12.832763671875, -12.15283203125, -11.472900390625, -10.79296875, -10.113037109375, -9.43310546875, -8.753173828125, -8.0732421875, -7.393310546875, -6.71337890625, -6.033447265625, -5.353515625, -4.673583984375, -3.99365234375, -3.313720703125, -2.6337890625, -1.953857421875, -1.27392578125, -0.593994140625, 0.0859375, 0.765869140625, 1.44580078125, 2.125732421875, 2.8056640625, 3.485595703125, 4.16552734375, 4.845458984375, 5.525390625, 6.205322265625, 6.88525390625, 7.565185546875, 8.2451171875, 8.925048828125, 9.60498046875, 10.284912109375, 10.96484375, 11.644775390625, 12.32470703125, 13.004638671875, 13.6845703125, 14.364501953125, 15.04443359375, 15.724365234375, 16.404296875, 17.084228515625, 17.76416015625, 18.444091796875, 19.1240234375, 19.803955078125, 20.48388671875, 21.163818359375, 21.84375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 8.0, 12.0, 14.0, 22.0, 35.0, 34.0, 57.0, 62.0, 105.0, 197.0, 231.0, 362.0, 569.0, 954.0, 1500.0, 2759.0, 4552.0, 8159.0, 15161.0, 28617.0, 57942.0, 126658.0, 362904.0, 4103543.0, 1139322.0, 244589.0, 94490.0, 45332.0, 23592.0, 12770.0, 6898.0, 4097.0, 2321.0, 1313.0, 725.0, 504.0, 368.0, 199.0, 128.0, 91.0, 78.0, 42.0, 38.0, 25.0, 13.0, 10.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.2265625, -13.7933349609375, -13.360107421875, -12.9268798828125, -12.49365234375, -12.0604248046875, -11.627197265625, -11.1939697265625, -10.7607421875, -10.3275146484375, -9.894287109375, -9.4610595703125, -9.02783203125, -8.5946044921875, -8.161376953125, -7.7281494140625, -7.294921875, -6.8616943359375, -6.428466796875, -5.9952392578125, -5.56201171875, -5.1287841796875, -4.695556640625, -4.2623291015625, -3.8291015625, -3.3958740234375, -2.962646484375, -2.5294189453125, -2.09619140625, -1.6629638671875, -1.229736328125, -0.7965087890625, -0.36328125, 0.0699462890625, 0.503173828125, 0.9364013671875, 1.36962890625, 1.8028564453125, 2.236083984375, 2.6693115234375, 3.1025390625, 3.5357666015625, 3.968994140625, 4.4022216796875, 4.83544921875, 5.2686767578125, 5.701904296875, 6.1351318359375, 6.568359375, 7.0015869140625, 7.434814453125, 7.8680419921875, 8.30126953125, 8.7344970703125, 9.167724609375, 9.6009521484375, 10.0341796875, 10.4674072265625, 10.900634765625, 11.3338623046875, 11.76708984375, 12.2003173828125, 12.633544921875, 13.0667724609375, 13.5]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 7.0, 6.0, 8.0, 14.0, 17.0, 21.0, 17.0, 28.0, 20.0, 29.0, 17.0, 31.0, 27.0, 39.0, 35.0, 41.0, 44.0, 59.0, 255.0, 652.0, 155.0, 108.0, 60.0, 42.0, 44.0, 30.0, 31.0, 29.0, 26.0, 32.0, 22.0, 14.0, 11.0, 13.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.33203125, -18.6171875, -17.90234375, -17.1875, -16.47265625, -15.7578125, -15.04296875, -14.328125, -13.61328125, -12.8984375, -12.18359375, -11.46875, -10.75390625, -10.0390625, -9.32421875, -8.609375, -7.89453125, -7.1796875, -6.46484375, -5.75, -5.03515625, -4.3203125, -3.60546875, -2.890625, -2.17578125, -1.4609375, -0.74609375, -0.03125, 0.68359375, 1.3984375, 2.11328125, 2.828125, 3.54296875, 4.2578125, 4.97265625, 5.6875, 6.40234375, 7.1171875, 7.83203125, 8.546875, 9.26171875, 9.9765625, 10.69140625, 11.40625, 12.12109375, 12.8359375, 13.55078125, 14.265625, 14.98046875, 15.6953125, 16.41015625, 17.125, 17.83984375, 18.5546875, 19.26953125, 19.984375, 20.69921875, 21.4140625, 22.12890625, 22.84375, 23.55859375, 24.2734375, 24.98828125, 25.703125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 9.0, 7.0, 18.0, 35.0, 30.0, 59.0, 65.0, 100.0, 110.0, 130.0, 224.0, 322.0, 479.0, 787.0, 1224.0, 2166.0, 4295.0, 10111.0, 33290.0, 5707690.0, 478841.0, 31677.0, 9832.0, 4116.0, 2193.0, 1295.0, 703.0, 429.0, 346.0, 221.0, 170.0, 125.0, 57.0, 66.0, 42.0, 30.0, 26.0, 16.0, 22.0, 9.0, 10.0, 5.0, 7.0, 8.0, 2.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-81.0625, -78.3583984375, -75.654296875, -72.9501953125, -70.24609375, -67.5419921875, -64.837890625, -62.1337890625, -59.4296875, -56.7255859375, -54.021484375, -51.3173828125, -48.61328125, -45.9091796875, -43.205078125, -40.5009765625, -37.796875, -35.0927734375, -32.388671875, -29.6845703125, -26.98046875, -24.2763671875, -21.572265625, -18.8681640625, -16.1640625, -13.4599609375, -10.755859375, -8.0517578125, -5.34765625, -2.6435546875, 0.060546875, 2.7646484375, 5.46875, 8.1728515625, 10.876953125, 13.5810546875, 16.28515625, 18.9892578125, 21.693359375, 24.3974609375, 27.1015625, 29.8056640625, 32.509765625, 35.2138671875, 37.91796875, 40.6220703125, 43.326171875, 46.0302734375, 48.734375, 51.4384765625, 54.142578125, 56.8466796875, 59.55078125, 62.2548828125, 64.958984375, 67.6630859375, 70.3671875, 73.0712890625, 75.775390625, 78.4794921875, 81.18359375, 83.8876953125, 86.591796875, 89.2958984375, 92.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 2.0, 10.0, 10.0, 10.0, 13.0, 17.0, 20.0, 21.0, 38.0, 41.0, 40.0, 62.0, 54.0, 162.0, 790.0, 225.0, 130.0, 75.0, 70.0, 49.0, 37.0, 35.0, 22.0, 20.0, 17.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.34375, -30.30908203125, -29.2744140625, -28.23974609375, -27.205078125, -26.17041015625, -25.1357421875, -24.10107421875, -23.06640625, -22.03173828125, -20.9970703125, -19.96240234375, -18.927734375, -17.89306640625, -16.8583984375, -15.82373046875, -14.7890625, -13.75439453125, -12.7197265625, -11.68505859375, -10.650390625, -9.61572265625, -8.5810546875, -7.54638671875, -6.51171875, -5.47705078125, -4.4423828125, -3.40771484375, -2.373046875, -1.33837890625, -0.3037109375, 0.73095703125, 1.765625, 2.80029296875, 3.8349609375, 4.86962890625, 5.904296875, 6.93896484375, 7.9736328125, 9.00830078125, 10.04296875, 11.07763671875, 12.1123046875, 13.14697265625, 14.181640625, 15.21630859375, 16.2509765625, 17.28564453125, 18.3203125, 19.35498046875, 20.3896484375, 21.42431640625, 22.458984375, 23.49365234375, 24.5283203125, 25.56298828125, 26.59765625, 27.63232421875, 28.6669921875, 29.70166015625, 30.736328125, 31.77099609375, 32.8056640625, 33.84033203125, 34.875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 73.0, 838.0, 55.0, 16.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.84063720703125, -92.20392608642578, -79.56720733642578, -66.93049621582031, -54.29378128051758, -41.657066345214844, -29.020355224609375, -16.383636474609375, -3.7469253540039062, 8.889788627624512, 21.52650260925293, 34.16321563720703, 46.799930572509766, 59.4366455078125, 72.07335662841797, 84.71007537841797, 97.34678649902344, 109.9834976196289, 122.6202163696289, 135.25692749023438, 147.89364624023438, 160.53036499023438, 173.1670684814453, 185.8037872314453, 198.44049072265625, 211.07720947265625, 223.7139129638672, 236.3506317138672, 248.9873504638672, 261.6240539550781, 274.2607727050781, 286.8974914550781, 299.5342102050781, 312.1709289550781, 324.8076477050781, 337.4443359375, 350.0810546875, 362.7177734375, 375.3544921875, 387.9912109375, 400.6279296875, 413.2646484375, 425.9013671875, 438.5380859375, 451.1747741699219, 463.8114929199219, 476.4482116699219, 489.0849304199219, 501.72161865234375, 514.3583374023438, 526.9950561523438, 539.6317749023438, 552.2684936523438, 564.9052124023438, 577.5418701171875, 590.1785888671875, 602.8153686523438, 615.4520874023438, 628.0888061523438, 640.7255249023438, 653.3622436523438, 665.9989624023438, 678.6356201171875, 691.2723388671875, 703.9090576171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [7.0, 1.0, 6.0, 6.0, 24.0, 44.0, 154.0, 324.0, 275.0, 89.0, 34.0, 21.0, 15.0, 8.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.29730224609375, -42.16850280761719, -36.039703369140625, -29.91090202331543, -23.782102584838867, -17.653303146362305, -11.52450180053711, -5.395702362060547, 0.7330970764160156, 6.861896991729736, 12.990696907043457, 19.119497299194336, 25.2482967376709, 31.37709617614746, 37.505897521972656, 43.63469696044922, 49.76349639892578, 55.892295837402344, 62.021095275878906, 68.14989471435547, 74.27869415283203, 80.4074935913086, 86.53630065917969, 92.66510009765625, 98.79389953613281, 104.92269897460938, 111.05149841308594, 117.1802978515625, 123.30909729003906, 129.43789672851562, 135.5666961669922, 141.69549560546875, 147.8242950439453, 153.95309448242188, 160.08189392089844, 166.210693359375, 172.33949279785156, 178.46829223632812, 184.5970916748047, 190.72589111328125, 196.8546905517578, 202.98348999023438, 209.11228942871094, 215.2410888671875, 221.36988830566406, 227.49868774414062, 233.6274871826172, 239.75628662109375, 245.88510131835938, 252.01390075683594, 258.1427001953125, 264.2715148925781, 270.4002990722656, 276.52911376953125, 282.65789794921875, 288.7867126464844, 294.9154968261719, 301.0443115234375, 307.173095703125, 313.3019104003906, 319.4306945800781, 325.55950927734375, 331.68829345703125, 337.8171081542969, 343.9458923339844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 7.0, 6.0, 9.0, 8.0, 14.0, 13.0, 16.0, 24.0, 28.0, 39.0, 63.0, 92.0, 112.0, 170.0, 276.0, 393.0, 614.0, 1018.0, 1756.0, 3191.0, 6666.0, 16799.0, 74917.0, 3971473.0, 85694.0, 16641.0, 6363.0, 3094.0, 1638.0, 1098.0, 632.0, 413.0, 273.0, 198.0, 140.0, 95.0, 79.0, 48.0, 28.0, 28.0, 27.0, 18.0, 12.0, 12.0, 12.0, 9.0, 8.0, 8.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0], "bins": [-1.2822265625, -1.243988037109375, -1.20574951171875, -1.167510986328125, -1.1292724609375, -1.091033935546875, -1.05279541015625, -1.014556884765625, -0.976318359375, -0.938079833984375, -0.89984130859375, -0.861602783203125, -0.8233642578125, -0.785125732421875, -0.74688720703125, -0.708648681640625, -0.67041015625, -0.632171630859375, -0.59393310546875, -0.555694580078125, -0.5174560546875, -0.479217529296875, -0.44097900390625, -0.402740478515625, -0.364501953125, -0.326263427734375, -0.28802490234375, -0.249786376953125, -0.2115478515625, -0.173309326171875, -0.13507080078125, -0.096832275390625, -0.05859375, -0.020355224609375, 0.01788330078125, 0.056121826171875, 0.0943603515625, 0.132598876953125, 0.17083740234375, 0.209075927734375, 0.247314453125, 0.285552978515625, 0.32379150390625, 0.362030029296875, 0.4002685546875, 0.438507080078125, 0.47674560546875, 0.514984130859375, 0.55322265625, 0.591461181640625, 0.62969970703125, 0.667938232421875, 0.7061767578125, 0.744415283203125, 0.78265380859375, 0.820892333984375, 0.859130859375, 0.897369384765625, 0.93560791015625, 0.973846435546875, 1.0120849609375, 1.050323486328125, 1.08856201171875, 1.126800537109375, 1.1650390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 9.0, 9.0, 7.0, 5.0, 18.0, 20.0, 56.0, 368.0, 374.0, 56.0, 22.0, 13.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18062591552734375, -0.1749725341796875, -0.16931915283203125, -0.163665771484375, -0.15801239013671875, -0.1523590087890625, -0.14670562744140625, -0.14105224609375, -0.13539886474609375, -0.1297454833984375, -0.12409210205078125, -0.118438720703125, -0.11278533935546875, -0.1071319580078125, -0.10147857666015625, -0.0958251953125, -0.09017181396484375, -0.0845184326171875, -0.07886505126953125, -0.073211669921875, -0.06755828857421875, -0.0619049072265625, -0.05625152587890625, -0.05059814453125, -0.04494476318359375, -0.0392913818359375, -0.03363800048828125, -0.027984619140625, -0.02233123779296875, -0.0166778564453125, -0.01102447509765625, -0.00537109375, 0.00028228759765625, 0.0059356689453125, 0.01158905029296875, 0.017242431640625, 0.02289581298828125, 0.0285491943359375, 0.03420257568359375, 0.03985595703125, 0.04550933837890625, 0.0511627197265625, 0.05681610107421875, 0.062469482421875, 0.06812286376953125, 0.0737762451171875, 0.07942962646484375, 0.0850830078125, 0.09073638916015625, 0.0963897705078125, 0.10204315185546875, 0.107696533203125, 0.11334991455078125, 0.1190032958984375, 0.12465667724609375, 0.13031005859375, 0.13596343994140625, 0.1416168212890625, 0.14727020263671875, 0.152923583984375, 0.15857696533203125, 0.1642303466796875, 0.16988372802734375, 0.175537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 2.0, 14.0, 15.0, 12.0, 16.0, 23.0, 55.0, 54.0, 92.0, 149.0, 239.0, 440.0, 732.0, 1396.0, 2973.0, 6920.0, 21056.0, 104301.0, 3267454.0, 704266.0, 58243.0, 15228.0, 5479.0, 2328.0, 1189.0, 644.0, 335.0, 198.0, 153.0, 74.0, 63.0, 37.0, 26.0, 16.0, 15.0, 12.0, 12.0, 6.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1530303955078125, -1.115631103515625, -1.0782318115234375, -1.04083251953125, -1.0034332275390625, -0.966033935546875, -0.9286346435546875, -0.8912353515625, -0.8538360595703125, -0.816436767578125, -0.7790374755859375, -0.74163818359375, -0.7042388916015625, -0.666839599609375, -0.6294403076171875, -0.592041015625, -0.5546417236328125, -0.517242431640625, -0.4798431396484375, -0.44244384765625, -0.4050445556640625, -0.367645263671875, -0.3302459716796875, -0.2928466796875, -0.2554473876953125, -0.218048095703125, -0.1806488037109375, -0.14324951171875, -0.1058502197265625, -0.068450927734375, -0.0310516357421875, 0.00634765625, 0.0437469482421875, 0.081146240234375, 0.1185455322265625, 0.15594482421875, 0.1933441162109375, 0.230743408203125, 0.2681427001953125, 0.3055419921875, 0.3429412841796875, 0.380340576171875, 0.4177398681640625, 0.45513916015625, 0.4925384521484375, 0.529937744140625, 0.5673370361328125, 0.604736328125, 0.6421356201171875, 0.679534912109375, 0.7169342041015625, 0.75433349609375, 0.7917327880859375, 0.829132080078125, 0.8665313720703125, 0.9039306640625, 0.9413299560546875, 0.978729248046875, 1.0161285400390625, 1.05352783203125, 1.0909271240234375, 1.128326416015625, 1.1657257080078125, 1.203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 6.0, 10.0, 14.0, 24.0, 20.0, 30.0, 52.0, 63.0, 87.0, 134.0, 215.0, 505.0, 1220.0, 696.0, 330.0, 181.0, 136.0, 91.0, 54.0, 38.0, 44.0, 23.0, 19.0, 12.0, 6.0, 17.0, 5.0, 5.0, 6.0, 3.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24895095825195312, -0.24057769775390625, -0.23220443725585938, -0.2238311767578125, -0.21545791625976562, -0.20708465576171875, -0.19871139526367188, -0.190338134765625, -0.18196487426757812, -0.17359161376953125, -0.16521835327148438, -0.1568450927734375, -0.14847183227539062, -0.14009857177734375, -0.13172531127929688, -0.12335205078125, -0.11497879028320312, -0.10660552978515625, -0.09823226928710938, -0.0898590087890625, -0.08148574829101562, -0.07311248779296875, -0.06473922729492188, -0.056365966796875, -0.047992706298828125, -0.03961944580078125, -0.031246185302734375, -0.0228729248046875, -0.014499664306640625, -0.00612640380859375, 0.002246856689453125, 0.0106201171875, 0.018993377685546875, 0.02736663818359375, 0.035739898681640625, 0.0441131591796875, 0.052486419677734375, 0.06085968017578125, 0.06923294067382812, 0.077606201171875, 0.08597946166992188, 0.09435272216796875, 0.10272598266601562, 0.1110992431640625, 0.11947250366210938, 0.12784576416015625, 0.13621902465820312, 0.14459228515625, 0.15296554565429688, 0.16133880615234375, 0.16971206665039062, 0.1780853271484375, 0.18645858764648438, 0.19483184814453125, 0.20320510864257812, 0.211578369140625, 0.21995162963867188, 0.22832489013671875, 0.23669815063476562, 0.2450714111328125, 0.2534446716308594, 0.26181793212890625, 0.2701911926269531, 0.278564453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 16.0, 44.0, 170.0, 357.0, 248.0, 83.0, 46.0, 12.0, 13.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7438559532165527, -3.5920450687408447, -3.4402341842651367, -3.288423538208008, -3.1366126537323, -2.984801769256592, -2.832991123199463, -2.681180238723755, -2.529369354248047, -2.377558469772339, -2.225747585296631, -2.073936939239502, -1.922126054763794, -1.770315170288086, -1.6185044050216675, -1.466693639755249, -1.314882755279541, -1.163071870803833, -1.0112611055374146, -0.8594502806663513, -0.7076394557952881, -0.5558286309242249, -0.4040178060531616, -0.25220704078674316, -0.10039615631103516, 0.051414668560028076, 0.2032254934310913, 0.35503631830215454, 0.5068471431732178, 0.658657968044281, 0.8104687929153442, 0.9622795581817627, 1.1140904426574707, 1.2659013271331787, 1.4177120923995972, 1.5695228576660156, 1.7213337421417236, 1.8731446266174316, 2.0249552726745605, 2.1767661571502686, 2.3285770416259766, 2.4803879261016846, 2.6321988105773926, 2.7840094566345215, 2.9358203411102295, 3.0876312255859375, 3.2394418716430664, 3.3912527561187744, 3.5430636405944824, 3.6948745250701904, 3.8466854095458984, 3.9984960556030273, 4.150306701660156, 4.302117824554443, 4.453928470611572, 4.605739593505859, 4.757550239562988, 4.909360885620117, 5.061172008514404, 5.212982654571533, 5.36479377746582, 5.516604423522949, 5.668415069580078, 5.820225715637207, 5.972036838531494]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 15.0, 12.0, 15.0, 20.0, 29.0, 36.0, 47.0, 46.0, 44.0, 52.0, 43.0, 50.0, 60.0, 63.0, 62.0, 60.0, 54.0, 46.0, 44.0, 46.0, 34.0, 26.0, 17.0, 19.0, 17.0, 5.0, 5.0, 13.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2556431293487549, -1.2096362113952637, -1.163629174232483, -1.1176222562789917, -1.0716153383255005, -1.0256083011627197, -0.9796013832092285, -0.9335944056510925, -0.8875874280929565, -0.8415804505348206, -0.7955735325813293, -0.7495665550231934, -0.7035595774650574, -0.6575525999069214, -0.6115456819534302, -0.5655387043952942, -0.519531786441803, -0.4735248386859894, -0.4275178611278534, -0.3815109133720398, -0.3355039358139038, -0.2894969880580902, -0.2434900403022766, -0.19748306274414062, -0.15147611498832703, -0.10546915233135223, -0.05946219712495804, -0.013455241918563843, 0.03255172073841095, 0.07855868339538574, 0.12456563115119934, 0.17057260870933533, 0.21657955646514893, 0.2625865042209625, 0.3085934817790985, 0.3546004295349121, 0.4006074070930481, 0.4466143548488617, 0.4926213026046753, 0.5386282801628113, 0.5846352577209473, 0.6306422352790833, 0.6766491532325745, 0.7226561307907104, 0.7686631083488464, 0.8146700859069824, 0.8606770038604736, 0.9066839814186096, 0.9526908993721008, 0.9986978769302368, 1.044704794883728, 1.0907118320465088, 1.13671875, 1.1827256679534912, 1.2287325859069824, 1.2747396230697632, 1.3207465410232544, 1.3667534589767456, 1.4127604961395264, 1.4587674140930176, 1.5047743320465088, 1.5507813692092896, 1.5967882871627808, 1.6427953243255615, 1.6888022422790527]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 6.0, 13.0, 14.0, 18.0, 43.0, 41.0, 74.0, 107.0, 138.0, 223.0, 360.0, 619.0, 1200.0, 2417.0, 6019.0, 19430.0, 386716.0, 597847.0, 21279.0, 6375.0, 2543.0, 1273.0, 691.0, 362.0, 228.0, 163.0, 97.0, 73.0, 57.0, 30.0, 32.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4500579833984375, -1.400115966796875, -1.3501739501953125, -1.30023193359375, -1.2502899169921875, -1.200347900390625, -1.1504058837890625, -1.1004638671875, -1.0505218505859375, -1.000579833984375, -0.9506378173828125, -0.90069580078125, -0.8507537841796875, -0.800811767578125, -0.7508697509765625, -0.700927734375, -0.6509857177734375, -0.601043701171875, -0.5511016845703125, -0.50115966796875, -0.4512176513671875, -0.401275634765625, -0.3513336181640625, -0.3013916015625, -0.2514495849609375, -0.201507568359375, -0.1515655517578125, -0.10162353515625, -0.0516815185546875, -0.001739501953125, 0.0482025146484375, 0.09814453125, 0.1480865478515625, 0.198028564453125, 0.2479705810546875, 0.29791259765625, 0.3478546142578125, 0.397796630859375, 0.4477386474609375, 0.4976806640625, 0.5476226806640625, 0.597564697265625, 0.6475067138671875, 0.69744873046875, 0.7473907470703125, 0.797332763671875, 0.8472747802734375, 0.897216796875, 0.9471588134765625, 0.997100830078125, 1.0470428466796875, 1.09698486328125, 1.1469268798828125, 1.196868896484375, 1.2468109130859375, 1.2967529296875, 1.3466949462890625, 1.396636962890625, 1.4465789794921875, 1.49652099609375, 1.5464630126953125, 1.596405029296875, 1.6463470458984375, 1.6962890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 11.0, 14.0, 26.0, 77.0, 199.0, 317.0, 201.0, 68.0, 22.0, 11.0, 6.0, 6.0, 2.0, 6.0, 5.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.1799640655517578, -0.17364883422851562, -0.16733360290527344, -0.16101837158203125, -0.15470314025878906, -0.14838790893554688, -0.1420726776123047, -0.1357574462890625, -0.1294422149658203, -0.12312698364257812, -0.11681175231933594, -0.11049652099609375, -0.10418128967285156, -0.09786605834960938, -0.09155082702636719, -0.085235595703125, -0.07892036437988281, -0.07260513305664062, -0.06628990173339844, -0.05997467041015625, -0.05365943908691406, -0.047344207763671875, -0.04102897644042969, -0.0347137451171875, -0.028398513793945312, -0.022083282470703125, -0.015768051147460938, -0.00945281982421875, -0.0031375885009765625, 0.003177642822265625, 0.009492874145507812, 0.01580810546875, 0.022123336791992188, 0.028438568115234375, 0.03475379943847656, 0.04106903076171875, 0.04738426208496094, 0.053699493408203125, 0.06001472473144531, 0.0663299560546875, 0.07264518737792969, 0.07896041870117188, 0.08527565002441406, 0.09159088134765625, 0.09790611267089844, 0.10422134399414062, 0.11053657531738281, 0.116851806640625, 0.12316703796386719, 0.12948226928710938, 0.13579750061035156, 0.14211273193359375, 0.14842796325683594, 0.15474319458007812, 0.1610584259033203, 0.1673736572265625, 0.1736888885498047, 0.18000411987304688, 0.18631935119628906, 0.19263458251953125, 0.19894981384277344, 0.20526504516601562, 0.2115802764892578, 0.2178955078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 21.0, 27.0, 27.0, 43.0, 79.0, 105.0, 220.0, 409.0, 910.0, 2454.0, 9221.0, 76196.0, 859168.0, 85317.0, 10073.0, 2422.0, 868.0, 420.0, 215.0, 114.0, 62.0, 45.0, 30.0, 22.0, 10.0, 16.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.964691162109375, -1.89813232421875, -1.831573486328125, -1.7650146484375, -1.698455810546875, -1.63189697265625, -1.565338134765625, -1.498779296875, -1.432220458984375, -1.36566162109375, -1.299102783203125, -1.2325439453125, -1.165985107421875, -1.09942626953125, -1.032867431640625, -0.96630859375, -0.899749755859375, -0.83319091796875, -0.766632080078125, -0.7000732421875, -0.633514404296875, -0.56695556640625, -0.500396728515625, -0.433837890625, -0.367279052734375, -0.30072021484375, -0.234161376953125, -0.1676025390625, -0.101043701171875, -0.03448486328125, 0.032073974609375, 0.0986328125, 0.165191650390625, 0.23175048828125, 0.298309326171875, 0.3648681640625, 0.431427001953125, 0.49798583984375, 0.564544677734375, 0.631103515625, 0.697662353515625, 0.76422119140625, 0.830780029296875, 0.8973388671875, 0.963897705078125, 1.03045654296875, 1.097015380859375, 1.16357421875, 1.230133056640625, 1.29669189453125, 1.363250732421875, 1.4298095703125, 1.496368408203125, 1.56292724609375, 1.629486083984375, 1.696044921875, 1.762603759765625, 1.82916259765625, 1.895721435546875, 1.9622802734375, 2.028839111328125, 2.09539794921875, 2.161956787109375, 2.228515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 4.0, 6.0, 14.0, 14.0, 14.0, 19.0, 26.0, 16.0, 31.0, 37.0, 34.0, 28.0, 34.0, 43.0, 33.0, 43.0, 35.0, 33.0, 43.0, 33.0, 47.0, 39.0, 36.0, 40.0, 51.0, 30.0, 26.0, 31.0, 19.0, 27.0, 19.0, 14.0, 17.0, 12.0, 7.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5092697143554688, -0.4921722412109375, -0.47507476806640625, -0.457977294921875, -0.44087982177734375, -0.4237823486328125, -0.40668487548828125, -0.38958740234375, -0.37248992919921875, -0.3553924560546875, -0.33829498291015625, -0.321197509765625, -0.30410003662109375, -0.2870025634765625, -0.26990509033203125, -0.2528076171875, -0.23571014404296875, -0.2186126708984375, -0.20151519775390625, -0.184417724609375, -0.16732025146484375, -0.1502227783203125, -0.13312530517578125, -0.11602783203125, -0.09893035888671875, -0.0818328857421875, -0.06473541259765625, -0.047637939453125, -0.03054046630859375, -0.0134429931640625, 0.00365447998046875, 0.020751953125, 0.03784942626953125, 0.0549468994140625, 0.07204437255859375, 0.089141845703125, 0.10623931884765625, 0.1233367919921875, 0.14043426513671875, 0.15753173828125, 0.17462921142578125, 0.1917266845703125, 0.20882415771484375, 0.225921630859375, 0.24301910400390625, 0.2601165771484375, 0.27721405029296875, 0.2943115234375, 0.31140899658203125, 0.3285064697265625, 0.34560394287109375, 0.362701416015625, 0.37979888916015625, 0.3968963623046875, 0.41399383544921875, 0.43109130859375, 0.44818878173828125, 0.4652862548828125, 0.48238372802734375, 0.499481201171875, 0.5165786743164062, 0.5336761474609375, 0.5507736206054688, 0.56787109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 1.0, 2.0, 1.0, 3.0, 6.0, 15.0, 11.0, 25.0, 30.0, 39.0, 66.0, 93.0, 152.0, 231.0, 423.0, 844.0, 2071.0, 8647.0, 696025.0, 328447.0, 7624.0, 1947.0, 803.0, 374.0, 224.0, 145.0, 93.0, 51.0, 45.0, 32.0, 26.0, 20.0, 9.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.505126953125, -2.40478515625, -2.304443359375, -2.2041015625, -2.103759765625, -2.00341796875, -1.903076171875, -1.802734375, -1.702392578125, -1.60205078125, -1.501708984375, -1.4013671875, -1.301025390625, -1.20068359375, -1.100341796875, -1.0, -0.899658203125, -0.79931640625, -0.698974609375, -0.5986328125, -0.498291015625, -0.39794921875, -0.297607421875, -0.197265625, -0.096923828125, 0.00341796875, 0.103759765625, 0.2041015625, 0.304443359375, 0.40478515625, 0.505126953125, 0.60546875, 0.705810546875, 0.80615234375, 0.906494140625, 1.0068359375, 1.107177734375, 1.20751953125, 1.307861328125, 1.408203125, 1.508544921875, 1.60888671875, 1.709228515625, 1.8095703125, 1.909912109375, 2.01025390625, 2.110595703125, 2.2109375, 2.311279296875, 2.41162109375, 2.511962890625, 2.6123046875, 2.712646484375, 2.81298828125, 2.913330078125, 3.013671875, 3.114013671875, 3.21435546875, 3.314697265625, 3.4150390625, 3.515380859375, 3.61572265625, 3.716064453125, 3.81640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 10.0, 5.0, 5.0, 11.0, 13.0, 23.0, 32.0, 34.0, 53.0, 79.0, 149.0, 208.0, 119.0, 58.0, 46.0, 22.0, 27.0, 20.0, 14.0, 9.0, 6.0, 7.0, 6.0, 5.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000457763671875, -0.0004362165927886963, -0.0004146695137023926, -0.00039312243461608887, -0.00037157535552978516, -0.00035002827644348145, -0.00032848119735717773, -0.000306934118270874, -0.0002853870391845703, -0.0002638399600982666, -0.0002422928810119629, -0.00022074580192565918, -0.00019919872283935547, -0.00017765164375305176, -0.00015610456466674805, -0.00013455748558044434, -0.00011301040649414062, -9.146332740783691e-05, -6.99162483215332e-05, -4.836916923522949e-05, -2.682209014892578e-05, -5.27501106262207e-06, 1.627206802368164e-05, 3.781914710998535e-05, 5.936622619628906e-05, 8.091330528259277e-05, 0.00010246038436889648, 0.0001240074634552002, 0.0001455545425415039, 0.00016710162162780762, 0.00018864870071411133, 0.00021019577980041504, 0.00023174285888671875, 0.00025328993797302246, 0.00027483701705932617, 0.0002963840961456299, 0.0003179311752319336, 0.0003394782543182373, 0.000361025333404541, 0.0003825724124908447, 0.00040411949157714844, 0.00042566657066345215, 0.00044721364974975586, 0.00046876072883605957, 0.0004903078079223633, 0.000511854887008667, 0.0005334019660949707, 0.0005549490451812744, 0.0005764961242675781, 0.0005980432033538818, 0.0006195902824401855, 0.0006411373615264893, 0.000662684440612793, 0.0006842315196990967, 0.0007057785987854004, 0.0007273256778717041, 0.0007488727569580078, 0.0007704198360443115, 0.0007919669151306152, 0.0008135139942169189, 0.0008350610733032227, 0.0008566081523895264, 0.0008781552314758301, 0.0008997023105621338, 0.0009212493896484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 10.0, 10.0, 19.0, 24.0, 38.0, 58.0, 65.0, 106.0, 174.0, 271.0, 491.0, 826.0, 1593.0, 3587.0, 10628.0, 52261.0, 911997.0, 49037.0, 10243.0, 3539.0, 1551.0, 776.0, 451.0, 256.0, 179.0, 106.0, 71.0, 49.0, 24.0, 30.0, 14.0, 15.0, 8.0, 9.0, 5.0, 2.0, 4.0, 2.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.693359375, -2.607818603515625, -2.52227783203125, -2.436737060546875, -2.3511962890625, -2.265655517578125, -2.18011474609375, -2.094573974609375, -2.009033203125, -1.923492431640625, -1.83795166015625, -1.752410888671875, -1.6668701171875, -1.581329345703125, -1.49578857421875, -1.410247802734375, -1.32470703125, -1.239166259765625, -1.15362548828125, -1.068084716796875, -0.9825439453125, -0.897003173828125, -0.81146240234375, -0.725921630859375, -0.640380859375, -0.554840087890625, -0.46929931640625, -0.383758544921875, -0.2982177734375, -0.212677001953125, -0.12713623046875, -0.041595458984375, 0.0439453125, 0.129486083984375, 0.21502685546875, 0.300567626953125, 0.3861083984375, 0.471649169921875, 0.55718994140625, 0.642730712890625, 0.728271484375, 0.813812255859375, 0.89935302734375, 0.984893798828125, 1.0704345703125, 1.155975341796875, 1.24151611328125, 1.327056884765625, 1.41259765625, 1.498138427734375, 1.58367919921875, 1.669219970703125, 1.7547607421875, 1.840301513671875, 1.92584228515625, 2.011383056640625, 2.096923828125, 2.182464599609375, 2.26800537109375, 2.353546142578125, 2.4390869140625, 2.524627685546875, 2.61016845703125, 2.695709228515625, 2.78125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 7.0, 23.0, 21.0, 32.0, 77.0, 172.0, 302.0, 186.0, 88.0, 23.0, 16.0, 11.0, 9.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.0160980224609375, -1.954071044921875, -1.8920440673828125, -1.83001708984375, -1.7679901123046875, -1.705963134765625, -1.6439361572265625, -1.5819091796875, -1.5198822021484375, -1.457855224609375, -1.3958282470703125, -1.33380126953125, -1.2717742919921875, -1.209747314453125, -1.1477203369140625, -1.085693359375, -1.0236663818359375, -0.961639404296875, -0.8996124267578125, -0.83758544921875, -0.7755584716796875, -0.713531494140625, -0.6515045166015625, -0.5894775390625, -0.5274505615234375, -0.465423583984375, -0.4033966064453125, -0.34136962890625, -0.2793426513671875, -0.217315673828125, -0.1552886962890625, -0.09326171875, -0.0312347412109375, 0.030792236328125, 0.0928192138671875, 0.15484619140625, 0.2168731689453125, 0.278900146484375, 0.3409271240234375, 0.4029541015625, 0.4649810791015625, 0.527008056640625, 0.5890350341796875, 0.65106201171875, 0.7130889892578125, 0.775115966796875, 0.8371429443359375, 0.899169921875, 0.9611968994140625, 1.023223876953125, 1.0852508544921875, 1.14727783203125, 1.2093048095703125, 1.271331787109375, 1.3333587646484375, 1.3953857421875, 1.4574127197265625, 1.519439697265625, 1.5814666748046875, 1.64349365234375, 1.7055206298828125, 1.767547607421875, 1.8295745849609375, 1.8916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 19.0, 55.0, 141.0, 361.0, 205.0, 88.0, 56.0, 32.0, 9.0, 12.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.705343246459961, -12.226470947265625, -11.747598648071289, -11.268726348876953, -10.789855003356934, -10.310982704162598, -9.832110404968262, -9.353238105773926, -8.87436580657959, -8.395493507385254, -7.916621685028076, -7.43774938583374, -6.958877086639404, -6.480005264282227, -6.001132965087891, -5.522260665893555, -5.043388843536377, -4.564516544342041, -4.085644721984863, -3.6067724227905273, -3.1279001235961914, -2.6490280628204346, -2.1701560020446777, -1.6912837028503418, -1.212411642074585, -0.7335394620895386, -0.25466734170913696, 0.22420477867126465, 0.703076958656311, 1.1819491386413574, 1.6608211994171143, 2.13969349861145, 2.618565559387207, 3.097437620162964, 3.5763099193573, 4.055181980133057, 4.534054279327393, 5.01292610168457, 5.491798400878906, 5.970670700073242, 6.449542999267578, 6.928415298461914, 7.407287120819092, 7.886159420013428, 8.365031242370605, 8.843903541564941, 9.322775840759277, 9.801648139953613, 10.280519485473633, 10.759391784667969, 11.238264083862305, 11.71713638305664, 12.19600772857666, 12.674880027770996, 13.153752326965332, 13.632624626159668, 14.111496925354004, 14.59036922454834, 15.069241523742676, 15.548112869262695, 16.02698516845703, 16.505857467651367, 16.984729766845703, 17.46360206604004, 17.942474365234375]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 6.0, 13.0, 12.0, 13.0, 31.0, 32.0, 52.0, 85.0, 108.0, 102.0, 114.0, 105.0, 85.0, 76.0, 36.0, 39.0, 20.0, 15.0, 12.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.027713775634766, -13.679011344909668, -13.330307960510254, -12.981605529785156, -12.632903099060059, -12.284200668334961, -11.935497283935547, -11.58679485321045, -11.238092422485352, -10.889389991760254, -10.54068660736084, -10.191984176635742, -9.843281745910645, -9.494579315185547, -9.145875930786133, -8.797173500061035, -8.448471069335938, -8.09976863861084, -7.751065731048584, -7.402362823486328, -7.0536603927612305, -6.704957485198975, -6.356254577636719, -6.007552146911621, -5.658848762512207, -5.310145854949951, -4.9614434242248535, -4.612740516662598, -4.2640380859375, -3.915335178375244, -3.5666325092315674, -3.2179298400878906, -2.869227409362793, -2.520524740219116, -2.1718220710754395, -1.8231192827224731, -1.4744166135787964, -1.1257139444351196, -0.7770111560821533, -0.42830848693847656, -0.0796058177947998, 0.26909688115119934, 0.6177995800971985, 0.96650230884552, 1.3152049779891968, 1.6639076471328735, 2.01261043548584, 2.3613131046295166, 2.7100157737731934, 3.05871844291687, 3.407421112060547, 3.7561240196228027, 4.1048264503479, 4.453529357910156, 4.802231788635254, 5.15093469619751, 5.499637603759766, 5.8483405113220215, 6.197042942047119, 6.545745849609375, 6.894448280334473, 7.2431511878967285, 7.591854095458984, 7.940556526184082, 8.28925895690918]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 15.0, 22.0, 62.0, 292.0, 153654.0, 4039112.0, 807.0, 180.0, 46.0, 30.0, 14.0, 11.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.378662109375, -18.24169921875, -17.104736328125, -15.9677734375, -14.830810546875, -13.69384765625, -12.556884765625, -11.419921875, -10.282958984375, -9.14599609375, -8.009033203125, -6.8720703125, -5.735107421875, -4.59814453125, -3.461181640625, -2.32421875, -1.187255859375, -0.05029296875, 1.086669921875, 2.2236328125, 3.360595703125, 4.49755859375, 5.634521484375, 6.771484375, 7.908447265625, 9.04541015625, 10.182373046875, 11.3193359375, 12.456298828125, 13.59326171875, 14.730224609375, 15.8671875, 17.004150390625, 18.14111328125, 19.278076171875, 20.4150390625, 21.552001953125, 22.68896484375, 23.825927734375, 24.962890625, 26.099853515625, 27.23681640625, 28.373779296875, 29.5107421875, 30.647705078125, 31.78466796875, 32.921630859375, 34.05859375, 35.195556640625, 36.33251953125, 37.469482421875, 38.6064453125, 39.743408203125, 40.88037109375, 42.017333984375, 43.154296875, 44.291259765625, 45.42822265625, 46.565185546875, 47.7021484375, 48.839111328125, 49.97607421875, 51.113037109375, 52.25]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 7.0, 10.0, 4.0, 7.0, 5.0, 14.0, 11.0, 25.0, 34.0, 69.0, 100.0, 138.0, 181.0, 143.0, 84.0, 68.0, 32.0, 22.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16455078125, -0.15960121154785156, -0.15465164184570312, -0.1497020721435547, -0.14475250244140625, -0.1398029327392578, -0.13485336303710938, -0.12990379333496094, -0.1249542236328125, -0.12000465393066406, -0.11505508422851562, -0.11010551452636719, -0.10515594482421875, -0.10020637512207031, -0.09525680541992188, -0.09030723571777344, -0.085357666015625, -0.08040809631347656, -0.07545852661132812, -0.07050895690917969, -0.06555938720703125, -0.06060981750488281, -0.055660247802734375, -0.05071067810058594, -0.0457611083984375, -0.04081153869628906, -0.035861968994140625, -0.030912399291992188, -0.02596282958984375, -0.021013259887695312, -0.016063690185546875, -0.011114120483398438, -0.00616455078125, -0.0012149810791015625, 0.003734588623046875, 0.008684158325195312, 0.01363372802734375, 0.018583297729492188, 0.023532867431640625, 0.028482437133789062, 0.0334320068359375, 0.03838157653808594, 0.043331146240234375, 0.04828071594238281, 0.05323028564453125, 0.05817985534667969, 0.06312942504882812, 0.06807899475097656, 0.073028564453125, 0.07797813415527344, 0.08292770385742188, 0.08787727355957031, 0.09282684326171875, 0.09777641296386719, 0.10272598266601562, 0.10767555236816406, 0.1126251220703125, 0.11757469177246094, 0.12252426147460938, 0.1274738311767578, 0.13242340087890625, 0.1373729705810547, 0.14232254028320312, 0.14727210998535156, 0.1522216796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 19.0, 27.0, 43.0, 54.0, 90.0, 127.0, 210.0, 405.0, 1498.0, 52023.0, 4131180.0, 7771.0, 619.0, 138.0, 44.0, 15.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.546875, -14.26873779296875, -13.9906005859375, -13.71246337890625, -13.434326171875, -13.15618896484375, -12.8780517578125, -12.59991455078125, -12.32177734375, -12.04364013671875, -11.7655029296875, -11.48736572265625, -11.209228515625, -10.93109130859375, -10.6529541015625, -10.37481689453125, -10.0966796875, -9.81854248046875, -9.5404052734375, -9.26226806640625, -8.984130859375, -8.70599365234375, -8.4278564453125, -8.14971923828125, -7.87158203125, -7.59344482421875, -7.3153076171875, -7.03717041015625, -6.759033203125, -6.48089599609375, -6.2027587890625, -5.92462158203125, -5.646484375, -5.36834716796875, -5.0902099609375, -4.81207275390625, -4.533935546875, -4.25579833984375, -3.9776611328125, -3.69952392578125, -3.42138671875, -3.14324951171875, -2.8651123046875, -2.58697509765625, -2.308837890625, -2.03070068359375, -1.7525634765625, -1.47442626953125, -1.1962890625, -0.91815185546875, -0.6400146484375, -0.36187744140625, -0.083740234375, 0.19439697265625, 0.4725341796875, 0.75067138671875, 1.02880859375, 1.30694580078125, 1.5850830078125, 1.86322021484375, 2.141357421875, 2.41949462890625, 2.6976318359375, 2.97576904296875, 3.25390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 12.0, 19.0, 25.0, 42.0, 69.0, 114.0, 269.0, 586.0, 1502.0, 896.0, 227.0, 89.0, 48.0, 31.0, 27.0, 15.0, 20.0, 17.0, 14.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25, -0.24102783203125, -0.2320556640625, -0.22308349609375, -0.214111328125, -0.20513916015625, -0.1961669921875, -0.18719482421875, -0.17822265625, -0.16925048828125, -0.1602783203125, -0.15130615234375, -0.142333984375, -0.13336181640625, -0.1243896484375, -0.11541748046875, -0.1064453125, -0.09747314453125, -0.0885009765625, -0.07952880859375, -0.070556640625, -0.06158447265625, -0.0526123046875, -0.04364013671875, -0.03466796875, -0.02569580078125, -0.0167236328125, -0.00775146484375, 0.001220703125, 0.01019287109375, 0.0191650390625, 0.02813720703125, 0.037109375, 0.04608154296875, 0.0550537109375, 0.06402587890625, 0.072998046875, 0.08197021484375, 0.0909423828125, 0.09991455078125, 0.10888671875, 0.11785888671875, 0.1268310546875, 0.13580322265625, 0.144775390625, 0.15374755859375, 0.1627197265625, 0.17169189453125, 0.1806640625, 0.18963623046875, 0.1986083984375, 0.20758056640625, 0.216552734375, 0.22552490234375, 0.2344970703125, 0.24346923828125, 0.25244140625, 0.26141357421875, 0.2703857421875, 0.27935791015625, 0.288330078125, 0.29730224609375, 0.3062744140625, 0.31524658203125, 0.32421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 64.0, 911.0, 26.0, 5.0], "bins": [-70.32695770263672, -69.18630981445312, -68.045654296875, -66.9050064086914, -65.76435852050781, -64.62370300292969, -63.483055114746094, -62.342403411865234, -61.201751708984375, -60.061100006103516, -58.92045211791992, -57.77980041503906, -56.6391487121582, -55.498497009277344, -54.35784912109375, -53.21719741821289, -52.07654571533203, -50.93589401245117, -49.79524612426758, -48.65459442138672, -47.51394271850586, -46.373291015625, -45.232643127441406, -44.09199142456055, -42.95134353637695, -41.810691833496094, -40.6700439453125, -39.52939224243164, -38.38874053955078, -37.24808883666992, -36.10744094848633, -34.96678924560547, -33.826133728027344, -32.685482025146484, -31.544832229614258, -30.40418243408203, -29.263530731201172, -28.122880935668945, -26.98223114013672, -25.84157943725586, -24.700929641723633, -23.560279846191406, -22.419628143310547, -21.27897834777832, -20.13832664489746, -18.997676849365234, -17.857025146484375, -16.71637535095215, -15.575724601745605, -14.435073852539062, -13.29442310333252, -12.153772354125977, -11.01312255859375, -9.87247085571289, -8.731821060180664, -7.591170310974121, -6.450519561767578, -5.309868812561035, -4.169218063354492, -3.0285677909851074, -1.8879170417785645, -0.7472662925720215, 0.3933839797973633, 1.5340347290039062, 2.67468523979187]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 9.0, 7.0, 24.0, 39.0, 54.0, 83.0, 87.0, 127.0, 128.0, 116.0, 109.0, 74.0, 56.0, 30.0, 20.0, 14.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.321140289306641, -7.164836883544922, -7.008533477783203, -6.852229595184326, -6.695926189422607, -6.539622783660889, -6.383318901062012, -6.227015495300293, -6.070712089538574, -5.9144086837768555, -5.758105278015137, -5.60180139541626, -5.445497989654541, -5.289194583892822, -5.132890701293945, -4.976587295532227, -4.820283889770508, -4.663980484008789, -4.50767707824707, -4.351373195648193, -4.195069789886475, -4.038766384124756, -3.882462739944458, -3.72615909576416, -3.5698556900024414, -3.4135522842407227, -3.257248640060425, -3.100944995880127, -2.944641590118408, -2.7883381843566895, -2.6320345401763916, -2.4757308959960938, -2.319427490234375, -2.1631240844726562, -2.0068204402923584, -1.85051691532135, -1.6942133903503418, -1.5379098653793335, -1.3816063404083252, -1.225302815437317, -1.0689992904663086, -0.9126957654953003, -0.756392240524292, -0.6000887155532837, -0.4437851905822754, -0.2874816656112671, -0.1311781406402588, 0.02512538433074951, 0.1814289093017578, 0.3377324342727661, 0.4940359592437744, 0.6503394842147827, 0.806643009185791, 0.9629465341567993, 1.1192500591278076, 1.275553584098816, 1.4318571090698242, 1.5881606340408325, 1.7444641590118408, 1.9007676839828491, 2.0570712089538574, 2.213374614715576, 2.369678258895874, 2.525981903076172, 2.6822853088378906]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 9.0, 23.0, 11.0, 24.0, 21.0, 30.0, 38.0, 54.0, 83.0, 180.0, 600.0, 3403.0, 34635.0, 878186.0, 122119.0, 7463.0, 1051.0, 243.0, 96.0, 58.0, 36.0, 37.0, 34.0, 23.0, 21.0, 18.0, 8.0, 9.0, 3.0, 7.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.2777099609375, -3.180419921875, -3.0831298828125, -2.98583984375, -2.8885498046875, -2.791259765625, -2.6939697265625, -2.5966796875, -2.4993896484375, -2.402099609375, -2.3048095703125, -2.20751953125, -2.1102294921875, -2.012939453125, -1.9156494140625, -1.818359375, -1.7210693359375, -1.623779296875, -1.5264892578125, -1.42919921875, -1.3319091796875, -1.234619140625, -1.1373291015625, -1.0400390625, -0.9427490234375, -0.845458984375, -0.7481689453125, -0.65087890625, -0.5535888671875, -0.456298828125, -0.3590087890625, -0.26171875, -0.1644287109375, -0.067138671875, 0.0301513671875, 0.12744140625, 0.2247314453125, 0.322021484375, 0.4193115234375, 0.5166015625, 0.6138916015625, 0.711181640625, 0.8084716796875, 0.90576171875, 1.0030517578125, 1.100341796875, 1.1976318359375, 1.294921875, 1.3922119140625, 1.489501953125, 1.5867919921875, 1.68408203125, 1.7813720703125, 1.878662109375, 1.9759521484375, 2.0732421875, 2.1705322265625, 2.267822265625, 2.3651123046875, 2.46240234375, 2.5596923828125, 2.656982421875, 2.7542724609375, 2.8515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 8.0, 6.0, 12.0, 40.0, 73.0, 122.0, 198.0, 233.0, 170.0, 74.0, 32.0, 23.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.451416015625, -0.4429044723510742, -0.43439292907714844, -0.42588138580322266, -0.4173698425292969, -0.4088582992553711, -0.4003467559814453, -0.39183521270751953, -0.38332366943359375, -0.37481212615966797, -0.3663005828857422, -0.3577890396118164, -0.3492774963378906, -0.34076595306396484, -0.33225440979003906, -0.3237428665161133, -0.3152313232421875, -0.3067197799682617, -0.29820823669433594, -0.28969669342041016, -0.2811851501464844, -0.2726736068725586, -0.2641620635986328, -0.25565052032470703, -0.24713897705078125, -0.23862743377685547, -0.2301158905029297, -0.2216043472290039, -0.21309280395507812, -0.20458126068115234, -0.19606971740722656, -0.18755817413330078, -0.179046630859375, -0.17053508758544922, -0.16202354431152344, -0.15351200103759766, -0.14500045776367188, -0.1364889144897461, -0.1279773712158203, -0.11946582794189453, -0.11095428466796875, -0.10244274139404297, -0.09393119812011719, -0.0854196548461914, -0.07690811157226562, -0.06839656829833984, -0.05988502502441406, -0.05137348175048828, -0.0428619384765625, -0.03435039520263672, -0.025838851928710938, -0.017327308654785156, -0.008815765380859375, -0.00030422210693359375, 0.008207321166992188, 0.01671886444091797, 0.02523040771484375, 0.03374195098876953, 0.04225349426269531, 0.050765037536621094, 0.059276580810546875, 0.06778812408447266, 0.07629966735839844, 0.08481121063232422, 0.09332275390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 7.0, 6.0, 11.0, 15.0, 31.0, 35.0, 67.0, 112.0, 250.0, 580.0, 1564.0, 5066.0, 18994.0, 91692.0, 594034.0, 278195.0, 42973.0, 10093.0, 2979.0, 1044.0, 420.0, 168.0, 95.0, 41.0, 19.0, 18.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.2108612060546875, -1.168792724609375, -1.1267242431640625, -1.08465576171875, -1.0425872802734375, -1.000518798828125, -0.9584503173828125, -0.9163818359375, -0.8743133544921875, -0.832244873046875, -0.7901763916015625, -0.74810791015625, -0.7060394287109375, -0.663970947265625, -0.6219024658203125, -0.579833984375, -0.5377655029296875, -0.495697021484375, -0.4536285400390625, -0.41156005859375, -0.3694915771484375, -0.327423095703125, -0.2853546142578125, -0.2432861328125, -0.2012176513671875, -0.159149169921875, -0.1170806884765625, -0.07501220703125, -0.0329437255859375, 0.009124755859375, 0.0511932373046875, 0.09326171875, 0.1353302001953125, 0.177398681640625, 0.2194671630859375, 0.26153564453125, 0.3036041259765625, 0.345672607421875, 0.3877410888671875, 0.4298095703125, 0.4718780517578125, 0.513946533203125, 0.5560150146484375, 0.59808349609375, 0.6401519775390625, 0.682220458984375, 0.7242889404296875, 0.766357421875, 0.8084259033203125, 0.850494384765625, 0.8925628662109375, 0.93463134765625, 0.9766998291015625, 1.018768310546875, 1.0608367919921875, 1.1029052734375, 1.1449737548828125, 1.187042236328125, 1.2291107177734375, 1.27117919921875, 1.3132476806640625, 1.355316162109375, 1.3973846435546875, 1.439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 2.0, 9.0, 6.0, 7.0, 13.0, 18.0, 12.0, 20.0, 25.0, 28.0, 21.0, 22.0, 30.0, 23.0, 29.0, 39.0, 41.0, 40.0, 40.0, 38.0, 40.0, 44.0, 35.0, 39.0, 42.0, 40.0, 26.0, 35.0, 33.0, 21.0, 28.0, 26.0, 17.0, 17.0, 22.0, 10.0, 11.0, 6.0, 11.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.385986328125, -0.3734169006347656, -0.36084747314453125, -0.3482780456542969, -0.3357086181640625, -0.3231391906738281, -0.31056976318359375, -0.2980003356933594, -0.285430908203125, -0.2728614807128906, -0.26029205322265625, -0.24772262573242188, -0.2351531982421875, -0.22258377075195312, -0.21001434326171875, -0.19744491577148438, -0.18487548828125, -0.17230606079101562, -0.15973663330078125, -0.14716720581054688, -0.1345977783203125, -0.12202835083007812, -0.10945892333984375, -0.09688949584960938, -0.084320068359375, -0.07175064086914062, -0.05918121337890625, -0.046611785888671875, -0.0340423583984375, -0.021472930908203125, -0.00890350341796875, 0.003665924072265625, 0.0162353515625, 0.028804779052734375, 0.04137420654296875, 0.053943634033203125, 0.0665130615234375, 0.07908248901367188, 0.09165191650390625, 0.10422134399414062, 0.116790771484375, 0.12936019897460938, 0.14192962646484375, 0.15449905395507812, 0.1670684814453125, 0.17963790893554688, 0.19220733642578125, 0.20477676391601562, 0.21734619140625, 0.22991561889648438, 0.24248504638671875, 0.2550544738769531, 0.2676239013671875, 0.2801933288574219, 0.29276275634765625, 0.3053321838378906, 0.317901611328125, 0.3304710388183594, 0.34304046630859375, 0.3556098937988281, 0.3681793212890625, 0.3807487487792969, 0.39331817626953125, 0.4058876037597656, 0.41845703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 8.0, 6.0, 4.0, 10.0, 12.0, 22.0, 23.0, 24.0, 62.0, 91.0, 166.0, 288.0, 529.0, 1107.0, 2810.0, 10186.0, 125511.0, 879993.0, 20091.0, 4253.0, 1622.0, 703.0, 394.0, 239.0, 128.0, 82.0, 58.0, 38.0, 25.0, 13.0, 16.0, 12.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.5, -6.33416748046875, -6.1683349609375, -6.00250244140625, -5.836669921875, -5.67083740234375, -5.5050048828125, -5.33917236328125, -5.17333984375, -5.00750732421875, -4.8416748046875, -4.67584228515625, -4.510009765625, -4.34417724609375, -4.1783447265625, -4.01251220703125, -3.8466796875, -3.68084716796875, -3.5150146484375, -3.34918212890625, -3.183349609375, -3.01751708984375, -2.8516845703125, -2.68585205078125, -2.52001953125, -2.35418701171875, -2.1883544921875, -2.02252197265625, -1.856689453125, -1.69085693359375, -1.5250244140625, -1.35919189453125, -1.193359375, -1.02752685546875, -0.8616943359375, -0.69586181640625, -0.530029296875, -0.36419677734375, -0.1983642578125, -0.03253173828125, 0.13330078125, 0.29913330078125, 0.4649658203125, 0.63079833984375, 0.796630859375, 0.96246337890625, 1.1282958984375, 1.29412841796875, 1.4599609375, 1.62579345703125, 1.7916259765625, 1.95745849609375, 2.123291015625, 2.28912353515625, 2.4549560546875, 2.62078857421875, 2.78662109375, 2.95245361328125, 3.1182861328125, 3.28411865234375, 3.449951171875, 3.61578369140625, 3.7816162109375, 3.94744873046875, 4.11328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 12.0, 12.0, 31.0, 37.0, 65.0, 86.0, 166.0, 223.0, 133.0, 62.0, 36.0, 28.0, 24.0, 9.0, 12.0, 10.0, 4.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006322860717773438, -0.0006138309836387634, -0.0005953758955001831, -0.0005769208073616028, -0.0005584657192230225, -0.0005400106310844421, -0.0005215555429458618, -0.0005031004548072815, -0.00048464536666870117, -0.00046619027853012085, -0.00044773519039154053, -0.0004292801022529602, -0.0004108250141143799, -0.00039236992597579956, -0.00037391483783721924, -0.0003554597496986389, -0.0003370046615600586, -0.00031854957342147827, -0.00030009448528289795, -0.0002816393971443176, -0.0002631843090057373, -0.000244729220867157, -0.00022627413272857666, -0.00020781904458999634, -0.00018936395645141602, -0.0001709088683128357, -0.00015245378017425537, -0.00013399869203567505, -0.00011554360389709473, -9.70885157585144e-05, -7.863342761993408e-05, -6.017833948135376e-05, -4.172325134277344e-05, -2.3268163204193115e-05, -4.813075065612793e-06, 1.364201307296753e-05, 3.209710121154785e-05, 5.0552189350128174e-05, 6.90072774887085e-05, 8.746236562728882e-05, 0.00010591745376586914, 0.00012437254190444946, 0.00014282763004302979, 0.0001612827181816101, 0.00017973780632019043, 0.00019819289445877075, 0.00021664798259735107, 0.0002351030707359314, 0.0002535581588745117, 0.00027201324701309204, 0.00029046833515167236, 0.0003089234232902527, 0.000327378511428833, 0.00034583359956741333, 0.00036428868770599365, 0.000382743775844574, 0.0004011988639831543, 0.0004196539521217346, 0.00043810904026031494, 0.00045656412839889526, 0.0004750192165374756, 0.0004934743046760559, 0.0005119293928146362, 0.0005303844809532166, 0.0005488395690917969]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 8.0, 8.0, 15.0, 16.0, 27.0, 49.0, 85.0, 176.0, 337.0, 822.0, 2122.0, 6915.0, 33008.0, 810810.0, 170826.0, 16253.0, 4365.0, 1460.0, 615.0, 269.0, 114.0, 86.0, 51.0, 46.0, 21.0, 12.0, 8.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.135772705078125, -3.00396728515625, -2.872161865234375, -2.7403564453125, -2.608551025390625, -2.47674560546875, -2.344940185546875, -2.213134765625, -2.081329345703125, -1.94952392578125, -1.817718505859375, -1.6859130859375, -1.554107666015625, -1.42230224609375, -1.290496826171875, -1.15869140625, -1.026885986328125, -0.89508056640625, -0.763275146484375, -0.6314697265625, -0.499664306640625, -0.36785888671875, -0.236053466796875, -0.104248046875, 0.027557373046875, 0.15936279296875, 0.291168212890625, 0.4229736328125, 0.554779052734375, 0.68658447265625, 0.818389892578125, 0.9501953125, 1.082000732421875, 1.21380615234375, 1.345611572265625, 1.4774169921875, 1.609222412109375, 1.74102783203125, 1.872833251953125, 2.004638671875, 2.136444091796875, 2.26824951171875, 2.400054931640625, 2.5318603515625, 2.663665771484375, 2.79547119140625, 2.927276611328125, 3.05908203125, 3.190887451171875, 3.32269287109375, 3.454498291015625, 3.5863037109375, 3.718109130859375, 3.84991455078125, 3.981719970703125, 4.113525390625, 4.245330810546875, 4.37713623046875, 4.508941650390625, 4.6407470703125, 4.772552490234375, 4.90435791015625, 5.036163330078125, 5.16796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 2.0, 10.0, 14.0, 23.0, 30.0, 47.0, 83.0, 168.0, 226.0, 152.0, 87.0, 48.0, 34.0, 23.0, 16.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5060272216796875, -1.438812255859375, -1.3715972900390625, -1.30438232421875, -1.2371673583984375, -1.169952392578125, -1.1027374267578125, -1.0355224609375, -0.9683074951171875, -0.901092529296875, -0.8338775634765625, -0.76666259765625, -0.6994476318359375, -0.632232666015625, -0.5650177001953125, -0.497802734375, -0.4305877685546875, -0.363372802734375, -0.2961578369140625, -0.22894287109375, -0.1617279052734375, -0.094512939453125, -0.0272979736328125, 0.0399169921875, 0.1071319580078125, 0.174346923828125, 0.2415618896484375, 0.30877685546875, 0.3759918212890625, 0.443206787109375, 0.5104217529296875, 0.57763671875, 0.6448516845703125, 0.712066650390625, 0.7792816162109375, 0.84649658203125, 0.9137115478515625, 0.980926513671875, 1.0481414794921875, 1.1153564453125, 1.1825714111328125, 1.249786376953125, 1.3170013427734375, 1.38421630859375, 1.4514312744140625, 1.518646240234375, 1.5858612060546875, 1.653076171875, 1.7202911376953125, 1.787506103515625, 1.8547210693359375, 1.92193603515625, 1.9891510009765625, 2.056365966796875, 2.1235809326171875, 2.1907958984375, 2.2580108642578125, 2.325225830078125, 2.3924407958984375, 2.45965576171875, 2.5268707275390625, 2.594085693359375, 2.6613006591796875, 2.728515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 11.0, 29.0, 64.0, 133.0, 261.0, 227.0, 131.0, 57.0, 36.0, 19.0, 15.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015359878540039, -7.662660598754883, -7.309961318969727, -6.95726203918457, -6.604562759399414, -6.251863479614258, -5.899164199829102, -5.546464920043945, -5.193765640258789, -4.841066360473633, -4.488367080688477, -4.13566780090332, -3.782968521118164, -3.430269241333008, -3.0775701999664307, -2.7248709201812744, -2.3721718788146973, -2.019472599029541, -1.6667733192443848, -1.314074158668518, -0.9613748788833618, -0.6086755990982056, -0.25597643852233887, 0.09672284126281738, 0.44942212104797363, 0.8021214008331299, 1.1548206806182861, 1.5075198411941528, 1.860219120979309, 2.212918281555176, 2.565617561340332, 2.9183168411254883, 3.2710161209106445, 3.623715400695801, 3.976414680480957, 4.329113960266113, 4.6818132400512695, 5.034512519836426, 5.387211799621582, 5.739911079406738, 6.0926103591918945, 6.445309638977051, 6.798008918762207, 7.150708198547363, 7.5034074783325195, 7.856106758117676, 8.208806037902832, 8.561505317687988, 8.914203643798828, 9.266902923583984, 9.61960220336914, 9.972301483154297, 10.325000762939453, 10.67770004272461, 11.030399322509766, 11.383098602294922, 11.735797882080078, 12.088497161865234, 12.44119644165039, 12.793895721435547, 13.146595001220703, 13.49929428100586, 13.851993560791016, 14.204692840576172, 14.557392120361328]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 9.0, 14.0, 22.0, 27.0, 39.0, 52.0, 65.0, 91.0, 106.0, 109.0, 108.0, 94.0, 78.0, 51.0, 47.0, 26.0, 18.0, 22.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.437831878662109, -4.1784749031066895, -3.9191179275512695, -3.6597609519958496, -3.4004039764404297, -3.1410470008850098, -2.88169002532959, -2.62233304977417, -2.36297607421875, -2.10361909866333, -1.8442621231079102, -1.5849051475524902, -1.3255481719970703, -1.0661911964416504, -0.8068342208862305, -0.5474772453308105, -0.2881202697753906, -0.028763294219970703, 0.23059368133544922, 0.48995065689086914, 0.7493076324462891, 1.008664608001709, 1.268021583557129, 1.5273785591125488, 1.7867355346679688, 2.0460925102233887, 2.3054494857788086, 2.5648064613342285, 2.8241634368896484, 3.0835204124450684, 3.3428773880004883, 3.602234363555908, 3.8615903854370117, 4.120947360992432, 4.380304336547852, 4.6396613121032715, 4.899018287658691, 5.158375263214111, 5.417732238769531, 5.677089214324951, 5.936446189880371, 6.195803165435791, 6.455160140991211, 6.714517116546631, 6.973874092102051, 7.233231067657471, 7.492588043212891, 7.7519450187683105, 8.01130199432373, 8.270658493041992, 8.53001594543457, 8.789373397827148, 9.04872989654541, 9.308086395263672, 9.56744384765625, 9.826801300048828, 10.08615779876709, 10.345514297485352, 10.60487174987793, 10.864229202270508, 11.12358570098877, 11.382942199707031, 11.64229965209961, 11.901657104492188, 12.16101360321045]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 7.0, 7.0, 16.0, 9.0, 9.0, 20.0, 9.0, 42.0, 74.0, 349.0, 4069.0, 4100126.0, 87727.0, 1425.0, 191.0, 47.0, 20.0, 20.0, 12.0, 20.0, 9.0, 13.0, 6.0, 2.0, 7.0, 8.0, 6.0, 3.0, 8.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0546875, -13.6265869140625, -13.198486328125, -12.7703857421875, -12.34228515625, -11.9141845703125, -11.486083984375, -11.0579833984375, -10.6298828125, -10.2017822265625, -9.773681640625, -9.3455810546875, -8.91748046875, -8.4893798828125, -8.061279296875, -7.6331787109375, -7.205078125, -6.7769775390625, -6.348876953125, -5.9207763671875, -5.49267578125, -5.0645751953125, -4.636474609375, -4.2083740234375, -3.7802734375, -3.3521728515625, -2.924072265625, -2.4959716796875, -2.06787109375, -1.6397705078125, -1.211669921875, -0.7835693359375, -0.35546875, 0.0726318359375, 0.500732421875, 0.9288330078125, 1.35693359375, 1.7850341796875, 2.213134765625, 2.6412353515625, 3.0693359375, 3.4974365234375, 3.925537109375, 4.3536376953125, 4.78173828125, 5.2098388671875, 5.637939453125, 6.0660400390625, 6.494140625, 6.9222412109375, 7.350341796875, 7.7784423828125, 8.20654296875, 8.6346435546875, 9.062744140625, 9.4908447265625, 9.9189453125, 10.3470458984375, 10.775146484375, 11.2032470703125, 11.63134765625, 12.0594482421875, 12.487548828125, 12.9156494140625, 13.34375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 10.0, 4.0, 6.0, 10.0, 9.0, 19.0, 19.0, 21.0, 17.0, 23.0, 32.0, 31.0, 41.0, 47.0, 50.0, 52.0, 57.0, 52.0, 56.0, 54.0, 43.0, 52.0, 37.0, 40.0, 30.0, 35.0, 26.0, 24.0, 22.0, 13.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0797119140625, -0.07734107971191406, -0.07497024536132812, -0.07259941101074219, -0.07022857666015625, -0.06785774230957031, -0.06548690795898438, -0.06311607360839844, -0.0607452392578125, -0.05837440490722656, -0.056003570556640625, -0.05363273620605469, -0.05126190185546875, -0.04889106750488281, -0.046520233154296875, -0.04414939880371094, -0.041778564453125, -0.03940773010253906, -0.037036895751953125, -0.03466606140136719, -0.03229522705078125, -0.029924392700195312, -0.027553558349609375, -0.025182723999023438, -0.0228118896484375, -0.020441055297851562, -0.018070220947265625, -0.015699386596679688, -0.01332855224609375, -0.010957717895507812, -0.008586883544921875, -0.0062160491943359375, -0.00384521484375, -0.0014743804931640625, 0.000896453857421875, 0.0032672882080078125, 0.00563812255859375, 0.008008956909179688, 0.010379791259765625, 0.012750625610351562, 0.0151214599609375, 0.017492294311523438, 0.019863128662109375, 0.022233963012695312, 0.02460479736328125, 0.026975631713867188, 0.029346466064453125, 0.03171730041503906, 0.034088134765625, 0.03645896911621094, 0.038829803466796875, 0.04120063781738281, 0.04357147216796875, 0.04594230651855469, 0.048313140869140625, 0.05068397521972656, 0.0530548095703125, 0.05542564392089844, 0.057796478271484375, 0.06016731262207031, 0.06253814697265625, 0.06490898132324219, 0.06727981567382812, 0.06965065002441406, 0.072021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 14.0, 32.0, 46.0, 170.0, 25568.0, 4167964.0, 364.0, 85.0, 31.0, 12.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.28125, -7.4658203125, -6.650390625, -5.8349609375, -5.01953125, -4.2041015625, -3.388671875, -2.5732421875, -1.7578125, -0.9423828125, -0.126953125, 0.6884765625, 1.50390625, 2.3193359375, 3.134765625, 3.9501953125, 4.765625, 5.5810546875, 6.396484375, 7.2119140625, 8.02734375, 8.8427734375, 9.658203125, 10.4736328125, 11.2890625, 12.1044921875, 12.919921875, 13.7353515625, 14.55078125, 15.3662109375, 16.181640625, 16.9970703125, 17.8125, 18.6279296875, 19.443359375, 20.2587890625, 21.07421875, 21.8896484375, 22.705078125, 23.5205078125, 24.3359375, 25.1513671875, 25.966796875, 26.7822265625, 27.59765625, 28.4130859375, 29.228515625, 30.0439453125, 30.859375, 31.6748046875, 32.490234375, 33.3056640625, 34.12109375, 34.9365234375, 35.751953125, 36.5673828125, 37.3828125, 38.1982421875, 39.013671875, 39.8291015625, 40.64453125, 41.4599609375, 42.275390625, 43.0908203125, 43.90625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 2.0, 10.0, 21.0, 20.0, 16.0, 44.0, 47.0, 90.0, 190.0, 411.0, 1420.0, 1048.0, 313.0, 143.0, 95.0, 56.0, 37.0, 32.0, 20.0, 13.0, 11.0, 9.0, 4.0, 7.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24488449096679688, -0.23464202880859375, -0.22439956665039062, -0.2141571044921875, -0.20391464233398438, -0.19367218017578125, -0.18342971801757812, -0.173187255859375, -0.16294479370117188, -0.15270233154296875, -0.14245986938476562, -0.1322174072265625, -0.12197494506835938, -0.11173248291015625, -0.10149002075195312, -0.09124755859375, -0.08100509643554688, -0.07076263427734375, -0.060520172119140625, -0.0502777099609375, -0.040035247802734375, -0.02979278564453125, -0.019550323486328125, -0.009307861328125, 0.000934600830078125, 0.01117706298828125, 0.021419525146484375, 0.0316619873046875, 0.041904449462890625, 0.05214691162109375, 0.062389373779296875, 0.0726318359375, 0.08287429809570312, 0.09311676025390625, 0.10335922241210938, 0.1136016845703125, 0.12384414672851562, 0.13408660888671875, 0.14432907104492188, 0.154571533203125, 0.16481399536132812, 0.17505645751953125, 0.18529891967773438, 0.1955413818359375, 0.20578384399414062, 0.21602630615234375, 0.22626876831054688, 0.23651123046875, 0.24675369262695312, 0.25699615478515625, 0.2672386169433594, 0.2774810791015625, 0.2877235412597656, 0.29796600341796875, 0.3082084655761719, 0.318450927734375, 0.3286933898925781, 0.33893585205078125, 0.3491783142089844, 0.3594207763671875, 0.3696632385253906, 0.37990570068359375, 0.3901481628417969, 0.400390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 5.0, 862.0, 154.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9658284187316895, -3.255408525466919, -1.5449886322021484, 0.16543149948120117, 1.8758511543273926, 3.586270809173584, 5.296691417694092, 7.007111072540283, 8.717531204223633, 10.427950859069824, 12.138370513916016, 13.848791122436523, 15.559210777282715, 17.269630432128906, 18.980051040649414, 20.690471649169922, 22.400890350341797, 24.111310958862305, 25.82172966003418, 27.532150268554688, 29.242568969726562, 30.95298957824707, 32.66341018676758, 34.37382888793945, 36.08424758911133, 37.7946662902832, 39.505088806152344, 41.21550750732422, 42.925926208496094, 44.63634490966797, 46.34676742553711, 48.057186126708984, 49.767608642578125, 51.47802734375, 53.18844985961914, 54.898868560791016, 56.60928726196289, 58.31970977783203, 60.030128479003906, 61.74054718017578, 63.450965881347656, 65.16138458251953, 66.8718032836914, 68.58222961425781, 70.29264831542969, 72.00306701660156, 73.71348571777344, 75.42390441894531, 77.13432312011719, 78.84474182128906, 80.55516052246094, 82.26557922363281, 83.97600555419922, 85.6864242553711, 87.39684295654297, 89.10726165771484, 90.81768798828125, 92.52810668945312, 94.238525390625, 95.94894409179688, 97.65937042236328, 99.36978912353516, 101.08020782470703, 102.7906265258789, 104.50104522705078]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 15.0, 29.0, 68.0, 117.0, 162.0, 184.0, 209.0, 111.0, 60.0, 33.0, 19.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3870370388031006, -2.258721113204956, -2.1304049491882324, -2.002089023590088, -1.8737730979919434, -1.7454570531845093, -1.6171410083770752, -1.4888250827789307, -1.3605090379714966, -1.2321929931640625, -1.103877067565918, -0.9755610227584839, -0.8472450375556946, -0.7189290523529053, -0.5906130075454712, -0.4622970223426819, -0.3339810371398926, -0.20566503703594208, -0.07734903693199158, 0.05096697807312012, 0.17928296327590942, 0.30759894847869873, 0.4359149932861328, 0.5642309784889221, 0.6925469636917114, 0.8208629488945007, 0.94917893409729, 1.0774949789047241, 1.2058110237121582, 1.3341269493103027, 1.4624429941177368, 1.590759038925171, 1.7190752029418945, 1.8473912477493286, 1.9757071733474731, 2.1040232181549072, 2.2323391437530518, 2.3606553077697754, 2.48897123336792, 2.6172871589660645, 2.745603084564209, 2.8739190101623535, 3.002235174179077, 3.1305510997772217, 3.258867025375366, 3.38718318939209, 3.5154991149902344, 3.643815040588379, 3.7721312046051025, 3.900447130203247, 4.028763294219971, 4.157079219818115, 4.28539514541626, 4.413711071014404, 4.542027473449707, 4.670343399047852, 4.798659324645996, 4.926975250244141, 5.055291175842285, 5.18360710144043, 5.311923503875732, 5.440239429473877, 5.5685553550720215, 5.696871280670166, 5.8251872062683105]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 6.0, 3.0, 8.0, 19.0, 16.0, 24.0, 25.0, 28.0, 25.0, 52.0, 55.0, 55.0, 41.0, 63.0, 1206.0, 1041327.0, 5173.0, 64.0, 50.0, 45.0, 41.0, 47.0, 29.0, 23.0, 29.0, 25.0, 13.0, 14.0, 10.0, 7.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.8773193359375, -7.512451171875, -7.1475830078125, -6.78271484375, -6.4178466796875, -6.052978515625, -5.6881103515625, -5.3232421875, -4.9583740234375, -4.593505859375, -4.2286376953125, -3.86376953125, -3.4989013671875, -3.134033203125, -2.7691650390625, -2.404296875, -2.0394287109375, -1.674560546875, -1.3096923828125, -0.94482421875, -0.5799560546875, -0.215087890625, 0.1497802734375, 0.5146484375, 0.8795166015625, 1.244384765625, 1.6092529296875, 1.97412109375, 2.3389892578125, 2.703857421875, 3.0687255859375, 3.43359375, 3.7984619140625, 4.163330078125, 4.5281982421875, 4.89306640625, 5.2579345703125, 5.622802734375, 5.9876708984375, 6.3525390625, 6.7174072265625, 7.082275390625, 7.4471435546875, 7.81201171875, 8.1768798828125, 8.541748046875, 8.9066162109375, 9.271484375, 9.6363525390625, 10.001220703125, 10.3660888671875, 10.73095703125, 11.0958251953125, 11.460693359375, 11.8255615234375, 12.1904296875, 12.5552978515625, 12.920166015625, 13.2850341796875, 13.64990234375, 14.0147705078125, 14.379638671875, 14.7445068359375, 15.109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 30.0, 124.0, 253.0, 327.0, 209.0, 63.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.11553192138671875, -0.0938568115234375, -0.07218170166015625, -0.050506591796875, -0.02883148193359375, -0.0071563720703125, 0.01451873779296875, 0.03619384765625, 0.05786895751953125, 0.0795440673828125, 0.10121917724609375, 0.122894287109375, 0.14456939697265625, 0.1662445068359375, 0.18791961669921875, 0.2095947265625, 0.23126983642578125, 0.2529449462890625, 0.27462005615234375, 0.296295166015625, 0.31797027587890625, 0.3396453857421875, 0.36132049560546875, 0.38299560546875, 0.40467071533203125, 0.4263458251953125, 0.44802093505859375, 0.469696044921875, 0.49137115478515625, 0.5130462646484375, 0.5347213745117188, 0.556396484375, 0.5780715942382812, 0.5997467041015625, 0.6214218139648438, 0.643096923828125, 0.6647720336914062, 0.6864471435546875, 0.7081222534179688, 0.72979736328125, 0.7514724731445312, 0.7731475830078125, 0.7948226928710938, 0.816497802734375, 0.8381729125976562, 0.8598480224609375, 0.8815231323242188, 0.9031982421875, 0.9248733520507812, 0.9465484619140625, 0.9682235717773438, 0.989898681640625, 1.0115737915039062, 1.0332489013671875, 1.0549240112304688, 1.07659912109375, 1.0982742309570312, 1.1199493408203125, 1.1416244506835938, 1.163299560546875, 1.1849746704101562, 1.2066497802734375, 1.2283248901367188, 1.25]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 7.0, 25.0, 21.0, 26.0, 63.0, 69.0, 126.0, 260.0, 504.0, 1356.0, 4680.0, 25804.0, 227652.0, 669614.0, 99928.0, 13624.0, 2933.0, 915.0, 378.0, 208.0, 114.0, 66.0, 40.0, 20.0, 23.0, 13.0, 14.0, 14.0, 9.0, 9.0, 2.0, 6.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4296875, -3.323577880859375, -3.21746826171875, -3.111358642578125, -3.0052490234375, -2.899139404296875, -2.79302978515625, -2.686920166015625, -2.580810546875, -2.474700927734375, -2.36859130859375, -2.262481689453125, -2.1563720703125, -2.050262451171875, -1.94415283203125, -1.838043212890625, -1.73193359375, -1.625823974609375, -1.51971435546875, -1.413604736328125, -1.3074951171875, -1.201385498046875, -1.09527587890625, -0.989166259765625, -0.883056640625, -0.776947021484375, -0.67083740234375, -0.564727783203125, -0.4586181640625, -0.352508544921875, -0.24639892578125, -0.140289306640625, -0.0341796875, 0.071929931640625, 0.17803955078125, 0.284149169921875, 0.3902587890625, 0.496368408203125, 0.60247802734375, 0.708587646484375, 0.814697265625, 0.920806884765625, 1.02691650390625, 1.133026123046875, 1.2391357421875, 1.345245361328125, 1.45135498046875, 1.557464599609375, 1.66357421875, 1.769683837890625, 1.87579345703125, 1.981903076171875, 2.0880126953125, 2.194122314453125, 2.30023193359375, 2.406341552734375, 2.512451171875, 2.618560791015625, 2.72467041015625, 2.830780029296875, 2.9368896484375, 3.042999267578125, 3.14910888671875, 3.255218505859375, 3.361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 3.0, 8.0, 7.0, 14.0, 22.0, 18.0, 22.0, 20.0, 34.0, 25.0, 30.0, 54.0, 41.0, 52.0, 53.0, 49.0, 51.0, 51.0, 47.0, 48.0, 49.0, 47.0, 43.0, 35.0, 35.0, 27.0, 20.0, 16.0, 13.0, 13.0, 8.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.133148193359375, -1.09735107421875, -1.061553955078125, -1.0257568359375, -0.989959716796875, -0.95416259765625, -0.918365478515625, -0.882568359375, -0.846771240234375, -0.81097412109375, -0.775177001953125, -0.7393798828125, -0.703582763671875, -0.66778564453125, -0.631988525390625, -0.59619140625, -0.560394287109375, -0.52459716796875, -0.488800048828125, -0.4530029296875, -0.417205810546875, -0.38140869140625, -0.345611572265625, -0.309814453125, -0.274017333984375, -0.23822021484375, -0.202423095703125, -0.1666259765625, -0.130828857421875, -0.09503173828125, -0.059234619140625, -0.0234375, 0.012359619140625, 0.04815673828125, 0.083953857421875, 0.1197509765625, 0.155548095703125, 0.19134521484375, 0.227142333984375, 0.262939453125, 0.298736572265625, 0.33453369140625, 0.370330810546875, 0.4061279296875, 0.441925048828125, 0.47772216796875, 0.513519287109375, 0.54931640625, 0.585113525390625, 0.62091064453125, 0.656707763671875, 0.6925048828125, 0.728302001953125, 0.76409912109375, 0.799896240234375, 0.835693359375, 0.871490478515625, 0.90728759765625, 0.943084716796875, 0.9788818359375, 1.014678955078125, 1.05047607421875, 1.086273193359375, 1.1220703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 12.0, 11.0, 9.0, 21.0, 24.0, 33.0, 49.0, 92.0, 148.0, 310.0, 914.0, 3000.0, 14311.0, 170372.0, 778015.0, 69400.0, 8487.0, 2031.0, 653.0, 282.0, 144.0, 67.0, 36.0, 29.0, 20.0, 21.0, 8.0, 11.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.4296875, -5.2716064453125, -5.113525390625, -4.9554443359375, -4.79736328125, -4.6392822265625, -4.481201171875, -4.3231201171875, -4.1650390625, -4.0069580078125, -3.848876953125, -3.6907958984375, -3.53271484375, -3.3746337890625, -3.216552734375, -3.0584716796875, -2.900390625, -2.7423095703125, -2.584228515625, -2.4261474609375, -2.26806640625, -2.1099853515625, -1.951904296875, -1.7938232421875, -1.6357421875, -1.4776611328125, -1.319580078125, -1.1614990234375, -1.00341796875, -0.8453369140625, -0.687255859375, -0.5291748046875, -0.37109375, -0.2130126953125, -0.054931640625, 0.1031494140625, 0.26123046875, 0.4193115234375, 0.577392578125, 0.7354736328125, 0.8935546875, 1.0516357421875, 1.209716796875, 1.3677978515625, 1.52587890625, 1.6839599609375, 1.842041015625, 2.0001220703125, 2.158203125, 2.3162841796875, 2.474365234375, 2.6324462890625, 2.79052734375, 2.9486083984375, 3.106689453125, 3.2647705078125, 3.4228515625, 3.5809326171875, 3.739013671875, 3.8970947265625, 4.05517578125, 4.2132568359375, 4.371337890625, 4.5294189453125, 4.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 11.0, 12.0, 14.0, 14.0, 32.0, 39.0, 47.0, 56.0, 76.0, 121.0, 121.0, 86.0, 90.0, 44.0, 41.0, 36.0, 28.0, 27.0, 17.0, 10.0, 11.0, 12.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0004756450653076172, -0.0004621855914592743, -0.0004487261176109314, -0.0004352666437625885, -0.0004218071699142456, -0.0004083476960659027, -0.0003948882222175598, -0.0003814287483692169, -0.000367969274520874, -0.00035450980067253113, -0.00034105032682418823, -0.00032759085297584534, -0.00031413137912750244, -0.00030067190527915955, -0.00028721243143081665, -0.00027375295758247375, -0.00026029348373413086, -0.00024683400988578796, -0.00023337453603744507, -0.00021991506218910217, -0.00020645558834075928, -0.00019299611449241638, -0.00017953664064407349, -0.0001660771667957306, -0.0001526176929473877, -0.0001391582190990448, -0.0001256987452507019, -0.00011223927140235901, -9.877979755401611e-05, -8.532032370567322e-05, -7.186084985733032e-05, -5.840137600898743e-05, -4.494190216064453e-05, -3.1482428312301636e-05, -1.802295446395874e-05, -4.563480615615845e-06, 8.89599323272705e-06, 2.2355467081069946e-05, 3.581494092941284e-05, 4.927441477775574e-05, 6.273388862609863e-05, 7.619336247444153e-05, 8.965283632278442e-05, 0.00010311231017112732, 0.00011657178401947021, 0.0001300312578678131, 0.000143490731716156, 0.0001569502055644989, 0.0001704096794128418, 0.0001838691532611847, 0.0001973286271095276, 0.00021078810095787048, 0.00022424757480621338, 0.00023770704865455627, 0.00025116652250289917, 0.00026462599635124207, 0.00027808547019958496, 0.00029154494404792786, 0.00030500441789627075, 0.00031846389174461365, 0.00033192336559295654, 0.00034538283944129944, 0.00035884231328964233, 0.00037230178713798523, 0.0003857612609863281]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 15.0, 18.0, 41.0, 35.0, 86.0, 130.0, 271.0, 659.0, 1833.0, 6844.0, 40326.0, 784787.0, 193897.0, 14473.0, 3224.0, 1059.0, 392.0, 184.0, 107.0, 56.0, 24.0, 15.0, 18.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.587890625, -6.38671875, -6.185546875, -5.984375, -5.783203125, -5.58203125, -5.380859375, -5.1796875, -4.978515625, -4.77734375, -4.576171875, -4.375, -4.173828125, -3.97265625, -3.771484375, -3.5703125, -3.369140625, -3.16796875, -2.966796875, -2.765625, -2.564453125, -2.36328125, -2.162109375, -1.9609375, -1.759765625, -1.55859375, -1.357421875, -1.15625, -0.955078125, -0.75390625, -0.552734375, -0.3515625, -0.150390625, 0.05078125, 0.251953125, 0.453125, 0.654296875, 0.85546875, 1.056640625, 1.2578125, 1.458984375, 1.66015625, 1.861328125, 2.0625, 2.263671875, 2.46484375, 2.666015625, 2.8671875, 3.068359375, 3.26953125, 3.470703125, 3.671875, 3.873046875, 4.07421875, 4.275390625, 4.4765625, 4.677734375, 4.87890625, 5.080078125, 5.28125, 5.482421875, 5.68359375, 5.884765625, 6.0859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 2.0, 5.0, 6.0, 8.0, 9.0, 33.0, 46.0, 72.0, 120.0, 146.0, 148.0, 150.0, 87.0, 52.0, 35.0, 18.0, 13.0, 4.0, 5.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.848602294921875, -3.74798583984375, -3.647369384765625, -3.5467529296875, -3.446136474609375, -3.34552001953125, -3.244903564453125, -3.144287109375, -3.043670654296875, -2.94305419921875, -2.842437744140625, -2.7418212890625, -2.641204833984375, -2.54058837890625, -2.439971923828125, -2.33935546875, -2.238739013671875, -2.13812255859375, -2.037506103515625, -1.9368896484375, -1.836273193359375, -1.73565673828125, -1.635040283203125, -1.534423828125, -1.433807373046875, -1.33319091796875, -1.232574462890625, -1.1319580078125, -1.031341552734375, -0.93072509765625, -0.830108642578125, -0.7294921875, -0.628875732421875, -0.52825927734375, -0.427642822265625, -0.3270263671875, -0.226409912109375, -0.12579345703125, -0.025177001953125, 0.075439453125, 0.176055908203125, 0.27667236328125, 0.377288818359375, 0.4779052734375, 0.578521728515625, 0.67913818359375, 0.779754638671875, 0.88037109375, 0.980987548828125, 1.08160400390625, 1.182220458984375, 1.2828369140625, 1.383453369140625, 1.48406982421875, 1.584686279296875, 1.685302734375, 1.785919189453125, 1.88653564453125, 1.987152099609375, 2.0877685546875, 2.188385009765625, 2.28900146484375, 2.389617919921875, 2.490234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 18.0, 982.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.80794143676758, -49.115779876708984, -40.423622131347656, -31.731460571289062, -23.03929901123047, -14.347137451171875, -5.654979705810547, 3.037181854248047, 11.72934341430664, 20.421504974365234, 29.113664627075195, 37.805824279785156, 46.49798583984375, 55.190147399902344, 63.88230514526367, 72.574462890625, 81.26663208007812, 89.95879364013672, 98.65095520019531, 107.34310913085938, 116.0352783203125, 124.72743225097656, 133.41958618164062, 142.11175537109375, 150.8039093017578, 159.49606323242188, 168.188232421875, 176.88038635253906, 185.5725555419922, 194.26470947265625, 202.95687866210938, 211.64903259277344, 220.34121704101562, 229.0333709716797, 237.7255401611328, 246.41769409179688, 255.10986328125, 263.8020324707031, 272.4941711425781, 281.18634033203125, 289.8785095214844, 298.5706787109375, 307.2628173828125, 315.9549865722656, 324.64715576171875, 333.3393249511719, 342.0314636230469, 350.7236328125, 359.415771484375, 368.1079406738281, 376.8000793457031, 385.49224853515625, 394.1844177246094, 402.8765869140625, 411.5687255859375, 420.2608947753906, 428.95306396484375, 437.6452331542969, 446.3373718261719, 455.029541015625, 463.7217102050781, 472.41387939453125, 481.10601806640625, 489.7981872558594, 498.4903564453125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 14.0, 32.0, 46.0, 97.0, 137.0, 156.0, 169.0, 144.0, 101.0, 63.0, 29.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.47555160522461, -12.563921928405762, -11.652291297912598, -10.74066162109375, -9.829030990600586, -8.917401313781738, -8.00577163696289, -7.094141483306885, -6.182511329650879, -5.270881175994873, -4.359251022338867, -3.4476213455200195, -2.5359911918640137, -1.6243610382080078, -0.7127313613891602, 0.1988987922668457, 1.1105289459228516, 2.0221590995788574, 2.933789014816284, 3.845418930053711, 4.757049083709717, 5.668679237365723, 6.58030891418457, 7.491939067840576, 8.403569221496582, 9.31519889831543, 10.226829528808594, 11.138459205627441, 12.050088882446289, 12.961719512939453, 13.8733491897583, 14.784978866577148, 15.696609497070312, 16.608240127563477, 17.519868850708008, 18.431499481201172, 19.343130111694336, 20.2547607421875, 21.16638946533203, 22.078020095825195, 22.98965072631836, 23.901281356811523, 24.812910079956055, 25.72454071044922, 26.636171340942383, 27.547801971435547, 28.459430694580078, 29.371061325073242, 30.282690048217773, 31.194320678710938, 32.10594940185547, 33.017578125, 33.9292106628418, 34.84083938598633, 35.752471923828125, 36.664100646972656, 37.57572937011719, 38.48735809326172, 39.398990631103516, 40.31061935424805, 41.22224807739258, 42.133880615234375, 43.045509338378906, 43.95713806152344, 44.868770599365234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 4.0, 10.0, 9.0, 29.0, 47.0, 81.0, 145.0, 1149.0, 4172780.0, 19007.0, 586.0, 197.0, 112.0, 58.0, 33.0, 16.0, 13.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.0220947265625, -7.989501953125, -6.9569091796875, -5.92431640625, -4.8917236328125, -3.859130859375, -2.8265380859375, -1.7939453125, -0.7613525390625, 0.271240234375, 1.3038330078125, 2.33642578125, 3.3690185546875, 4.401611328125, 5.4342041015625, 6.466796875, 7.4993896484375, 8.531982421875, 9.5645751953125, 10.59716796875, 11.6297607421875, 12.662353515625, 13.6949462890625, 14.7275390625, 15.7601318359375, 16.792724609375, 17.8253173828125, 18.85791015625, 19.8905029296875, 20.923095703125, 21.9556884765625, 22.98828125, 24.0208740234375, 25.053466796875, 26.0860595703125, 27.11865234375, 28.1512451171875, 29.183837890625, 30.2164306640625, 31.2490234375, 32.2816162109375, 33.314208984375, 34.3468017578125, 35.37939453125, 36.4119873046875, 37.444580078125, 38.4771728515625, 39.509765625, 40.5423583984375, 41.574951171875, 42.6075439453125, 43.64013671875, 44.6727294921875, 45.705322265625, 46.7379150390625, 47.7705078125, 48.8031005859375, 49.835693359375, 50.8682861328125, 51.90087890625, 52.9334716796875, 53.966064453125, 54.9986572265625, 56.03125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 6.0, 6.0, 31.0, 81.0, 190.0, 289.0, 254.0, 118.0, 35.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.1893024444580078, -0.15607070922851562, -0.12283897399902344, -0.08960723876953125, -0.05637550354003906, -0.023143768310546875, 0.010087966918945312, 0.0433197021484375, 0.07655143737792969, 0.10978317260742188, 0.14301490783691406, 0.17624664306640625, 0.20947837829589844, 0.24271011352539062, 0.2759418487548828, 0.309173583984375, 0.3424053192138672, 0.3756370544433594, 0.40886878967285156, 0.44210052490234375, 0.47533226013183594, 0.5085639953613281, 0.5417957305908203, 0.5750274658203125, 0.6082592010498047, 0.6414909362792969, 0.6747226715087891, 0.7079544067382812, 0.7411861419677734, 0.7744178771972656, 0.8076496124267578, 0.84088134765625, 0.8741130828857422, 0.9073448181152344, 0.9405765533447266, 0.9738082885742188, 1.007040023803711, 1.0402717590332031, 1.0735034942626953, 1.1067352294921875, 1.1399669647216797, 1.1731986999511719, 1.206430435180664, 1.2396621704101562, 1.2728939056396484, 1.3061256408691406, 1.3393573760986328, 1.372589111328125, 1.4058208465576172, 1.4390525817871094, 1.4722843170166016, 1.5055160522460938, 1.538747787475586, 1.5719795227050781, 1.6052112579345703, 1.6384429931640625, 1.6716747283935547, 1.7049064636230469, 1.738138198852539, 1.7713699340820312, 1.8046016693115234, 1.8378334045410156, 1.8710651397705078, 1.904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 19.0, 59.0, 114.0, 230.0, 2209.0, 4190100.0, 976.0, 299.0, 170.0, 75.0, 28.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.5, -28.224609375, -25.94921875, -23.673828125, -21.3984375, -19.123046875, -16.84765625, -14.572265625, -12.296875, -10.021484375, -7.74609375, -5.470703125, -3.1953125, -0.919921875, 1.35546875, 3.630859375, 5.90625, 8.181640625, 10.45703125, 12.732421875, 15.0078125, 17.283203125, 19.55859375, 21.833984375, 24.109375, 26.384765625, 28.66015625, 30.935546875, 33.2109375, 35.486328125, 37.76171875, 40.037109375, 42.3125, 44.587890625, 46.86328125, 49.138671875, 51.4140625, 53.689453125, 55.96484375, 58.240234375, 60.515625, 62.791015625, 65.06640625, 67.341796875, 69.6171875, 71.892578125, 74.16796875, 76.443359375, 78.71875, 80.994140625, 83.26953125, 85.544921875, 87.8203125, 90.095703125, 92.37109375, 94.646484375, 96.921875, 99.197265625, 101.47265625, 103.748046875, 106.0234375, 108.298828125, 110.57421875, 112.849609375, 115.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 12.0, 51.0, 1640.0, 2316.0, 55.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.20343017578125, -2.0201416015625, -1.83685302734375, -1.653564453125, -1.47027587890625, -1.2869873046875, -1.10369873046875, -0.92041015625, -0.73712158203125, -0.5538330078125, -0.37054443359375, -0.187255859375, -0.00396728515625, 0.1793212890625, 0.36260986328125, 0.5458984375, 0.72918701171875, 0.9124755859375, 1.09576416015625, 1.279052734375, 1.46234130859375, 1.6456298828125, 1.82891845703125, 2.01220703125, 2.19549560546875, 2.3787841796875, 2.56207275390625, 2.745361328125, 2.92864990234375, 3.1119384765625, 3.29522705078125, 3.478515625, 3.66180419921875, 3.8450927734375, 4.02838134765625, 4.211669921875, 4.39495849609375, 4.5782470703125, 4.76153564453125, 4.94482421875, 5.12811279296875, 5.3114013671875, 5.49468994140625, 5.677978515625, 5.86126708984375, 6.0445556640625, 6.22784423828125, 6.4111328125, 6.59442138671875, 6.7777099609375, 6.96099853515625, 7.144287109375, 7.32757568359375, 7.5108642578125, 7.69415283203125, 7.87744140625, 8.06072998046875, 8.2440185546875, 8.42730712890625, 8.610595703125, 8.79388427734375, 8.9771728515625, 9.16046142578125, 9.34375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 591.0, 396.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.34315490722656, -90.70955657958984, -87.0759506225586, -83.44235229492188, -79.80874633789062, -76.1751480102539, -72.54154968261719, -68.90794372558594, -65.27434539794922, -61.640743255615234, -58.00714111328125, -54.37354278564453, -50.73994064331055, -47.10633850097656, -43.472740173339844, -39.83913803100586, -36.205535888671875, -32.57193374633789, -28.93833351135254, -25.304733276367188, -21.671131134033203, -18.03752899169922, -14.403928756713867, -10.770328521728516, -7.136726379394531, -3.5031251907348633, 0.1304759979248047, 3.7640771865844727, 7.397678375244141, 11.031280517578125, 14.664880752563477, 18.298480987548828, 21.932083129882812, 25.565685272216797, 29.19928550720215, 32.8328857421875, 36.466487884521484, 40.10009002685547, 43.73368835449219, 47.36729049682617, 51.000892639160156, 54.63449478149414, 58.268096923828125, 61.901695251464844, 65.53529357910156, 69.16889953613281, 72.80249786376953, 76.43609619140625, 80.0697021484375, 83.70330047607422, 87.33690643310547, 90.97050476074219, 94.60411071777344, 98.23770904541016, 101.87130737304688, 105.50491333007812, 109.13851165771484, 112.77210998535156, 116.40571594238281, 120.03931427001953, 123.67291259765625, 127.3065185546875, 130.94012451171875, 134.57371520996094, 138.2073211669922]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 17.0, 28.0, 53.0, 80.0, 112.0, 148.0, 148.0, 141.0, 119.0, 71.0, 34.0, 27.0, 10.0, 5.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.74961853027344, -32.71575927734375, -31.681903839111328, -30.648046493530273, -29.61418914794922, -28.580331802368164, -27.54647445678711, -26.512615203857422, -25.478759765625, -24.444902420043945, -23.41104507446289, -22.377187728881836, -21.34333038330078, -20.309473037719727, -19.275615692138672, -18.241756439208984, -17.20789909362793, -16.174041748046875, -15.14018440246582, -14.106327056884766, -13.072469711303711, -12.038612365722656, -11.004754066467285, -9.97089672088623, -8.937039375305176, -7.903182029724121, -6.869324684143066, -5.8354668617248535, -4.801609516143799, -3.767752170562744, -2.7338943481445312, -1.7000370025634766, -0.6661796569824219, 0.36767780780792236, 1.4015352725982666, 2.4353928565979004, 3.469250202178955, 4.50310754776001, 5.536965370178223, 6.570822715759277, 7.604680061340332, 8.638537406921387, 9.672394752502441, 10.706253051757812, 11.740110397338867, 12.773967742919922, 13.807825088500977, 14.841682434082031, 15.875539779663086, 16.90939712524414, 17.943254470825195, 18.97711181640625, 20.010969161987305, 21.04482650756836, 22.078685760498047, 23.11254119873047, 24.146400451660156, 25.18025779724121, 26.214115142822266, 27.24797248840332, 28.281829833984375, 29.31568717956543, 30.349544525146484, 31.383403778076172, 32.417259216308594]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 0.0, 6.0, 7.0, 13.0, 20.0, 18.0, 19.0, 34.0, 52.0, 70.0, 119.0, 225.0, 522.0, 1568.0, 8601.0, 253752.0, 762753.0, 17036.0, 2373.0, 664.0, 278.0, 134.0, 77.0, 56.0, 50.0, 23.0, 19.0, 11.0, 18.0, 6.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.5823974609375, -13.172607421875, -12.7628173828125, -12.35302734375, -11.9432373046875, -11.533447265625, -11.1236572265625, -10.7138671875, -10.3040771484375, -9.894287109375, -9.4844970703125, -9.07470703125, -8.6649169921875, -8.255126953125, -7.8453369140625, -7.435546875, -7.0257568359375, -6.615966796875, -6.2061767578125, -5.79638671875, -5.3865966796875, -4.976806640625, -4.5670166015625, -4.1572265625, -3.7474365234375, -3.337646484375, -2.9278564453125, -2.51806640625, -2.1082763671875, -1.698486328125, -1.2886962890625, -0.87890625, -0.4691162109375, -0.059326171875, 0.3504638671875, 0.76025390625, 1.1700439453125, 1.579833984375, 1.9896240234375, 2.3994140625, 2.8092041015625, 3.218994140625, 3.6287841796875, 4.03857421875, 4.4483642578125, 4.858154296875, 5.2679443359375, 5.677734375, 6.0875244140625, 6.497314453125, 6.9071044921875, 7.31689453125, 7.7266845703125, 8.136474609375, 8.5462646484375, 8.9560546875, 9.3658447265625, 9.775634765625, 10.1854248046875, 10.59521484375, 11.0050048828125, 11.414794921875, 11.8245849609375, 12.234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 27.0, 49.0, 65.0, 101.0, 110.0, 140.0, 131.0, 126.0, 100.0, 67.0, 26.0, 27.0, 11.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0771026611328125, -1.028228759765625, -0.9793548583984375, -0.93048095703125, -0.8816070556640625, -0.832733154296875, -0.7838592529296875, -0.7349853515625, -0.6861114501953125, -0.637237548828125, -0.5883636474609375, -0.53948974609375, -0.4906158447265625, -0.441741943359375, -0.3928680419921875, -0.343994140625, -0.2951202392578125, -0.246246337890625, -0.1973724365234375, -0.14849853515625, -0.0996246337890625, -0.050750732421875, -0.0018768310546875, 0.0469970703125, 0.0958709716796875, 0.144744873046875, 0.1936187744140625, 0.24249267578125, 0.2913665771484375, 0.340240478515625, 0.3891143798828125, 0.43798828125, 0.4868621826171875, 0.535736083984375, 0.5846099853515625, 0.63348388671875, 0.6823577880859375, 0.731231689453125, 0.7801055908203125, 0.8289794921875, 0.8778533935546875, 0.926727294921875, 0.9756011962890625, 1.02447509765625, 1.0733489990234375, 1.122222900390625, 1.1710968017578125, 1.219970703125, 1.2688446044921875, 1.317718505859375, 1.3665924072265625, 1.41546630859375, 1.4643402099609375, 1.513214111328125, 1.5620880126953125, 1.6109619140625, 1.6598358154296875, 1.708709716796875, 1.7575836181640625, 1.80645751953125, 1.8553314208984375, 1.904205322265625, 1.9530792236328125, 2.001953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 4.0, 12.0, 5.0, 10.0, 13.0, 9.0, 14.0, 30.0, 42.0, 88.0, 153.0, 533.0, 3338.0, 75704.0, 933930.0, 31729.0, 2162.0, 423.0, 140.0, 64.0, 32.0, 24.0, 13.0, 16.0, 14.0, 13.0, 9.0, 3.0, 5.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.140625, -10.8070068359375, -10.473388671875, -10.1397705078125, -9.80615234375, -9.4725341796875, -9.138916015625, -8.8052978515625, -8.4716796875, -8.1380615234375, -7.804443359375, -7.4708251953125, -7.13720703125, -6.8035888671875, -6.469970703125, -6.1363525390625, -5.802734375, -5.4691162109375, -5.135498046875, -4.8018798828125, -4.46826171875, -4.1346435546875, -3.801025390625, -3.4674072265625, -3.1337890625, -2.8001708984375, -2.466552734375, -2.1329345703125, -1.79931640625, -1.4656982421875, -1.132080078125, -0.7984619140625, -0.46484375, -0.1312255859375, 0.202392578125, 0.5360107421875, 0.86962890625, 1.2032470703125, 1.536865234375, 1.8704833984375, 2.2041015625, 2.5377197265625, 2.871337890625, 3.2049560546875, 3.53857421875, 3.8721923828125, 4.205810546875, 4.5394287109375, 4.873046875, 5.2066650390625, 5.540283203125, 5.8739013671875, 6.20751953125, 6.5411376953125, 6.874755859375, 7.2083740234375, 7.5419921875, 7.8756103515625, 8.209228515625, 8.5428466796875, 8.87646484375, 9.2100830078125, 9.543701171875, 9.8773193359375, 10.2109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 18.0, 17.0, 17.0, 30.0, 32.0, 33.0, 42.0, 51.0, 70.0, 44.0, 69.0, 68.0, 56.0, 66.0, 60.0, 68.0, 48.0, 28.0, 34.0, 22.0, 26.0, 13.0, 10.0, 11.0, 10.0, 4.0, 6.0, 1.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-4.01953125, -3.907257080078125, -3.79498291015625, -3.682708740234375, -3.5704345703125, -3.458160400390625, -3.34588623046875, -3.233612060546875, -3.121337890625, -3.009063720703125, -2.89678955078125, -2.784515380859375, -2.6722412109375, -2.559967041015625, -2.44769287109375, -2.335418701171875, -2.22314453125, -2.110870361328125, -1.99859619140625, -1.886322021484375, -1.7740478515625, -1.661773681640625, -1.54949951171875, -1.437225341796875, -1.324951171875, -1.212677001953125, -1.10040283203125, -0.988128662109375, -0.8758544921875, -0.763580322265625, -0.65130615234375, -0.539031982421875, -0.4267578125, -0.314483642578125, -0.20220947265625, -0.089935302734375, 0.0223388671875, 0.134613037109375, 0.24688720703125, 0.359161376953125, 0.471435546875, 0.583709716796875, 0.69598388671875, 0.808258056640625, 0.9205322265625, 1.032806396484375, 1.14508056640625, 1.257354736328125, 1.36962890625, 1.481903076171875, 1.59417724609375, 1.706451416015625, 1.8187255859375, 1.930999755859375, 2.04327392578125, 2.155548095703125, 2.267822265625, 2.380096435546875, 2.49237060546875, 2.604644775390625, 2.7169189453125, 2.829193115234375, 2.94146728515625, 3.053741455078125, 3.166015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 2.0, 8.0, 16.0, 12.0, 25.0, 36.0, 66.0, 99.0, 243.0, 477.0, 1438.0, 6175.0, 98703.0, 887463.0, 47421.0, 4371.0, 1137.0, 429.0, 197.0, 88.0, 54.0, 31.0, 22.0, 11.0, 5.0, 5.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.0078125, -7.82330322265625, -7.6387939453125, -7.45428466796875, -7.269775390625, -7.08526611328125, -6.9007568359375, -6.71624755859375, -6.53173828125, -6.34722900390625, -6.1627197265625, -5.97821044921875, -5.793701171875, -5.60919189453125, -5.4246826171875, -5.24017333984375, -5.0556640625, -4.87115478515625, -4.6866455078125, -4.50213623046875, -4.317626953125, -4.13311767578125, -3.9486083984375, -3.76409912109375, -3.57958984375, -3.39508056640625, -3.2105712890625, -3.02606201171875, -2.841552734375, -2.65704345703125, -2.4725341796875, -2.28802490234375, -2.103515625, -1.91900634765625, -1.7344970703125, -1.54998779296875, -1.365478515625, -1.18096923828125, -0.9964599609375, -0.81195068359375, -0.62744140625, -0.44293212890625, -0.2584228515625, -0.07391357421875, 0.110595703125, 0.29510498046875, 0.4796142578125, 0.66412353515625, 0.8486328125, 1.03314208984375, 1.2176513671875, 1.40216064453125, 1.586669921875, 1.77117919921875, 1.9556884765625, 2.14019775390625, 2.32470703125, 2.50921630859375, 2.6937255859375, 2.87823486328125, 3.062744140625, 3.24725341796875, 3.4317626953125, 3.61627197265625, 3.80078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 9.0, 12.0, 13.0, 13.0, 17.0, 20.0, 30.0, 47.0, 27.0, 47.0, 52.0, 67.0, 61.0, 65.0, 51.0, 66.0, 64.0, 47.0, 51.0, 41.0, 32.0, 22.0, 17.0, 22.0, 13.0, 15.0, 8.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022935867309570312, -0.00022200867533683777, -0.0002146586775779724, -0.00020730867981910706, -0.0001999586820602417, -0.00019260868430137634, -0.00018525868654251099, -0.00017790868878364563, -0.00017055869102478027, -0.00016320869326591492, -0.00015585869550704956, -0.0001485086977481842, -0.00014115869998931885, -0.0001338087022304535, -0.00012645870447158813, -0.00011910870671272278, -0.00011175870895385742, -0.00010440871119499207, -9.705871343612671e-05, -8.970871567726135e-05, -8.2358717918396e-05, -7.500872015953064e-05, -6.765872240066528e-05, -6.030872464179993e-05, -5.295872688293457e-05, -4.5608729124069214e-05, -3.825873136520386e-05, -3.09087336063385e-05, -2.3558735847473145e-05, -1.6208738088607788e-05, -8.858740329742432e-06, -1.5087425708770752e-06, 5.841255187988281e-06, 1.3191252946853638e-05, 2.0541250705718994e-05, 2.789124846458435e-05, 3.524124622344971e-05, 4.2591243982315063e-05, 4.994124174118042e-05, 5.7291239500045776e-05, 6.464123725891113e-05, 7.199123501777649e-05, 7.934123277664185e-05, 8.66912305355072e-05, 9.404122829437256e-05, 0.00010139122605323792, 0.00010874122381210327, 0.00011609122157096863, 0.00012344121932983398, 0.00013079121708869934, 0.0001381412148475647, 0.00014549121260643005, 0.0001528412103652954, 0.00016019120812416077, 0.00016754120588302612, 0.00017489120364189148, 0.00018224120140075684, 0.0001895911991596222, 0.00019694119691848755, 0.0002042911946773529, 0.00021164119243621826, 0.00021899119019508362, 0.00022634118795394897, 0.00023369118571281433, 0.0002410411834716797]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 15.0, 5.0, 15.0, 25.0, 57.0, 110.0, 297.0, 1147.0, 8511.0, 537031.0, 491897.0, 7938.0, 1035.0, 239.0, 97.0, 58.0, 28.0, 15.0, 8.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.484375, -10.23468017578125, -9.9849853515625, -9.73529052734375, -9.485595703125, -9.23590087890625, -8.9862060546875, -8.73651123046875, -8.48681640625, -8.23712158203125, -7.9874267578125, -7.73773193359375, -7.488037109375, -7.23834228515625, -6.9886474609375, -6.73895263671875, -6.4892578125, -6.23956298828125, -5.9898681640625, -5.74017333984375, -5.490478515625, -5.24078369140625, -4.9910888671875, -4.74139404296875, -4.49169921875, -4.24200439453125, -3.9923095703125, -3.74261474609375, -3.492919921875, -3.24322509765625, -2.9935302734375, -2.74383544921875, -2.494140625, -2.24444580078125, -1.9947509765625, -1.74505615234375, -1.495361328125, -1.24566650390625, -0.9959716796875, -0.74627685546875, -0.49658203125, -0.24688720703125, 0.0028076171875, 0.25250244140625, 0.502197265625, 0.75189208984375, 1.0015869140625, 1.25128173828125, 1.5009765625, 1.75067138671875, 2.0003662109375, 2.25006103515625, 2.499755859375, 2.74945068359375, 2.9991455078125, 3.24884033203125, 3.49853515625, 3.74822998046875, 3.9979248046875, 4.24761962890625, 4.497314453125, 4.74700927734375, 4.9967041015625, 5.24639892578125, 5.49609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 12.0, 17.0, 22.0, 36.0, 44.0, 81.0, 95.0, 120.0, 123.0, 120.0, 107.0, 74.0, 45.0, 21.0, 18.0, 12.0, 14.0, 11.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.615234375, -3.5300140380859375, -3.444793701171875, -3.3595733642578125, -3.27435302734375, -3.1891326904296875, -3.103912353515625, -3.0186920166015625, -2.9334716796875, -2.8482513427734375, -2.763031005859375, -2.6778106689453125, -2.59259033203125, -2.5073699951171875, -2.422149658203125, -2.3369293212890625, -2.251708984375, -2.1664886474609375, -2.081268310546875, -1.9960479736328125, -1.91082763671875, -1.8256072998046875, -1.740386962890625, -1.6551666259765625, -1.5699462890625, -1.4847259521484375, -1.399505615234375, -1.3142852783203125, -1.22906494140625, -1.1438446044921875, -1.058624267578125, -0.9734039306640625, -0.88818359375, -0.8029632568359375, -0.717742919921875, -0.6325225830078125, -0.54730224609375, -0.4620819091796875, -0.376861572265625, -0.2916412353515625, -0.2064208984375, -0.1212005615234375, -0.035980224609375, 0.0492401123046875, 0.13446044921875, 0.2196807861328125, 0.304901123046875, 0.3901214599609375, 0.475341796875, 0.5605621337890625, 0.645782470703125, 0.7310028076171875, 0.81622314453125, 0.9014434814453125, 0.986663818359375, 1.0718841552734375, 1.1571044921875, 1.2423248291015625, 1.327545166015625, 1.4127655029296875, 1.49798583984375, 1.5832061767578125, 1.668426513671875, 1.7536468505859375, 1.8388671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 10.0, 21.0, 87.0, 577.0, 298.0, 16.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.97378540039062, -157.81253051757812, -154.65127563476562, -151.49002075195312, -148.3287811279297, -145.1675262451172, -142.0062713623047, -138.8450164794922, -135.6837615966797, -132.5225067138672, -129.3612518310547, -126.20000457763672, -123.03874969482422, -119.87750244140625, -116.71624755859375, -113.55499267578125, -110.39374542236328, -107.23249053955078, -104.07124328613281, -100.90998840332031, -97.74873352050781, -94.58747863769531, -91.42623138427734, -88.26497650146484, -85.10372924804688, -81.94247436523438, -78.7812271118164, -75.6199722290039, -72.4587173461914, -69.29747009277344, -66.13621520996094, -62.97496032714844, -59.81371307373047, -56.652462005615234, -53.491207122802734, -50.3299560546875, -47.168701171875, -44.007450103759766, -40.84619903564453, -37.68494415283203, -34.5236930847168, -31.36244010925293, -28.201187133789062, -25.039936065673828, -21.87868309020996, -18.717430114746094, -15.55617904663086, -12.394926071166992, -9.233673095703125, -6.072420597076416, -2.911168098449707, 0.25008392333984375, 3.411336898803711, 6.572589874267578, 9.733840942382812, 12.89509391784668, 16.056346893310547, 19.217599868774414, 22.37885284423828, 25.540103912353516, 28.701356887817383, 31.86260986328125, 35.023860931396484, 38.18511199951172, 41.34636688232422]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 10.0, 16.0, 27.0, 28.0, 32.0, 35.0, 49.0, 57.0, 66.0, 71.0, 67.0, 73.0, 70.0, 75.0, 69.0, 50.0, 46.0, 29.0, 32.0, 21.0, 17.0, 5.0, 8.0, 11.0, 5.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6370849609375, -34.68000030517578, -33.7229118347168, -32.76582717895508, -31.808738708496094, -30.851654052734375, -29.894567489624023, -28.937480926513672, -27.98039436340332, -27.02330780029297, -26.066221237182617, -25.109134674072266, -24.152050018310547, -23.194961547851562, -22.237876892089844, -21.280790328979492, -20.32370376586914, -19.36661720275879, -18.409530639648438, -17.452444076538086, -16.495357513427734, -15.5382719039917, -14.581186294555664, -13.624099731445312, -12.667013168334961, -11.70992660522461, -10.752840042114258, -9.795754432678223, -8.838667869567871, -7.8815813064575195, -6.924495220184326, -5.967409133911133, -5.010322570800781, -4.05323600769043, -3.0961499214172363, -2.139063596725464, -1.1819772720336914, -0.22489070892333984, 0.7321953773498535, 1.6892814636230469, 2.6463680267333984, 3.603454351425171, 4.560540676116943, 5.517626762390137, 6.474713325500488, 7.43179988861084, 8.388885498046875, 9.345972061157227, 10.303058624267578, 11.26014518737793, 12.217231750488281, 13.174317359924316, 14.131403923034668, 15.08849048614502, 16.045576095581055, 17.002662658691406, 17.959749221801758, 18.91683578491211, 19.87392234802246, 20.831008911132812, 21.78809356689453, 22.745182037353516, 23.702266693115234, 24.659353256225586, 25.616439819335938]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 25.0, 63.0, 115.0, 384.0, 1955.0, 24075.0, 4062819.0, 99153.0, 4136.0, 810.0, 327.0, 141.0, 93.0, 49.0, 37.0, 24.0, 18.0, 9.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -7.7989501953125, -7.183837890625, -6.5687255859375, -5.95361328125, -5.3385009765625, -4.723388671875, -4.1082763671875, -3.4931640625, -2.8780517578125, -2.262939453125, -1.6478271484375, -1.03271484375, -0.4176025390625, 0.197509765625, 0.8126220703125, 1.427734375, 2.0428466796875, 2.657958984375, 3.2730712890625, 3.88818359375, 4.5032958984375, 5.118408203125, 5.7335205078125, 6.3486328125, 6.9637451171875, 7.578857421875, 8.1939697265625, 8.80908203125, 9.4241943359375, 10.039306640625, 10.6544189453125, 11.26953125, 11.8846435546875, 12.499755859375, 13.1148681640625, 13.72998046875, 14.3450927734375, 14.960205078125, 15.5753173828125, 16.1904296875, 16.8055419921875, 17.420654296875, 18.0357666015625, 18.65087890625, 19.2659912109375, 19.881103515625, 20.4962158203125, 21.111328125, 21.7264404296875, 22.341552734375, 22.9566650390625, 23.57177734375, 24.1868896484375, 24.802001953125, 25.4171142578125, 26.0322265625, 26.6473388671875, 27.262451171875, 27.8775634765625, 28.49267578125, 29.1077880859375, 29.722900390625, 30.3380126953125, 30.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 18.0, 22.0, 34.0, 54.0, 75.0, 84.0, 111.0, 116.0, 123.0, 102.0, 69.0, 70.0, 43.0, 26.0, 15.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8320388793945312, -0.7876129150390625, -0.7431869506835938, -0.698760986328125, -0.6543350219726562, -0.6099090576171875, -0.5654830932617188, -0.52105712890625, -0.47663116455078125, -0.4322052001953125, -0.38777923583984375, -0.343353271484375, -0.29892730712890625, -0.2545013427734375, -0.21007537841796875, -0.1656494140625, -0.12122344970703125, -0.0767974853515625, -0.03237152099609375, 0.012054443359375, 0.05648040771484375, 0.1009063720703125, 0.14533233642578125, 0.18975830078125, 0.23418426513671875, 0.2786102294921875, 0.32303619384765625, 0.367462158203125, 0.41188812255859375, 0.4563140869140625, 0.5007400512695312, 0.545166015625, 0.5895919799804688, 0.6340179443359375, 0.6784439086914062, 0.722869873046875, 0.7672958374023438, 0.8117218017578125, 0.8561477661132812, 0.90057373046875, 0.9449996948242188, 0.9894256591796875, 1.0338516235351562, 1.078277587890625, 1.1227035522460938, 1.1671295166015625, 1.2115554809570312, 1.2559814453125, 1.3004074096679688, 1.3448333740234375, 1.3892593383789062, 1.433685302734375, 1.4781112670898438, 1.5225372314453125, 1.5669631958007812, 1.61138916015625, 1.6558151245117188, 1.7002410888671875, 1.7446670532226562, 1.789093017578125, 1.8335189819335938, 1.8779449462890625, 1.9223709106445312, 1.966796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 10.0, 21.0, 62.0, 289.0, 7023.0, 4185639.0, 942.0, 192.0, 71.0, 27.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -17.995849609375, -15.10107421875, -12.206298828125, -9.3115234375, -6.416748046875, -3.52197265625, -0.627197265625, 2.267578125, 5.162353515625, 8.05712890625, 10.951904296875, 13.8466796875, 16.741455078125, 19.63623046875, 22.531005859375, 25.42578125, 28.320556640625, 31.21533203125, 34.110107421875, 37.0048828125, 39.899658203125, 42.79443359375, 45.689208984375, 48.583984375, 51.478759765625, 54.37353515625, 57.268310546875, 60.1630859375, 63.057861328125, 65.95263671875, 68.847412109375, 71.7421875, 74.636962890625, 77.53173828125, 80.426513671875, 83.3212890625, 86.216064453125, 89.11083984375, 92.005615234375, 94.900390625, 97.795166015625, 100.68994140625, 103.584716796875, 106.4794921875, 109.374267578125, 112.26904296875, 115.163818359375, 118.05859375, 120.953369140625, 123.84814453125, 126.742919921875, 129.6376953125, 132.532470703125, 135.42724609375, 138.322021484375, 141.216796875, 144.111572265625, 147.00634765625, 149.901123046875, 152.7958984375, 155.690673828125, 158.58544921875, 161.480224609375, 164.375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 17.0, 65.0, 454.0, 3355.0, 157.0, 13.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.6173248291015625, -1.360626220703125, -1.1039276123046875, -0.84722900390625, -0.5905303955078125, -0.333831787109375, -0.0771331787109375, 0.1795654296875, 0.4362640380859375, 0.692962646484375, 0.9496612548828125, 1.20635986328125, 1.4630584716796875, 1.719757080078125, 1.9764556884765625, 2.233154296875, 2.4898529052734375, 2.746551513671875, 3.0032501220703125, 3.25994873046875, 3.5166473388671875, 3.773345947265625, 4.0300445556640625, 4.2867431640625, 4.5434417724609375, 4.800140380859375, 5.0568389892578125, 5.31353759765625, 5.5702362060546875, 5.826934814453125, 6.0836334228515625, 6.34033203125, 6.5970306396484375, 6.853729248046875, 7.1104278564453125, 7.36712646484375, 7.6238250732421875, 7.880523681640625, 8.137222290039062, 8.3939208984375, 8.650619506835938, 8.907318115234375, 9.164016723632812, 9.42071533203125, 9.677413940429688, 9.934112548828125, 10.190811157226562, 10.447509765625, 10.704208374023438, 10.960906982421875, 11.217605590820312, 11.47430419921875, 11.731002807617188, 11.987701416015625, 12.244400024414062, 12.5010986328125, 12.757797241210938, 13.014495849609375, 13.271194458007812, 13.52789306640625, 13.784591674804688, 14.041290283203125, 14.297988891601562, 14.5546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 110.0, 735.0, 124.0, 21.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.00344848632812, -70.75090789794922, -68.49836730957031, -66.2458267211914, -63.993282318115234, -61.74074172973633, -59.488197326660156, -57.23565673828125, -54.983116149902344, -52.73057556152344, -50.47803497314453, -48.22549057006836, -45.97294998168945, -43.72040939331055, -41.467864990234375, -39.21532440185547, -36.96278381347656, -34.710243225097656, -32.45770263671875, -30.205158233642578, -27.952617645263672, -25.700077056884766, -23.447534561157227, -21.194992065429688, -18.94245147705078, -16.689910888671875, -14.437368392944336, -12.184826850891113, -9.93228530883789, -7.679743766784668, -5.427202224731445, -3.1746606826782227, -0.9221115112304688, 1.330430030822754, 3.5829715728759766, 5.835513114929199, 8.088054656982422, 10.340596199035645, 12.593137741088867, 14.84567928314209, 17.098220825195312, 19.35076141357422, 21.603303909301758, 23.855846405029297, 26.108386993408203, 28.36092758178711, 30.61347007751465, 32.86601257324219, 35.118553161621094, 37.37109375, 39.623634338378906, 41.87617874145508, 44.128719329833984, 46.38125991821289, 48.63380432128906, 50.88634490966797, 53.138885498046875, 55.39142608642578, 57.64396667480469, 59.89651107788086, 62.149051666259766, 64.40159606933594, 66.65413665771484, 68.90667724609375, 71.15921783447266]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 13.0, 15.0, 47.0, 51.0, 78.0, 89.0, 95.0, 112.0, 135.0, 112.0, 69.0, 56.0, 49.0, 27.0, 24.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.984140396118164, -26.096216201782227, -25.208293914794922, -24.320369720458984, -23.432445526123047, -22.544523239135742, -21.656599044799805, -20.7686767578125, -19.880752563476562, -18.992828369140625, -18.10490608215332, -17.216981887817383, -16.329057693481445, -15.44113540649414, -14.553211212158203, -13.665287971496582, -12.777363777160645, -11.889440536499023, -11.001516342163086, -10.113593101501465, -9.225669860839844, -8.337745666503906, -7.449822425842285, -6.561899185180664, -5.673975467681885, -4.7860517501831055, -3.8981285095214844, -3.010204792022705, -2.122281312942505, -1.2343578338623047, -0.3464341163635254, 0.5414891242980957, 1.429412841796875, 2.317336320877075, 3.2052597999572754, 4.093183517456055, 4.981106758117676, 5.869030475616455, 6.756954193115234, 7.6448774337768555, 8.532800674438477, 9.420723915100098, 10.308648109436035, 11.196571350097656, 12.084494590759277, 12.972417831420898, 13.860342025756836, 14.748265266418457, 15.636189460754395, 16.524112701416016, 17.412036895751953, 18.29996109008789, 19.187883377075195, 20.075807571411133, 20.963729858398438, 21.851654052734375, 22.739578247070312, 23.62750244140625, 24.515424728393555, 25.403348922729492, 26.29127311706543, 27.179195404052734, 28.067119598388672, 28.95504379272461, 29.842966079711914]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 17.0, 14.0, 16.0, 27.0, 26.0, 28.0, 68.0, 89.0, 112.0, 197.0, 388.0, 627.0, 1526.0, 4525.0, 22407.0, 174594.0, 715180.0, 107114.0, 15467.0, 3455.0, 1252.0, 522.0, 308.0, 165.0, 131.0, 69.0, 56.0, 44.0, 38.0, 20.0, 14.0, 9.0, 14.0, 4.0, 10.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.60906982421875, -8.3587646484375, -8.10845947265625, -7.858154296875, -7.60784912109375, -7.3575439453125, -7.10723876953125, -6.85693359375, -6.60662841796875, -6.3563232421875, -6.10601806640625, -5.855712890625, -5.60540771484375, -5.3551025390625, -5.10479736328125, -4.8544921875, -4.60418701171875, -4.3538818359375, -4.10357666015625, -3.853271484375, -3.60296630859375, -3.3526611328125, -3.10235595703125, -2.85205078125, -2.60174560546875, -2.3514404296875, -2.10113525390625, -1.850830078125, -1.60052490234375, -1.3502197265625, -1.09991455078125, -0.849609375, -0.59930419921875, -0.3489990234375, -0.09869384765625, 0.151611328125, 0.40191650390625, 0.6522216796875, 0.90252685546875, 1.15283203125, 1.40313720703125, 1.6534423828125, 1.90374755859375, 2.154052734375, 2.40435791015625, 2.6546630859375, 2.90496826171875, 3.1552734375, 3.40557861328125, 3.6558837890625, 3.90618896484375, 4.156494140625, 4.40679931640625, 4.6571044921875, 4.90740966796875, 5.15771484375, 5.40802001953125, 5.6583251953125, 5.90863037109375, 6.158935546875, 6.40924072265625, 6.6595458984375, 6.90985107421875, 7.16015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 16.0, 20.0, 35.0, 54.0, 70.0, 75.0, 68.0, 109.0, 124.0, 91.0, 74.0, 71.0, 59.0, 49.0, 24.0, 19.0, 15.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.210693359375, -1.14794921875, -1.085205078125, -1.0224609375, -0.959716796875, -0.89697265625, -0.834228515625, -0.771484375, -0.708740234375, -0.64599609375, -0.583251953125, -0.5205078125, -0.457763671875, -0.39501953125, -0.332275390625, -0.26953125, -0.206787109375, -0.14404296875, -0.081298828125, -0.0185546875, 0.044189453125, 0.10693359375, 0.169677734375, 0.232421875, 0.295166015625, 0.35791015625, 0.420654296875, 0.4833984375, 0.546142578125, 0.60888671875, 0.671630859375, 0.734375, 0.797119140625, 0.85986328125, 0.922607421875, 0.9853515625, 1.048095703125, 1.11083984375, 1.173583984375, 1.236328125, 1.299072265625, 1.36181640625, 1.424560546875, 1.4873046875, 1.550048828125, 1.61279296875, 1.675537109375, 1.73828125, 1.801025390625, 1.86376953125, 1.926513671875, 1.9892578125, 2.052001953125, 2.11474609375, 2.177490234375, 2.240234375, 2.302978515625, 2.36572265625, 2.428466796875, 2.4912109375, 2.553955078125, 2.61669921875, 2.679443359375, 2.7421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 6.0, 11.0, 10.0, 11.0, 18.0, 19.0, 32.0, 60.0, 108.0, 157.0, 443.0, 1630.0, 8564.0, 92908.0, 827893.0, 104770.0, 9328.0, 1664.0, 494.0, 179.0, 71.0, 44.0, 29.0, 30.0, 19.0, 16.0, 7.0, 11.0, 5.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.7578125, -9.48309326171875, -9.2083740234375, -8.93365478515625, -8.658935546875, -8.38421630859375, -8.1094970703125, -7.83477783203125, -7.56005859375, -7.28533935546875, -7.0106201171875, -6.73590087890625, -6.461181640625, -6.18646240234375, -5.9117431640625, -5.63702392578125, -5.3623046875, -5.08758544921875, -4.8128662109375, -4.53814697265625, -4.263427734375, -3.98870849609375, -3.7139892578125, -3.43927001953125, -3.16455078125, -2.88983154296875, -2.6151123046875, -2.34039306640625, -2.065673828125, -1.79095458984375, -1.5162353515625, -1.24151611328125, -0.966796875, -0.69207763671875, -0.4173583984375, -0.14263916015625, 0.132080078125, 0.40679931640625, 0.6815185546875, 0.95623779296875, 1.23095703125, 1.50567626953125, 1.7803955078125, 2.05511474609375, 2.329833984375, 2.60455322265625, 2.8792724609375, 3.15399169921875, 3.4287109375, 3.70343017578125, 3.9781494140625, 4.25286865234375, 4.527587890625, 4.80230712890625, 5.0770263671875, 5.35174560546875, 5.62646484375, 5.90118408203125, 6.1759033203125, 6.45062255859375, 6.725341796875, 7.00006103515625, 7.2747802734375, 7.54949951171875, 7.82421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 1.0, 13.0, 11.0, 16.0, 10.0, 18.0, 20.0, 45.0, 48.0, 43.0, 45.0, 47.0, 48.0, 63.0, 67.0, 55.0, 61.0, 59.0, 50.0, 46.0, 30.0, 37.0, 29.0, 20.0, 25.0, 16.0, 15.0, 18.0, 5.0, 3.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-5.99609375, -5.829833984375, -5.66357421875, -5.497314453125, -5.3310546875, -5.164794921875, -4.99853515625, -4.832275390625, -4.666015625, -4.499755859375, -4.33349609375, -4.167236328125, -4.0009765625, -3.834716796875, -3.66845703125, -3.502197265625, -3.3359375, -3.169677734375, -3.00341796875, -2.837158203125, -2.6708984375, -2.504638671875, -2.33837890625, -2.172119140625, -2.005859375, -1.839599609375, -1.67333984375, -1.507080078125, -1.3408203125, -1.174560546875, -1.00830078125, -0.842041015625, -0.67578125, -0.509521484375, -0.34326171875, -0.177001953125, -0.0107421875, 0.155517578125, 0.32177734375, 0.488037109375, 0.654296875, 0.820556640625, 0.98681640625, 1.153076171875, 1.3193359375, 1.485595703125, 1.65185546875, 1.818115234375, 1.984375, 2.150634765625, 2.31689453125, 2.483154296875, 2.6494140625, 2.815673828125, 2.98193359375, 3.148193359375, 3.314453125, 3.480712890625, 3.64697265625, 3.813232421875, 3.9794921875, 4.145751953125, 4.31201171875, 4.478271484375, 4.64453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 24.0, 37.0, 55.0, 96.0, 126.0, 249.0, 476.0, 897.0, 1928.0, 4566.0, 12726.0, 45524.0, 206703.0, 508129.0, 201328.0, 44663.0, 12646.0, 4541.0, 1826.0, 875.0, 443.0, 235.0, 157.0, 93.0, 52.0, 34.0, 21.0, 16.0, 9.0, 10.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.8310699462890625, -1.776397705078125, -1.7217254638671875, -1.66705322265625, -1.6123809814453125, -1.557708740234375, -1.5030364990234375, -1.4483642578125, -1.3936920166015625, -1.339019775390625, -1.2843475341796875, -1.22967529296875, -1.1750030517578125, -1.120330810546875, -1.0656585693359375, -1.010986328125, -0.9563140869140625, -0.901641845703125, -0.8469696044921875, -0.79229736328125, -0.7376251220703125, -0.682952880859375, -0.6282806396484375, -0.5736083984375, -0.5189361572265625, -0.464263916015625, -0.4095916748046875, -0.35491943359375, -0.3002471923828125, -0.245574951171875, -0.1909027099609375, -0.13623046875, -0.0815582275390625, -0.026885986328125, 0.0277862548828125, 0.08245849609375, 0.1371307373046875, 0.191802978515625, 0.2464752197265625, 0.3011474609375, 0.3558197021484375, 0.410491943359375, 0.4651641845703125, 0.51983642578125, 0.5745086669921875, 0.629180908203125, 0.6838531494140625, 0.738525390625, 0.7931976318359375, 0.847869873046875, 0.9025421142578125, 0.95721435546875, 1.0118865966796875, 1.066558837890625, 1.1212310791015625, 1.1759033203125, 1.2305755615234375, 1.285247802734375, 1.3399200439453125, 1.39459228515625, 1.4492645263671875, 1.503936767578125, 1.5586090087890625, 1.61328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 8.0, 15.0, 17.0, 28.0, 39.0, 50.0, 79.0, 119.0, 133.0, 120.0, 109.0, 68.0, 59.0, 38.0, 31.0, 21.0, 20.0, 6.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034117698669433594, -0.0003280453383922577, -0.00031491369009017944, -0.0003017820417881012, -0.00028865039348602295, -0.0002755187451839447, -0.00026238709688186646, -0.0002492554485797882, -0.00023612380027770996, -0.00022299215197563171, -0.00020986050367355347, -0.00019672885537147522, -0.00018359720706939697, -0.00017046555876731873, -0.00015733391046524048, -0.00014420226216316223, -0.00013107061386108398, -0.00011793896555900574, -0.00010480731725692749, -9.167566895484924e-05, -7.8544020652771e-05, -6.541237235069275e-05, -5.22807240486145e-05, -3.9149075746536255e-05, -2.6017427444458008e-05, -1.288577914237976e-05, 2.4586915969848633e-07, 1.3377517461776733e-05, 2.650916576385498e-05, 3.964081406593323e-05, 5.2772462368011475e-05, 6.590411067008972e-05, 7.903575897216797e-05, 9.216740727424622e-05, 0.00010529905557632446, 0.00011843070387840271, 0.00013156235218048096, 0.0001446940004825592, 0.00015782564878463745, 0.0001709572970867157, 0.00018408894538879395, 0.0001972205936908722, 0.00021035224199295044, 0.0002234838902950287, 0.00023661553859710693, 0.0002497471868991852, 0.00026287883520126343, 0.0002760104835033417, 0.0002891421318054199, 0.00030227378010749817, 0.0003154054284095764, 0.00032853707671165466, 0.0003416687250137329, 0.00035480037331581116, 0.0003679320216178894, 0.00038106366991996765, 0.0003941953182220459, 0.00040732696652412415, 0.0004204586148262024, 0.00043359026312828064, 0.0004467219114303589, 0.00045985355973243713, 0.0004729852080345154, 0.00048611685633659363, 0.0004992485046386719]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 17.0, 17.0, 26.0, 25.0, 51.0, 82.0, 128.0, 222.0, 368.0, 701.0, 1651.0, 4069.0, 11618.0, 40110.0, 163894.0, 482456.0, 253772.0, 62280.0, 17191.0, 5625.0, 2145.0, 973.0, 445.0, 264.0, 137.0, 68.0, 48.0, 42.0, 17.0, 18.0, 22.0, 10.0, 5.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4239959716796875, -1.368499755859375, -1.3130035400390625, -1.25750732421875, -1.2020111083984375, -1.146514892578125, -1.0910186767578125, -1.0355224609375, -0.9800262451171875, -0.924530029296875, -0.8690338134765625, -0.81353759765625, -0.7580413818359375, -0.702545166015625, -0.6470489501953125, -0.591552734375, -0.5360565185546875, -0.480560302734375, -0.4250640869140625, -0.36956787109375, -0.3140716552734375, -0.258575439453125, -0.2030792236328125, -0.1475830078125, -0.0920867919921875, -0.036590576171875, 0.0189056396484375, 0.07440185546875, 0.1298980712890625, 0.185394287109375, 0.2408905029296875, 0.29638671875, 0.3518829345703125, 0.407379150390625, 0.4628753662109375, 0.51837158203125, 0.5738677978515625, 0.629364013671875, 0.6848602294921875, 0.7403564453125, 0.7958526611328125, 0.851348876953125, 0.9068450927734375, 0.96234130859375, 1.0178375244140625, 1.073333740234375, 1.1288299560546875, 1.184326171875, 1.2398223876953125, 1.295318603515625, 1.3508148193359375, 1.40631103515625, 1.4618072509765625, 1.517303466796875, 1.5727996826171875, 1.6282958984375, 1.6837921142578125, 1.739288330078125, 1.7947845458984375, 1.85028076171875, 1.9057769775390625, 1.961273193359375, 2.0167694091796875, 2.072265625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 12.0, 7.0, 11.0, 8.0, 9.0, 20.0, 24.0, 31.0, 28.0, 50.0, 43.0, 42.0, 50.0, 71.0, 58.0, 84.0, 67.0, 51.0, 47.0, 47.0, 36.0, 38.0, 27.0, 37.0, 17.0, 20.0, 11.0, 13.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.25146484375, -1.208984375, -1.16650390625, -1.1240234375, -1.08154296875, -1.0390625, -0.99658203125, -0.9541015625, -0.91162109375, -0.869140625, -0.82666015625, -0.7841796875, -0.74169921875, -0.69921875, -0.65673828125, -0.6142578125, -0.57177734375, -0.529296875, -0.48681640625, -0.4443359375, -0.40185546875, -0.359375, -0.31689453125, -0.2744140625, -0.23193359375, -0.189453125, -0.14697265625, -0.1044921875, -0.06201171875, -0.01953125, 0.02294921875, 0.0654296875, 0.10791015625, 0.150390625, 0.19287109375, 0.2353515625, 0.27783203125, 0.3203125, 0.36279296875, 0.4052734375, 0.44775390625, 0.490234375, 0.53271484375, 0.5751953125, 0.61767578125, 0.66015625, 0.70263671875, 0.7451171875, 0.78759765625, 0.830078125, 0.87255859375, 0.9150390625, 0.95751953125, 1.0, 1.04248046875, 1.0849609375, 1.12744140625, 1.169921875, 1.21240234375, 1.2548828125, 1.29736328125, 1.33984375, 1.38232421875, 1.4248046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 12.0, 23.0, 27.0, 67.0, 160.0, 290.0, 233.0, 118.0, 44.0, 21.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.26384353637695, -38.91786575317383, -37.5718879699707, -36.225914001464844, -34.87993621826172, -33.533958435058594, -32.18798065185547, -30.842002868652344, -29.49602699279785, -28.150049209594727, -26.804073333740234, -25.45809555053711, -24.112117767333984, -22.766141891479492, -21.420164108276367, -20.074188232421875, -18.72821044921875, -17.382232666015625, -16.036256790161133, -14.690279006958008, -13.3443021774292, -11.99832534790039, -10.652347564697266, -9.306370735168457, -7.960393905639648, -6.61441707611084, -5.268439769744873, -3.9224624633789062, -2.5764856338500977, -1.230508804321289, 0.11546897888183594, 1.4614458084106445, 2.8074188232421875, 4.153395652770996, 5.499372959136963, 6.84535026550293, 8.191327095031738, 9.537303924560547, 10.883281707763672, 12.22925853729248, 13.575235366821289, 14.921212196350098, 16.267189025878906, 17.61316680908203, 18.959144592285156, 20.30512046813965, 21.651098251342773, 22.997074127197266, 24.34305191040039, 25.689029693603516, 27.035005569458008, 28.380983352661133, 29.726959228515625, 31.07293701171875, 32.418914794921875, 33.764892578125, 35.110870361328125, 36.45684814453125, 37.802825927734375, 39.1488037109375, 40.49477767944336, 41.840755462646484, 43.18673324584961, 44.532711029052734, 45.878684997558594]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 7.0, 6.0, 17.0, 11.0, 10.0, 13.0, 22.0, 19.0, 29.0, 32.0, 31.0, 34.0, 40.0, 48.0, 59.0, 47.0, 38.0, 46.0, 41.0, 42.0, 58.0, 43.0, 40.0, 30.0, 29.0, 28.0, 24.0, 28.0, 19.0, 23.0, 24.0, 15.0, 9.0, 6.0, 6.0, 7.0, 3.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.08823013305664, -28.28565216064453, -27.483074188232422, -26.680496215820312, -25.877920150756836, -25.075342178344727, -24.272764205932617, -23.470186233520508, -22.6676082611084, -21.86503028869629, -21.06245231628418, -20.259876251220703, -19.457298278808594, -18.654720306396484, -17.852142333984375, -17.049564361572266, -16.246986389160156, -15.444408416748047, -14.641831398010254, -13.839253425598145, -13.036675453186035, -12.234098434448242, -11.431520462036133, -10.628942489624023, -9.826366424560547, -9.023788452148438, -8.221211433410645, -7.418633460998535, -6.616055488586426, -5.813477993011475, -5.010900497436523, -4.208322525024414, -3.4057445526123047, -2.6031668186187744, -1.8005892038345337, -0.998011589050293, -0.1954338550567627, 0.6071438789367676, 1.4097213745117188, 2.212299346923828, 3.0148768424987793, 3.8174545764923096, 4.62003231048584, 5.422609806060791, 6.225187301635742, 7.027765274047852, 7.830342769622803, 8.63292121887207, 9.435498237609863, 10.238076210021973, 11.040653228759766, 11.843231201171875, 12.645809173583984, 13.448387145996094, 14.250964164733887, 15.053542137145996, 15.856119155883789, 16.6586971282959, 17.461275100708008, 18.263851165771484, 19.066429138183594, 19.869007110595703, 20.671585083007812, 21.474163055419922, 22.27674102783203]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 8.0, 27.0, 56.0, 86.0, 170.0, 418.0, 1104.0, 3984.0, 28146.0, 3830764.0, 313114.0, 11711.0, 2659.0, 898.0, 475.0, 252.0, 123.0, 78.0, 49.0, 46.0, 23.0, 27.0, 13.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.2523193359375, -6.793701171875, -6.3350830078125, -5.87646484375, -5.4178466796875, -4.959228515625, -4.5006103515625, -4.0419921875, -3.5833740234375, -3.124755859375, -2.6661376953125, -2.20751953125, -1.7489013671875, -1.290283203125, -0.8316650390625, -0.373046875, 0.0855712890625, 0.544189453125, 1.0028076171875, 1.46142578125, 1.9200439453125, 2.378662109375, 2.8372802734375, 3.2958984375, 3.7545166015625, 4.213134765625, 4.6717529296875, 5.13037109375, 5.5889892578125, 6.047607421875, 6.5062255859375, 6.96484375, 7.4234619140625, 7.882080078125, 8.3406982421875, 8.79931640625, 9.2579345703125, 9.716552734375, 10.1751708984375, 10.6337890625, 11.0924072265625, 11.551025390625, 12.0096435546875, 12.46826171875, 12.9268798828125, 13.385498046875, 13.8441162109375, 14.302734375, 14.7613525390625, 15.219970703125, 15.6785888671875, 16.13720703125, 16.5958251953125, 17.054443359375, 17.5130615234375, 17.9716796875, 18.4302978515625, 18.888916015625, 19.3475341796875, 19.80615234375, 20.2647705078125, 20.723388671875, 21.1820068359375, 21.640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 19.0, 43.0, 54.0, 82.0, 100.0, 112.0, 113.0, 123.0, 97.0, 79.0, 58.0, 39.0, 24.0, 14.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.2762451171875, -1.198974609375, -1.1217041015625, -1.04443359375, -0.9671630859375, -0.889892578125, -0.8126220703125, -0.7353515625, -0.6580810546875, -0.580810546875, -0.5035400390625, -0.42626953125, -0.3489990234375, -0.271728515625, -0.1944580078125, -0.1171875, -0.0399169921875, 0.037353515625, 0.1146240234375, 0.19189453125, 0.2691650390625, 0.346435546875, 0.4237060546875, 0.5009765625, 0.5782470703125, 0.655517578125, 0.7327880859375, 0.81005859375, 0.8873291015625, 0.964599609375, 1.0418701171875, 1.119140625, 1.1964111328125, 1.273681640625, 1.3509521484375, 1.42822265625, 1.5054931640625, 1.582763671875, 1.6600341796875, 1.7373046875, 1.8145751953125, 1.891845703125, 1.9691162109375, 2.04638671875, 2.1236572265625, 2.200927734375, 2.2781982421875, 2.35546875, 2.4327392578125, 2.510009765625, 2.5872802734375, 2.66455078125, 2.7418212890625, 2.819091796875, 2.8963623046875, 2.9736328125, 3.0509033203125, 3.128173828125, 3.2054443359375, 3.28271484375, 3.3599853515625, 3.437255859375, 3.5145263671875, 3.591796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 17.0, 40.0, 65.0, 143.0, 273.0, 2660.0, 4189810.0, 915.0, 219.0, 86.0, 37.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.625, -92.39111328125, -90.1572265625, -87.92333984375, -85.689453125, -83.45556640625, -81.2216796875, -78.98779296875, -76.75390625, -74.52001953125, -72.2861328125, -70.05224609375, -67.818359375, -65.58447265625, -63.3505859375, -61.11669921875, -58.8828125, -56.64892578125, -54.4150390625, -52.18115234375, -49.947265625, -47.71337890625, -45.4794921875, -43.24560546875, -41.01171875, -38.77783203125, -36.5439453125, -34.31005859375, -32.076171875, -29.84228515625, -27.6083984375, -25.37451171875, -23.140625, -20.90673828125, -18.6728515625, -16.43896484375, -14.205078125, -11.97119140625, -9.7373046875, -7.50341796875, -5.26953125, -3.03564453125, -0.8017578125, 1.43212890625, 3.666015625, 5.89990234375, 8.1337890625, 10.36767578125, 12.6015625, 14.83544921875, 17.0693359375, 19.30322265625, 21.537109375, 23.77099609375, 26.0048828125, 28.23876953125, 30.47265625, 32.70654296875, 34.9404296875, 37.17431640625, 39.408203125, 41.64208984375, 43.8759765625, 46.10986328125, 48.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 10.0, 34.0, 430.0, 3467.0, 126.0, 15.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.84375, -14.4844970703125, -14.125244140625, -13.7659912109375, -13.40673828125, -13.0474853515625, -12.688232421875, -12.3289794921875, -11.9697265625, -11.6104736328125, -11.251220703125, -10.8919677734375, -10.53271484375, -10.1734619140625, -9.814208984375, -9.4549560546875, -9.095703125, -8.7364501953125, -8.377197265625, -8.0179443359375, -7.65869140625, -7.2994384765625, -6.940185546875, -6.5809326171875, -6.2216796875, -5.8624267578125, -5.503173828125, -5.1439208984375, -4.78466796875, -4.4254150390625, -4.066162109375, -3.7069091796875, -3.34765625, -2.9884033203125, -2.629150390625, -2.2698974609375, -1.91064453125, -1.5513916015625, -1.192138671875, -0.8328857421875, -0.4736328125, -0.1143798828125, 0.244873046875, 0.6041259765625, 0.96337890625, 1.3226318359375, 1.681884765625, 2.0411376953125, 2.400390625, 2.7596435546875, 3.118896484375, 3.4781494140625, 3.83740234375, 4.1966552734375, 4.555908203125, 4.9151611328125, 5.2744140625, 5.6336669921875, 5.992919921875, 6.3521728515625, 6.71142578125, 7.0706787109375, 7.429931640625, 7.7891845703125, 8.1484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 516.0, 471.0, 16.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.27314758300781, -65.16852569580078, -62.063899993896484, -58.95927810668945, -55.854652404785156, -52.750030517578125, -49.645408630371094, -46.54078674316406, -43.436161041259766, -40.331539154052734, -37.22691345214844, -34.122291564941406, -31.017667770385742, -27.913043975830078, -24.808422088623047, -21.703798294067383, -18.59917449951172, -15.494550704956055, -12.389927864074707, -9.28530502319336, -6.180681228637695, -3.0760574340820312, 0.028564453125, 3.133188247680664, 6.237812042236328, 9.342435836791992, 12.44705867767334, 15.551681518554688, 18.65630531311035, 21.760929107666016, 24.865550994873047, 27.97017478942871, 31.074798583984375, 34.179420471191406, 37.2840461730957, 40.388668060302734, 43.49329376220703, 46.59791564941406, 49.702537536621094, 52.807159423828125, 55.91178512573242, 59.01640701293945, 62.12103271484375, 65.22565460205078, 68.33027648925781, 71.43490600585938, 74.53952026367188, 77.64414978027344, 80.74877166748047, 83.8533935546875, 86.95801544189453, 90.06263732910156, 93.16726684570312, 96.27188873291016, 99.37651062011719, 102.48113250732422, 105.58575439453125, 108.69037628173828, 111.79499816894531, 114.89962768554688, 118.0042495727539, 121.10887145996094, 124.21349334716797, 127.318115234375, 130.42274475097656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 27.0, 31.0, 44.0, 58.0, 94.0, 107.0, 104.0, 97.0, 101.0, 106.0, 61.0, 62.0, 38.0, 19.0, 14.0, 8.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.749408721923828, -11.235383033752441, -10.721357345581055, -10.207331657409668, -9.693305969238281, -9.179280281066895, -8.665254592895508, -8.151227951049805, -7.637202739715576, -7.1231770515441895, -6.609151363372803, -6.095125198364258, -5.581099510192871, -5.067073822021484, -4.553048133850098, -4.039022445678711, -3.524996757507324, -3.0109710693359375, -2.496945381164551, -1.982919454574585, -1.4688937664031982, -0.9548680782318115, -0.4408421516418457, 0.07318353652954102, 0.5872092247009277, 1.1012349128723145, 1.6152607202529907, 2.129286527633667, 2.6433122158050537, 3.1573379039764404, 3.6713638305664062, 4.185389518737793, 4.69941520690918, 5.213440895080566, 5.727466583251953, 6.24149227142334, 6.755517959594727, 7.269543647766113, 7.783569812774658, 8.297595977783203, 8.811620712280273, 9.32564640045166, 9.839672088623047, 10.353697776794434, 10.86772346496582, 11.381749153137207, 11.895774841308594, 12.409801483154297, 12.923827171325684, 13.43785285949707, 13.951878547668457, 14.465904235839844, 14.97992992401123, 15.493955612182617, 16.00798225402832, 16.52200698852539, 17.036033630371094, 17.550060272216797, 18.064085006713867, 18.57811164855957, 19.09213638305664, 19.606163024902344, 20.120187759399414, 20.634214401245117, 21.148239135742188]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 3.0, 5.0, 9.0, 9.0, 17.0, 20.0, 17.0, 31.0, 46.0, 58.0, 92.0, 128.0, 217.0, 325.0, 552.0, 1108.0, 2494.0, 6804.0, 23769.0, 107021.0, 509476.0, 313602.0, 59767.0, 14573.0, 4510.0, 1798.0, 844.0, 431.0, 254.0, 156.0, 117.0, 85.0, 53.0, 36.0, 30.0, 23.0, 19.0, 16.0, 14.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.7982177734375, -5.615966796875, -5.4337158203125, -5.25146484375, -5.0692138671875, -4.886962890625, -4.7047119140625, -4.5224609375, -4.3402099609375, -4.157958984375, -3.9757080078125, -3.79345703125, -3.6112060546875, -3.428955078125, -3.2467041015625, -3.064453125, -2.8822021484375, -2.699951171875, -2.5177001953125, -2.33544921875, -2.1531982421875, -1.970947265625, -1.7886962890625, -1.6064453125, -1.4241943359375, -1.241943359375, -1.0596923828125, -0.87744140625, -0.6951904296875, -0.512939453125, -0.3306884765625, -0.1484375, 0.0338134765625, 0.216064453125, 0.3983154296875, 0.58056640625, 0.7628173828125, 0.945068359375, 1.1273193359375, 1.3095703125, 1.4918212890625, 1.674072265625, 1.8563232421875, 2.03857421875, 2.2208251953125, 2.403076171875, 2.5853271484375, 2.767578125, 2.9498291015625, 3.132080078125, 3.3143310546875, 3.49658203125, 3.6788330078125, 3.861083984375, 4.0433349609375, 4.2255859375, 4.4078369140625, 4.590087890625, 4.7723388671875, 4.95458984375, 5.1368408203125, 5.319091796875, 5.5013427734375, 5.68359375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 19.0, 14.0, 32.0, 38.0, 41.0, 56.0, 76.0, 70.0, 94.0, 91.0, 77.0, 79.0, 60.0, 64.0, 50.0, 45.0, 22.0, 19.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.646484375, -1.588775634765625, -1.53106689453125, -1.473358154296875, -1.4156494140625, -1.357940673828125, -1.30023193359375, -1.242523193359375, -1.184814453125, -1.127105712890625, -1.06939697265625, -1.011688232421875, -0.9539794921875, -0.896270751953125, -0.83856201171875, -0.780853271484375, -0.72314453125, -0.665435791015625, -0.60772705078125, -0.550018310546875, -0.4923095703125, -0.434600830078125, -0.37689208984375, -0.319183349609375, -0.261474609375, -0.203765869140625, -0.14605712890625, -0.088348388671875, -0.0306396484375, 0.027069091796875, 0.08477783203125, 0.142486572265625, 0.2001953125, 0.257904052734375, 0.31561279296875, 0.373321533203125, 0.4310302734375, 0.488739013671875, 0.54644775390625, 0.604156494140625, 0.661865234375, 0.719573974609375, 0.77728271484375, 0.834991455078125, 0.8927001953125, 0.950408935546875, 1.00811767578125, 1.065826416015625, 1.12353515625, 1.181243896484375, 1.23895263671875, 1.296661376953125, 1.3543701171875, 1.412078857421875, 1.46978759765625, 1.527496337890625, 1.585205078125, 1.642913818359375, 1.70062255859375, 1.758331298828125, 1.8160400390625, 1.873748779296875, 1.93145751953125, 1.989166259765625, 2.046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 8.0, 8.0, 12.0, 16.0, 23.0, 38.0, 57.0, 86.0, 214.0, 446.0, 1178.0, 4499.0, 26593.0, 386221.0, 582293.0, 38437.0, 5958.0, 1434.0, 476.0, 243.0, 123.0, 56.0, 38.0, 21.0, 14.0, 10.0, 15.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.45703125, -6.17730712890625, -5.8975830078125, -5.61785888671875, -5.338134765625, -5.05841064453125, -4.7786865234375, -4.49896240234375, -4.21923828125, -3.93951416015625, -3.6597900390625, -3.38006591796875, -3.100341796875, -2.82061767578125, -2.5408935546875, -2.26116943359375, -1.9814453125, -1.70172119140625, -1.4219970703125, -1.14227294921875, -0.862548828125, -0.58282470703125, -0.3031005859375, -0.02337646484375, 0.25634765625, 0.53607177734375, 0.8157958984375, 1.09552001953125, 1.375244140625, 1.65496826171875, 1.9346923828125, 2.21441650390625, 2.494140625, 2.77386474609375, 3.0535888671875, 3.33331298828125, 3.613037109375, 3.89276123046875, 4.1724853515625, 4.45220947265625, 4.73193359375, 5.01165771484375, 5.2913818359375, 5.57110595703125, 5.850830078125, 6.13055419921875, 6.4102783203125, 6.69000244140625, 6.9697265625, 7.24945068359375, 7.5291748046875, 7.80889892578125, 8.088623046875, 8.36834716796875, 8.6480712890625, 8.92779541015625, 9.20751953125, 9.48724365234375, 9.7669677734375, 10.04669189453125, 10.326416015625, 10.60614013671875, 10.8858642578125, 11.16558837890625, 11.4453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 1.0, 13.0, 7.0, 14.0, 23.0, 23.0, 31.0, 37.0, 37.0, 54.0, 54.0, 66.0, 68.0, 77.0, 72.0, 64.0, 65.0, 59.0, 47.0, 44.0, 32.0, 24.0, 12.0, 13.0, 12.0, 16.0, 6.0, 5.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.6749267578125, -4.459228515625, -4.2435302734375, -4.02783203125, -3.8121337890625, -3.596435546875, -3.3807373046875, -3.1650390625, -2.9493408203125, -2.733642578125, -2.5179443359375, -2.30224609375, -2.0865478515625, -1.870849609375, -1.6551513671875, -1.439453125, -1.2237548828125, -1.008056640625, -0.7923583984375, -0.57666015625, -0.3609619140625, -0.145263671875, 0.0704345703125, 0.2861328125, 0.5018310546875, 0.717529296875, 0.9332275390625, 1.14892578125, 1.3646240234375, 1.580322265625, 1.7960205078125, 2.01171875, 2.2274169921875, 2.443115234375, 2.6588134765625, 2.87451171875, 3.0902099609375, 3.305908203125, 3.5216064453125, 3.7373046875, 3.9530029296875, 4.168701171875, 4.3843994140625, 4.60009765625, 4.8157958984375, 5.031494140625, 5.2471923828125, 5.462890625, 5.6785888671875, 5.894287109375, 6.1099853515625, 6.32568359375, 6.5413818359375, 6.757080078125, 6.9727783203125, 7.1884765625, 7.4041748046875, 7.619873046875, 7.8355712890625, 8.05126953125, 8.2669677734375, 8.482666015625, 8.6983642578125, 8.9140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 3.0, 13.0, 11.0, 19.0, 15.0, 33.0, 48.0, 85.0, 122.0, 299.0, 651.0, 1725.0, 6770.0, 52796.0, 664322.0, 294190.0, 21487.0, 3797.0, 1170.0, 477.0, 216.0, 118.0, 66.0, 44.0, 16.0, 16.0, 7.0, 2.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.935546875, -2.829986572265625, -2.72442626953125, -2.618865966796875, -2.5133056640625, -2.407745361328125, -2.30218505859375, -2.196624755859375, -2.091064453125, -1.985504150390625, -1.87994384765625, -1.774383544921875, -1.6688232421875, -1.563262939453125, -1.45770263671875, -1.352142333984375, -1.24658203125, -1.141021728515625, -1.03546142578125, -0.929901123046875, -0.8243408203125, -0.718780517578125, -0.61322021484375, -0.507659912109375, -0.402099609375, -0.296539306640625, -0.19097900390625, -0.085418701171875, 0.0201416015625, 0.125701904296875, 0.23126220703125, 0.336822509765625, 0.4423828125, 0.547943115234375, 0.65350341796875, 0.759063720703125, 0.8646240234375, 0.970184326171875, 1.07574462890625, 1.181304931640625, 1.286865234375, 1.392425537109375, 1.49798583984375, 1.603546142578125, 1.7091064453125, 1.814666748046875, 1.92022705078125, 2.025787353515625, 2.13134765625, 2.236907958984375, 2.34246826171875, 2.448028564453125, 2.5535888671875, 2.659149169921875, 2.76470947265625, 2.870269775390625, 2.975830078125, 3.081390380859375, 3.18695068359375, 3.292510986328125, 3.3980712890625, 3.503631591796875, 3.60919189453125, 3.714752197265625, 3.8203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 1.0, 3.0, 6.0, 8.0, 7.0, 15.0, 16.0, 26.0, 28.0, 43.0, 53.0, 51.0, 83.0, 96.0, 112.0, 82.0, 67.0, 52.0, 47.0, 46.0, 32.0, 31.0, 15.0, 8.0, 14.0, 10.0, 10.0, 3.0, 4.0, 4.0, 10.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027871131896972656, -0.00027015432715415955, -0.00026159733533859253, -0.0002530403435230255, -0.0002444833517074585, -0.00023592635989189148, -0.00022736936807632446, -0.00021881237626075745, -0.00021025538444519043, -0.0002016983926296234, -0.0001931414008140564, -0.00018458440899848938, -0.00017602741718292236, -0.00016747042536735535, -0.00015891343355178833, -0.0001503564417362213, -0.0001417994499206543, -0.00013324245810508728, -0.00012468546628952026, -0.00011612847447395325, -0.00010757148265838623, -9.901449084281921e-05, -9.04574990272522e-05, -8.190050721168518e-05, -7.334351539611816e-05, -6.478652358055115e-05, -5.622953176498413e-05, -4.7672539949417114e-05, -3.91155481338501e-05, -3.055855631828308e-05, -2.2001564502716064e-05, -1.3444572687149048e-05, -4.887580871582031e-06, 3.6694109439849854e-06, 1.2226402759552002e-05, 2.078339457511902e-05, 2.9340386390686035e-05, 3.789737820625305e-05, 4.645437002182007e-05, 5.5011361837387085e-05, 6.35683536529541e-05, 7.212534546852112e-05, 8.068233728408813e-05, 8.923932909965515e-05, 9.779632091522217e-05, 0.00010635331273078918, 0.0001149103045463562, 0.00012346729636192322, 0.00013202428817749023, 0.00014058127999305725, 0.00014913827180862427, 0.00015769526362419128, 0.0001662522554397583, 0.00017480924725532532, 0.00018336623907089233, 0.00019192323088645935, 0.00020048022270202637, 0.00020903721451759338, 0.0002175942063331604, 0.00022615119814872742, 0.00023470818996429443, 0.00024326518177986145, 0.00025182217359542847, 0.0002603791654109955, 0.0002689361572265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 9.0, 6.0, 7.0, 9.0, 18.0, 22.0, 37.0, 57.0, 112.0, 224.0, 469.0, 1154.0, 3191.0, 12462.0, 93765.0, 692161.0, 214477.0, 22596.0, 4897.0, 1545.0, 668.0, 298.0, 162.0, 80.0, 40.0, 25.0, 23.0, 5.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.774322509765625, -2.67755126953125, -2.580780029296875, -2.4840087890625, -2.387237548828125, -2.29046630859375, -2.193695068359375, -2.096923828125, -2.000152587890625, -1.90338134765625, -1.806610107421875, -1.7098388671875, -1.613067626953125, -1.51629638671875, -1.419525146484375, -1.32275390625, -1.225982666015625, -1.12921142578125, -1.032440185546875, -0.9356689453125, -0.838897705078125, -0.74212646484375, -0.645355224609375, -0.548583984375, -0.451812744140625, -0.35504150390625, -0.258270263671875, -0.1614990234375, -0.064727783203125, 0.03204345703125, 0.128814697265625, 0.2255859375, 0.322357177734375, 0.41912841796875, 0.515899658203125, 0.6126708984375, 0.709442138671875, 0.80621337890625, 0.902984619140625, 0.999755859375, 1.096527099609375, 1.19329833984375, 1.290069580078125, 1.3868408203125, 1.483612060546875, 1.58038330078125, 1.677154541015625, 1.77392578125, 1.870697021484375, 1.96746826171875, 2.064239501953125, 2.1610107421875, 2.257781982421875, 2.35455322265625, 2.451324462890625, 2.548095703125, 2.644866943359375, 2.74163818359375, 2.838409423828125, 2.9351806640625, 3.031951904296875, 3.12872314453125, 3.225494384765625, 3.322265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 14.0, 20.0, 31.0, 36.0, 65.0, 81.0, 125.0, 119.0, 110.0, 93.0, 78.0, 52.0, 43.0, 33.0, 19.0, 9.0, 10.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.291015625, -2.2142333984375, -2.137451171875, -2.0606689453125, -1.98388671875, -1.9071044921875, -1.830322265625, -1.7535400390625, -1.6767578125, -1.5999755859375, -1.523193359375, -1.4464111328125, -1.36962890625, -1.2928466796875, -1.216064453125, -1.1392822265625, -1.0625, -0.9857177734375, -0.908935546875, -0.8321533203125, -0.75537109375, -0.6785888671875, -0.601806640625, -0.5250244140625, -0.4482421875, -0.3714599609375, -0.294677734375, -0.2178955078125, -0.14111328125, -0.0643310546875, 0.012451171875, 0.0892333984375, 0.166015625, 0.2427978515625, 0.319580078125, 0.3963623046875, 0.47314453125, 0.5499267578125, 0.626708984375, 0.7034912109375, 0.7802734375, 0.8570556640625, 0.933837890625, 1.0106201171875, 1.08740234375, 1.1641845703125, 1.240966796875, 1.3177490234375, 1.39453125, 1.4713134765625, 1.548095703125, 1.6248779296875, 1.70166015625, 1.7784423828125, 1.855224609375, 1.9320068359375, 2.0087890625, 2.0855712890625, 2.162353515625, 2.2391357421875, 2.31591796875, 2.3927001953125, 2.469482421875, 2.5462646484375, 2.623046875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 15.0, 39.0, 111.0, 308.0, 307.0, 123.0, 57.0, 13.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.99281311035156, -69.01544952392578, -67.03807830810547, -65.06071472167969, -63.083351135253906, -61.10598373413086, -59.12861633300781, -57.15125274658203, -55.17388916015625, -53.1965217590332, -51.21915817260742, -49.241790771484375, -47.264427185058594, -45.28705978393555, -43.3096923828125, -41.33232879638672, -39.35496139526367, -37.377593994140625, -35.400230407714844, -33.4228630065918, -31.445499420166016, -29.46813201904297, -27.490766525268555, -25.51340103149414, -23.536035537719727, -21.558670043945312, -19.5813045501709, -17.603939056396484, -15.626572608947754, -13.64920711517334, -11.67184066772461, -9.694475173950195, -7.717113494873047, -5.739748001098633, -3.7623820304870605, -1.7850160598754883, 0.19234943389892578, 2.16971492767334, 4.14708137512207, 6.124446868896484, 8.101812362670898, 10.079177856445312, 12.056543350219727, 14.033909797668457, 16.011276245117188, 17.98863983154297, 19.966007232666016, 21.94337272644043, 23.920738220214844, 25.898103713989258, 27.875469207763672, 29.85283660888672, 31.8302001953125, 33.80756759643555, 35.784934997558594, 37.762298583984375, 39.739662170410156, 41.7170295715332, 43.694393157958984, 45.67176055908203, 47.64912414550781, 49.62649154663086, 51.603858947753906, 53.58122253417969, 55.558589935302734]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 10.0, 11.0, 21.0, 15.0, 25.0, 25.0, 31.0, 36.0, 53.0, 54.0, 60.0, 62.0, 72.0, 69.0, 56.0, 69.0, 61.0, 44.0, 40.0, 36.0, 34.0, 27.0, 16.0, 14.0, 16.0, 11.0, 7.0, 2.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.55316925048828, -43.291900634765625, -42.030635833740234, -40.76936721801758, -39.50809860229492, -38.24683380126953, -36.985565185546875, -35.72429656982422, -34.46302795410156, -33.201759338378906, -31.940492630004883, -30.67922592163086, -29.417957305908203, -28.15669059753418, -26.895423889160156, -25.6341552734375, -24.37289047241211, -23.111623764038086, -21.85035514831543, -20.589088439941406, -19.32781982421875, -18.066553115844727, -16.805286407470703, -15.544018745422363, -14.282751083374023, -13.021483421325684, -11.760215759277344, -10.49894905090332, -9.23768138885498, -7.976413726806641, -6.715146541595459, -5.453879356384277, -4.1926116943359375, -2.9313442707061768, -1.670076847076416, -0.4088094234466553, 0.8524580001831055, 2.1137256622314453, 3.374992847442627, 4.636260032653809, 5.897527694702148, 7.158795356750488, 8.420063018798828, 9.681329727172852, 10.942597389221191, 12.203865051269531, 13.465131759643555, 14.726399421691895, 15.987667083740234, 17.248933792114258, 18.510202407836914, 19.771469116210938, 21.032737731933594, 22.294004440307617, 23.55527114868164, 24.816539764404297, 26.07780647277832, 27.339073181152344, 28.600341796875, 29.861608505249023, 31.122875213623047, 32.3841438293457, 33.64541244506836, 34.90667724609375, 36.167945861816406]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1.0, 8.0, 10.0, 23.0, 28.0, 49.0, 83.0, 154.0, 254.0, 510.0, 1096.0, 2936.0, 10050.0, 57775.0, 3494350.0, 583693.0, 31355.0, 7114.0, 2436.0, 1046.0, 484.0, 305.0, 165.0, 99.0, 82.0, 56.0, 19.0, 25.0, 24.0, 22.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.2734375, -7.926513671875, -7.57958984375, -7.232666015625, -6.8857421875, -6.538818359375, -6.19189453125, -5.844970703125, -5.498046875, -5.151123046875, -4.80419921875, -4.457275390625, -4.1103515625, -3.763427734375, -3.41650390625, -3.069580078125, -2.72265625, -2.375732421875, -2.02880859375, -1.681884765625, -1.3349609375, -0.988037109375, -0.64111328125, -0.294189453125, 0.052734375, 0.399658203125, 0.74658203125, 1.093505859375, 1.4404296875, 1.787353515625, 2.13427734375, 2.481201171875, 2.828125, 3.175048828125, 3.52197265625, 3.868896484375, 4.2158203125, 4.562744140625, 4.90966796875, 5.256591796875, 5.603515625, 5.950439453125, 6.29736328125, 6.644287109375, 6.9912109375, 7.338134765625, 7.68505859375, 8.031982421875, 8.37890625, 8.725830078125, 9.07275390625, 9.419677734375, 9.7666015625, 10.113525390625, 10.46044921875, 10.807373046875, 11.154296875, 11.501220703125, 11.84814453125, 12.195068359375, 12.5419921875, 12.888916015625, 13.23583984375, 13.582763671875, 13.9296875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 10.0, 10.0, 17.0, 34.0, 24.0, 33.0, 49.0, 70.0, 75.0, 78.0, 80.0, 88.0, 71.0, 84.0, 58.0, 51.0, 50.0, 32.0, 28.0, 20.0, 14.0, 8.0, 10.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7607421875, -1.7005767822265625, -1.640411376953125, -1.5802459716796875, -1.52008056640625, -1.4599151611328125, -1.399749755859375, -1.3395843505859375, -1.2794189453125, -1.2192535400390625, -1.159088134765625, -1.0989227294921875, -1.03875732421875, -0.9785919189453125, -0.918426513671875, -0.8582611083984375, -0.798095703125, -0.7379302978515625, -0.677764892578125, -0.6175994873046875, -0.55743408203125, -0.4972686767578125, -0.437103271484375, -0.3769378662109375, -0.3167724609375, -0.2566070556640625, -0.196441650390625, -0.1362762451171875, -0.07611083984375, -0.0159454345703125, 0.044219970703125, 0.1043853759765625, 0.16455078125, 0.2247161865234375, 0.284881591796875, 0.3450469970703125, 0.40521240234375, 0.4653778076171875, 0.525543212890625, 0.5857086181640625, 0.6458740234375, 0.7060394287109375, 0.766204833984375, 0.8263702392578125, 0.88653564453125, 0.9467010498046875, 1.006866455078125, 1.0670318603515625, 1.127197265625, 1.1873626708984375, 1.247528076171875, 1.3076934814453125, 1.36785888671875, 1.4280242919921875, 1.488189697265625, 1.5483551025390625, 1.6085205078125, 1.6686859130859375, 1.728851318359375, 1.7890167236328125, 1.84918212890625, 1.9093475341796875, 1.969512939453125, 2.0296783447265625, 2.08984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 16.0, 28.0, 40.0, 49.0, 62.0, 118.0, 196.0, 396.0, 947.0, 2645.0, 10187.0, 229105.0, 3916403.0, 26730.0, 4670.0, 1456.0, 537.0, 254.0, 145.0, 89.0, 70.0, 36.0, 26.0, 20.0, 19.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.0390625, -14.5416259765625, -14.044189453125, -13.5467529296875, -13.04931640625, -12.5518798828125, -12.054443359375, -11.5570068359375, -11.0595703125, -10.5621337890625, -10.064697265625, -9.5672607421875, -9.06982421875, -8.5723876953125, -8.074951171875, -7.5775146484375, -7.080078125, -6.5826416015625, -6.085205078125, -5.5877685546875, -5.09033203125, -4.5928955078125, -4.095458984375, -3.5980224609375, -3.1005859375, -2.6031494140625, -2.105712890625, -1.6082763671875, -1.11083984375, -0.6134033203125, -0.115966796875, 0.3814697265625, 0.87890625, 1.3763427734375, 1.873779296875, 2.3712158203125, 2.86865234375, 3.3660888671875, 3.863525390625, 4.3609619140625, 4.8583984375, 5.3558349609375, 5.853271484375, 6.3507080078125, 6.84814453125, 7.3455810546875, 7.843017578125, 8.3404541015625, 8.837890625, 9.3353271484375, 9.832763671875, 10.3302001953125, 10.82763671875, 11.3250732421875, 11.822509765625, 12.3199462890625, 12.8173828125, 13.3148193359375, 13.812255859375, 14.3096923828125, 14.80712890625, 15.3045654296875, 15.802001953125, 16.2994384765625, 16.796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 13.0, 16.0, 46.0, 97.0, 450.0, 2773.0, 510.0, 86.0, 41.0, 17.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.049072265625, -7.78564453125, -7.522216796875, -7.2587890625, -6.995361328125, -6.73193359375, -6.468505859375, -6.205078125, -5.941650390625, -5.67822265625, -5.414794921875, -5.1513671875, -4.887939453125, -4.62451171875, -4.361083984375, -4.09765625, -3.834228515625, -3.57080078125, -3.307373046875, -3.0439453125, -2.780517578125, -2.51708984375, -2.253662109375, -1.990234375, -1.726806640625, -1.46337890625, -1.199951171875, -0.9365234375, -0.673095703125, -0.40966796875, -0.146240234375, 0.1171875, 0.380615234375, 0.64404296875, 0.907470703125, 1.1708984375, 1.434326171875, 1.69775390625, 1.961181640625, 2.224609375, 2.488037109375, 2.75146484375, 3.014892578125, 3.2783203125, 3.541748046875, 3.80517578125, 4.068603515625, 4.33203125, 4.595458984375, 4.85888671875, 5.122314453125, 5.3857421875, 5.649169921875, 5.91259765625, 6.176025390625, 6.439453125, 6.702880859375, 6.96630859375, 7.229736328125, 7.4931640625, 7.756591796875, 8.02001953125, 8.283447265625, 8.546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 39.0, 78.0, 211.0, 319.0, 189.0, 102.0, 33.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.20782470703125, -22.139741897583008, -21.071659088134766, -20.00357437133789, -18.93549156188965, -17.867408752441406, -16.79932403564453, -15.731241226196289, -14.663158416748047, -13.595075607299805, -12.526991844177246, -11.458908081054688, -10.390825271606445, -9.322742462158203, -8.254658699035645, -7.186575412750244, -6.118492126464844, -5.050408840179443, -3.982325553894043, -2.9142422676086426, -1.8461589813232422, -0.7780756950378418, 0.2900075912475586, 1.358090877532959, 2.4261741638183594, 3.4942574501037598, 4.56234073638916, 5.6304240226745605, 6.698507308959961, 7.766590595245361, 8.834673881530762, 9.90275764465332, 10.970840454101562, 12.038923263549805, 13.107007026672363, 14.175090789794922, 15.243173599243164, 16.311256408691406, 17.37934112548828, 18.447423934936523, 19.515506744384766, 20.583589553833008, 21.65167236328125, 22.719757080078125, 23.787839889526367, 24.85592269897461, 25.924007415771484, 26.992090225219727, 28.06017303466797, 29.12825584411621, 30.196338653564453, 31.264423370361328, 32.33250427246094, 33.40058898925781, 34.46867370605469, 35.5367546081543, 36.60483932495117, 37.67292404174805, 38.741004943847656, 39.80908966064453, 40.877174377441406, 41.945255279541016, 43.01333999633789, 44.0814208984375, 45.149505615234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 14.0, 25.0, 19.0, 20.0, 29.0, 38.0, 39.0, 35.0, 55.0, 58.0, 72.0, 80.0, 66.0, 63.0, 72.0, 58.0, 54.0, 34.0, 29.0, 28.0, 32.0, 17.0, 18.0, 10.0, 9.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.771625518798828, -19.298376083374023, -18.82512664794922, -18.35187530517578, -17.878625869750977, -17.405376434326172, -16.932126998901367, -16.458877563476562, -15.985628128051758, -15.512378692626953, -15.039128303527832, -14.565878868103027, -14.092629432678223, -13.619379043579102, -13.146129608154297, -12.672880172729492, -12.199629783630371, -11.726380348205566, -11.253129959106445, -10.77988052368164, -10.306631088256836, -9.833381652832031, -9.36013126373291, -8.886881828308105, -8.413631439208984, -7.9403815269470215, -7.467132091522217, -6.993882179260254, -6.520632743835449, -6.047382831573486, -5.574132919311523, -5.100883483886719, -4.627634048461914, -4.154384136199951, -3.6811347007751465, -3.2078847885131836, -2.7346351146698, -2.261385440826416, -1.7881355285644531, -1.3148858547210693, -0.8416361808776855, -0.368386447429657, 0.10486328601837158, 0.5781130790710449, 1.0513627529144287, 1.5246124267578125, 1.9978623390197754, 2.471112012863159, 2.944361686706543, 3.4176113605499268, 3.8908610343933105, 4.364110946655273, 4.837360382080078, 5.310610294342041, 5.783860206604004, 6.257109642028809, 6.7303595542907715, 7.203609466552734, 7.676858901977539, 8.150108337402344, 8.623358726501465, 9.09660816192627, 9.56985855102539, 10.043107986450195, 10.516357421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 15.0, 15.0, 38.0, 54.0, 112.0, 152.0, 268.0, 543.0, 1215.0, 3142.0, 12384.0, 82274.0, 629027.0, 277814.0, 31618.0, 6111.0, 1997.0, 814.0, 403.0, 209.0, 128.0, 77.0, 44.0, 23.0, 26.0, 11.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.8973388671875, -7.622802734375, -7.3482666015625, -7.07373046875, -6.7991943359375, -6.524658203125, -6.2501220703125, -5.9755859375, -5.7010498046875, -5.426513671875, -5.1519775390625, -4.87744140625, -4.6029052734375, -4.328369140625, -4.0538330078125, -3.779296875, -3.5047607421875, -3.230224609375, -2.9556884765625, -2.68115234375, -2.4066162109375, -2.132080078125, -1.8575439453125, -1.5830078125, -1.3084716796875, -1.033935546875, -0.7593994140625, -0.48486328125, -0.2103271484375, 0.064208984375, 0.3387451171875, 0.61328125, 0.8878173828125, 1.162353515625, 1.4368896484375, 1.71142578125, 1.9859619140625, 2.260498046875, 2.5350341796875, 2.8095703125, 3.0841064453125, 3.358642578125, 3.6331787109375, 3.90771484375, 4.1822509765625, 4.456787109375, 4.7313232421875, 5.005859375, 5.2803955078125, 5.554931640625, 5.8294677734375, 6.10400390625, 6.3785400390625, 6.653076171875, 6.9276123046875, 7.2021484375, 7.4766845703125, 7.751220703125, 8.0257568359375, 8.30029296875, 8.5748291015625, 8.849365234375, 9.1239013671875, 9.3984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 14.0, 23.0, 26.0, 48.0, 73.0, 65.0, 73.0, 107.0, 106.0, 101.0, 85.0, 81.0, 63.0, 45.0, 37.0, 15.0, 11.0, 10.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.41070556640625, -2.3389892578125, -2.26727294921875, -2.195556640625, -2.12384033203125, -2.0521240234375, -1.98040771484375, -1.90869140625, -1.83697509765625, -1.7652587890625, -1.69354248046875, -1.621826171875, -1.55010986328125, -1.4783935546875, -1.40667724609375, -1.3349609375, -1.26324462890625, -1.1915283203125, -1.11981201171875, -1.048095703125, -0.97637939453125, -0.9046630859375, -0.83294677734375, -0.76123046875, -0.68951416015625, -0.6177978515625, -0.54608154296875, -0.474365234375, -0.40264892578125, -0.3309326171875, -0.25921630859375, -0.1875, -0.11578369140625, -0.0440673828125, 0.02764892578125, 0.099365234375, 0.17108154296875, 0.2427978515625, 0.31451416015625, 0.38623046875, 0.45794677734375, 0.5296630859375, 0.60137939453125, 0.673095703125, 0.74481201171875, 0.8165283203125, 0.88824462890625, 0.9599609375, 1.03167724609375, 1.1033935546875, 1.17510986328125, 1.246826171875, 1.31854248046875, 1.3902587890625, 1.46197509765625, 1.53369140625, 1.60540771484375, 1.6771240234375, 1.74884033203125, 1.820556640625, 1.89227294921875, 1.9639892578125, 2.03570556640625, 2.107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 4.0, 11.0, 15.0, 16.0, 33.0, 46.0, 70.0, 120.0, 177.0, 282.0, 524.0, 944.0, 1944.0, 3684.0, 8137.0, 18565.0, 48224.0, 140090.0, 360766.0, 297383.0, 103045.0, 36744.0, 14810.0, 6583.0, 2995.0, 1531.0, 733.0, 450.0, 225.0, 133.0, 80.0, 61.0, 32.0, 27.0, 23.0, 5.0, 17.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.771484375, -3.663299560546875, -3.55511474609375, -3.446929931640625, -3.3387451171875, -3.230560302734375, -3.12237548828125, -3.014190673828125, -2.906005859375, -2.797821044921875, -2.68963623046875, -2.581451416015625, -2.4732666015625, -2.365081787109375, -2.25689697265625, -2.148712158203125, -2.04052734375, -1.932342529296875, -1.82415771484375, -1.715972900390625, -1.6077880859375, -1.499603271484375, -1.39141845703125, -1.283233642578125, -1.175048828125, -1.066864013671875, -0.95867919921875, -0.850494384765625, -0.7423095703125, -0.634124755859375, -0.52593994140625, -0.417755126953125, -0.3095703125, -0.201385498046875, -0.09320068359375, 0.014984130859375, 0.1231689453125, 0.231353759765625, 0.33953857421875, 0.447723388671875, 0.555908203125, 0.664093017578125, 0.77227783203125, 0.880462646484375, 0.9886474609375, 1.096832275390625, 1.20501708984375, 1.313201904296875, 1.42138671875, 1.529571533203125, 1.63775634765625, 1.745941162109375, 1.8541259765625, 1.962310791015625, 2.07049560546875, 2.178680419921875, 2.286865234375, 2.395050048828125, 2.50323486328125, 2.611419677734375, 2.7196044921875, 2.827789306640625, 2.93597412109375, 3.044158935546875, 3.15234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 12.0, 14.0, 7.0, 9.0, 9.0, 14.0, 17.0, 20.0, 21.0, 28.0, 37.0, 33.0, 39.0, 48.0, 37.0, 52.0, 47.0, 36.0, 56.0, 28.0, 33.0, 47.0, 43.0, 44.0, 30.0, 29.0, 31.0, 20.0, 23.0, 19.0, 21.0, 14.0, 17.0, 10.0, 9.0, 8.0, 12.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-4.765625, -4.6239013671875, -4.482177734375, -4.3404541015625, -4.19873046875, -4.0570068359375, -3.915283203125, -3.7735595703125, -3.6318359375, -3.4901123046875, -3.348388671875, -3.2066650390625, -3.06494140625, -2.9232177734375, -2.781494140625, -2.6397705078125, -2.498046875, -2.3563232421875, -2.214599609375, -2.0728759765625, -1.93115234375, -1.7894287109375, -1.647705078125, -1.5059814453125, -1.3642578125, -1.2225341796875, -1.080810546875, -0.9390869140625, -0.79736328125, -0.6556396484375, -0.513916015625, -0.3721923828125, -0.23046875, -0.0887451171875, 0.052978515625, 0.1947021484375, 0.33642578125, 0.4781494140625, 0.619873046875, 0.7615966796875, 0.9033203125, 1.0450439453125, 1.186767578125, 1.3284912109375, 1.47021484375, 1.6119384765625, 1.753662109375, 1.8953857421875, 2.037109375, 2.1788330078125, 2.320556640625, 2.4622802734375, 2.60400390625, 2.7457275390625, 2.887451171875, 3.0291748046875, 3.1708984375, 3.3126220703125, 3.454345703125, 3.5960693359375, 3.73779296875, 3.8795166015625, 4.021240234375, 4.1629638671875, 4.3046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 2.0, 3.0, 6.0, 9.0, 14.0, 10.0, 24.0, 26.0, 61.0, 98.0, 187.0, 397.0, 1093.0, 3624.0, 15678.0, 91649.0, 539043.0, 333790.0, 49651.0, 9181.0, 2468.0, 839.0, 316.0, 157.0, 85.0, 42.0, 27.0, 19.0, 16.0, 11.0, 5.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.012847900390625, -1.94757080078125, -1.882293701171875, -1.8170166015625, -1.751739501953125, -1.68646240234375, -1.621185302734375, -1.555908203125, -1.490631103515625, -1.42535400390625, -1.360076904296875, -1.2947998046875, -1.229522705078125, -1.16424560546875, -1.098968505859375, -1.03369140625, -0.968414306640625, -0.90313720703125, -0.837860107421875, -0.7725830078125, -0.707305908203125, -0.64202880859375, -0.576751708984375, -0.511474609375, -0.446197509765625, -0.38092041015625, -0.315643310546875, -0.2503662109375, -0.185089111328125, -0.11981201171875, -0.054534912109375, 0.0107421875, 0.076019287109375, 0.14129638671875, 0.206573486328125, 0.2718505859375, 0.337127685546875, 0.40240478515625, 0.467681884765625, 0.532958984375, 0.598236083984375, 0.66351318359375, 0.728790283203125, 0.7940673828125, 0.859344482421875, 0.92462158203125, 0.989898681640625, 1.05517578125, 1.120452880859375, 1.18572998046875, 1.251007080078125, 1.3162841796875, 1.381561279296875, 1.44683837890625, 1.512115478515625, 1.577392578125, 1.642669677734375, 1.70794677734375, 1.773223876953125, 1.8385009765625, 1.903778076171875, 1.96905517578125, 2.034332275390625, 2.099609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 3.0, 8.0, 9.0, 8.0, 7.0, 17.0, 15.0, 25.0, 33.0, 33.0, 41.0, 64.0, 101.0, 95.0, 124.0, 95.0, 74.0, 71.0, 50.0, 25.0, 23.0, 18.0, 9.0, 12.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003345012664794922, -0.0003255307674407959, -0.0003165602684020996, -0.0003075897693634033, -0.00029861927032470703, -0.00028964877128601074, -0.00028067827224731445, -0.00027170777320861816, -0.0002627372741699219, -0.0002537667751312256, -0.0002447962760925293, -0.000235825777053833, -0.00022685527801513672, -0.00021788477897644043, -0.00020891427993774414, -0.00019994378089904785, -0.00019097328186035156, -0.00018200278282165527, -0.00017303228378295898, -0.0001640617847442627, -0.0001550912857055664, -0.00014612078666687012, -0.00013715028762817383, -0.00012817978858947754, -0.00011920928955078125, -0.00011023879051208496, -0.00010126829147338867, -9.229779243469238e-05, -8.33272933959961e-05, -7.43567943572998e-05, -6.538629531860352e-05, -5.6415796279907227e-05, -4.744529724121094e-05, -3.847479820251465e-05, -2.950429916381836e-05, -2.053380012512207e-05, -1.1563301086425781e-05, -2.592802047729492e-06, 6.377696990966797e-06, 1.5348196029663086e-05, 2.4318695068359375e-05, 3.3289194107055664e-05, 4.225969314575195e-05, 5.123019218444824e-05, 6.020069122314453e-05, 6.917119026184082e-05, 7.814168930053711e-05, 8.71121883392334e-05, 9.608268737792969e-05, 0.00010505318641662598, 0.00011402368545532227, 0.00012299418449401855, 0.00013196468353271484, 0.00014093518257141113, 0.00014990568161010742, 0.0001588761806488037, 0.0001678466796875, 0.0001768171787261963, 0.00018578767776489258, 0.00019475817680358887, 0.00020372867584228516, 0.00021269917488098145, 0.00022166967391967773, 0.00023064017295837402, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 5.0, 9.0, 12.0, 22.0, 25.0, 41.0, 70.0, 83.0, 129.0, 223.0, 329.0, 589.0, 1045.0, 2161.0, 4914.0, 12564.0, 36366.0, 113364.0, 373484.0, 345562.0, 103185.0, 33399.0, 11664.0, 4587.0, 2074.0, 1005.0, 607.0, 347.0, 230.0, 142.0, 106.0, 62.0, 41.0, 24.0, 24.0, 12.0, 18.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-1.5791015625, -1.535186767578125, -1.49127197265625, -1.447357177734375, -1.4034423828125, -1.359527587890625, -1.31561279296875, -1.271697998046875, -1.227783203125, -1.183868408203125, -1.13995361328125, -1.096038818359375, -1.0521240234375, -1.008209228515625, -0.96429443359375, -0.920379638671875, -0.87646484375, -0.832550048828125, -0.78863525390625, -0.744720458984375, -0.7008056640625, -0.656890869140625, -0.61297607421875, -0.569061279296875, -0.525146484375, -0.481231689453125, -0.43731689453125, -0.393402099609375, -0.3494873046875, -0.305572509765625, -0.26165771484375, -0.217742919921875, -0.173828125, -0.129913330078125, -0.08599853515625, -0.042083740234375, 0.0018310546875, 0.045745849609375, 0.08966064453125, 0.133575439453125, 0.177490234375, 0.221405029296875, 0.26531982421875, 0.309234619140625, 0.3531494140625, 0.397064208984375, 0.44097900390625, 0.484893798828125, 0.52880859375, 0.572723388671875, 0.61663818359375, 0.660552978515625, 0.7044677734375, 0.748382568359375, 0.79229736328125, 0.836212158203125, 0.880126953125, 0.924041748046875, 0.96795654296875, 1.011871337890625, 1.0557861328125, 1.099700927734375, 1.14361572265625, 1.187530517578125, 1.2314453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 2.0, 8.0, 7.0, 14.0, 17.0, 22.0, 28.0, 30.0, 40.0, 49.0, 61.0, 80.0, 85.0, 96.0, 82.0, 66.0, 59.0, 49.0, 39.0, 36.0, 21.0, 25.0, 15.0, 16.0, 7.0, 6.0, 3.0, 8.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.4353485107421875, -1.388275146484375, -1.3412017822265625, -1.29412841796875, -1.2470550537109375, -1.199981689453125, -1.1529083251953125, -1.1058349609375, -1.0587615966796875, -1.011688232421875, -0.9646148681640625, -0.91754150390625, -0.8704681396484375, -0.823394775390625, -0.7763214111328125, -0.729248046875, -0.6821746826171875, -0.635101318359375, -0.5880279541015625, -0.54095458984375, -0.4938812255859375, -0.446807861328125, -0.3997344970703125, -0.3526611328125, -0.3055877685546875, -0.258514404296875, -0.2114410400390625, -0.16436767578125, -0.1172943115234375, -0.070220947265625, -0.0231475830078125, 0.02392578125, 0.0709991455078125, 0.118072509765625, 0.1651458740234375, 0.21221923828125, 0.2592926025390625, 0.306365966796875, 0.3534393310546875, 0.4005126953125, 0.4475860595703125, 0.494659423828125, 0.5417327880859375, 0.58880615234375, 0.6358795166015625, 0.682952880859375, 0.7300262451171875, 0.777099609375, 0.8241729736328125, 0.871246337890625, 0.9183197021484375, 0.96539306640625, 1.0124664306640625, 1.059539794921875, 1.1066131591796875, 1.1536865234375, 1.2007598876953125, 1.247833251953125, 1.2949066162109375, 1.34197998046875, 1.3890533447265625, 1.436126708984375, 1.4832000732421875, 1.5302734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 9.0, 18.0, 23.0, 49.0, 126.0, 168.0, 226.0, 181.0, 94.0, 44.0, 30.0, 12.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.797157287597656, -20.552026748657227, -19.30689811706543, -18.061767578125, -16.81663703918457, -15.571507453918457, -14.326377868652344, -13.081247329711914, -11.8361177444458, -10.590988159179688, -9.345857620239258, -8.100728034973145, -6.855597972869873, -5.610467910766602, -4.365338325500488, -3.1202077865600586, -1.8750782012939453, -0.6299482583999634, 0.6151816844940186, 1.860311508178711, 3.1054415702819824, 4.350571632385254, 5.595701217651367, 6.840831756591797, 8.08596134185791, 9.331090927124023, 10.576221466064453, 11.821351051330566, 13.06648063659668, 14.31161117553711, 15.556740760803223, 16.80187225341797, 18.047000885009766, 19.292131423950195, 20.537260055541992, 21.782390594482422, 23.02752113342285, 24.27265167236328, 25.517780303955078, 26.762910842895508, 28.008041381835938, 29.253171920776367, 30.498300552368164, 31.743431091308594, 32.98855972290039, 34.23369216918945, 35.47882080078125, 36.72395324707031, 37.969078063964844, 39.21420669555664, 40.4593391418457, 41.7044677734375, 42.9495964050293, 44.19472885131836, 45.439857482910156, 46.68498992919922, 47.930118560791016, 49.17524719238281, 50.420379638671875, 51.66550827026367, 52.91063690185547, 54.15576934814453, 55.40089797973633, 56.646026611328125, 57.89115905761719]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 14.0, 9.0, 12.0, 13.0, 14.0, 17.0, 19.0, 27.0, 37.0, 30.0, 34.0, 53.0, 43.0, 39.0, 45.0, 51.0, 49.0, 43.0, 50.0, 59.0, 46.0, 43.0, 37.0, 26.0, 29.0, 22.0, 30.0, 23.0, 16.0, 14.0, 16.0, 11.0, 1.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.802770614624023, -24.875926971435547, -23.94908332824707, -23.022239685058594, -22.095394134521484, -21.16855239868164, -20.24170684814453, -19.314863204956055, -18.388019561767578, -17.4611759185791, -16.534332275390625, -15.607487678527832, -14.680644035339355, -13.753800392150879, -12.826955795288086, -11.90011215209961, -10.973268508911133, -10.046424865722656, -9.11958122253418, -8.192736625671387, -7.26589298248291, -6.339049339294434, -5.412205219268799, -4.485361099243164, -3.5585174560546875, -2.631673574447632, -1.7048296928405762, -0.7779858112335205, 0.14885807037353516, 1.0757017135620117, 2.0025458335876465, 2.9293899536132812, 3.856231689453125, 4.783075332641602, 5.709919452667236, 6.636763572692871, 7.563607215881348, 8.490450859069824, 9.417295455932617, 10.344139099121094, 11.27098274230957, 12.197826385498047, 13.124670028686523, 14.051514625549316, 14.978358268737793, 15.90520191192627, 16.832046508789062, 17.75889015197754, 18.685733795166016, 19.612577438354492, 20.53942108154297, 21.466264724731445, 22.393108367919922, 23.31995391845703, 24.246797561645508, 25.173641204833984, 26.10048484802246, 27.027328491210938, 27.954172134399414, 28.88101577758789, 29.807861328125, 30.734703063964844, 31.661548614501953, 32.58839416503906, 33.515235900878906]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 10.0, 7.0, 14.0, 20.0, 19.0, 27.0, 35.0, 54.0, 89.0, 125.0, 239.0, 420.0, 783.0, 1585.0, 3856.0, 11317.0, 55469.0, 3283588.0, 783783.0, 37709.0, 8968.0, 3134.0, 1341.0, 665.0, 373.0, 228.0, 138.0, 96.0, 46.0, 38.0, 29.0, 18.0, 15.0, 12.0, 11.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.562744140625, -5.35595703125, -5.149169921875, -4.9423828125, -4.735595703125, -4.52880859375, -4.322021484375, -4.115234375, -3.908447265625, -3.70166015625, -3.494873046875, -3.2880859375, -3.081298828125, -2.87451171875, -2.667724609375, -2.4609375, -2.254150390625, -2.04736328125, -1.840576171875, -1.6337890625, -1.427001953125, -1.22021484375, -1.013427734375, -0.806640625, -0.599853515625, -0.39306640625, -0.186279296875, 0.0205078125, 0.227294921875, 0.43408203125, 0.640869140625, 0.84765625, 1.054443359375, 1.26123046875, 1.468017578125, 1.6748046875, 1.881591796875, 2.08837890625, 2.295166015625, 2.501953125, 2.708740234375, 2.91552734375, 3.122314453125, 3.3291015625, 3.535888671875, 3.74267578125, 3.949462890625, 4.15625, 4.363037109375, 4.56982421875, 4.776611328125, 4.9833984375, 5.190185546875, 5.39697265625, 5.603759765625, 5.810546875, 6.017333984375, 6.22412109375, 6.430908203125, 6.6376953125, 6.844482421875, 7.05126953125, 7.258056640625, 7.46484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 30.0, 33.0, 41.0, 53.0, 55.0, 75.0, 79.0, 96.0, 79.0, 74.0, 77.0, 58.0, 61.0, 41.0, 34.0, 19.0, 15.0, 16.0, 13.0, 4.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1015625, -2.03985595703125, -1.9781494140625, -1.91644287109375, -1.854736328125, -1.79302978515625, -1.7313232421875, -1.66961669921875, -1.60791015625, -1.54620361328125, -1.4844970703125, -1.42279052734375, -1.361083984375, -1.29937744140625, -1.2376708984375, -1.17596435546875, -1.1142578125, -1.05255126953125, -0.9908447265625, -0.92913818359375, -0.867431640625, -0.80572509765625, -0.7440185546875, -0.68231201171875, -0.62060546875, -0.55889892578125, -0.4971923828125, -0.43548583984375, -0.373779296875, -0.31207275390625, -0.2503662109375, -0.18865966796875, -0.126953125, -0.06524658203125, -0.0035400390625, 0.05816650390625, 0.119873046875, 0.18157958984375, 0.2432861328125, 0.30499267578125, 0.36669921875, 0.42840576171875, 0.4901123046875, 0.55181884765625, 0.613525390625, 0.67523193359375, 0.7369384765625, 0.79864501953125, 0.8603515625, 0.92205810546875, 0.9837646484375, 1.04547119140625, 1.107177734375, 1.16888427734375, 1.2305908203125, 1.29229736328125, 1.35400390625, 1.41571044921875, 1.4774169921875, 1.53912353515625, 1.600830078125, 1.66253662109375, 1.7242431640625, 1.78594970703125, 1.84765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 9.0, 8.0, 20.0, 18.0, 24.0, 35.0, 61.0, 77.0, 115.0, 127.0, 221.0, 363.0, 583.0, 1064.0, 2943.0, 18163.0, 521911.0, 3598056.0, 42909.0, 4671.0, 1281.0, 602.0, 323.0, 221.0, 128.0, 91.0, 62.0, 37.0, 43.0, 17.0, 19.0, 15.0, 10.0, 13.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2891845703125, -8.039306640625, -7.7894287109375, -7.53955078125, -7.2896728515625, -7.039794921875, -6.7899169921875, -6.5400390625, -6.2901611328125, -6.040283203125, -5.7904052734375, -5.54052734375, -5.2906494140625, -5.040771484375, -4.7908935546875, -4.541015625, -4.2911376953125, -4.041259765625, -3.7913818359375, -3.54150390625, -3.2916259765625, -3.041748046875, -2.7918701171875, -2.5419921875, -2.2921142578125, -2.042236328125, -1.7923583984375, -1.54248046875, -1.2926025390625, -1.042724609375, -0.7928466796875, -0.54296875, -0.2930908203125, -0.043212890625, 0.2066650390625, 0.45654296875, 0.7064208984375, 0.956298828125, 1.2061767578125, 1.4560546875, 1.7059326171875, 1.955810546875, 2.2056884765625, 2.45556640625, 2.7054443359375, 2.955322265625, 3.2052001953125, 3.455078125, 3.7049560546875, 3.954833984375, 4.2047119140625, 4.45458984375, 4.7044677734375, 4.954345703125, 5.2042236328125, 5.4541015625, 5.7039794921875, 5.953857421875, 6.2037353515625, 6.45361328125, 6.7034912109375, 6.953369140625, 7.2032470703125, 7.453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 6.0, 4.0, 18.0, 30.0, 63.0, 111.0, 263.0, 954.0, 1987.0, 361.0, 134.0, 58.0, 34.0, 16.0, 8.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.2890625, -4.200164794921875, -4.11126708984375, -4.022369384765625, -3.9334716796875, -3.844573974609375, -3.75567626953125, -3.666778564453125, -3.577880859375, -3.488983154296875, -3.40008544921875, -3.311187744140625, -3.2222900390625, -3.133392333984375, -3.04449462890625, -2.955596923828125, -2.86669921875, -2.777801513671875, -2.68890380859375, -2.600006103515625, -2.5111083984375, -2.422210693359375, -2.33331298828125, -2.244415283203125, -2.155517578125, -2.066619873046875, -1.97772216796875, -1.888824462890625, -1.7999267578125, -1.711029052734375, -1.62213134765625, -1.533233642578125, -1.4443359375, -1.355438232421875, -1.26654052734375, -1.177642822265625, -1.0887451171875, -0.999847412109375, -0.91094970703125, -0.822052001953125, -0.733154296875, -0.644256591796875, -0.55535888671875, -0.466461181640625, -0.3775634765625, -0.288665771484375, -0.19976806640625, -0.110870361328125, -0.02197265625, 0.066925048828125, 0.15582275390625, 0.244720458984375, 0.3336181640625, 0.422515869140625, 0.51141357421875, 0.600311279296875, 0.689208984375, 0.778106689453125, 0.86700439453125, 0.955902099609375, 1.0447998046875, 1.133697509765625, 1.22259521484375, 1.311492919921875, 1.400390625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 16.0, 36.0, 119.0, 339.0, 328.0, 118.0, 29.0, 10.0, 6.0, 1.0, 1.0], "bins": [-54.2608528137207, -53.31338882446289, -52.36592483520508, -51.418460845947266, -50.47099685668945, -49.52353286743164, -48.57606506347656, -47.62860107421875, -46.68113708496094, -45.733673095703125, -44.78620910644531, -43.8387451171875, -42.89128112792969, -41.943817138671875, -40.99635314941406, -40.04888916015625, -39.10142517089844, -38.153961181640625, -37.20649719238281, -36.259033203125, -35.31156921386719, -34.364105224609375, -33.41664123535156, -32.46917724609375, -31.521709442138672, -30.57424545288086, -29.626781463623047, -28.679317474365234, -27.73185157775879, -26.784387588500977, -25.836923599243164, -24.88945960998535, -23.94199562072754, -22.994531631469727, -22.047067642211914, -21.09960174560547, -20.152137756347656, -19.204673767089844, -18.25720977783203, -17.30974578857422, -16.362281799316406, -15.414817810058594, -14.467352867126465, -13.519888877868652, -12.57242488861084, -11.624959945678711, -10.677495956420898, -9.730031967163086, -8.78256607055664, -7.83510160446167, -6.887637615203857, -5.940173149108887, -4.992709159851074, -4.0452446937561035, -3.097780227661133, -2.1503162384033203, -1.2028522491455078, -0.25538796186447144, 0.6920763254165649, 1.639540672302246, 2.5870048999786377, 3.5344691276550293, 4.48193359375, 5.4293975830078125, 6.376862049102783]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 14.0, 18.0, 38.0, 48.0, 49.0, 67.0, 64.0, 77.0, 73.0, 76.0, 104.0, 70.0, 59.0, 66.0, 32.0, 38.0, 35.0, 19.0, 13.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.274557113647461, -13.862266540527344, -13.449975967407227, -13.03768539428711, -12.625394821166992, -12.213104248046875, -11.800812721252441, -11.388522148132324, -10.976231575012207, -10.56394100189209, -10.151650428771973, -9.739359855651855, -9.327068328857422, -8.914777755737305, -8.502487182617188, -8.09019660949707, -7.677906036376953, -7.265615463256836, -6.853324890136719, -6.441033840179443, -6.028743267059326, -5.616452693939209, -5.204161643981934, -4.791871070861816, -4.379580497741699, -3.967289924621582, -3.5549991130828857, -3.1427083015441895, -2.7304177284240723, -2.318127155303955, -1.9058363437652588, -1.4935455322265625, -1.0812559127807617, -0.668965220451355, -0.25667452812194824, 0.1556161642074585, 0.5679068565368652, 0.9801974296569824, 1.3924882411956787, 1.804779052734375, 2.217069625854492, 2.6293601989746094, 3.0416510105133057, 3.453941822052002, 3.866232395172119, 4.278522968292236, 4.690814018249512, 5.103104591369629, 5.515395164489746, 5.927685737609863, 6.3399763107299805, 6.752267360687256, 7.164557933807373, 7.57684850692749, 7.989139556884766, 8.401430130004883, 8.813720703125, 9.226011276245117, 9.638301849365234, 10.050592422485352, 10.462882995605469, 10.875173568725586, 11.28746509552002, 11.699755668640137, 12.112046241760254]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 7.0, 7.0, 8.0, 17.0, 26.0, 27.0, 34.0, 44.0, 83.0, 123.0, 184.0, 315.0, 537.0, 999.0, 2079.0, 4905.0, 13045.0, 39534.0, 153508.0, 489857.0, 251630.0, 60609.0, 18575.0, 6690.0, 2742.0, 1287.0, 600.0, 407.0, 207.0, 154.0, 94.0, 70.0, 31.0, 31.0, 21.0, 21.0, 13.0, 14.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.897216796875, -4.72021484375, -4.543212890625, -4.3662109375, -4.189208984375, -4.01220703125, -3.835205078125, -3.658203125, -3.481201171875, -3.30419921875, -3.127197265625, -2.9501953125, -2.773193359375, -2.59619140625, -2.419189453125, -2.2421875, -2.065185546875, -1.88818359375, -1.711181640625, -1.5341796875, -1.357177734375, -1.18017578125, -1.003173828125, -0.826171875, -0.649169921875, -0.47216796875, -0.295166015625, -0.1181640625, 0.058837890625, 0.23583984375, 0.412841796875, 0.58984375, 0.766845703125, 0.94384765625, 1.120849609375, 1.2978515625, 1.474853515625, 1.65185546875, 1.828857421875, 2.005859375, 2.182861328125, 2.35986328125, 2.536865234375, 2.7138671875, 2.890869140625, 3.06787109375, 3.244873046875, 3.421875, 3.598876953125, 3.77587890625, 3.952880859375, 4.1298828125, 4.306884765625, 4.48388671875, 4.660888671875, 4.837890625, 5.014892578125, 5.19189453125, 5.368896484375, 5.5458984375, 5.722900390625, 5.89990234375, 6.076904296875, 6.25390625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 3.0, 3.0, 18.0, 15.0, 23.0, 25.0, 42.0, 48.0, 68.0, 66.0, 67.0, 85.0, 78.0, 81.0, 62.0, 73.0, 59.0, 44.0, 33.0, 33.0, 18.0, 11.0, 12.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.624359130859375, -1.56512451171875, -1.505889892578125, -1.4466552734375, -1.387420654296875, -1.32818603515625, -1.268951416015625, -1.209716796875, -1.150482177734375, -1.09124755859375, -1.032012939453125, -0.9727783203125, -0.913543701171875, -0.85430908203125, -0.795074462890625, -0.73583984375, -0.676605224609375, -0.61737060546875, -0.558135986328125, -0.4989013671875, -0.439666748046875, -0.38043212890625, -0.321197509765625, -0.261962890625, -0.202728271484375, -0.14349365234375, -0.084259033203125, -0.0250244140625, 0.034210205078125, 0.09344482421875, 0.152679443359375, 0.2119140625, 0.271148681640625, 0.33038330078125, 0.389617919921875, 0.4488525390625, 0.508087158203125, 0.56732177734375, 0.626556396484375, 0.685791015625, 0.745025634765625, 0.80426025390625, 0.863494873046875, 0.9227294921875, 0.981964111328125, 1.04119873046875, 1.100433349609375, 1.15966796875, 1.218902587890625, 1.27813720703125, 1.337371826171875, 1.3966064453125, 1.455841064453125, 1.51507568359375, 1.574310302734375, 1.633544921875, 1.692779541015625, 1.75201416015625, 1.811248779296875, 1.8704833984375, 1.929718017578125, 1.98895263671875, 2.048187255859375, 2.107421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 11.0, 12.0, 21.0, 25.0, 36.0, 59.0, 98.0, 147.0, 220.0, 315.0, 484.0, 752.0, 1233.0, 2076.0, 3723.0, 6551.0, 12704.0, 26187.0, 57174.0, 137230.0, 291038.0, 277140.0, 126935.0, 53440.0, 24193.0, 11849.0, 6262.0, 3462.0, 1951.0, 1149.0, 748.0, 462.0, 275.0, 195.0, 143.0, 68.0, 55.0, 38.0, 32.0, 20.0, 17.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.626953125, -2.5472412109375, -2.467529296875, -2.3878173828125, -2.30810546875, -2.2283935546875, -2.148681640625, -2.0689697265625, -1.9892578125, -1.9095458984375, -1.829833984375, -1.7501220703125, -1.67041015625, -1.5906982421875, -1.510986328125, -1.4312744140625, -1.3515625, -1.2718505859375, -1.192138671875, -1.1124267578125, -1.03271484375, -0.9530029296875, -0.873291015625, -0.7935791015625, -0.7138671875, -0.6341552734375, -0.554443359375, -0.4747314453125, -0.39501953125, -0.3153076171875, -0.235595703125, -0.1558837890625, -0.076171875, 0.0035400390625, 0.083251953125, 0.1629638671875, 0.24267578125, 0.3223876953125, 0.402099609375, 0.4818115234375, 0.5615234375, 0.6412353515625, 0.720947265625, 0.8006591796875, 0.88037109375, 0.9600830078125, 1.039794921875, 1.1195068359375, 1.19921875, 1.2789306640625, 1.358642578125, 1.4383544921875, 1.51806640625, 1.5977783203125, 1.677490234375, 1.7572021484375, 1.8369140625, 1.9166259765625, 1.996337890625, 2.0760498046875, 2.15576171875, 2.2354736328125, 2.315185546875, 2.3948974609375, 2.474609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 3.0, 5.0, 9.0, 22.0, 15.0, 12.0, 21.0, 24.0, 25.0, 29.0, 32.0, 32.0, 38.0, 37.0, 38.0, 40.0, 41.0, 34.0, 49.0, 37.0, 47.0, 47.0, 30.0, 42.0, 43.0, 37.0, 25.0, 23.0, 21.0, 11.0, 26.0, 14.0, 18.0, 11.0, 9.0, 7.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.95928955078125, -3.8209228515625, -3.68255615234375, -3.544189453125, -3.40582275390625, -3.2674560546875, -3.12908935546875, -2.99072265625, -2.85235595703125, -2.7139892578125, -2.57562255859375, -2.437255859375, -2.29888916015625, -2.1605224609375, -2.02215576171875, -1.8837890625, -1.74542236328125, -1.6070556640625, -1.46868896484375, -1.330322265625, -1.19195556640625, -1.0535888671875, -0.91522216796875, -0.77685546875, -0.63848876953125, -0.5001220703125, -0.36175537109375, -0.223388671875, -0.08502197265625, 0.0533447265625, 0.19171142578125, 0.330078125, 0.46844482421875, 0.6068115234375, 0.74517822265625, 0.883544921875, 1.02191162109375, 1.1602783203125, 1.29864501953125, 1.43701171875, 1.57537841796875, 1.7137451171875, 1.85211181640625, 1.990478515625, 2.12884521484375, 2.2672119140625, 2.40557861328125, 2.5439453125, 2.68231201171875, 2.8206787109375, 2.95904541015625, 3.097412109375, 3.23577880859375, 3.3741455078125, 3.51251220703125, 3.65087890625, 3.78924560546875, 3.9276123046875, 4.06597900390625, 4.204345703125, 4.34271240234375, 4.4810791015625, 4.61944580078125, 4.7578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 5.0, 3.0, 14.0, 10.0, 27.0, 29.0, 57.0, 108.0, 199.0, 403.0, 902.0, 2047.0, 5808.0, 19157.0, 85360.0, 476463.0, 371582.0, 63557.0, 14967.0, 4604.0, 1738.0, 725.0, 370.0, 173.0, 91.0, 73.0, 24.0, 22.0, 11.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.619140625, -1.55413818359375, -1.4891357421875, -1.42413330078125, -1.359130859375, -1.29412841796875, -1.2291259765625, -1.16412353515625, -1.09912109375, -1.03411865234375, -0.9691162109375, -0.90411376953125, -0.839111328125, -0.77410888671875, -0.7091064453125, -0.64410400390625, -0.5791015625, -0.51409912109375, -0.4490966796875, -0.38409423828125, -0.319091796875, -0.25408935546875, -0.1890869140625, -0.12408447265625, -0.05908203125, 0.00592041015625, 0.0709228515625, 0.13592529296875, 0.200927734375, 0.26593017578125, 0.3309326171875, 0.39593505859375, 0.4609375, 0.52593994140625, 0.5909423828125, 0.65594482421875, 0.720947265625, 0.78594970703125, 0.8509521484375, 0.91595458984375, 0.98095703125, 1.04595947265625, 1.1109619140625, 1.17596435546875, 1.240966796875, 1.30596923828125, 1.3709716796875, 1.43597412109375, 1.5009765625, 1.56597900390625, 1.6309814453125, 1.69598388671875, 1.760986328125, 1.82598876953125, 1.8909912109375, 1.95599365234375, 2.02099609375, 2.08599853515625, 2.1510009765625, 2.21600341796875, 2.281005859375, 2.34600830078125, 2.4110107421875, 2.47601318359375, 2.541015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 8.0, 10.0, 15.0, 14.0, 15.0, 20.0, 24.0, 30.0, 34.0, 64.0, 88.0, 101.0, 99.0, 88.0, 78.0, 49.0, 36.0, 42.0, 28.0, 23.0, 22.0, 16.0, 11.0, 14.0, 12.0, 11.0, 5.0, 4.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00029015541076660156, -0.000281263142824173, -0.0002723708748817444, -0.0002634786069393158, -0.0002545863389968872, -0.0002456940710544586, -0.00023680180311203003, -0.00022790953516960144, -0.00021901726722717285, -0.00021012499928474426, -0.00020123273134231567, -0.00019234046339988708, -0.0001834481954574585, -0.0001745559275150299, -0.00016566365957260132, -0.00015677139163017273, -0.00014787912368774414, -0.00013898685574531555, -0.00013009458780288696, -0.00012120231986045837, -0.00011231005191802979, -0.0001034177839756012, -9.452551603317261e-05, -8.563324809074402e-05, -7.674098014831543e-05, -6.784871220588684e-05, -5.895644426345825e-05, -5.006417632102966e-05, -4.1171908378601074e-05, -3.2279640436172485e-05, -2.3387372493743896e-05, -1.4495104551315308e-05, -5.602836608886719e-06, 3.28943133354187e-06, 1.2181699275970459e-05, 2.1073967218399048e-05, 2.9966235160827637e-05, 3.8858503103256226e-05, 4.7750771045684814e-05, 5.66430389881134e-05, 6.553530693054199e-05, 7.442757487297058e-05, 8.331984281539917e-05, 9.221211075782776e-05, 0.00010110437870025635, 0.00010999664664268494, 0.00011888891458511353, 0.00012778118252754211, 0.0001366734504699707, 0.0001455657184123993, 0.00015445798635482788, 0.00016335025429725647, 0.00017224252223968506, 0.00018113479018211365, 0.00019002705812454224, 0.00019891932606697083, 0.00020781159400939941, 0.000216703861951828, 0.0002255961298942566, 0.00023448839783668518, 0.00024338066577911377, 0.00025227293372154236, 0.00026116520166397095, 0.00027005746960639954, 0.0002789497375488281]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 15.0, 16.0, 31.0, 39.0, 61.0, 83.0, 109.0, 184.0, 321.0, 536.0, 979.0, 1835.0, 3818.0, 8687.0, 21300.0, 68558.0, 332414.0, 461374.0, 99731.0, 27974.0, 10774.0, 4746.0, 2278.0, 1168.0, 611.0, 325.0, 191.0, 128.0, 86.0, 43.0, 33.0, 34.0, 15.0, 12.0, 6.0, 8.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.017578125, -1.9566802978515625, -1.895782470703125, -1.8348846435546875, -1.77398681640625, -1.7130889892578125, -1.652191162109375, -1.5912933349609375, -1.5303955078125, -1.4694976806640625, -1.408599853515625, -1.3477020263671875, -1.28680419921875, -1.2259063720703125, -1.165008544921875, -1.1041107177734375, -1.043212890625, -0.9823150634765625, -0.921417236328125, -0.8605194091796875, -0.79962158203125, -0.7387237548828125, -0.677825927734375, -0.6169281005859375, -0.5560302734375, -0.4951324462890625, -0.434234619140625, -0.3733367919921875, -0.31243896484375, -0.2515411376953125, -0.190643310546875, -0.1297454833984375, -0.06884765625, -0.0079498291015625, 0.052947998046875, 0.1138458251953125, 0.17474365234375, 0.2356414794921875, 0.296539306640625, 0.3574371337890625, 0.4183349609375, 0.4792327880859375, 0.540130615234375, 0.6010284423828125, 0.66192626953125, 0.7228240966796875, 0.783721923828125, 0.8446197509765625, 0.905517578125, 0.9664154052734375, 1.027313232421875, 1.0882110595703125, 1.14910888671875, 1.2100067138671875, 1.270904541015625, 1.3318023681640625, 1.3927001953125, 1.4535980224609375, 1.514495849609375, 1.5753936767578125, 1.63629150390625, 1.6971893310546875, 1.758087158203125, 1.8189849853515625, 1.8798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 8.0, 15.0, 13.0, 14.0, 30.0, 34.0, 39.0, 65.0, 77.0, 94.0, 84.0, 83.0, 104.0, 72.0, 57.0, 52.0, 36.0, 20.0, 21.0, 9.0, 12.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.630096435546875, -1.57366943359375, -1.517242431640625, -1.4608154296875, -1.404388427734375, -1.34796142578125, -1.291534423828125, -1.235107421875, -1.178680419921875, -1.12225341796875, -1.065826416015625, -1.0093994140625, -0.952972412109375, -0.89654541015625, -0.840118408203125, -0.78369140625, -0.727264404296875, -0.67083740234375, -0.614410400390625, -0.5579833984375, -0.501556396484375, -0.44512939453125, -0.388702392578125, -0.332275390625, -0.275848388671875, -0.21942138671875, -0.162994384765625, -0.1065673828125, -0.050140380859375, 0.00628662109375, 0.062713623046875, 0.119140625, 0.175567626953125, 0.23199462890625, 0.288421630859375, 0.3448486328125, 0.401275634765625, 0.45770263671875, 0.514129638671875, 0.570556640625, 0.626983642578125, 0.68341064453125, 0.739837646484375, 0.7962646484375, 0.852691650390625, 0.90911865234375, 0.965545654296875, 1.02197265625, 1.078399658203125, 1.13482666015625, 1.191253662109375, 1.2476806640625, 1.304107666015625, 1.36053466796875, 1.416961669921875, 1.473388671875, 1.529815673828125, 1.58624267578125, 1.642669677734375, 1.6990966796875, 1.755523681640625, 1.81195068359375, 1.868377685546875, 1.9248046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 29.0, 38.0, 72.0, 105.0, 184.0, 177.0, 132.0, 90.0, 48.0, 42.0, 22.0, 15.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.351150512695312, -26.21552276611328, -25.07989501953125, -23.94426918029785, -22.80864143371582, -21.67301368713379, -20.53738784790039, -19.40176010131836, -18.266132354736328, -17.130504608154297, -15.994877815246582, -14.859251022338867, -13.723623275756836, -12.587995529174805, -11.45236873626709, -10.316741943359375, -9.181114196777344, -8.045486450195312, -6.909859657287598, -5.774232387542725, -4.638605117797852, -3.5029778480529785, -2.3673505783081055, -1.2317233085632324, -0.09609603881835938, 1.0395312309265137, 2.1751585006713867, 3.3107857704162598, 4.446413040161133, 5.582040309906006, 6.717667579650879, 7.853294849395752, 8.988922119140625, 10.124549865722656, 11.260176658630371, 12.395803451538086, 13.531431198120117, 14.667058944702148, 15.802685737609863, 16.938312530517578, 18.07394027709961, 19.20956802368164, 20.345195770263672, 21.48082160949707, 22.6164493560791, 23.752077102661133, 24.88770294189453, 26.023330688476562, 27.158958435058594, 28.294586181640625, 29.430213928222656, 30.565839767456055, 31.701467514038086, 32.837093353271484, 33.972721099853516, 35.10834884643555, 36.24397659301758, 37.37960433959961, 38.51523208618164, 39.65085983276367, 40.78648376464844, 41.92211151123047, 43.0577392578125, 44.19336700439453, 45.32899475097656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 14.0, 18.0, 22.0, 23.0, 17.0, 28.0, 27.0, 27.0, 36.0, 38.0, 30.0, 33.0, 34.0, 53.0, 43.0, 49.0, 37.0, 54.0, 41.0, 30.0, 41.0, 37.0, 28.0, 22.0, 18.0, 22.0, 19.0, 15.0, 18.0, 18.0, 16.0, 12.0, 17.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.037307739257812, -26.202707290649414, -25.368104934692383, -24.533504486083984, -23.698904037475586, -22.864303588867188, -22.029701232910156, -21.195100784301758, -20.36050033569336, -19.52589988708496, -18.69129753112793, -17.85669708251953, -17.022096633911133, -16.187496185302734, -15.352893829345703, -14.518293380737305, -13.683691024780273, -12.849089622497559, -12.01448917388916, -11.179887771606445, -10.345287322998047, -9.510685920715332, -8.676084518432617, -7.8414835929870605, -7.006882667541504, -6.172281742095947, -5.337680816650391, -4.503079414367676, -3.668478488922119, -2.8338775634765625, -1.9992761611938477, -1.164675235748291, -0.33007240295410156, 0.5045286417007446, 1.3391296863555908, 2.1737308502197266, 3.008331775665283, 3.84293270111084, 4.677534103393555, 5.512135028839111, 6.346735954284668, 7.181336879730225, 8.015937805175781, 8.850539207458496, 9.685140609741211, 10.51974105834961, 11.354342460632324, 12.188943862915039, 13.023544311523438, 13.858145713806152, 14.69274616241455, 15.527347564697266, 16.361948013305664, 17.196548461914062, 18.031150817871094, 18.865751266479492, 19.70035171508789, 20.53495216369629, 21.36955451965332, 22.20415496826172, 23.038755416870117, 23.873355865478516, 24.707958221435547, 25.542558670043945, 26.377161026000977]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 12.0, 10.0, 23.0, 47.0, 65.0, 107.0, 145.0, 280.0, 605.0, 1477.0, 4592.0, 21751.0, 391713.0, 3717046.0, 44627.0, 7534.0, 2410.0, 866.0, 405.0, 210.0, 123.0, 76.0, 46.0, 36.0, 24.0, 10.0, 7.0, 13.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.3218994140625, -8.026611328125, -7.7313232421875, -7.43603515625, -7.1407470703125, -6.845458984375, -6.5501708984375, -6.2548828125, -5.9595947265625, -5.664306640625, -5.3690185546875, -5.07373046875, -4.7784423828125, -4.483154296875, -4.1878662109375, -3.892578125, -3.5972900390625, -3.302001953125, -3.0067138671875, -2.71142578125, -2.4161376953125, -2.120849609375, -1.8255615234375, -1.5302734375, -1.2349853515625, -0.939697265625, -0.6444091796875, -0.34912109375, -0.0538330078125, 0.241455078125, 0.5367431640625, 0.83203125, 1.1273193359375, 1.422607421875, 1.7178955078125, 2.01318359375, 2.3084716796875, 2.603759765625, 2.8990478515625, 3.1943359375, 3.4896240234375, 3.784912109375, 4.0802001953125, 4.37548828125, 4.6707763671875, 4.966064453125, 5.2613525390625, 5.556640625, 5.8519287109375, 6.147216796875, 6.4425048828125, 6.73779296875, 7.0330810546875, 7.328369140625, 7.6236572265625, 7.9189453125, 8.2142333984375, 8.509521484375, 8.8048095703125, 9.10009765625, 9.3953857421875, 9.690673828125, 9.9859619140625, 10.28125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 8.0, 14.0, 25.0, 18.0, 30.0, 59.0, 47.0, 46.0, 65.0, 72.0, 84.0, 76.0, 72.0, 82.0, 54.0, 54.0, 48.0, 29.0, 31.0, 18.0, 23.0, 13.0, 5.0, 11.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.92578125, -1.8602294921875, -1.794677734375, -1.7291259765625, -1.66357421875, -1.5980224609375, -1.532470703125, -1.4669189453125, -1.4013671875, -1.3358154296875, -1.270263671875, -1.2047119140625, -1.13916015625, -1.0736083984375, -1.008056640625, -0.9425048828125, -0.876953125, -0.8114013671875, -0.745849609375, -0.6802978515625, -0.61474609375, -0.5491943359375, -0.483642578125, -0.4180908203125, -0.3525390625, -0.2869873046875, -0.221435546875, -0.1558837890625, -0.09033203125, -0.0247802734375, 0.040771484375, 0.1063232421875, 0.171875, 0.2374267578125, 0.302978515625, 0.3685302734375, 0.43408203125, 0.4996337890625, 0.565185546875, 0.6307373046875, 0.6962890625, 0.7618408203125, 0.827392578125, 0.8929443359375, 0.95849609375, 1.0240478515625, 1.089599609375, 1.1551513671875, 1.220703125, 1.2862548828125, 1.351806640625, 1.4173583984375, 1.48291015625, 1.5484619140625, 1.614013671875, 1.6795654296875, 1.7451171875, 1.8106689453125, 1.876220703125, 1.9417724609375, 2.00732421875, 2.0728759765625, 2.138427734375, 2.2039794921875, 2.26953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 13.0, 10.0, 17.0, 33.0, 55.0, 93.0, 169.0, 335.0, 839.0, 2539.0, 10049.0, 86447.0, 3793204.0, 276186.0, 18497.0, 3768.0, 1153.0, 462.0, 185.0, 102.0, 64.0, 25.0, 15.0, 10.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.4759521484375, -6.233154296875, -5.9903564453125, -5.74755859375, -5.5047607421875, -5.261962890625, -5.0191650390625, -4.7763671875, -4.5335693359375, -4.290771484375, -4.0479736328125, -3.80517578125, -3.5623779296875, -3.319580078125, -3.0767822265625, -2.833984375, -2.5911865234375, -2.348388671875, -2.1055908203125, -1.86279296875, -1.6199951171875, -1.377197265625, -1.1343994140625, -0.8916015625, -0.6488037109375, -0.406005859375, -0.1632080078125, 0.07958984375, 0.3223876953125, 0.565185546875, 0.8079833984375, 1.05078125, 1.2935791015625, 1.536376953125, 1.7791748046875, 2.02197265625, 2.2647705078125, 2.507568359375, 2.7503662109375, 2.9931640625, 3.2359619140625, 3.478759765625, 3.7215576171875, 3.96435546875, 4.2071533203125, 4.449951171875, 4.6927490234375, 4.935546875, 5.1783447265625, 5.421142578125, 5.6639404296875, 5.90673828125, 6.1495361328125, 6.392333984375, 6.6351318359375, 6.8779296875, 7.1207275390625, 7.363525390625, 7.6063232421875, 7.84912109375, 8.0919189453125, 8.334716796875, 8.5775146484375, 8.8203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 2.0, 12.0, 14.0, 14.0, 24.0, 49.0, 66.0, 151.0, 416.0, 1835.0, 942.0, 266.0, 115.0, 57.0, 38.0, 19.0, 17.0, 6.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.19921875, -4.098785400390625, -3.99835205078125, -3.897918701171875, -3.7974853515625, -3.697052001953125, -3.59661865234375, -3.496185302734375, -3.395751953125, -3.295318603515625, -3.19488525390625, -3.094451904296875, -2.9940185546875, -2.893585205078125, -2.79315185546875, -2.692718505859375, -2.59228515625, -2.491851806640625, -2.39141845703125, -2.290985107421875, -2.1905517578125, -2.090118408203125, -1.98968505859375, -1.889251708984375, -1.788818359375, -1.688385009765625, -1.58795166015625, -1.487518310546875, -1.3870849609375, -1.286651611328125, -1.18621826171875, -1.085784912109375, -0.9853515625, -0.884918212890625, -0.78448486328125, -0.684051513671875, -0.5836181640625, -0.483184814453125, -0.38275146484375, -0.282318115234375, -0.181884765625, -0.081451416015625, 0.01898193359375, 0.119415283203125, 0.2198486328125, 0.320281982421875, 0.42071533203125, 0.521148681640625, 0.62158203125, 0.722015380859375, 0.82244873046875, 0.922882080078125, 1.0233154296875, 1.123748779296875, 1.22418212890625, 1.324615478515625, 1.425048828125, 1.525482177734375, 1.62591552734375, 1.726348876953125, 1.8267822265625, 1.927215576171875, 2.02764892578125, 2.128082275390625, 2.228515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 8.0, 13.0, 15.0, 29.0, 62.0, 87.0, 142.0, 167.0, 170.0, 138.0, 81.0, 44.0, 21.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.0150089263916, -19.56905746459961, -19.12310791015625, -18.677156448364258, -18.2312068939209, -17.785255432128906, -17.339305877685547, -16.893354415893555, -16.447402954101562, -16.00145149230957, -15.555501937866211, -15.109550476074219, -14.663599967956543, -14.217649459838867, -13.771698951721191, -13.325748443603516, -12.87979793548584, -12.433847427368164, -11.987896919250488, -11.541946411132812, -11.09599494934082, -10.650044441223145, -10.204093933105469, -9.758143424987793, -9.312192916870117, -8.866242408752441, -8.420291900634766, -7.974340915679932, -7.528389930725098, -7.082439422607422, -6.636488914489746, -6.19053840637207, -5.744585990905762, -5.298635482788086, -4.852684497833252, -4.406733989715576, -3.9607832431793213, -3.5148324966430664, -3.0688819885253906, -2.6229312419891357, -2.176980495452881, -1.731029748916626, -1.2850791215896606, -0.8391284942626953, -0.39317774772644043, 0.05277299880981445, 0.49872350692749023, 0.9446742534637451, 1.390625, 1.8365757465362549, 2.2825264930725098, 2.7284770011901855, 3.1744277477264404, 3.6203784942626953, 4.066329002380371, 4.512279510498047, 4.958230495452881, 5.404181003570557, 5.850131988525391, 6.296082496643066, 6.742033004760742, 7.187983989715576, 7.633934497833252, 8.079885482788086, 8.525835990905762]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 18.0, 4.0, 9.0, 26.0, 23.0, 28.0, 27.0, 40.0, 36.0, 44.0, 32.0, 38.0, 41.0, 41.0, 54.0, 51.0, 57.0, 53.0, 39.0, 53.0, 40.0, 41.0, 30.0, 23.0, 18.0, 25.0, 22.0, 11.0, 15.0, 11.0, 16.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.026930809020996, -8.771805763244629, -8.516681671142578, -8.261556625366211, -8.00643253326416, -7.751307964324951, -7.496183395385742, -7.241058349609375, -6.985934257507324, -6.730809688568115, -6.475685119628906, -6.220560550689697, -5.965435981750488, -5.710311412811279, -5.45518684387207, -5.200061798095703, -4.944937229156494, -4.689812660217285, -4.434688091278076, -4.179563522338867, -3.924438953399658, -3.669314384460449, -3.414189577102661, -3.159065008163452, -2.903940439224243, -2.648815870285034, -2.393691301345825, -2.138566493988037, -1.8834420442581177, -1.6283174753189087, -1.3731927871704102, -1.1180682182312012, -0.8629441261291504, -0.6078195571899414, -0.35269492864608765, -0.09757030010223389, 0.1575542688369751, 0.4126788377761841, 0.6678035259246826, 0.9229280948638916, 1.1780526638031006, 1.4331772327423096, 1.6883018016815186, 1.943426489830017, 2.1985511779785156, 2.4536757469177246, 2.7088003158569336, 2.9639248847961426, 3.2190494537353516, 3.4741740226745605, 3.7292985916137695, 3.9844231605529785, 4.2395477294921875, 4.4946722984313965, 4.7497968673706055, 5.004921913146973, 5.260046005249023, 5.515170574188232, 5.770295143127441, 6.02541971206665, 6.280544281005859, 6.535668849945068, 6.790793418884277, 7.0459184646606445, 7.3010430335998535]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 15.0, 10.0, 16.0, 28.0, 32.0, 54.0, 100.0, 170.0, 277.0, 569.0, 1252.0, 3096.0, 8645.0, 28884.0, 124600.0, 566910.0, 243683.0, 48736.0, 13615.0, 4391.0, 1790.0, 764.0, 405.0, 210.0, 125.0, 67.0, 39.0, 28.0, 13.0, 12.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.45758056640625, -6.2471923828125, -6.03680419921875, -5.826416015625, -5.61602783203125, -5.4056396484375, -5.19525146484375, -4.98486328125, -4.77447509765625, -4.5640869140625, -4.35369873046875, -4.143310546875, -3.93292236328125, -3.7225341796875, -3.51214599609375, -3.3017578125, -3.09136962890625, -2.8809814453125, -2.67059326171875, -2.460205078125, -2.24981689453125, -2.0394287109375, -1.82904052734375, -1.61865234375, -1.40826416015625, -1.1978759765625, -0.98748779296875, -0.777099609375, -0.56671142578125, -0.3563232421875, -0.14593505859375, 0.064453125, 0.27484130859375, 0.4852294921875, 0.69561767578125, 0.906005859375, 1.11639404296875, 1.3267822265625, 1.53717041015625, 1.74755859375, 1.95794677734375, 2.1683349609375, 2.37872314453125, 2.589111328125, 2.79949951171875, 3.0098876953125, 3.22027587890625, 3.4306640625, 3.64105224609375, 3.8514404296875, 4.06182861328125, 4.272216796875, 4.48260498046875, 4.6929931640625, 4.90338134765625, 5.11376953125, 5.32415771484375, 5.5345458984375, 5.74493408203125, 5.955322265625, 6.16571044921875, 6.3760986328125, 6.58648681640625, 6.796875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 12.0, 18.0, 22.0, 17.0, 40.0, 26.0, 49.0, 57.0, 50.0, 85.0, 80.0, 71.0, 65.0, 66.0, 59.0, 61.0, 47.0, 41.0, 28.0, 18.0, 24.0, 13.0, 12.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.77001953125, -1.7080078125, -1.64599609375, -1.583984375, -1.52197265625, -1.4599609375, -1.39794921875, -1.3359375, -1.27392578125, -1.2119140625, -1.14990234375, -1.087890625, -1.02587890625, -0.9638671875, -0.90185546875, -0.83984375, -0.77783203125, -0.7158203125, -0.65380859375, -0.591796875, -0.52978515625, -0.4677734375, -0.40576171875, -0.34375, -0.28173828125, -0.2197265625, -0.15771484375, -0.095703125, -0.03369140625, 0.0283203125, 0.09033203125, 0.15234375, 0.21435546875, 0.2763671875, 0.33837890625, 0.400390625, 0.46240234375, 0.5244140625, 0.58642578125, 0.6484375, 0.71044921875, 0.7724609375, 0.83447265625, 0.896484375, 0.95849609375, 1.0205078125, 1.08251953125, 1.14453125, 1.20654296875, 1.2685546875, 1.33056640625, 1.392578125, 1.45458984375, 1.5166015625, 1.57861328125, 1.640625, 1.70263671875, 1.7646484375, 1.82666015625, 1.888671875, 1.95068359375, 2.0126953125, 2.07470703125, 2.13671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 5.0, 17.0, 12.0, 33.0, 44.0, 61.0, 68.0, 120.0, 191.0, 335.0, 600.0, 1021.0, 2208.0, 4558.0, 11403.0, 32564.0, 109396.0, 399519.0, 347417.0, 92086.0, 28417.0, 10074.0, 4226.0, 1852.0, 983.0, 497.0, 293.0, 183.0, 105.0, 76.0, 57.0, 38.0, 27.0, 12.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.44921875, -4.318115234375, -4.18701171875, -4.055908203125, -3.9248046875, -3.793701171875, -3.66259765625, -3.531494140625, -3.400390625, -3.269287109375, -3.13818359375, -3.007080078125, -2.8759765625, -2.744873046875, -2.61376953125, -2.482666015625, -2.3515625, -2.220458984375, -2.08935546875, -1.958251953125, -1.8271484375, -1.696044921875, -1.56494140625, -1.433837890625, -1.302734375, -1.171630859375, -1.04052734375, -0.909423828125, -0.7783203125, -0.647216796875, -0.51611328125, -0.385009765625, -0.25390625, -0.122802734375, 0.00830078125, 0.139404296875, 0.2705078125, 0.401611328125, 0.53271484375, 0.663818359375, 0.794921875, 0.926025390625, 1.05712890625, 1.188232421875, 1.3193359375, 1.450439453125, 1.58154296875, 1.712646484375, 1.84375, 1.974853515625, 2.10595703125, 2.237060546875, 2.3681640625, 2.499267578125, 2.63037109375, 2.761474609375, 2.892578125, 3.023681640625, 3.15478515625, 3.285888671875, 3.4169921875, 3.548095703125, 3.67919921875, 3.810302734375, 3.94140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 3.0, 5.0, 8.0, 11.0, 13.0, 20.0, 16.0, 21.0, 24.0, 32.0, 34.0, 33.0, 49.0, 43.0, 50.0, 56.0, 58.0, 47.0, 48.0, 51.0, 54.0, 36.0, 49.0, 37.0, 28.0, 27.0, 26.0, 28.0, 25.0, 15.0, 6.0, 14.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.17218017578125, -5.9888916015625, -5.80560302734375, -5.622314453125, -5.43902587890625, -5.2557373046875, -5.07244873046875, -4.88916015625, -4.70587158203125, -4.5225830078125, -4.33929443359375, -4.156005859375, -3.97271728515625, -3.7894287109375, -3.60614013671875, -3.4228515625, -3.23956298828125, -3.0562744140625, -2.87298583984375, -2.689697265625, -2.50640869140625, -2.3231201171875, -2.13983154296875, -1.95654296875, -1.77325439453125, -1.5899658203125, -1.40667724609375, -1.223388671875, -1.04010009765625, -0.8568115234375, -0.67352294921875, -0.490234375, -0.30694580078125, -0.1236572265625, 0.05963134765625, 0.242919921875, 0.42620849609375, 0.6094970703125, 0.79278564453125, 0.97607421875, 1.15936279296875, 1.3426513671875, 1.52593994140625, 1.709228515625, 1.89251708984375, 2.0758056640625, 2.25909423828125, 2.4423828125, 2.62567138671875, 2.8089599609375, 2.99224853515625, 3.175537109375, 3.35882568359375, 3.5421142578125, 3.72540283203125, 3.90869140625, 4.09197998046875, 4.2752685546875, 4.45855712890625, 4.641845703125, 4.82513427734375, 5.0084228515625, 5.19171142578125, 5.375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 10.0, 19.0, 39.0, 81.0, 196.0, 687.0, 4835.0, 752605.0, 285383.0, 3820.0, 549.0, 182.0, 72.0, 26.0, 16.0, 15.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.1041259765625, -9.755126953125, -9.4061279296875, -9.05712890625, -8.7081298828125, -8.359130859375, -8.0101318359375, -7.6611328125, -7.3121337890625, -6.963134765625, -6.6141357421875, -6.26513671875, -5.9161376953125, -5.567138671875, -5.2181396484375, -4.869140625, -4.5201416015625, -4.171142578125, -3.8221435546875, -3.47314453125, -3.1241455078125, -2.775146484375, -2.4261474609375, -2.0771484375, -1.7281494140625, -1.379150390625, -1.0301513671875, -0.68115234375, -0.3321533203125, 0.016845703125, 0.3658447265625, 0.71484375, 1.0638427734375, 1.412841796875, 1.7618408203125, 2.11083984375, 2.4598388671875, 2.808837890625, 3.1578369140625, 3.5068359375, 3.8558349609375, 4.204833984375, 4.5538330078125, 4.90283203125, 5.2518310546875, 5.600830078125, 5.9498291015625, 6.298828125, 6.6478271484375, 6.996826171875, 7.3458251953125, 7.69482421875, 8.0438232421875, 8.392822265625, 8.7418212890625, 9.0908203125, 9.4398193359375, 9.788818359375, 10.1378173828125, 10.48681640625, 10.8358154296875, 11.184814453125, 11.5338134765625, 11.8828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 7.0, 3.0, 5.0, 20.0, 22.0, 39.0, 82.0, 349.0, 289.0, 78.0, 37.0, 29.0, 20.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011129379272460938, -0.0010819882154464722, -0.0010510385036468506, -0.001020088791847229, -0.0009891390800476074, -0.0009581893682479858, -0.0009272396564483643, -0.0008962899446487427, -0.0008653402328491211, -0.0008343905210494995, -0.0008034408092498779, -0.0007724910974502563, -0.0007415413856506348, -0.0007105916738510132, -0.0006796419620513916, -0.00064869225025177, -0.0006177425384521484, -0.0005867928266525269, -0.0005558431148529053, -0.0005248934030532837, -0.0004939436912536621, -0.00046299397945404053, -0.00043204426765441895, -0.00040109455585479736, -0.0003701448440551758, -0.0003391951322555542, -0.0003082454204559326, -0.00027729570865631104, -0.00024634599685668945, -0.00021539628505706787, -0.0001844465732574463, -0.0001534968614578247, -0.00012254714965820312, -9.159743785858154e-05, -6.064772605895996e-05, -2.969801425933838e-05, 1.2516975402832031e-06, 3.2201409339904785e-05, 6.315112113952637e-05, 9.410083293914795e-05, 0.00012505054473876953, 0.0001560002565383911, 0.0001869499683380127, 0.00021789968013763428, 0.00024884939193725586, 0.00027979910373687744, 0.000310748815536499, 0.0003416985273361206, 0.0003726482391357422, 0.00040359795093536377, 0.00043454766273498535, 0.00046549737453460693, 0.0004964470863342285, 0.0005273967981338501, 0.0005583465099334717, 0.0005892962217330933, 0.0006202459335327148, 0.0006511956453323364, 0.000682145357131958, 0.0007130950689315796, 0.0007440447807312012, 0.0007749944925308228, 0.0008059442043304443, 0.0008368939161300659, 0.0008678436279296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 13.0, 25.0, 43.0, 95.0, 158.0, 305.0, 1222.0, 13529.0, 999419.0, 31186.0, 1790.0, 392.0, 183.0, 85.0, 47.0, 30.0, 18.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4649658203125, -12.070556640625, -11.6761474609375, -11.28173828125, -10.8873291015625, -10.492919921875, -10.0985107421875, -9.7041015625, -9.3096923828125, -8.915283203125, -8.5208740234375, -8.12646484375, -7.7320556640625, -7.337646484375, -6.9432373046875, -6.548828125, -6.1544189453125, -5.760009765625, -5.3656005859375, -4.97119140625, -4.5767822265625, -4.182373046875, -3.7879638671875, -3.3935546875, -2.9991455078125, -2.604736328125, -2.2103271484375, -1.81591796875, -1.4215087890625, -1.027099609375, -0.6326904296875, -0.23828125, 0.1561279296875, 0.550537109375, 0.9449462890625, 1.33935546875, 1.7337646484375, 2.128173828125, 2.5225830078125, 2.9169921875, 3.3114013671875, 3.705810546875, 4.1002197265625, 4.49462890625, 4.8890380859375, 5.283447265625, 5.6778564453125, 6.072265625, 6.4666748046875, 6.861083984375, 7.2554931640625, 7.64990234375, 8.0443115234375, 8.438720703125, 8.8331298828125, 9.2275390625, 9.6219482421875, 10.016357421875, 10.4107666015625, 10.80517578125, 11.1995849609375, 11.593994140625, 11.9884033203125, 12.3828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 13.0, 19.0, 40.0, 110.0, 360.0, 287.0, 89.0, 46.0, 17.0, 9.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.779541015625, -7.53564453125, -7.291748046875, -7.0478515625, -6.803955078125, -6.56005859375, -6.316162109375, -6.072265625, -5.828369140625, -5.58447265625, -5.340576171875, -5.0966796875, -4.852783203125, -4.60888671875, -4.364990234375, -4.12109375, -3.877197265625, -3.63330078125, -3.389404296875, -3.1455078125, -2.901611328125, -2.65771484375, -2.413818359375, -2.169921875, -1.926025390625, -1.68212890625, -1.438232421875, -1.1943359375, -0.950439453125, -0.70654296875, -0.462646484375, -0.21875, 0.025146484375, 0.26904296875, 0.512939453125, 0.7568359375, 1.000732421875, 1.24462890625, 1.488525390625, 1.732421875, 1.976318359375, 2.22021484375, 2.464111328125, 2.7080078125, 2.951904296875, 3.19580078125, 3.439697265625, 3.68359375, 3.927490234375, 4.17138671875, 4.415283203125, 4.6591796875, 4.903076171875, 5.14697265625, 5.390869140625, 5.634765625, 5.878662109375, 6.12255859375, 6.366455078125, 6.6103515625, 6.854248046875, 7.09814453125, 7.342041015625, 7.5859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 19.0, 81.0, 343.0, 417.0, 119.0, 20.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.73838424682617, -48.73485565185547, -44.731327056884766, -40.72779846191406, -36.724273681640625, -32.720741271972656, -28.71721649169922, -24.713687896728516, -20.710159301757812, -16.70663070678711, -12.703103065490723, -8.699575424194336, -4.696046829223633, -0.6925182342529297, 3.3110084533691406, 7.314537048339844, 11.318065643310547, 15.32159423828125, 19.325122833251953, 23.328649520874023, 27.332178115844727, 31.33570671081543, 35.3392333984375, 39.3427619934082, 43.346290588378906, 47.34981918334961, 51.35334777832031, 55.35687255859375, 59.36040496826172, 63.363929748535156, 67.36746215820312, 71.37098693847656, 75.37452697753906, 79.3780517578125, 83.38158416748047, 87.3851089477539, 91.38864135742188, 95.39216613769531, 99.39569091796875, 103.39922332763672, 107.40275573730469, 111.40628051757812, 115.4098129272461, 119.41333770751953, 123.4168701171875, 127.42039489746094, 131.42391967773438, 135.42745971679688, 139.43096923828125, 143.4344940185547, 147.43801879882812, 151.44155883789062, 155.44508361816406, 159.4486083984375, 163.45213317871094, 167.45565795898438, 171.45919799804688, 175.4627227783203, 179.46624755859375, 183.46978759765625, 187.4733123779297, 191.47683715820312, 195.48036193847656, 199.48388671875, 203.4874267578125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 4.0, 11.0, 15.0, 11.0, 13.0, 19.0, 18.0, 27.0, 19.0, 25.0, 30.0, 33.0, 42.0, 34.0, 52.0, 36.0, 38.0, 35.0, 52.0, 54.0, 42.0, 35.0, 47.0, 33.0, 36.0, 32.0, 31.0, 28.0, 22.0, 24.0, 22.0, 10.0, 10.0, 5.0, 4.0, 8.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-26.830242156982422, -26.00262451171875, -25.175006866455078, -24.34739112854004, -23.519773483276367, -22.692155838012695, -21.864540100097656, -21.036922454833984, -20.209304809570312, -19.38168716430664, -18.55406951904297, -17.72645378112793, -16.898836135864258, -16.071218490600586, -15.24360179901123, -14.415985107421875, -13.588367462158203, -12.760749816894531, -11.933133125305176, -11.10551643371582, -10.277898788452148, -9.450281143188477, -8.622664451599121, -7.795047283172607, -6.967430114746094, -6.13981294631958, -5.312195777893066, -4.484578609466553, -3.656961441040039, -2.8293442726135254, -2.0017271041870117, -1.174109935760498, -0.3464946746826172, 0.4811224937438965, 1.3087396621704102, 2.136356830596924, 2.9639739990234375, 3.791591167449951, 4.619208335876465, 5.4468255043029785, 6.274442672729492, 7.102059841156006, 7.9296770095825195, 8.757293701171875, 9.584911346435547, 10.412528991699219, 11.240145683288574, 12.06776237487793, 12.895380020141602, 13.722997665405273, 14.550614356994629, 15.378231048583984, 16.205848693847656, 17.033466339111328, 17.861083984375, 18.68869972229004, 19.51631736755371, 20.343935012817383, 21.171550750732422, 21.999168395996094, 22.826786041259766, 23.654403686523438, 24.48202133178711, 25.30963706970215, 26.13725471496582]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 12.0, 15.0, 22.0, 22.0, 51.0, 79.0, 129.0, 265.0, 458.0, 1014.0, 2800.0, 10925.0, 87006.0, 3980585.0, 94493.0, 11302.0, 2916.0, 1072.0, 493.0, 251.0, 126.0, 84.0, 63.0, 24.0, 18.0, 17.0, 7.0, 8.0, 12.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.6334228515625, -9.337158203125, -9.0408935546875, -8.74462890625, -8.4483642578125, -8.152099609375, -7.8558349609375, -7.5595703125, -7.2633056640625, -6.967041015625, -6.6707763671875, -6.37451171875, -6.0782470703125, -5.781982421875, -5.4857177734375, -5.189453125, -4.8931884765625, -4.596923828125, -4.3006591796875, -4.00439453125, -3.7081298828125, -3.411865234375, -3.1156005859375, -2.8193359375, -2.5230712890625, -2.226806640625, -1.9305419921875, -1.63427734375, -1.3380126953125, -1.041748046875, -0.7454833984375, -0.44921875, -0.1529541015625, 0.143310546875, 0.4395751953125, 0.73583984375, 1.0321044921875, 1.328369140625, 1.6246337890625, 1.9208984375, 2.2171630859375, 2.513427734375, 2.8096923828125, 3.10595703125, 3.4022216796875, 3.698486328125, 3.9947509765625, 4.291015625, 4.5872802734375, 4.883544921875, 5.1798095703125, 5.47607421875, 5.7723388671875, 6.068603515625, 6.3648681640625, 6.6611328125, 6.9573974609375, 7.253662109375, 7.5499267578125, 7.84619140625, 8.1424560546875, 8.438720703125, 8.7349853515625, 9.03125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 12.0, 9.0, 17.0, 27.0, 30.0, 35.0, 36.0, 53.0, 57.0, 45.0, 54.0, 58.0, 54.0, 73.0, 66.0, 50.0, 57.0, 38.0, 45.0, 25.0, 24.0, 25.0, 18.0, 15.0, 15.0, 7.0, 10.0, 7.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.816436767578125, -1.75885009765625, -1.701263427734375, -1.6436767578125, -1.586090087890625, -1.52850341796875, -1.470916748046875, -1.413330078125, -1.355743408203125, -1.29815673828125, -1.240570068359375, -1.1829833984375, -1.125396728515625, -1.06781005859375, -1.010223388671875, -0.95263671875, -0.895050048828125, -0.83746337890625, -0.779876708984375, -0.7222900390625, -0.664703369140625, -0.60711669921875, -0.549530029296875, -0.491943359375, -0.434356689453125, -0.37677001953125, -0.319183349609375, -0.2615966796875, -0.204010009765625, -0.14642333984375, -0.088836669921875, -0.03125, 0.026336669921875, 0.08392333984375, 0.141510009765625, 0.1990966796875, 0.256683349609375, 0.31427001953125, 0.371856689453125, 0.429443359375, 0.487030029296875, 0.54461669921875, 0.602203369140625, 0.6597900390625, 0.717376708984375, 0.77496337890625, 0.832550048828125, 0.89013671875, 0.947723388671875, 1.00531005859375, 1.062896728515625, 1.1204833984375, 1.178070068359375, 1.23565673828125, 1.293243408203125, 1.350830078125, 1.408416748046875, 1.46600341796875, 1.523590087890625, 1.5811767578125, 1.638763427734375, 1.69635009765625, 1.753936767578125, 1.8115234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 22.0, 26.0, 37.0, 55.0, 91.0, 117.0, 211.0, 321.0, 615.0, 1236.0, 3409.0, 15129.0, 160795.0, 3911641.0, 84588.0, 10750.0, 2753.0, 1046.0, 604.0, 313.0, 170.0, 128.0, 72.0, 37.0, 34.0, 23.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.7835693359375, -8.512451171875, -8.2413330078125, -7.97021484375, -7.6990966796875, -7.427978515625, -7.1568603515625, -6.8857421875, -6.6146240234375, -6.343505859375, -6.0723876953125, -5.80126953125, -5.5301513671875, -5.259033203125, -4.9879150390625, -4.716796875, -4.4456787109375, -4.174560546875, -3.9034423828125, -3.63232421875, -3.3612060546875, -3.090087890625, -2.8189697265625, -2.5478515625, -2.2767333984375, -2.005615234375, -1.7344970703125, -1.46337890625, -1.1922607421875, -0.921142578125, -0.6500244140625, -0.37890625, -0.1077880859375, 0.163330078125, 0.4344482421875, 0.70556640625, 0.9766845703125, 1.247802734375, 1.5189208984375, 1.7900390625, 2.0611572265625, 2.332275390625, 2.6033935546875, 2.87451171875, 3.1456298828125, 3.416748046875, 3.6878662109375, 3.958984375, 4.2301025390625, 4.501220703125, 4.7723388671875, 5.04345703125, 5.3145751953125, 5.585693359375, 5.8568115234375, 6.1279296875, 6.3990478515625, 6.670166015625, 6.9412841796875, 7.21240234375, 7.4835205078125, 7.754638671875, 8.0257568359375, 8.296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 8.0, 11.0, 19.0, 29.0, 44.0, 122.0, 427.0, 2423.0, 608.0, 179.0, 76.0, 39.0, 30.0, 21.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.834869384765625, -2.73223876953125, -2.629608154296875, -2.5269775390625, -2.424346923828125, -2.32171630859375, -2.219085693359375, -2.116455078125, -2.013824462890625, -1.91119384765625, -1.808563232421875, -1.7059326171875, -1.603302001953125, -1.50067138671875, -1.398040771484375, -1.29541015625, -1.192779541015625, -1.09014892578125, -0.987518310546875, -0.8848876953125, -0.782257080078125, -0.67962646484375, -0.576995849609375, -0.474365234375, -0.371734619140625, -0.26910400390625, -0.166473388671875, -0.0638427734375, 0.038787841796875, 0.14141845703125, 0.244049072265625, 0.3466796875, 0.449310302734375, 0.55194091796875, 0.654571533203125, 0.7572021484375, 0.859832763671875, 0.96246337890625, 1.065093994140625, 1.167724609375, 1.270355224609375, 1.37298583984375, 1.475616455078125, 1.5782470703125, 1.680877685546875, 1.78350830078125, 1.886138916015625, 1.98876953125, 2.091400146484375, 2.19403076171875, 2.296661376953125, 2.3992919921875, 2.501922607421875, 2.60455322265625, 2.707183837890625, 2.809814453125, 2.912445068359375, 3.01507568359375, 3.117706298828125, 3.2203369140625, 3.322967529296875, 3.42559814453125, 3.528228759765625, 3.630859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 32.0, 83.0, 140.0, 217.0, 174.0, 176.0, 97.0, 32.0, 7.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-28.076038360595703, -27.499469757080078, -26.92289924621582, -26.346330642700195, -25.76976203918457, -25.193193435668945, -24.616622924804688, -24.040054321289062, -23.463485717773438, -22.886917114257812, -22.310346603393555, -21.73377799987793, -21.157209396362305, -20.58064079284668, -20.004070281982422, -19.427501678466797, -18.850933074951172, -18.274364471435547, -17.69779396057129, -17.121225357055664, -16.54465675354004, -15.968087196350098, -15.391517639160156, -14.814949035644531, -14.238378524780273, -13.661808967590332, -13.085240364074707, -12.508670806884766, -11.93210220336914, -11.3555326461792, -10.778963088989258, -10.202394485473633, -9.625824928283691, -9.04925537109375, -8.472686767578125, -7.896117210388184, -7.319548606872559, -6.742979049682617, -6.166409969329834, -5.589840888977051, -5.013271808624268, -4.436702728271484, -3.860133647918701, -3.283564329147339, -2.7069952487945557, -2.1304261684417725, -1.5538568496704102, -0.977287769317627, -0.40071868896484375, 0.17585045099258423, 0.7524195909500122, 1.328988790512085, 1.9055578708648682, 2.4821269512176514, 3.0586962699890137, 3.635265350341797, 4.21183443069458, 4.788403511047363, 5.3649725914001465, 5.94154167175293, 6.518111228942871, 7.094679832458496, 7.6712493896484375, 8.247817993164062, 8.824387550354004]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 11.0, 17.0, 19.0, 35.0, 35.0, 55.0, 61.0, 51.0, 43.0, 55.0, 78.0, 71.0, 65.0, 72.0, 62.0, 36.0, 59.0, 40.0, 28.0, 24.0, 15.0, 21.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.687346458435059, -7.387083530426025, -7.086820602416992, -6.786557674407959, -6.486294746398926, -6.186032295227051, -5.885769367218018, -5.585506439208984, -5.285243511199951, -4.984980583190918, -4.684717655181885, -4.384454727172852, -4.084192276000977, -3.7839291095733643, -3.48366641998291, -3.183403491973877, -2.8831405639648438, -2.5828776359558105, -2.2826147079467773, -1.9823520183563232, -1.68208909034729, -1.3818261623382568, -1.0815633535385132, -0.7813005447387695, -0.48103761672973633, -0.1807747483253479, 0.11948812007904053, 0.41975098848342896, 0.7200138568878174, 1.0202767848968506, 1.3205395936965942, 1.620802402496338, 1.9210662841796875, 2.2213292121887207, 2.521592140197754, 2.821854829788208, 3.122117757797241, 3.4223806858062744, 3.7226433753967285, 4.022906303405762, 4.323169231414795, 4.623432159423828, 4.923695087432861, 5.2239580154418945, 5.5242204666137695, 5.824483871459961, 6.124746322631836, 6.425009250640869, 6.725272178649902, 7.0255351066589355, 7.325798034667969, 7.626060962677002, 7.926323890686035, 8.22658634185791, 8.526849746704102, 8.827112197875977, 9.127374649047852, 9.427637100219727, 9.727900505065918, 10.028162956237793, 10.328426361083984, 10.62868881225586, 10.92895221710205, 11.229214668273926, 11.529478073120117]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 13.0, 8.0, 20.0, 29.0, 67.0, 111.0, 253.0, 594.0, 1931.0, 7601.0, 42432.0, 397450.0, 529280.0, 55896.0, 9363.0, 2225.0, 693.0, 261.0, 129.0, 76.0, 42.0, 22.0, 20.0, 13.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.58740234375, -9.2685546875, -8.94970703125, -8.630859375, -8.31201171875, -7.9931640625, -7.67431640625, -7.35546875, -7.03662109375, -6.7177734375, -6.39892578125, -6.080078125, -5.76123046875, -5.4423828125, -5.12353515625, -4.8046875, -4.48583984375, -4.1669921875, -3.84814453125, -3.529296875, -3.21044921875, -2.8916015625, -2.57275390625, -2.25390625, -1.93505859375, -1.6162109375, -1.29736328125, -0.978515625, -0.65966796875, -0.3408203125, -0.02197265625, 0.296875, 0.61572265625, 0.9345703125, 1.25341796875, 1.572265625, 1.89111328125, 2.2099609375, 2.52880859375, 2.84765625, 3.16650390625, 3.4853515625, 3.80419921875, 4.123046875, 4.44189453125, 4.7607421875, 5.07958984375, 5.3984375, 5.71728515625, 6.0361328125, 6.35498046875, 6.673828125, 6.99267578125, 7.3115234375, 7.63037109375, 7.94921875, 8.26806640625, 8.5869140625, 8.90576171875, 9.224609375, 9.54345703125, 9.8623046875, 10.18115234375, 10.5]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 17.0, 13.0, 13.0, 20.0, 20.0, 34.0, 41.0, 40.0, 46.0, 40.0, 54.0, 54.0, 61.0, 57.0, 62.0, 53.0, 61.0, 56.0, 47.0, 35.0, 29.0, 28.0, 19.0, 19.0, 10.0, 13.0, 11.0, 9.0, 8.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.830322265625, -1.77392578125, -1.717529296875, -1.6611328125, -1.604736328125, -1.54833984375, -1.491943359375, -1.435546875, -1.379150390625, -1.32275390625, -1.266357421875, -1.2099609375, -1.153564453125, -1.09716796875, -1.040771484375, -0.984375, -0.927978515625, -0.87158203125, -0.815185546875, -0.7587890625, -0.702392578125, -0.64599609375, -0.589599609375, -0.533203125, -0.476806640625, -0.42041015625, -0.364013671875, -0.3076171875, -0.251220703125, -0.19482421875, -0.138427734375, -0.08203125, -0.025634765625, 0.03076171875, 0.087158203125, 0.1435546875, 0.199951171875, 0.25634765625, 0.312744140625, 0.369140625, 0.425537109375, 0.48193359375, 0.538330078125, 0.5947265625, 0.651123046875, 0.70751953125, 0.763916015625, 0.8203125, 0.876708984375, 0.93310546875, 0.989501953125, 1.0458984375, 1.102294921875, 1.15869140625, 1.215087890625, 1.271484375, 1.327880859375, 1.38427734375, 1.440673828125, 1.4970703125, 1.553466796875, 1.60986328125, 1.666259765625, 1.72265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 13.0, 13.0, 22.0, 40.0, 36.0, 47.0, 77.0, 117.0, 211.0, 334.0, 648.0, 1308.0, 3006.0, 6785.0, 18011.0, 50888.0, 160810.0, 462622.0, 232200.0, 70790.0, 24147.0, 8996.0, 3747.0, 1756.0, 769.0, 420.0, 266.0, 158.0, 87.0, 48.0, 36.0, 21.0, 25.0, 14.0, 17.0, 9.0, 12.0, 8.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0], "bins": [-5.08203125, -4.943359375, -4.8046875, -4.666015625, -4.52734375, -4.388671875, -4.25, -4.111328125, -3.97265625, -3.833984375, -3.6953125, -3.556640625, -3.41796875, -3.279296875, -3.140625, -3.001953125, -2.86328125, -2.724609375, -2.5859375, -2.447265625, -2.30859375, -2.169921875, -2.03125, -1.892578125, -1.75390625, -1.615234375, -1.4765625, -1.337890625, -1.19921875, -1.060546875, -0.921875, -0.783203125, -0.64453125, -0.505859375, -0.3671875, -0.228515625, -0.08984375, 0.048828125, 0.1875, 0.326171875, 0.46484375, 0.603515625, 0.7421875, 0.880859375, 1.01953125, 1.158203125, 1.296875, 1.435546875, 1.57421875, 1.712890625, 1.8515625, 1.990234375, 2.12890625, 2.267578125, 2.40625, 2.544921875, 2.68359375, 2.822265625, 2.9609375, 3.099609375, 3.23828125, 3.376953125, 3.515625, 3.654296875, 3.79296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 5.0, 6.0, 3.0, 5.0, 7.0, 18.0, 18.0, 14.0, 19.0, 22.0, 31.0, 28.0, 26.0, 26.0, 44.0, 32.0, 33.0, 35.0, 44.0, 41.0, 53.0, 48.0, 43.0, 37.0, 49.0, 55.0, 32.0, 25.0, 30.0, 20.0, 24.0, 17.0, 17.0, 18.0, 14.0, 12.0, 6.0, 13.0, 4.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.6015625, -5.43426513671875, -5.2669677734375, -5.09967041015625, -4.932373046875, -4.76507568359375, -4.5977783203125, -4.43048095703125, -4.26318359375, -4.09588623046875, -3.9285888671875, -3.76129150390625, -3.593994140625, -3.42669677734375, -3.2593994140625, -3.09210205078125, -2.9248046875, -2.75750732421875, -2.5902099609375, -2.42291259765625, -2.255615234375, -2.08831787109375, -1.9210205078125, -1.75372314453125, -1.58642578125, -1.41912841796875, -1.2518310546875, -1.08453369140625, -0.917236328125, -0.74993896484375, -0.5826416015625, -0.41534423828125, -0.248046875, -0.08074951171875, 0.0865478515625, 0.25384521484375, 0.421142578125, 0.58843994140625, 0.7557373046875, 0.92303466796875, 1.09033203125, 1.25762939453125, 1.4249267578125, 1.59222412109375, 1.759521484375, 1.92681884765625, 2.0941162109375, 2.26141357421875, 2.4287109375, 2.59600830078125, 2.7633056640625, 2.93060302734375, 3.097900390625, 3.26519775390625, 3.4324951171875, 3.59979248046875, 3.76708984375, 3.93438720703125, 4.1016845703125, 4.26898193359375, 4.436279296875, 4.60357666015625, 4.7708740234375, 4.93817138671875, 5.10546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 11.0, 17.0, 11.0, 36.0, 95.0, 142.0, 385.0, 1068.0, 3584.0, 18005.0, 180290.0, 786414.0, 47914.0, 7569.0, 1828.0, 688.0, 241.0, 113.0, 50.0, 32.0, 22.0, 10.0, 12.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.58795166015625, -3.4766845703125, -3.36541748046875, -3.254150390625, -3.14288330078125, -3.0316162109375, -2.92034912109375, -2.80908203125, -2.69781494140625, -2.5865478515625, -2.47528076171875, -2.364013671875, -2.25274658203125, -2.1414794921875, -2.03021240234375, -1.9189453125, -1.80767822265625, -1.6964111328125, -1.58514404296875, -1.473876953125, -1.36260986328125, -1.2513427734375, -1.14007568359375, -1.02880859375, -0.91754150390625, -0.8062744140625, -0.69500732421875, -0.583740234375, -0.47247314453125, -0.3612060546875, -0.24993896484375, -0.138671875, -0.02740478515625, 0.0838623046875, 0.19512939453125, 0.306396484375, 0.41766357421875, 0.5289306640625, 0.64019775390625, 0.75146484375, 0.86273193359375, 0.9739990234375, 1.08526611328125, 1.196533203125, 1.30780029296875, 1.4190673828125, 1.53033447265625, 1.6416015625, 1.75286865234375, 1.8641357421875, 1.97540283203125, 2.086669921875, 2.19793701171875, 2.3092041015625, 2.42047119140625, 2.53173828125, 2.64300537109375, 2.7542724609375, 2.86553955078125, 2.976806640625, 3.08807373046875, 3.1993408203125, 3.31060791015625, 3.421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 11.0, 6.0, 17.0, 13.0, 22.0, 44.0, 105.0, 286.0, 250.0, 114.0, 38.0, 33.0, 22.0, 9.0, 6.0, 10.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007410049438476562, -0.0007203966379165649, -0.0006997883319854736, -0.0006791800260543823, -0.000658571720123291, -0.0006379634141921997, -0.0006173551082611084, -0.0005967468023300171, -0.0005761384963989258, -0.0005555301904678345, -0.0005349218845367432, -0.0005143135786056519, -0.0004937052726745605, -0.00047309696674346924, -0.00045248866081237793, -0.0004318803548812866, -0.0004112720489501953, -0.000390663743019104, -0.0003700554370880127, -0.0003494471311569214, -0.0003288388252258301, -0.00030823051929473877, -0.00028762221336364746, -0.00026701390743255615, -0.00024640560150146484, -0.00022579729557037354, -0.00020518898963928223, -0.00018458068370819092, -0.0001639723777770996, -0.0001433640718460083, -0.000122755765914917, -0.00010214745998382568, -8.153915405273438e-05, -6.0930848121643066e-05, -4.032254219055176e-05, -1.971423625946045e-05, 8.940696716308594e-07, 2.1502375602722168e-05, 4.2110681533813477e-05, 6.271898746490479e-05, 8.33272933959961e-05, 0.0001039355993270874, 0.0001245439052581787, 0.00014515221118927002, 0.00016576051712036133, 0.00018636882305145264, 0.00020697712898254395, 0.00022758543491363525, 0.00024819374084472656, 0.00026880204677581787, 0.0002894103527069092, 0.0003100186586380005, 0.0003306269645690918, 0.0003512352705001831, 0.0003718435764312744, 0.0003924518823623657, 0.00041306018829345703, 0.00043366849422454834, 0.00045427680015563965, 0.00047488510608673096, 0.0004954934120178223, 0.0005161017179489136, 0.0005367100238800049, 0.0005573183298110962, 0.0005779266357421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 6.0, 14.0, 29.0, 35.0, 62.0, 98.0, 172.0, 312.0, 500.0, 958.0, 1878.0, 3994.0, 10297.0, 31672.0, 190155.0, 703110.0, 74033.0, 18657.0, 6725.0, 2883.0, 1312.0, 698.0, 367.0, 223.0, 117.0, 83.0, 41.0, 51.0, 22.0, 13.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.79296875, -2.71380615234375, -2.6346435546875, -2.55548095703125, -2.476318359375, -2.39715576171875, -2.3179931640625, -2.23883056640625, -2.15966796875, -2.08050537109375, -2.0013427734375, -1.92218017578125, -1.843017578125, -1.76385498046875, -1.6846923828125, -1.60552978515625, -1.5263671875, -1.44720458984375, -1.3680419921875, -1.28887939453125, -1.209716796875, -1.13055419921875, -1.0513916015625, -0.97222900390625, -0.89306640625, -0.81390380859375, -0.7347412109375, -0.65557861328125, -0.576416015625, -0.49725341796875, -0.4180908203125, -0.33892822265625, -0.259765625, -0.18060302734375, -0.1014404296875, -0.02227783203125, 0.056884765625, 0.13604736328125, 0.2152099609375, 0.29437255859375, 0.37353515625, 0.45269775390625, 0.5318603515625, 0.61102294921875, 0.690185546875, 0.76934814453125, 0.8485107421875, 0.92767333984375, 1.0068359375, 1.08599853515625, 1.1651611328125, 1.24432373046875, 1.323486328125, 1.40264892578125, 1.4818115234375, 1.56097412109375, 1.64013671875, 1.71929931640625, 1.7984619140625, 1.87762451171875, 1.956787109375, 2.03594970703125, 2.1151123046875, 2.19427490234375, 2.2734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 14.0, 17.0, 28.0, 34.0, 67.0, 78.0, 132.0, 150.0, 142.0, 77.0, 74.0, 46.0, 36.0, 19.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.5167236328125, -2.441650390625, -2.3665771484375, -2.29150390625, -2.2164306640625, -2.141357421875, -2.0662841796875, -1.9912109375, -1.9161376953125, -1.841064453125, -1.7659912109375, -1.69091796875, -1.6158447265625, -1.540771484375, -1.4656982421875, -1.390625, -1.3155517578125, -1.240478515625, -1.1654052734375, -1.09033203125, -1.0152587890625, -0.940185546875, -0.8651123046875, -0.7900390625, -0.7149658203125, -0.639892578125, -0.5648193359375, -0.48974609375, -0.4146728515625, -0.339599609375, -0.2645263671875, -0.189453125, -0.1143798828125, -0.039306640625, 0.0357666015625, 0.11083984375, 0.1859130859375, 0.260986328125, 0.3360595703125, 0.4111328125, 0.4862060546875, 0.561279296875, 0.6363525390625, 0.71142578125, 0.7864990234375, 0.861572265625, 0.9366455078125, 1.01171875, 1.0867919921875, 1.161865234375, 1.2369384765625, 1.31201171875, 1.3870849609375, 1.462158203125, 1.5372314453125, 1.6123046875, 1.6873779296875, 1.762451171875, 1.8375244140625, 1.91259765625, 1.9876708984375, 2.062744140625, 2.1378173828125, 2.212890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 21.0, 46.0, 91.0, 180.0, 260.0, 200.0, 113.0, 46.0, 22.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.71807861328125, -99.70803833007812, -97.69799041748047, -95.68795013427734, -93.67790985107422, -91.6678695678711, -89.65782165527344, -87.64778137207031, -85.63774108886719, -83.62770080566406, -81.6176528930664, -79.60761260986328, -77.59757232666016, -75.58753204345703, -73.57748413085938, -71.56744384765625, -69.55740356445312, -67.54736328125, -65.53731536865234, -63.52727508544922, -61.517234802246094, -59.5071907043457, -57.49714660644531, -55.48710632324219, -53.47705841064453, -51.46701431274414, -49.456974029541016, -47.446929931640625, -45.4368896484375, -43.42684555053711, -41.41680145263672, -39.406761169433594, -37.396728515625, -35.38668441772461, -33.376644134521484, -31.366600036621094, -29.35655975341797, -27.346515655517578, -25.33647346496582, -23.326431274414062, -21.316387176513672, -19.306344985961914, -17.296302795410156, -15.286259651184082, -13.276217460632324, -11.266175270080566, -9.256132125854492, -7.246089935302734, -5.236047744750977, -3.2260053157806396, -1.2159628868103027, 0.7940797805786133, 2.804121971130371, 4.814164161682129, 6.824207305908203, 8.834249496459961, 10.844291687011719, 12.854333877563477, 14.864376068115234, 16.874420166015625, 18.88446044921875, 20.89450454711914, 22.9045467376709, 24.914588928222656, 26.924631118774414]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 7.0, 8.0, 17.0, 9.0, 12.0, 24.0, 28.0, 26.0, 28.0, 30.0, 34.0, 26.0, 29.0, 34.0, 27.0, 30.0, 42.0, 27.0, 44.0, 33.0, 34.0, 31.0, 36.0, 33.0, 31.0, 22.0, 26.0, 26.0, 24.0, 33.0, 24.0, 23.0, 21.0, 12.0, 18.0, 10.0, 10.0, 5.0, 6.0, 7.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-23.635513305664062, -22.937578201293945, -22.239643096923828, -21.541709899902344, -20.843774795532227, -20.14583969116211, -19.447904586791992, -18.749969482421875, -18.052034378051758, -17.35409927368164, -16.656164169311523, -15.958230018615723, -15.260294914245605, -14.562360763549805, -13.864425659179688, -13.16649055480957, -12.46855640411377, -11.770621299743652, -11.072687149047852, -10.374752044677734, -9.676816940307617, -8.9788818359375, -8.2809476852417, -7.583012580871582, -6.885077953338623, -6.187143325805664, -5.489208221435547, -4.791273593902588, -4.093338966369629, -3.3954038619995117, -2.6974692344665527, -1.9995341300964355, -1.3015995025634766, -0.6036646962165833, 0.09427011013031006, 0.7922048568725586, 1.4901397228240967, 2.1880745887756348, 2.8860092163085938, 3.583944320678711, 4.28187894821167, 4.979813575744629, 5.677748680114746, 6.375683307647705, 7.073617935180664, 7.771553039550781, 8.469488143920898, 9.167423248291016, 9.865357398986816, 10.563292503356934, 11.261226654052734, 11.959161758422852, 12.657096862792969, 13.355031967163086, 14.052966117858887, 14.750901222229004, 15.448835372924805, 16.146770477294922, 16.84470558166504, 17.542640686035156, 18.24057388305664, 18.938508987426758, 19.636444091796875, 20.334379196166992, 21.03231430053711]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 9.0, 8.0, 13.0, 17.0, 39.0, 48.0, 55.0, 98.0, 143.0, 227.0, 342.0, 667.0, 1273.0, 2733.0, 8548.0, 51196.0, 3993513.0, 114873.0, 13169.0, 3787.0, 1516.0, 770.0, 405.0, 284.0, 158.0, 126.0, 77.0, 49.0, 39.0, 25.0, 19.0, 14.0, 11.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.2421875, -13.7774658203125, -13.312744140625, -12.8480224609375, -12.38330078125, -11.9185791015625, -11.453857421875, -10.9891357421875, -10.5244140625, -10.0596923828125, -9.594970703125, -9.1302490234375, -8.66552734375, -8.2008056640625, -7.736083984375, -7.2713623046875, -6.806640625, -6.3419189453125, -5.877197265625, -5.4124755859375, -4.94775390625, -4.4830322265625, -4.018310546875, -3.5535888671875, -3.0888671875, -2.6241455078125, -2.159423828125, -1.6947021484375, -1.22998046875, -0.7652587890625, -0.300537109375, 0.1641845703125, 0.62890625, 1.0936279296875, 1.558349609375, 2.0230712890625, 2.48779296875, 2.9525146484375, 3.417236328125, 3.8819580078125, 4.3466796875, 4.8114013671875, 5.276123046875, 5.7408447265625, 6.20556640625, 6.6702880859375, 7.135009765625, 7.5997314453125, 8.064453125, 8.5291748046875, 8.993896484375, 9.4586181640625, 9.92333984375, 10.3880615234375, 10.852783203125, 11.3175048828125, 11.7822265625, 12.2469482421875, 12.711669921875, 13.1763916015625, 13.64111328125, 14.1058349609375, 14.570556640625, 15.0352783203125, 15.5]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 13.0, 11.0, 19.0, 20.0, 31.0, 38.0, 50.0, 42.0, 43.0, 42.0, 41.0, 70.0, 74.0, 55.0, 49.0, 47.0, 44.0, 46.0, 46.0, 36.0, 29.0, 31.0, 19.0, 16.0, 17.0, 15.0, 9.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.25, -2.192291259765625, -2.13458251953125, -2.076873779296875, -2.0191650390625, -1.961456298828125, -1.90374755859375, -1.846038818359375, -1.788330078125, -1.730621337890625, -1.67291259765625, -1.615203857421875, -1.5574951171875, -1.499786376953125, -1.44207763671875, -1.384368896484375, -1.32666015625, -1.268951416015625, -1.21124267578125, -1.153533935546875, -1.0958251953125, -1.038116455078125, -0.98040771484375, -0.922698974609375, -0.864990234375, -0.807281494140625, -0.74957275390625, -0.691864013671875, -0.6341552734375, -0.576446533203125, -0.51873779296875, -0.461029052734375, -0.4033203125, -0.345611572265625, -0.28790283203125, -0.230194091796875, -0.1724853515625, -0.114776611328125, -0.05706787109375, 0.000640869140625, 0.058349609375, 0.116058349609375, 0.17376708984375, 0.231475830078125, 0.2891845703125, 0.346893310546875, 0.40460205078125, 0.462310791015625, 0.52001953125, 0.577728271484375, 0.63543701171875, 0.693145751953125, 0.7508544921875, 0.808563232421875, 0.86627197265625, 0.923980712890625, 0.981689453125, 1.039398193359375, 1.09710693359375, 1.154815673828125, 1.2125244140625, 1.270233154296875, 1.32794189453125, 1.385650634765625, 1.443359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 16.0, 35.0, 38.0, 61.0, 118.0, 244.0, 367.0, 624.0, 1157.0, 2457.0, 5504.0, 14037.0, 49059.0, 602104.0, 3410937.0, 76364.0, 18394.0, 6706.0, 2830.0, 1478.0, 755.0, 434.0, 232.0, 129.0, 72.0, 43.0, 25.0, 19.0, 15.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.34808349609375, -6.1141357421875, -5.88018798828125, -5.646240234375, -5.41229248046875, -5.1783447265625, -4.94439697265625, -4.71044921875, -4.47650146484375, -4.2425537109375, -4.00860595703125, -3.774658203125, -3.54071044921875, -3.3067626953125, -3.07281494140625, -2.8388671875, -2.60491943359375, -2.3709716796875, -2.13702392578125, -1.903076171875, -1.66912841796875, -1.4351806640625, -1.20123291015625, -0.96728515625, -0.73333740234375, -0.4993896484375, -0.26544189453125, -0.031494140625, 0.20245361328125, 0.4364013671875, 0.67034912109375, 0.904296875, 1.13824462890625, 1.3721923828125, 1.60614013671875, 1.840087890625, 2.07403564453125, 2.3079833984375, 2.54193115234375, 2.77587890625, 3.00982666015625, 3.2437744140625, 3.47772216796875, 3.711669921875, 3.94561767578125, 4.1795654296875, 4.41351318359375, 4.6474609375, 4.88140869140625, 5.1153564453125, 5.34930419921875, 5.583251953125, 5.81719970703125, 6.0511474609375, 6.28509521484375, 6.51904296875, 6.75299072265625, 6.9869384765625, 7.22088623046875, 7.454833984375, 7.68878173828125, 7.9227294921875, 8.15667724609375, 8.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 8.0, 15.0, 16.0, 23.0, 31.0, 59.0, 108.0, 254.0, 2047.0, 1078.0, 209.0, 71.0, 49.0, 23.0, 18.0, 9.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3968505859375, -3.293701171875, -3.1905517578125, -3.08740234375, -2.9842529296875, -2.881103515625, -2.7779541015625, -2.6748046875, -2.5716552734375, -2.468505859375, -2.3653564453125, -2.26220703125, -2.1590576171875, -2.055908203125, -1.9527587890625, -1.849609375, -1.7464599609375, -1.643310546875, -1.5401611328125, -1.43701171875, -1.3338623046875, -1.230712890625, -1.1275634765625, -1.0244140625, -0.9212646484375, -0.818115234375, -0.7149658203125, -0.61181640625, -0.5086669921875, -0.405517578125, -0.3023681640625, -0.19921875, -0.0960693359375, 0.007080078125, 0.1102294921875, 0.21337890625, 0.3165283203125, 0.419677734375, 0.5228271484375, 0.6259765625, 0.7291259765625, 0.832275390625, 0.9354248046875, 1.03857421875, 1.1417236328125, 1.244873046875, 1.3480224609375, 1.451171875, 1.5543212890625, 1.657470703125, 1.7606201171875, 1.86376953125, 1.9669189453125, 2.070068359375, 2.1732177734375, 2.2763671875, 2.3795166015625, 2.482666015625, 2.5858154296875, 2.68896484375, 2.7921142578125, 2.895263671875, 2.9984130859375, 3.1015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 13.0, 11.0, 32.0, 58.0, 116.0, 214.0, 239.0, 171.0, 87.0, 33.0, 12.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.76390075683594, -31.960107803344727, -31.156314849853516, -30.352521896362305, -29.548728942871094, -28.74493408203125, -27.94114112854004, -27.137348175048828, -26.333555221557617, -25.529762268066406, -24.725969314575195, -23.922176361083984, -23.11838150024414, -22.314590454101562, -21.51079559326172, -20.707002639770508, -19.903209686279297, -19.099416732788086, -18.295623779296875, -17.491830825805664, -16.688037872314453, -15.884243965148926, -15.080450057983398, -14.276657104492188, -13.472864151000977, -12.669071197509766, -11.865278244018555, -11.061484336853027, -10.257691383361816, -9.453898429870605, -8.650104522705078, -7.846311569213867, -7.042516708374023, -6.2387237548828125, -5.434930324554443, -4.631136894226074, -3.8273439407348633, -3.0235509872436523, -2.219757556915283, -1.415964126586914, -0.6121711730957031, 0.19162201881408691, 0.995415210723877, 1.799208402633667, 2.603001594543457, 3.406794548034668, 4.210587978363037, 5.014381408691406, 5.818174362182617, 6.621967315673828, 7.425760746002197, 8.229554176330566, 9.033347129821777, 9.837140083312988, 10.640933990478516, 11.444726943969727, 12.248519897460938, 13.052312850952148, 13.85610580444336, 14.659899711608887, 15.463692665100098, 16.267486572265625, 17.071279525756836, 17.875072479248047, 18.678865432739258]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 10.0, 7.0, 10.0, 15.0, 14.0, 18.0, 23.0, 26.0, 22.0, 16.0, 16.0, 24.0, 36.0, 36.0, 35.0, 28.0, 23.0, 37.0, 38.0, 46.0, 37.0, 37.0, 26.0, 48.0, 39.0, 27.0, 31.0, 37.0, 27.0, 29.0, 20.0, 21.0, 27.0, 17.0, 19.0, 12.0, 18.0, 6.0, 9.0, 6.0, 5.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.768549919128418, -7.523983955383301, -7.279418468475342, -7.034852504730225, -6.790286540985107, -6.545721054077148, -6.301155090332031, -6.056589126586914, -5.812023162841797, -5.56745719909668, -5.322891712188721, -5.0783257484436035, -4.833759784698486, -4.589194297790527, -4.34462833404541, -4.100062370300293, -3.855496883392334, -3.610931158065796, -3.3663651943206787, -3.1217994689941406, -2.8772335052490234, -2.6326677799224854, -2.3881020545959473, -2.14353609085083, -1.898970365524292, -1.6544045209884644, -1.4098386764526367, -1.1652729511260986, -0.920707106590271, -0.6761412620544434, -0.4315755367279053, -0.18700969219207764, 0.05755615234375, 0.30212196707725525, 0.5466877818107605, 0.7912535667419434, 1.035819411277771, 1.2803852558135986, 1.5249509811401367, 1.7695168256759644, 2.014082670211792, 2.25864839553833, 2.5032143592834473, 2.7477800846099854, 2.9923458099365234, 3.2369117736816406, 3.4814774990081787, 3.726043224334717, 3.970609188079834, 4.215175151824951, 4.45974063873291, 4.704306602478027, 4.9488725662231445, 5.193438529968262, 5.438004016876221, 5.682569980621338, 5.927135467529297, 6.171701431274414, 6.416266918182373, 6.66083288192749, 6.905398845672607, 7.149964332580566, 7.394530296325684, 7.639096260070801, 7.883662223815918]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 34.0, 50.0, 64.0, 104.0, 173.0, 286.0, 463.0, 945.0, 1736.0, 3683.0, 8535.0, 23269.0, 78233.0, 326714.0, 442365.0, 111117.0, 30635.0, 11017.0, 4489.0, 2094.0, 1043.0, 583.0, 353.0, 176.0, 110.0, 73.0, 46.0, 44.0, 27.0, 9.0, 15.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.80859375, -7.5728759765625, -7.337158203125, -7.1014404296875, -6.86572265625, -6.6300048828125, -6.394287109375, -6.1585693359375, -5.9228515625, -5.6871337890625, -5.451416015625, -5.2156982421875, -4.97998046875, -4.7442626953125, -4.508544921875, -4.2728271484375, -4.037109375, -3.8013916015625, -3.565673828125, -3.3299560546875, -3.09423828125, -2.8585205078125, -2.622802734375, -2.3870849609375, -2.1513671875, -1.9156494140625, -1.679931640625, -1.4442138671875, -1.20849609375, -0.9727783203125, -0.737060546875, -0.5013427734375, -0.265625, -0.0299072265625, 0.205810546875, 0.4415283203125, 0.67724609375, 0.9129638671875, 1.148681640625, 1.3843994140625, 1.6201171875, 1.8558349609375, 2.091552734375, 2.3272705078125, 2.56298828125, 2.7987060546875, 3.034423828125, 3.2701416015625, 3.505859375, 3.7415771484375, 3.977294921875, 4.2130126953125, 4.44873046875, 4.6844482421875, 4.920166015625, 5.1558837890625, 5.3916015625, 5.6273193359375, 5.863037109375, 6.0987548828125, 6.33447265625, 6.5701904296875, 6.805908203125, 7.0416259765625, 7.27734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 6.0, 7.0, 11.0, 13.0, 17.0, 20.0, 25.0, 24.0, 32.0, 46.0, 41.0, 51.0, 45.0, 52.0, 62.0, 58.0, 52.0, 46.0, 51.0, 46.0, 44.0, 45.0, 36.0, 35.0, 27.0, 16.0, 24.0, 19.0, 9.0, 10.0, 10.0, 6.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.126953125, -2.067626953125, -2.00830078125, -1.948974609375, -1.8896484375, -1.830322265625, -1.77099609375, -1.711669921875, -1.65234375, -1.593017578125, -1.53369140625, -1.474365234375, -1.4150390625, -1.355712890625, -1.29638671875, -1.237060546875, -1.177734375, -1.118408203125, -1.05908203125, -0.999755859375, -0.9404296875, -0.881103515625, -0.82177734375, -0.762451171875, -0.703125, -0.643798828125, -0.58447265625, -0.525146484375, -0.4658203125, -0.406494140625, -0.34716796875, -0.287841796875, -0.228515625, -0.169189453125, -0.10986328125, -0.050537109375, 0.0087890625, 0.068115234375, 0.12744140625, 0.186767578125, 0.24609375, 0.305419921875, 0.36474609375, 0.424072265625, 0.4833984375, 0.542724609375, 0.60205078125, 0.661376953125, 0.720703125, 0.780029296875, 0.83935546875, 0.898681640625, 0.9580078125, 1.017333984375, 1.07666015625, 1.135986328125, 1.1953125, 1.254638671875, 1.31396484375, 1.373291015625, 1.4326171875, 1.491943359375, 1.55126953125, 1.610595703125, 1.669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 1.0, 6.0, 6.0, 8.0, 13.0, 12.0, 25.0, 47.0, 74.0, 115.0, 205.0, 391.0, 711.0, 1533.0, 3881.0, 12997.0, 62778.0, 432086.0, 447519.0, 65846.0, 13079.0, 4092.0, 1549.0, 738.0, 346.0, 179.0, 128.0, 62.0, 41.0, 25.0, 26.0, 8.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.96875, -6.719970703125, -6.47119140625, -6.222412109375, -5.9736328125, -5.724853515625, -5.47607421875, -5.227294921875, -4.978515625, -4.729736328125, -4.48095703125, -4.232177734375, -3.9833984375, -3.734619140625, -3.48583984375, -3.237060546875, -2.98828125, -2.739501953125, -2.49072265625, -2.241943359375, -1.9931640625, -1.744384765625, -1.49560546875, -1.246826171875, -0.998046875, -0.749267578125, -0.50048828125, -0.251708984375, -0.0029296875, 0.245849609375, 0.49462890625, 0.743408203125, 0.9921875, 1.240966796875, 1.48974609375, 1.738525390625, 1.9873046875, 2.236083984375, 2.48486328125, 2.733642578125, 2.982421875, 3.231201171875, 3.47998046875, 3.728759765625, 3.9775390625, 4.226318359375, 4.47509765625, 4.723876953125, 4.97265625, 5.221435546875, 5.47021484375, 5.718994140625, 5.9677734375, 6.216552734375, 6.46533203125, 6.714111328125, 6.962890625, 7.211669921875, 7.46044921875, 7.709228515625, 7.9580078125, 8.206787109375, 8.45556640625, 8.704345703125, 8.953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 8.0, 17.0, 29.0, 26.0, 30.0, 40.0, 39.0, 58.0, 65.0, 61.0, 76.0, 73.0, 59.0, 59.0, 49.0, 49.0, 52.0, 47.0, 42.0, 27.0, 21.0, 12.0, 13.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3673095703125, -11.039306640625, -10.7113037109375, -10.38330078125, -10.0552978515625, -9.727294921875, -9.3992919921875, -9.0712890625, -8.7432861328125, -8.415283203125, -8.0872802734375, -7.75927734375, -7.4312744140625, -7.103271484375, -6.7752685546875, -6.447265625, -6.1192626953125, -5.791259765625, -5.4632568359375, -5.13525390625, -4.8072509765625, -4.479248046875, -4.1512451171875, -3.8232421875, -3.4952392578125, -3.167236328125, -2.8392333984375, -2.51123046875, -2.1832275390625, -1.855224609375, -1.5272216796875, -1.19921875, -0.8712158203125, -0.543212890625, -0.2152099609375, 0.11279296875, 0.4407958984375, 0.768798828125, 1.0968017578125, 1.4248046875, 1.7528076171875, 2.080810546875, 2.4088134765625, 2.73681640625, 3.0648193359375, 3.392822265625, 3.7208251953125, 4.048828125, 4.3768310546875, 4.704833984375, 5.0328369140625, 5.36083984375, 5.6888427734375, 6.016845703125, 6.3448486328125, 6.6728515625, 7.0008544921875, 7.328857421875, 7.6568603515625, 7.98486328125, 8.3128662109375, 8.640869140625, 8.9688720703125, 9.296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 8.0, 14.0, 11.0, 13.0, 26.0, 35.0, 49.0, 61.0, 110.0, 164.0, 304.0, 577.0, 1272.0, 3731.0, 13942.0, 128652.0, 841808.0, 45433.0, 7869.0, 2396.0, 978.0, 459.0, 213.0, 138.0, 81.0, 52.0, 37.0, 34.0, 19.0, 21.0, 10.0, 5.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.5625, -9.29168701171875, -9.0208740234375, -8.75006103515625, -8.479248046875, -8.20843505859375, -7.9376220703125, -7.66680908203125, -7.39599609375, -7.12518310546875, -6.8543701171875, -6.58355712890625, -6.312744140625, -6.04193115234375, -5.7711181640625, -5.50030517578125, -5.2294921875, -4.95867919921875, -4.6878662109375, -4.41705322265625, -4.146240234375, -3.87542724609375, -3.6046142578125, -3.33380126953125, -3.06298828125, -2.79217529296875, -2.5213623046875, -2.25054931640625, -1.979736328125, -1.70892333984375, -1.4381103515625, -1.16729736328125, -0.896484375, -0.62567138671875, -0.3548583984375, -0.08404541015625, 0.186767578125, 0.45758056640625, 0.7283935546875, 0.99920654296875, 1.27001953125, 1.54083251953125, 1.8116455078125, 2.08245849609375, 2.353271484375, 2.62408447265625, 2.8948974609375, 3.16571044921875, 3.4365234375, 3.70733642578125, 3.9781494140625, 4.24896240234375, 4.519775390625, 4.79058837890625, 5.0614013671875, 5.33221435546875, 5.60302734375, 5.87384033203125, 6.1446533203125, 6.41546630859375, 6.686279296875, 6.95709228515625, 7.2279052734375, 7.49871826171875, 7.76953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 15.0, 14.0, 12.0, 23.0, 27.0, 30.0, 51.0, 72.0, 102.0, 223.0, 125.0, 74.0, 51.0, 52.0, 34.0, 14.0, 13.0, 8.0, 17.0, 5.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009412765502929688, -0.0009168311953544617, -0.0008923858404159546, -0.0008679404854774475, -0.0008434951305389404, -0.0008190497756004333, -0.0007946044206619263, -0.0007701590657234192, -0.0007457137107849121, -0.000721268355846405, -0.000696823000907898, -0.0006723776459693909, -0.0006479322910308838, -0.0006234869360923767, -0.0005990415811538696, -0.0005745962262153625, -0.0005501508712768555, -0.0005257055163383484, -0.0005012601613998413, -0.00047681480646133423, -0.00045236945152282715, -0.00042792409658432007, -0.000403478741645813, -0.0003790333867073059, -0.00035458803176879883, -0.00033014267683029175, -0.00030569732189178467, -0.0002812519669532776, -0.0002568066120147705, -0.00023236125707626343, -0.00020791590213775635, -0.00018347054719924927, -0.0001590251922607422, -0.0001345798373222351, -0.00011013448238372803, -8.568912744522095e-05, -6.124377250671387e-05, -3.679841756820679e-05, -1.2353062629699707e-05, 1.2092292308807373e-05, 3.653764724731445e-05, 6.098300218582153e-05, 8.542835712432861e-05, 0.0001098737120628357, 0.00013431906700134277, 0.00015876442193984985, 0.00018320977687835693, 0.00020765513181686401, 0.0002321004867553711, 0.0002565458416938782, 0.00028099119663238525, 0.00030543655157089233, 0.0003298819065093994, 0.0003543272614479065, 0.0003787726163864136, 0.00040321797132492065, 0.00042766332626342773, 0.0004521086812019348, 0.0004765540361404419, 0.000500999391078949, 0.0005254447460174561, 0.0005498901009559631, 0.0005743354558944702, 0.0005987808108329773, 0.0006232261657714844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 6.0, 2.0, 8.0, 8.0, 9.0, 10.0, 23.0, 34.0, 52.0, 69.0, 169.0, 379.0, 622.0, 1539.0, 4229.0, 16813.0, 142488.0, 815066.0, 52646.0, 9375.0, 2787.0, 1105.0, 495.0, 273.0, 135.0, 74.0, 46.0, 28.0, 12.0, 15.0, 10.0, 11.0, 2.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.09375, -9.807861328125, -9.52197265625, -9.236083984375, -8.9501953125, -8.664306640625, -8.37841796875, -8.092529296875, -7.806640625, -7.520751953125, -7.23486328125, -6.948974609375, -6.6630859375, -6.377197265625, -6.09130859375, -5.805419921875, -5.51953125, -5.233642578125, -4.94775390625, -4.661865234375, -4.3759765625, -4.090087890625, -3.80419921875, -3.518310546875, -3.232421875, -2.946533203125, -2.66064453125, -2.374755859375, -2.0888671875, -1.802978515625, -1.51708984375, -1.231201171875, -0.9453125, -0.659423828125, -0.37353515625, -0.087646484375, 0.1982421875, 0.484130859375, 0.77001953125, 1.055908203125, 1.341796875, 1.627685546875, 1.91357421875, 2.199462890625, 2.4853515625, 2.771240234375, 3.05712890625, 3.343017578125, 3.62890625, 3.914794921875, 4.20068359375, 4.486572265625, 4.7724609375, 5.058349609375, 5.34423828125, 5.630126953125, 5.916015625, 6.201904296875, 6.48779296875, 6.773681640625, 7.0595703125, 7.345458984375, 7.63134765625, 7.917236328125, 8.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 18.0, 42.0, 63.0, 163.0, 369.0, 153.0, 65.0, 35.0, 23.0, 8.0, 11.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.53955078125, -12.1416015625, -11.74365234375, -11.345703125, -10.94775390625, -10.5498046875, -10.15185546875, -9.75390625, -9.35595703125, -8.9580078125, -8.56005859375, -8.162109375, -7.76416015625, -7.3662109375, -6.96826171875, -6.5703125, -6.17236328125, -5.7744140625, -5.37646484375, -4.978515625, -4.58056640625, -4.1826171875, -3.78466796875, -3.38671875, -2.98876953125, -2.5908203125, -2.19287109375, -1.794921875, -1.39697265625, -0.9990234375, -0.60107421875, -0.203125, 0.19482421875, 0.5927734375, 0.99072265625, 1.388671875, 1.78662109375, 2.1845703125, 2.58251953125, 2.98046875, 3.37841796875, 3.7763671875, 4.17431640625, 4.572265625, 4.97021484375, 5.3681640625, 5.76611328125, 6.1640625, 6.56201171875, 6.9599609375, 7.35791015625, 7.755859375, 8.15380859375, 8.5517578125, 8.94970703125, 9.34765625, 9.74560546875, 10.1435546875, 10.54150390625, 10.939453125, 11.33740234375, 11.7353515625, 12.13330078125, 12.53125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 12.0, 20.0, 36.0, 45.0, 84.0, 133.0, 164.0, 143.0, 141.0, 87.0, 50.0, 37.0, 18.0, 7.0, 6.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.37358093261719, -95.91415405273438, -93.4547348022461, -90.99530792236328, -88.53588104248047, -86.07646179199219, -83.61703491210938, -81.15760803222656, -78.69818115234375, -76.23875427246094, -73.77933502197266, -71.31990814208984, -68.86048126220703, -66.40106201171875, -63.94163513183594, -61.482208251953125, -59.022789001464844, -56.5633659362793, -54.103939056396484, -51.64451599121094, -49.185089111328125, -46.72566604614258, -44.26624298095703, -41.80681610107422, -39.34739303588867, -36.887969970703125, -34.42854309082031, -31.969120025634766, -29.509695053100586, -27.050270080566406, -24.59084701538086, -22.13142204284668, -19.67198944091797, -17.21256446838379, -14.753140449523926, -12.293716430664062, -9.834291458129883, -7.374866485595703, -4.91544246673584, -2.4560184478759766, 0.003406524658203125, 2.4628310203552246, 4.922255516052246, 7.381680011749268, 9.841104507446289, 12.300529479980469, 14.759953498840332, 17.219377517700195, 19.678802490234375, 22.138227462768555, 24.597652435302734, 27.05707550048828, 29.51650047302246, 31.97592544555664, 34.43534851074219, 36.894775390625, 39.35419845581055, 41.813621520996094, 44.273048400878906, 46.73247146606445, 49.19189453125, 51.65132141113281, 54.11074447631836, 56.570167541503906, 59.02959442138672]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 10.0, 12.0, 13.0, 27.0, 41.0, 26.0, 51.0, 51.0, 50.0, 72.0, 68.0, 88.0, 74.0, 78.0, 61.0, 52.0, 40.0, 37.0, 31.0, 28.0, 22.0, 12.0, 9.0, 15.0, 5.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.62456512451172, -73.2418212890625, -70.85906982421875, -68.47632598876953, -66.09358215332031, -63.71083068847656, -61.328086853027344, -58.94533920288086, -56.562591552734375, -54.17984390258789, -51.797096252441406, -49.41435241699219, -47.0316047668457, -44.64885711669922, -42.26611328125, -39.883365631103516, -37.50061798095703, -35.11787033081055, -32.73512268066406, -30.352378845214844, -27.96963119506836, -25.586883544921875, -23.204137802124023, -20.821392059326172, -18.438644409179688, -16.055896759033203, -13.673151016235352, -11.290404319763184, -8.907657623291016, -6.524910926818848, -4.14216423034668, -1.7594184875488281, 0.6233367919921875, 3.0060834884643555, 5.388830184936523, 7.771576881408691, 10.15432357788086, 12.537070274353027, 14.919816970825195, 17.302562713623047, 19.68531036376953, 22.068058013916016, 24.450803756713867, 26.83354949951172, 29.216297149658203, 31.599044799804688, 33.981788635253906, 36.36453628540039, 38.747283935546875, 41.13003158569336, 43.512779235839844, 45.89552307128906, 48.27827072143555, 50.66101837158203, 53.04376220703125, 55.426509857177734, 57.80925750732422, 60.1920051574707, 62.57475280761719, 64.9574966430664, 67.34024047851562, 69.72299194335938, 72.1057357788086, 74.48847961425781, 76.87123107910156]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 27.0, 31.0, 42.0, 59.0, 95.0, 158.0, 287.0, 563.0, 1397.0, 4719.0, 29558.0, 3899255.0, 240417.0, 12952.0, 2740.0, 955.0, 382.0, 227.0, 119.0, 93.0, 42.0, 35.0, 22.0, 20.0, 16.0, 10.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.654052734375, -12.07373046875, -11.493408203125, -10.9130859375, -10.332763671875, -9.75244140625, -9.172119140625, -8.591796875, -8.011474609375, -7.43115234375, -6.850830078125, -6.2705078125, -5.690185546875, -5.10986328125, -4.529541015625, -3.94921875, -3.368896484375, -2.78857421875, -2.208251953125, -1.6279296875, -1.047607421875, -0.46728515625, 0.113037109375, 0.693359375, 1.273681640625, 1.85400390625, 2.434326171875, 3.0146484375, 3.594970703125, 4.17529296875, 4.755615234375, 5.3359375, 5.916259765625, 6.49658203125, 7.076904296875, 7.6572265625, 8.237548828125, 8.81787109375, 9.398193359375, 9.978515625, 10.558837890625, 11.13916015625, 11.719482421875, 12.2998046875, 12.880126953125, 13.46044921875, 14.040771484375, 14.62109375, 15.201416015625, 15.78173828125, 16.362060546875, 16.9423828125, 17.522705078125, 18.10302734375, 18.683349609375, 19.263671875, 19.843994140625, 20.42431640625, 21.004638671875, 21.5849609375, 22.165283203125, 22.74560546875, 23.325927734375, 23.90625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 14.0, 20.0, 17.0, 27.0, 22.0, 36.0, 38.0, 42.0, 49.0, 60.0, 70.0, 74.0, 56.0, 55.0, 53.0, 51.0, 45.0, 50.0, 40.0, 42.0, 27.0, 21.0, 17.0, 13.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.096588134765625, -2.01348876953125, -1.930389404296875, -1.8472900390625, -1.764190673828125, -1.68109130859375, -1.597991943359375, -1.514892578125, -1.431793212890625, -1.34869384765625, -1.265594482421875, -1.1824951171875, -1.099395751953125, -1.01629638671875, -0.933197021484375, -0.85009765625, -0.766998291015625, -0.68389892578125, -0.600799560546875, -0.5177001953125, -0.434600830078125, -0.35150146484375, -0.268402099609375, -0.185302734375, -0.102203369140625, -0.01910400390625, 0.063995361328125, 0.1470947265625, 0.230194091796875, 0.31329345703125, 0.396392822265625, 0.4794921875, 0.562591552734375, 0.64569091796875, 0.728790283203125, 0.8118896484375, 0.894989013671875, 0.97808837890625, 1.061187744140625, 1.144287109375, 1.227386474609375, 1.31048583984375, 1.393585205078125, 1.4766845703125, 1.559783935546875, 1.64288330078125, 1.725982666015625, 1.80908203125, 1.892181396484375, 1.97528076171875, 2.058380126953125, 2.1414794921875, 2.224578857421875, 2.30767822265625, 2.390777587890625, 2.473876953125, 2.556976318359375, 2.64007568359375, 2.723175048828125, 2.8062744140625, 2.889373779296875, 2.97247314453125, 3.055572509765625, 3.138671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 13.0, 14.0, 24.0, 29.0, 42.0, 74.0, 117.0, 239.0, 660.0, 2014.0, 8595.0, 84413.0, 3977323.0, 107642.0, 9565.0, 2240.0, 688.0, 238.0, 123.0, 84.0, 38.0, 27.0, 20.0, 21.0, 5.0, 8.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.5048828125, -16.931640625, -16.3583984375, -15.78515625, -15.2119140625, -14.638671875, -14.0654296875, -13.4921875, -12.9189453125, -12.345703125, -11.7724609375, -11.19921875, -10.6259765625, -10.052734375, -9.4794921875, -8.90625, -8.3330078125, -7.759765625, -7.1865234375, -6.61328125, -6.0400390625, -5.466796875, -4.8935546875, -4.3203125, -3.7470703125, -3.173828125, -2.6005859375, -2.02734375, -1.4541015625, -0.880859375, -0.3076171875, 0.265625, 0.8388671875, 1.412109375, 1.9853515625, 2.55859375, 3.1318359375, 3.705078125, 4.2783203125, 4.8515625, 5.4248046875, 5.998046875, 6.5712890625, 7.14453125, 7.7177734375, 8.291015625, 8.8642578125, 9.4375, 10.0107421875, 10.583984375, 11.1572265625, 11.73046875, 12.3037109375, 12.876953125, 13.4501953125, 14.0234375, 14.5966796875, 15.169921875, 15.7431640625, 16.31640625, 16.8896484375, 17.462890625, 18.0361328125, 18.609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 10.0, 15.0, 20.0, 47.0, 95.0, 249.0, 2606.0, 746.0, 164.0, 53.0, 23.0, 15.0, 11.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.703125, -13.40362548828125, -13.1041259765625, -12.80462646484375, -12.505126953125, -12.20562744140625, -11.9061279296875, -11.60662841796875, -11.30712890625, -11.00762939453125, -10.7081298828125, -10.40863037109375, -10.109130859375, -9.80963134765625, -9.5101318359375, -9.21063232421875, -8.9111328125, -8.61163330078125, -8.3121337890625, -8.01263427734375, -7.713134765625, -7.41363525390625, -7.1141357421875, -6.81463623046875, -6.51513671875, -6.21563720703125, -5.9161376953125, -5.61663818359375, -5.317138671875, -5.01763916015625, -4.7181396484375, -4.41864013671875, -4.119140625, -3.81964111328125, -3.5201416015625, -3.22064208984375, -2.921142578125, -2.62164306640625, -2.3221435546875, -2.02264404296875, -1.72314453125, -1.42364501953125, -1.1241455078125, -0.82464599609375, -0.525146484375, -0.22564697265625, 0.0738525390625, 0.37335205078125, 0.6728515625, 0.97235107421875, 1.2718505859375, 1.57135009765625, 1.870849609375, 2.17034912109375, 2.4698486328125, 2.76934814453125, 3.06884765625, 3.36834716796875, 3.6678466796875, 3.96734619140625, 4.266845703125, 4.56634521484375, 4.8658447265625, 5.16534423828125, 5.46484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 25.0, 93.0, 234.0, 305.0, 202.0, 99.0, 20.0, 10.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.431304931640625, -47.46857452392578, -45.50584030151367, -43.54310607910156, -41.58037567138672, -39.617645263671875, -37.654911041259766, -35.692176818847656, -33.72944641113281, -31.766714096069336, -29.80398178100586, -27.841249465942383, -25.878517150878906, -23.91578483581543, -21.953052520751953, -19.990320205688477, -18.027587890625, -16.064855575561523, -14.102123260498047, -12.13939094543457, -10.176658630371094, -8.213926315307617, -6.251194000244141, -4.288461685180664, -2.3257293701171875, -0.36299705505371094, 1.5997352600097656, 3.562467575073242, 5.525199890136719, 7.487932205200195, 9.450664520263672, 11.413396835327148, 13.376129150390625, 15.338861465454102, 17.301593780517578, 19.264326095581055, 21.22705841064453, 23.189790725708008, 25.152523040771484, 27.11525535583496, 29.077987670898438, 31.040719985961914, 33.00345230102539, 34.9661865234375, 36.928916931152344, 38.89164733886719, 40.8543815612793, 42.817115783691406, 44.77984619140625, 46.742576599121094, 48.7053108215332, 50.66804504394531, 52.630775451660156, 54.593505859375, 56.55624008178711, 58.51897430419922, 60.48170471191406, 62.444435119628906, 64.40716552734375, 66.36990356445312, 68.33263397216797, 70.29536437988281, 72.25810241699219, 74.22083282470703, 76.18356323242188]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 15.0, 9.0, 18.0, 20.0, 20.0, 16.0, 35.0, 32.0, 35.0, 47.0, 58.0, 47.0, 48.0, 44.0, 51.0, 58.0, 45.0, 48.0, 38.0, 45.0, 47.0, 31.0, 34.0, 25.0, 26.0, 20.0, 15.0, 12.0, 12.0, 8.0, 4.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.807159423828125, -16.178470611572266, -15.549779891967773, -14.921090126037598, -14.292400360107422, -13.663711547851562, -13.035021781921387, -12.406332015991211, -11.777642250061035, -11.14895248413086, -10.520262718200684, -9.891572952270508, -9.262884140014648, -8.634193420410156, -8.005504608154297, -7.376814842224121, -6.748125076293945, -6.1194353103637695, -5.490745544433594, -4.862056255340576, -4.2333664894104, -3.6046767234802246, -2.975987195968628, -2.3472976684570312, -1.7186079025268555, -1.0899182558059692, -0.461228609085083, 0.16746103763580322, 0.7961506843566895, 1.4248404502868652, 2.053529977798462, 2.6822195053100586, 3.3109092712402344, 3.93959903717041, 4.568288803100586, 5.1969780921936035, 5.825667858123779, 6.454357624053955, 7.083046913146973, 7.711736679077148, 8.340426445007324, 8.9691162109375, 9.597805976867676, 10.226495742797852, 10.855184555053711, 11.483875274658203, 12.112564086914062, 12.741253852844238, 13.369943618774414, 13.99863338470459, 14.627323150634766, 15.256012916564941, 15.884702682495117, 16.513391494750977, 17.14208221435547, 17.770771026611328, 18.399459838867188, 19.028148651123047, 19.65683937072754, 20.2855281829834, 20.91421890258789, 21.54290771484375, 22.171598434448242, 22.8002872467041, 23.428977966308594]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 14.0, 26.0, 33.0, 48.0, 52.0, 91.0, 142.0, 206.0, 345.0, 540.0, 808.0, 1243.0, 2084.0, 3539.0, 6382.0, 11588.0, 22468.0, 46735.0, 102524.0, 207235.0, 273550.0, 190378.0, 91835.0, 41560.0, 20427.0, 10458.0, 5619.0, 3248.0, 1949.0, 1264.0, 751.0, 467.0, 289.0, 186.0, 141.0, 90.0, 60.0, 40.0, 33.0, 20.0, 13.0, 15.0, 12.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.03912353515625, -3.9063720703125, -3.77362060546875, -3.640869140625, -3.50811767578125, -3.3753662109375, -3.24261474609375, -3.10986328125, -2.97711181640625, -2.8443603515625, -2.71160888671875, -2.578857421875, -2.44610595703125, -2.3133544921875, -2.18060302734375, -2.0478515625, -1.91510009765625, -1.7823486328125, -1.64959716796875, -1.516845703125, -1.38409423828125, -1.2513427734375, -1.11859130859375, -0.98583984375, -0.85308837890625, -0.7203369140625, -0.58758544921875, -0.454833984375, -0.32208251953125, -0.1893310546875, -0.05657958984375, 0.076171875, 0.20892333984375, 0.3416748046875, 0.47442626953125, 0.607177734375, 0.73992919921875, 0.8726806640625, 1.00543212890625, 1.13818359375, 1.27093505859375, 1.4036865234375, 1.53643798828125, 1.669189453125, 1.80194091796875, 1.9346923828125, 2.06744384765625, 2.2001953125, 2.33294677734375, 2.4656982421875, 2.59844970703125, 2.731201171875, 2.86395263671875, 2.9967041015625, 3.12945556640625, 3.26220703125, 3.39495849609375, 3.5277099609375, 3.66046142578125, 3.793212890625, 3.92596435546875, 4.0587158203125, 4.19146728515625, 4.32421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 10.0, 11.0, 12.0, 17.0, 11.0, 13.0, 22.0, 22.0, 29.0, 27.0, 40.0, 44.0, 53.0, 45.0, 66.0, 54.0, 52.0, 48.0, 56.0, 52.0, 49.0, 28.0, 39.0, 33.0, 31.0, 31.0, 24.0, 13.0, 17.0, 9.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.35589599609375, -2.2781982421875, -2.20050048828125, -2.122802734375, -2.04510498046875, -1.9674072265625, -1.88970947265625, -1.81201171875, -1.73431396484375, -1.6566162109375, -1.57891845703125, -1.501220703125, -1.42352294921875, -1.3458251953125, -1.26812744140625, -1.1904296875, -1.11273193359375, -1.0350341796875, -0.95733642578125, -0.879638671875, -0.80194091796875, -0.7242431640625, -0.64654541015625, -0.56884765625, -0.49114990234375, -0.4134521484375, -0.33575439453125, -0.258056640625, -0.18035888671875, -0.1026611328125, -0.02496337890625, 0.052734375, 0.13043212890625, 0.2081298828125, 0.28582763671875, 0.363525390625, 0.44122314453125, 0.5189208984375, 0.59661865234375, 0.67431640625, 0.75201416015625, 0.8297119140625, 0.90740966796875, 0.985107421875, 1.06280517578125, 1.1405029296875, 1.21820068359375, 1.2958984375, 1.37359619140625, 1.4512939453125, 1.52899169921875, 1.606689453125, 1.68438720703125, 1.7620849609375, 1.83978271484375, 1.91748046875, 1.99517822265625, 2.0728759765625, 2.15057373046875, 2.228271484375, 2.30596923828125, 2.3836669921875, 2.46136474609375, 2.5390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 11.0, 17.0, 17.0, 37.0, 45.0, 78.0, 121.0, 192.0, 392.0, 894.0, 2109.0, 6402.0, 23298.0, 122211.0, 589259.0, 247245.0, 40712.0, 9884.0, 3160.0, 1154.0, 564.0, 265.0, 157.0, 113.0, 46.0, 45.0, 25.0, 25.0, 10.0, 13.0, 7.0, 3.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.421875, -9.08154296875, -8.7412109375, -8.40087890625, -8.060546875, -7.72021484375, -7.3798828125, -7.03955078125, -6.69921875, -6.35888671875, -6.0185546875, -5.67822265625, -5.337890625, -4.99755859375, -4.6572265625, -4.31689453125, -3.9765625, -3.63623046875, -3.2958984375, -2.95556640625, -2.615234375, -2.27490234375, -1.9345703125, -1.59423828125, -1.25390625, -0.91357421875, -0.5732421875, -0.23291015625, 0.107421875, 0.44775390625, 0.7880859375, 1.12841796875, 1.46875, 1.80908203125, 2.1494140625, 2.48974609375, 2.830078125, 3.17041015625, 3.5107421875, 3.85107421875, 4.19140625, 4.53173828125, 4.8720703125, 5.21240234375, 5.552734375, 5.89306640625, 6.2333984375, 6.57373046875, 6.9140625, 7.25439453125, 7.5947265625, 7.93505859375, 8.275390625, 8.61572265625, 8.9560546875, 9.29638671875, 9.63671875, 9.97705078125, 10.3173828125, 10.65771484375, 10.998046875, 11.33837890625, 11.6787109375, 12.01904296875, 12.359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 3.0, 6.0, 7.0, 3.0, 7.0, 15.0, 14.0, 21.0, 25.0, 28.0, 31.0, 33.0, 41.0, 43.0, 37.0, 52.0, 58.0, 54.0, 56.0, 49.0, 49.0, 45.0, 50.0, 49.0, 42.0, 30.0, 28.0, 26.0, 23.0, 20.0, 11.0, 13.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -13.95068359375, -13.4638671875, -12.97705078125, -12.490234375, -12.00341796875, -11.5166015625, -11.02978515625, -10.54296875, -10.05615234375, -9.5693359375, -9.08251953125, -8.595703125, -8.10888671875, -7.6220703125, -7.13525390625, -6.6484375, -6.16162109375, -5.6748046875, -5.18798828125, -4.701171875, -4.21435546875, -3.7275390625, -3.24072265625, -2.75390625, -2.26708984375, -1.7802734375, -1.29345703125, -0.806640625, -0.31982421875, 0.1669921875, 0.65380859375, 1.140625, 1.62744140625, 2.1142578125, 2.60107421875, 3.087890625, 3.57470703125, 4.0615234375, 4.54833984375, 5.03515625, 5.52197265625, 6.0087890625, 6.49560546875, 6.982421875, 7.46923828125, 7.9560546875, 8.44287109375, 8.9296875, 9.41650390625, 9.9033203125, 10.39013671875, 10.876953125, 11.36376953125, 11.8505859375, 12.33740234375, 12.82421875, 13.31103515625, 13.7978515625, 14.28466796875, 14.771484375, 15.25830078125, 15.7451171875, 16.23193359375, 16.71875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 16.0, 11.0, 22.0, 41.0, 56.0, 89.0, 141.0, 259.0, 565.0, 1325.0, 4702.0, 29540.0, 524099.0, 454925.0, 25944.0, 4360.0, 1278.0, 530.0, 260.0, 166.0, 69.0, 41.0, 29.0, 19.0, 22.0, 9.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8690185546875, -7.597412109375, -7.3258056640625, -7.05419921875, -6.7825927734375, -6.510986328125, -6.2393798828125, -5.9677734375, -5.6961669921875, -5.424560546875, -5.1529541015625, -4.88134765625, -4.6097412109375, -4.338134765625, -4.0665283203125, -3.794921875, -3.5233154296875, -3.251708984375, -2.9801025390625, -2.70849609375, -2.4368896484375, -2.165283203125, -1.8936767578125, -1.6220703125, -1.3504638671875, -1.078857421875, -0.8072509765625, -0.53564453125, -0.2640380859375, 0.007568359375, 0.2791748046875, 0.55078125, 0.8223876953125, 1.093994140625, 1.3656005859375, 1.63720703125, 1.9088134765625, 2.180419921875, 2.4520263671875, 2.7236328125, 2.9952392578125, 3.266845703125, 3.5384521484375, 3.81005859375, 4.0816650390625, 4.353271484375, 4.6248779296875, 4.896484375, 5.1680908203125, 5.439697265625, 5.7113037109375, 5.98291015625, 6.2545166015625, 6.526123046875, 6.7977294921875, 7.0693359375, 7.3409423828125, 7.612548828125, 7.8841552734375, 8.15576171875, 8.4273681640625, 8.698974609375, 8.9705810546875, 9.2421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 13.0, 16.0, 17.0, 44.0, 53.0, 88.0, 113.0, 110.0, 137.0, 137.0, 99.0, 54.0, 46.0, 20.0, 13.0, 17.0, 3.0, 4.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00133514404296875, -0.0012993142008781433, -0.0012634843587875366, -0.00122765451669693, -0.0011918246746063232, -0.0011559948325157166, -0.0011201649904251099, -0.0010843351483345032, -0.0010485053062438965, -0.0010126754641532898, -0.000976845622062683, -0.0009410157799720764, -0.0009051859378814697, -0.000869356095790863, -0.0008335262537002563, -0.0007976964116096497, -0.000761866569519043, -0.0007260367274284363, -0.0006902068853378296, -0.0006543770432472229, -0.0006185472011566162, -0.0005827173590660095, -0.0005468875169754028, -0.0005110576748847961, -0.00047522783279418945, -0.00043939799070358276, -0.0004035681486129761, -0.0003677383065223694, -0.0003319084644317627, -0.000296078622341156, -0.0002602487802505493, -0.00022441893815994263, -0.00018858909606933594, -0.00015275925397872925, -0.00011692941188812256, -8.109956979751587e-05, -4.526972770690918e-05, -9.43988561630249e-06, 2.63899564743042e-05, 6.221979856491089e-05, 9.804964065551758e-05, 0.00013387948274612427, 0.00016970932483673096, 0.00020553916692733765, 0.00024136900901794434, 0.000277198851108551, 0.0003130286931991577, 0.0003488585352897644, 0.0003846883773803711, 0.0004205182194709778, 0.00045634806156158447, 0.0004921779036521912, 0.0005280077457427979, 0.0005638375878334045, 0.0005996674299240112, 0.0006354972720146179, 0.0006713271141052246, 0.0007071569561958313, 0.000742986798286438, 0.0007788166403770447, 0.0008146464824676514, 0.0008504763245582581, 0.0008863061666488647, 0.0009221360087394714, 0.0009579658508300781]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 16.0, 17.0, 30.0, 44.0, 61.0, 122.0, 243.0, 529.0, 1518.0, 5311.0, 28190.0, 302965.0, 627259.0, 68544.0, 9524.0, 2554.0, 861.0, 341.0, 188.0, 87.0, 50.0, 43.0, 16.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.62890625, -6.39385986328125, -6.1588134765625, -5.92376708984375, -5.688720703125, -5.45367431640625, -5.2186279296875, -4.98358154296875, -4.74853515625, -4.51348876953125, -4.2784423828125, -4.04339599609375, -3.808349609375, -3.57330322265625, -3.3382568359375, -3.10321044921875, -2.8681640625, -2.63311767578125, -2.3980712890625, -2.16302490234375, -1.927978515625, -1.69293212890625, -1.4578857421875, -1.22283935546875, -0.98779296875, -0.75274658203125, -0.5177001953125, -0.28265380859375, -0.047607421875, 0.18743896484375, 0.4224853515625, 0.65753173828125, 0.892578125, 1.12762451171875, 1.3626708984375, 1.59771728515625, 1.832763671875, 2.06781005859375, 2.3028564453125, 2.53790283203125, 2.77294921875, 3.00799560546875, 3.2430419921875, 3.47808837890625, 3.713134765625, 3.94818115234375, 4.1832275390625, 4.41827392578125, 4.6533203125, 4.88836669921875, 5.1234130859375, 5.35845947265625, 5.593505859375, 5.82855224609375, 6.0635986328125, 6.29864501953125, 6.53369140625, 6.76873779296875, 7.0037841796875, 7.23883056640625, 7.473876953125, 7.70892333984375, 7.9439697265625, 8.17901611328125, 8.4140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 9.0, 6.0, 11.0, 12.0, 28.0, 45.0, 54.0, 72.0, 76.0, 107.0, 108.0, 118.0, 104.0, 66.0, 64.0, 27.0, 31.0, 18.0, 9.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.2890625, -10.03662109375, -9.7841796875, -9.53173828125, -9.279296875, -9.02685546875, -8.7744140625, -8.52197265625, -8.26953125, -8.01708984375, -7.7646484375, -7.51220703125, -7.259765625, -7.00732421875, -6.7548828125, -6.50244140625, -6.25, -5.99755859375, -5.7451171875, -5.49267578125, -5.240234375, -4.98779296875, -4.7353515625, -4.48291015625, -4.23046875, -3.97802734375, -3.7255859375, -3.47314453125, -3.220703125, -2.96826171875, -2.7158203125, -2.46337890625, -2.2109375, -1.95849609375, -1.7060546875, -1.45361328125, -1.201171875, -0.94873046875, -0.6962890625, -0.44384765625, -0.19140625, 0.06103515625, 0.3134765625, 0.56591796875, 0.818359375, 1.07080078125, 1.3232421875, 1.57568359375, 1.828125, 2.08056640625, 2.3330078125, 2.58544921875, 2.837890625, 3.09033203125, 3.3427734375, 3.59521484375, 3.84765625, 4.10009765625, 4.3525390625, 4.60498046875, 4.857421875, 5.10986328125, 5.3623046875, 5.61474609375, 5.8671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 32.0, 102.0, 358.0, 365.0, 105.0, 30.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-381.563232421875, -374.3453674316406, -367.1274719238281, -359.90960693359375, -352.69171142578125, -345.4738464355469, -338.2559509277344, -331.0380859375, -323.8201904296875, -316.6023254394531, -309.3844299316406, -302.16656494140625, -294.94866943359375, -287.7308044433594, -280.5129089355469, -273.2950439453125, -266.0771789550781, -258.85931396484375, -251.64141845703125, -244.4235382080078, -237.20565795898438, -229.98779296875, -222.76991271972656, -215.55203247070312, -208.3341522216797, -201.11627197265625, -193.8983917236328, -186.68051147460938, -179.462646484375, -172.2447509765625, -165.02688598632812, -157.8090057373047, -150.5911102294922, -143.37322998046875, -136.1553497314453, -128.93746948242188, -121.71959686279297, -114.50171661376953, -107.28384399414062, -100.06596374511719, -92.84808349609375, -85.63020324707031, -78.41232299804688, -71.19445037841797, -63.97657012939453, -56.758689880371094, -49.54081344604492, -42.32293701171875, -35.10505676269531, -27.887178421020508, -20.669300079345703, -13.451421737670898, -6.233543395996094, 0.9843368530273438, 8.202213287353516, 15.420089721679688, 22.637969970703125, 29.85584831237793, 37.073726654052734, 44.291603088378906, 51.509483337402344, 58.72736358642578, 65.94523620605469, 73.16311645507812, 80.38099670410156]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 11.0, 12.0, 17.0, 18.0, 14.0, 26.0, 35.0, 45.0, 49.0, 44.0, 40.0, 50.0, 49.0, 52.0, 62.0, 52.0, 54.0, 51.0, 47.0, 37.0, 31.0, 31.0, 16.0, 20.0, 17.0, 13.0, 18.0, 7.0, 7.0, 12.0, 9.0, 6.0, 3.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.94235229492188, -84.39067077636719, -81.83899688720703, -79.28732299804688, -76.73564147949219, -74.1839599609375, -71.63228607177734, -69.08061218261719, -66.5289306640625, -63.97725296020508, -61.425575256347656, -58.873897552490234, -56.32221984863281, -53.77054214477539, -51.21886444091797, -48.66718673706055, -46.115509033203125, -43.5638313293457, -41.01215362548828, -38.46047592163086, -35.90879821777344, -33.357120513916016, -30.805442810058594, -28.253765106201172, -25.70208740234375, -23.150409698486328, -20.598731994628906, -18.047054290771484, -15.495376586914062, -12.94369888305664, -10.392021179199219, -7.840343475341797, -5.288665771484375, -2.736988067626953, -0.18531036376953125, 2.3663673400878906, 4.9180450439453125, 7.469722747802734, 10.021400451660156, 12.573078155517578, 15.124755859375, 17.676433563232422, 20.228111267089844, 22.779788970947266, 25.331466674804688, 27.88314437866211, 30.43482208251953, 32.98649978637695, 35.538177490234375, 38.0898551940918, 40.64153289794922, 43.19321060180664, 45.74488830566406, 48.296566009521484, 50.848243713378906, 53.39992141723633, 55.95159912109375, 58.50327682495117, 61.054954528808594, 63.606632232666016, 66.15830993652344, 68.70999145507812, 71.26166534423828, 73.81333923339844, 76.36502075195312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 12.0, 11.0, 30.0, 37.0, 87.0, 167.0, 353.0, 814.0, 2620.0, 12684.0, 4027777.0, 139608.0, 6990.0, 1823.0, 684.0, 294.0, 122.0, 58.0, 39.0, 19.0, 15.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.2781982421875, -11.626708984375, -10.9752197265625, -10.32373046875, -9.6722412109375, -9.020751953125, -8.3692626953125, -7.7177734375, -7.0662841796875, -6.414794921875, -5.7633056640625, -5.11181640625, -4.4603271484375, -3.808837890625, -3.1573486328125, -2.505859375, -1.8543701171875, -1.202880859375, -0.5513916015625, 0.10009765625, 0.7515869140625, 1.403076171875, 2.0545654296875, 2.7060546875, 3.3575439453125, 4.009033203125, 4.6605224609375, 5.31201171875, 5.9635009765625, 6.614990234375, 7.2664794921875, 7.91796875, 8.5694580078125, 9.220947265625, 9.8724365234375, 10.52392578125, 11.1754150390625, 11.826904296875, 12.4783935546875, 13.1298828125, 13.7813720703125, 14.432861328125, 15.0843505859375, 15.73583984375, 16.3873291015625, 17.038818359375, 17.6903076171875, 18.341796875, 18.9932861328125, 19.644775390625, 20.2962646484375, 20.94775390625, 21.5992431640625, 22.250732421875, 22.9022216796875, 23.5537109375, 24.2052001953125, 24.856689453125, 25.5081787109375, 26.15966796875, 26.8111572265625, 27.462646484375, 28.1141357421875, 28.765625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 16.0, 25.0, 17.0, 27.0, 39.0, 51.0, 50.0, 54.0, 72.0, 58.0, 66.0, 75.0, 78.0, 61.0, 61.0, 45.0, 40.0, 22.0, 28.0, 21.0, 29.0, 9.0, 15.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.43585205078125, -4.3013916015625, -4.16693115234375, -4.032470703125, -3.89801025390625, -3.7635498046875, -3.62908935546875, -3.49462890625, -3.36016845703125, -3.2257080078125, -3.09124755859375, -2.956787109375, -2.82232666015625, -2.6878662109375, -2.55340576171875, -2.4189453125, -2.28448486328125, -2.1500244140625, -2.01556396484375, -1.881103515625, -1.74664306640625, -1.6121826171875, -1.47772216796875, -1.34326171875, -1.20880126953125, -1.0743408203125, -0.93988037109375, -0.805419921875, -0.67095947265625, -0.5364990234375, -0.40203857421875, -0.267578125, -0.13311767578125, 0.0013427734375, 0.13580322265625, 0.270263671875, 0.40472412109375, 0.5391845703125, 0.67364501953125, 0.80810546875, 0.94256591796875, 1.0770263671875, 1.21148681640625, 1.345947265625, 1.48040771484375, 1.6148681640625, 1.74932861328125, 1.8837890625, 2.01824951171875, 2.1527099609375, 2.28717041015625, 2.421630859375, 2.55609130859375, 2.6905517578125, 2.82501220703125, 2.95947265625, 3.09393310546875, 3.2283935546875, 3.36285400390625, 3.497314453125, 3.63177490234375, 3.7662353515625, 3.90069580078125, 4.03515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 2.0, 6.0, 6.0, 8.0, 21.0, 30.0, 42.0, 67.0, 104.0, 114.0, 186.0, 267.0, 461.0, 893.0, 1780.0, 4454.0, 16115.0, 313246.0, 3820009.0, 25838.0, 5951.0, 2255.0, 1023.0, 514.0, 298.0, 185.0, 137.0, 85.0, 62.0, 36.0, 23.0, 17.0, 18.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.6851806640625, -14.143798828125, -13.6024169921875, -13.06103515625, -12.5196533203125, -11.978271484375, -11.4368896484375, -10.8955078125, -10.3541259765625, -9.812744140625, -9.2713623046875, -8.72998046875, -8.1885986328125, -7.647216796875, -7.1058349609375, -6.564453125, -6.0230712890625, -5.481689453125, -4.9403076171875, -4.39892578125, -3.8575439453125, -3.316162109375, -2.7747802734375, -2.2333984375, -1.6920166015625, -1.150634765625, -0.6092529296875, -0.06787109375, 0.4735107421875, 1.014892578125, 1.5562744140625, 2.09765625, 2.6390380859375, 3.180419921875, 3.7218017578125, 4.26318359375, 4.8045654296875, 5.345947265625, 5.8873291015625, 6.4287109375, 6.9700927734375, 7.511474609375, 8.0528564453125, 8.59423828125, 9.1356201171875, 9.677001953125, 10.2183837890625, 10.759765625, 11.3011474609375, 11.842529296875, 12.3839111328125, 12.92529296875, 13.4666748046875, 14.008056640625, 14.5494384765625, 15.0908203125, 15.6322021484375, 16.173583984375, 16.7149658203125, 17.25634765625, 17.7977294921875, 18.339111328125, 18.8804931640625, 19.421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 11.0, 13.0, 35.0, 201.0, 3446.0, 244.0, 50.0, 31.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.2890625, -6.133819580078125, -5.97857666015625, -5.823333740234375, -5.6680908203125, -5.512847900390625, -5.35760498046875, -5.202362060546875, -5.047119140625, -4.891876220703125, -4.73663330078125, -4.581390380859375, -4.4261474609375, -4.270904541015625, -4.11566162109375, -3.960418701171875, -3.80517578125, -3.649932861328125, -3.49468994140625, -3.339447021484375, -3.1842041015625, -3.028961181640625, -2.87371826171875, -2.718475341796875, -2.563232421875, -2.407989501953125, -2.25274658203125, -2.097503662109375, -1.9422607421875, -1.787017822265625, -1.63177490234375, -1.476531982421875, -1.3212890625, -1.166046142578125, -1.01080322265625, -0.855560302734375, -0.7003173828125, -0.545074462890625, -0.38983154296875, -0.234588623046875, -0.079345703125, 0.075897216796875, 0.23114013671875, 0.386383056640625, 0.5416259765625, 0.696868896484375, 0.85211181640625, 1.007354736328125, 1.16259765625, 1.317840576171875, 1.47308349609375, 1.628326416015625, 1.7835693359375, 1.938812255859375, 2.09405517578125, 2.249298095703125, 2.404541015625, 2.559783935546875, 2.71502685546875, 2.870269775390625, 3.0255126953125, 3.180755615234375, 3.33599853515625, 3.491241455078125, 3.646484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 14.0, 58.0, 124.0, 283.0, 269.0, 137.0, 74.0, 24.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.465678215026855, -10.735272407531738, -10.004866600036621, -9.27446174621582, -8.544055938720703, -7.813649654388428, -7.083244323730469, -6.352838516235352, -5.622432708740234, -4.892026901245117, -4.16162109375, -3.431215763092041, -2.700809955596924, -1.9704041481018066, -1.2399988174438477, -0.5095930099487305, 0.22081279754638672, 0.9512184858322144, 1.681624174118042, 2.41202974319458, 3.1424355506896973, 3.8728413581848145, 4.603246688842773, 5.333652496337891, 6.064058303833008, 6.794464111328125, 7.524869918823242, 8.25527572631836, 8.985681533813477, 9.716087341308594, 10.446492195129395, 11.176898002624512, 11.907302856445312, 12.63770866394043, 13.368114471435547, 14.098520278930664, 14.828926086425781, 15.559331893920898, 16.289737701416016, 17.0201416015625, 17.75054931640625, 18.480955123901367, 19.211360931396484, 19.9417667388916, 20.67217254638672, 21.402578353881836, 22.132984161376953, 22.863388061523438, 23.593793869018555, 24.324199676513672, 25.05460548400879, 25.785011291503906, 26.515417098999023, 27.24582290649414, 27.976226806640625, 28.706634521484375, 29.43703842163086, 30.167444229125977, 30.897850036621094, 31.62825584411621, 32.35866165161133, 33.08906555175781, 33.81947326660156, 34.54987716674805, 35.2802848815918]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 11.0, 6.0, 14.0, 16.0, 22.0, 28.0, 33.0, 26.0, 27.0, 30.0, 41.0, 37.0, 31.0, 36.0, 49.0, 36.0, 48.0, 37.0, 39.0, 41.0, 48.0, 33.0, 34.0, 33.0, 28.0, 23.0, 27.0, 17.0, 25.0, 21.0, 12.0, 11.0, 12.0, 11.0, 7.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.57032585144043, -7.336163520812988, -7.102000713348389, -6.867838382720947, -6.633675575256348, -6.399513244628906, -6.165350437164307, -5.931188106536865, -5.697025299072266, -5.462862968444824, -5.228700160980225, -4.994537830352783, -4.760375022888184, -4.526212692260742, -4.292049884796143, -4.057887554168701, -3.8237249851226807, -3.58956241607666, -3.3553998470306396, -3.121237277984619, -2.8870747089385986, -2.652912139892578, -2.4187498092651367, -2.184587001800537, -1.9504245519638062, -1.7162619829177856, -1.4820994138717651, -1.2479369640350342, -1.0137743949890137, -0.7796118259429932, -0.5454492568969727, -0.31128668785095215, -0.07712411880493164, 0.15703843533992767, 0.391200989484787, 0.6253635287284851, 0.8595260977745056, 1.0936886072158813, 1.3278511762619019, 1.5620137453079224, 1.7961763143539429, 2.030338764190674, 2.2645013332366943, 2.498663902282715, 2.7328264713287354, 2.966989040374756, 3.2011516094207764, 3.435314178466797, 3.6694767475128174, 3.903639316558838, 4.137801647186279, 4.371964454650879, 4.60612678527832, 4.84028959274292, 5.074451923370361, 5.308614730834961, 5.542777061462402, 5.776939392089844, 6.011102199554443, 6.245264530181885, 6.479427337646484, 6.713589668273926, 6.947752475738525, 7.181914806365967, 7.416077613830566]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 19.0, 37.0, 55.0, 75.0, 126.0, 214.0, 409.0, 778.0, 1441.0, 3450.0, 8033.0, 21690.0, 65041.0, 201302.0, 392371.0, 234971.0, 76669.0, 25067.0, 9343.0, 3877.0, 1691.0, 833.0, 437.0, 231.0, 131.0, 86.0, 62.0, 29.0, 21.0, 12.0, 11.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.046875, -6.80859375, -6.5703125, -6.33203125, -6.09375, -5.85546875, -5.6171875, -5.37890625, -5.140625, -4.90234375, -4.6640625, -4.42578125, -4.1875, -3.94921875, -3.7109375, -3.47265625, -3.234375, -2.99609375, -2.7578125, -2.51953125, -2.28125, -2.04296875, -1.8046875, -1.56640625, -1.328125, -1.08984375, -0.8515625, -0.61328125, -0.375, -0.13671875, 0.1015625, 0.33984375, 0.578125, 0.81640625, 1.0546875, 1.29296875, 1.53125, 1.76953125, 2.0078125, 2.24609375, 2.484375, 2.72265625, 2.9609375, 3.19921875, 3.4375, 3.67578125, 3.9140625, 4.15234375, 4.390625, 4.62890625, 4.8671875, 5.10546875, 5.34375, 5.58203125, 5.8203125, 6.05859375, 6.296875, 6.53515625, 6.7734375, 7.01171875, 7.25, 7.48828125, 7.7265625, 7.96484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 5.0, 9.0, 4.0, 13.0, 24.0, 17.0, 33.0, 30.0, 33.0, 46.0, 40.0, 42.0, 63.0, 48.0, 50.0, 40.0, 66.0, 53.0, 74.0, 53.0, 52.0, 33.0, 23.0, 30.0, 20.0, 31.0, 11.0, 16.0, 7.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.576171875, -3.454986572265625, -3.33380126953125, -3.212615966796875, -3.0914306640625, -2.970245361328125, -2.84906005859375, -2.727874755859375, -2.606689453125, -2.485504150390625, -2.36431884765625, -2.243133544921875, -2.1219482421875, -2.000762939453125, -1.87957763671875, -1.758392333984375, -1.63720703125, -1.516021728515625, -1.39483642578125, -1.273651123046875, -1.1524658203125, -1.031280517578125, -0.91009521484375, -0.788909912109375, -0.667724609375, -0.546539306640625, -0.42535400390625, -0.304168701171875, -0.1829833984375, -0.061798095703125, 0.05938720703125, 0.180572509765625, 0.3017578125, 0.422943115234375, 0.54412841796875, 0.665313720703125, 0.7864990234375, 0.907684326171875, 1.02886962890625, 1.150054931640625, 1.271240234375, 1.392425537109375, 1.51361083984375, 1.634796142578125, 1.7559814453125, 1.877166748046875, 1.99835205078125, 2.119537353515625, 2.24072265625, 2.361907958984375, 2.48309326171875, 2.604278564453125, 2.7254638671875, 2.846649169921875, 2.96783447265625, 3.089019775390625, 3.210205078125, 3.331390380859375, 3.45257568359375, 3.573760986328125, 3.6949462890625, 3.816131591796875, 3.93731689453125, 4.058502197265625, 4.1796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 19.0, 35.0, 51.0, 46.0, 110.0, 166.0, 296.0, 659.0, 1687.0, 5620.0, 30385.0, 272254.0, 641137.0, 79300.0, 11807.0, 2903.0, 1025.0, 434.0, 215.0, 136.0, 88.0, 44.0, 39.0, 18.0, 12.0, 12.0, 8.0, 4.0, 6.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.0357666015625, -13.571533203125, -13.1072998046875, -12.64306640625, -12.1788330078125, -11.714599609375, -11.2503662109375, -10.7861328125, -10.3218994140625, -9.857666015625, -9.3934326171875, -8.92919921875, -8.4649658203125, -8.000732421875, -7.5364990234375, -7.072265625, -6.6080322265625, -6.143798828125, -5.6795654296875, -5.21533203125, -4.7510986328125, -4.286865234375, -3.8226318359375, -3.3583984375, -2.8941650390625, -2.429931640625, -1.9656982421875, -1.50146484375, -1.0372314453125, -0.572998046875, -0.1087646484375, 0.35546875, 0.8197021484375, 1.283935546875, 1.7481689453125, 2.21240234375, 2.6766357421875, 3.140869140625, 3.6051025390625, 4.0693359375, 4.5335693359375, 4.997802734375, 5.4620361328125, 5.92626953125, 6.3905029296875, 6.854736328125, 7.3189697265625, 7.783203125, 8.2474365234375, 8.711669921875, 9.1759033203125, 9.64013671875, 10.1043701171875, 10.568603515625, 11.0328369140625, 11.4970703125, 11.9613037109375, 12.425537109375, 12.8897705078125, 13.35400390625, 13.8182373046875, 14.282470703125, 14.7467041015625, 15.2109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 5.0, 7.0, 9.0, 18.0, 20.0, 27.0, 24.0, 24.0, 35.0, 56.0, 48.0, 49.0, 43.0, 61.0, 62.0, 44.0, 55.0, 54.0, 49.0, 55.0, 36.0, 40.0, 28.0, 25.0, 29.0, 30.0, 7.0, 13.0, 10.0, 12.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.130859375, -19.46484375, -18.798828125, -18.1328125, -17.466796875, -16.80078125, -16.134765625, -15.46875, -14.802734375, -14.13671875, -13.470703125, -12.8046875, -12.138671875, -11.47265625, -10.806640625, -10.140625, -9.474609375, -8.80859375, -8.142578125, -7.4765625, -6.810546875, -6.14453125, -5.478515625, -4.8125, -4.146484375, -3.48046875, -2.814453125, -2.1484375, -1.482421875, -0.81640625, -0.150390625, 0.515625, 1.181640625, 1.84765625, 2.513671875, 3.1796875, 3.845703125, 4.51171875, 5.177734375, 5.84375, 6.509765625, 7.17578125, 7.841796875, 8.5078125, 9.173828125, 9.83984375, 10.505859375, 11.171875, 11.837890625, 12.50390625, 13.169921875, 13.8359375, 14.501953125, 15.16796875, 15.833984375, 16.5, 17.166015625, 17.83203125, 18.498046875, 19.1640625, 19.830078125, 20.49609375, 21.162109375, 21.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 27.0, 39.0, 65.0, 115.0, 264.0, 568.0, 1336.0, 4035.0, 20751.0, 221216.0, 709086.0, 76880.0, 9941.0, 2517.0, 893.0, 366.0, 197.0, 107.0, 45.0, 34.0, 16.0, 11.0, 7.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.1104736328125, -4.908447265625, -4.7064208984375, -4.50439453125, -4.3023681640625, -4.100341796875, -3.8983154296875, -3.6962890625, -3.4942626953125, -3.292236328125, -3.0902099609375, -2.88818359375, -2.6861572265625, -2.484130859375, -2.2821044921875, -2.080078125, -1.8780517578125, -1.676025390625, -1.4739990234375, -1.27197265625, -1.0699462890625, -0.867919921875, -0.6658935546875, -0.4638671875, -0.2618408203125, -0.059814453125, 0.1422119140625, 0.34423828125, 0.5462646484375, 0.748291015625, 0.9503173828125, 1.15234375, 1.3543701171875, 1.556396484375, 1.7584228515625, 1.96044921875, 2.1624755859375, 2.364501953125, 2.5665283203125, 2.7685546875, 2.9705810546875, 3.172607421875, 3.3746337890625, 3.57666015625, 3.7786865234375, 3.980712890625, 4.1827392578125, 4.384765625, 4.5867919921875, 4.788818359375, 4.9908447265625, 5.19287109375, 5.3948974609375, 5.596923828125, 5.7989501953125, 6.0009765625, 6.2030029296875, 6.405029296875, 6.6070556640625, 6.80908203125, 7.0111083984375, 7.213134765625, 7.4151611328125, 7.6171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 5.0, 6.0, 8.0, 21.0, 36.0, 34.0, 37.0, 60.0, 74.0, 82.0, 94.0, 99.0, 84.0, 66.0, 65.0, 47.0, 37.0, 31.0, 19.0, 16.0, 18.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000850677490234375, -0.0008278191089630127, -0.0008049607276916504, -0.0007821023464202881, -0.0007592439651489258, -0.0007363855838775635, -0.0007135272026062012, -0.0006906688213348389, -0.0006678104400634766, -0.0006449520587921143, -0.000622093677520752, -0.0005992352962493896, -0.0005763769149780273, -0.000553518533706665, -0.0005306601524353027, -0.0005078017711639404, -0.0004849433898925781, -0.0004620850086212158, -0.0004392266273498535, -0.0004163682460784912, -0.0003935098648071289, -0.0003706514835357666, -0.0003477931022644043, -0.000324934720993042, -0.0003020763397216797, -0.0002792179584503174, -0.0002563595771789551, -0.00023350119590759277, -0.00021064281463623047, -0.00018778443336486816, -0.00016492605209350586, -0.00014206767082214355, -0.00011920928955078125, -9.635090827941895e-05, -7.349252700805664e-05, -5.0634145736694336e-05, -2.777576446533203e-05, -4.9173831939697266e-06, 1.7940998077392578e-05, 4.079937934875488e-05, 6.365776062011719e-05, 8.651614189147949e-05, 0.0001093745231628418, 0.0001322329044342041, 0.0001550912857055664, 0.0001779496669769287, 0.00020080804824829102, 0.00022366642951965332, 0.0002465248107910156, 0.00026938319206237793, 0.00029224157333374023, 0.00031509995460510254, 0.00033795833587646484, 0.00036081671714782715, 0.00038367509841918945, 0.00040653347969055176, 0.00042939186096191406, 0.00045225024223327637, 0.00047510862350463867, 0.000497967004776001, 0.0005208253860473633, 0.0005436837673187256, 0.0005665421485900879, 0.0005894005298614502, 0.0006122589111328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 8.0, 1.0, 3.0, 3.0, 7.0, 11.0, 32.0, 33.0, 72.0, 130.0, 259.0, 590.0, 1838.0, 8213.0, 79356.0, 756652.0, 182426.0, 14674.0, 2684.0, 845.0, 325.0, 172.0, 88.0, 34.0, 36.0, 22.0, 12.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.37408447265625, -6.1348876953125, -5.89569091796875, -5.656494140625, -5.41729736328125, -5.1781005859375, -4.93890380859375, -4.69970703125, -4.46051025390625, -4.2213134765625, -3.98211669921875, -3.742919921875, -3.50372314453125, -3.2645263671875, -3.02532958984375, -2.7861328125, -2.54693603515625, -2.3077392578125, -2.06854248046875, -1.829345703125, -1.59014892578125, -1.3509521484375, -1.11175537109375, -0.87255859375, -0.63336181640625, -0.3941650390625, -0.15496826171875, 0.084228515625, 0.32342529296875, 0.5626220703125, 0.80181884765625, 1.041015625, 1.28021240234375, 1.5194091796875, 1.75860595703125, 1.997802734375, 2.23699951171875, 2.4761962890625, 2.71539306640625, 2.95458984375, 3.19378662109375, 3.4329833984375, 3.67218017578125, 3.911376953125, 4.15057373046875, 4.3897705078125, 4.62896728515625, 4.8681640625, 5.10736083984375, 5.3465576171875, 5.58575439453125, 5.824951171875, 6.06414794921875, 6.3033447265625, 6.54254150390625, 6.78173828125, 7.02093505859375, 7.2601318359375, 7.49932861328125, 7.738525390625, 7.97772216796875, 8.2169189453125, 8.45611572265625, 8.6953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 5.0, 15.0, 18.0, 25.0, 28.0, 43.0, 70.0, 116.0, 163.0, 150.0, 125.0, 78.0, 57.0, 29.0, 24.0, 22.0, 14.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.692138671875, -11.36083984375, -11.029541015625, -10.6982421875, -10.366943359375, -10.03564453125, -9.704345703125, -9.373046875, -9.041748046875, -8.71044921875, -8.379150390625, -8.0478515625, -7.716552734375, -7.38525390625, -7.053955078125, -6.72265625, -6.391357421875, -6.06005859375, -5.728759765625, -5.3974609375, -5.066162109375, -4.73486328125, -4.403564453125, -4.072265625, -3.740966796875, -3.40966796875, -3.078369140625, -2.7470703125, -2.415771484375, -2.08447265625, -1.753173828125, -1.421875, -1.090576171875, -0.75927734375, -0.427978515625, -0.0966796875, 0.234619140625, 0.56591796875, 0.897216796875, 1.228515625, 1.559814453125, 1.89111328125, 2.222412109375, 2.5537109375, 2.885009765625, 3.21630859375, 3.547607421875, 3.87890625, 4.210205078125, 4.54150390625, 4.872802734375, 5.2041015625, 5.535400390625, 5.86669921875, 6.197998046875, 6.529296875, 6.860595703125, 7.19189453125, 7.523193359375, 7.8544921875, 8.185791015625, 8.51708984375, 8.848388671875, 9.1796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 15.0, 15.0, 31.0, 81.0, 164.0, 236.0, 222.0, 120.0, 60.0, 27.0, 19.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-194.8741455078125, -190.68942260742188, -186.50469970703125, -182.31997680664062, -178.13525390625, -173.95054626464844, -169.7658233642578, -165.5811004638672, -161.39637756347656, -157.21165466308594, -153.0269317626953, -148.8422088623047, -144.65750122070312, -140.4727783203125, -136.28805541992188, -132.10333251953125, -127.91860961914062, -123.73388671875, -119.54916381835938, -115.36444854736328, -111.17972564697266, -106.99500274658203, -102.81028747558594, -98.62556457519531, -94.44084167480469, -90.25611877441406, -86.07139587402344, -81.88668060302734, -77.70195770263672, -73.5172348022461, -69.33251953125, -65.14779663085938, -60.96308135986328, -56.778358459472656, -52.5936393737793, -48.40892028808594, -44.22419738769531, -40.03947448730469, -35.85475540161133, -31.670034408569336, -27.485313415527344, -23.30059242248535, -19.11587142944336, -14.931150436401367, -10.746429443359375, -6.561708450317383, -2.3769874572753906, 1.8077335357666016, 5.992454528808594, 10.177175521850586, 14.361896514892578, 18.54661750793457, 22.731338500976562, 26.916059494018555, 31.100780487060547, 35.285499572753906, 39.47022247314453, 43.654945373535156, 47.839664459228516, 52.024383544921875, 56.2091064453125, 60.393829345703125, 64.57855224609375, 68.76326751708984, 72.94799041748047]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 12.0, 12.0, 16.0, 13.0, 23.0, 27.0, 36.0, 28.0, 34.0, 37.0, 47.0, 47.0, 69.0, 69.0, 54.0, 60.0, 68.0, 45.0, 44.0, 42.0, 30.0, 26.0, 28.0, 19.0, 21.0, 18.0, 12.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.84974670410156, -81.9218978881836, -78.99404907226562, -76.06619262695312, -73.13834381103516, -70.21049499511719, -67.28264617919922, -64.35479736328125, -61.426944732666016, -58.49909591674805, -55.57124328613281, -52.643394470214844, -49.715545654296875, -46.78769302368164, -43.85984420776367, -40.93199157714844, -38.00414276123047, -35.0762939453125, -32.148441314697266, -29.220592498779297, -26.292741775512695, -23.364891052246094, -20.437042236328125, -17.509191513061523, -14.581340789794922, -11.65349006652832, -8.725640296936035, -5.79779052734375, -2.8699398040771484, 0.057910919189453125, 2.985759735107422, 5.913610458374023, 8.841461181640625, 11.769311904907227, 14.697161674499512, 17.625011444091797, 20.5528621673584, 23.480712890625, 26.40856170654297, 29.33641242980957, 32.26426315307617, 35.19211196899414, 38.119964599609375, 41.047813415527344, 43.97566223144531, 46.90351486206055, 49.831363677978516, 52.75921630859375, 55.68706512451172, 58.61491394042969, 61.54276657104492, 64.47061157226562, 67.39846801757812, 70.3263168334961, 73.25416564941406, 76.18201446533203, 79.10986328125, 82.03771209716797, 84.96556091308594, 87.89341735839844, 90.8212661743164, 93.74911499023438, 96.67696380615234, 99.60481262207031, 102.53266906738281]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 11.0, 6.0, 17.0, 27.0, 47.0, 85.0, 159.0, 231.0, 475.0, 865.0, 1792.0, 4257.0, 14868.0, 149728.0, 3962519.0, 45016.0, 8309.0, 3036.0, 1326.0, 673.0, 338.0, 198.0, 120.0, 64.0, 32.0, 25.0, 14.0, 17.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.64251708984375, -7.3280029296875, -7.01348876953125, -6.698974609375, -6.38446044921875, -6.0699462890625, -5.75543212890625, -5.44091796875, -5.12640380859375, -4.8118896484375, -4.49737548828125, -4.182861328125, -3.86834716796875, -3.5538330078125, -3.23931884765625, -2.9248046875, -2.61029052734375, -2.2957763671875, -1.98126220703125, -1.666748046875, -1.35223388671875, -1.0377197265625, -0.72320556640625, -0.40869140625, -0.09417724609375, 0.2203369140625, 0.53485107421875, 0.849365234375, 1.16387939453125, 1.4783935546875, 1.79290771484375, 2.107421875, 2.42193603515625, 2.7364501953125, 3.05096435546875, 3.365478515625, 3.67999267578125, 3.9945068359375, 4.30902099609375, 4.62353515625, 4.93804931640625, 5.2525634765625, 5.56707763671875, 5.881591796875, 6.19610595703125, 6.5106201171875, 6.82513427734375, 7.1396484375, 7.45416259765625, 7.7686767578125, 8.08319091796875, 8.397705078125, 8.71221923828125, 9.0267333984375, 9.34124755859375, 9.65576171875, 9.97027587890625, 10.2847900390625, 10.59930419921875, 10.913818359375, 11.22833251953125, 11.5428466796875, 11.85736083984375, 12.171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 8.0, 12.0, 31.0, 20.0, 28.0, 35.0, 39.0, 57.0, 61.0, 53.0, 52.0, 57.0, 72.0, 83.0, 80.0, 46.0, 43.0, 44.0, 34.0, 32.0, 28.0, 20.0, 16.0, 9.0, 10.0, 5.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0390625, -4.8951416015625, -4.751220703125, -4.6072998046875, -4.46337890625, -4.3194580078125, -4.175537109375, -4.0316162109375, -3.8876953125, -3.7437744140625, -3.599853515625, -3.4559326171875, -3.31201171875, -3.1680908203125, -3.024169921875, -2.8802490234375, -2.736328125, -2.5924072265625, -2.448486328125, -2.3045654296875, -2.16064453125, -2.0167236328125, -1.872802734375, -1.7288818359375, -1.5849609375, -1.4410400390625, -1.297119140625, -1.1531982421875, -1.00927734375, -0.8653564453125, -0.721435546875, -0.5775146484375, -0.43359375, -0.2896728515625, -0.145751953125, -0.0018310546875, 0.14208984375, 0.2860107421875, 0.429931640625, 0.5738525390625, 0.7177734375, 0.8616943359375, 1.005615234375, 1.1495361328125, 1.29345703125, 1.4373779296875, 1.581298828125, 1.7252197265625, 1.869140625, 2.0130615234375, 2.156982421875, 2.3009033203125, 2.44482421875, 2.5887451171875, 2.732666015625, 2.8765869140625, 3.0205078125, 3.1644287109375, 3.308349609375, 3.4522705078125, 3.59619140625, 3.7401123046875, 3.884033203125, 4.0279541015625, 4.171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 3.0, 10.0, 18.0, 29.0, 31.0, 58.0, 79.0, 123.0, 199.0, 283.0, 478.0, 752.0, 1255.0, 2421.0, 5071.0, 12644.0, 45062.0, 492917.0, 3520472.0, 80274.0, 18330.0, 6729.0, 3066.0, 1591.0, 945.0, 493.0, 339.0, 206.0, 138.0, 86.0, 48.0, 32.0, 34.0, 24.0, 7.0, 6.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.55047607421875, -7.3001708984375, -7.04986572265625, -6.799560546875, -6.54925537109375, -6.2989501953125, -6.04864501953125, -5.79833984375, -5.54803466796875, -5.2977294921875, -5.04742431640625, -4.797119140625, -4.54681396484375, -4.2965087890625, -4.04620361328125, -3.7958984375, -3.54559326171875, -3.2952880859375, -3.04498291015625, -2.794677734375, -2.54437255859375, -2.2940673828125, -2.04376220703125, -1.79345703125, -1.54315185546875, -1.2928466796875, -1.04254150390625, -0.792236328125, -0.54193115234375, -0.2916259765625, -0.04132080078125, 0.208984375, 0.45928955078125, 0.7095947265625, 0.95989990234375, 1.210205078125, 1.46051025390625, 1.7108154296875, 1.96112060546875, 2.21142578125, 2.46173095703125, 2.7120361328125, 2.96234130859375, 3.212646484375, 3.46295166015625, 3.7132568359375, 3.96356201171875, 4.2138671875, 4.46417236328125, 4.7144775390625, 4.96478271484375, 5.215087890625, 5.46539306640625, 5.7156982421875, 5.96600341796875, 6.21630859375, 6.46661376953125, 6.7169189453125, 6.96722412109375, 7.217529296875, 7.46783447265625, 7.7181396484375, 7.96844482421875, 8.21875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 7.0, 2.0, 6.0, 11.0, 29.0, 46.0, 91.0, 318.0, 2920.0, 416.0, 110.0, 45.0, 29.0, 13.0, 10.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.326416015625, -3.22119140625, -3.115966796875, -3.0107421875, -2.905517578125, -2.80029296875, -2.695068359375, -2.58984375, -2.484619140625, -2.37939453125, -2.274169921875, -2.1689453125, -2.063720703125, -1.95849609375, -1.853271484375, -1.748046875, -1.642822265625, -1.53759765625, -1.432373046875, -1.3271484375, -1.221923828125, -1.11669921875, -1.011474609375, -0.90625, -0.801025390625, -0.69580078125, -0.590576171875, -0.4853515625, -0.380126953125, -0.27490234375, -0.169677734375, -0.064453125, 0.040771484375, 0.14599609375, 0.251220703125, 0.3564453125, 0.461669921875, 0.56689453125, 0.672119140625, 0.77734375, 0.882568359375, 0.98779296875, 1.093017578125, 1.1982421875, 1.303466796875, 1.40869140625, 1.513916015625, 1.619140625, 1.724365234375, 1.82958984375, 1.934814453125, 2.0400390625, 2.145263671875, 2.25048828125, 2.355712890625, 2.4609375, 2.566162109375, 2.67138671875, 2.776611328125, 2.8818359375, 2.987060546875, 3.09228515625, 3.197509765625, 3.302734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 11.0, 16.0, 19.0, 52.0, 59.0, 113.0, 122.0, 130.0, 116.0, 126.0, 92.0, 67.0, 28.0, 18.0, 5.0, 10.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.685128211975098, -11.318992614746094, -10.95285701751709, -10.586721420288086, -10.220586776733398, -9.854451179504395, -9.48831558227539, -9.122179985046387, -8.756044387817383, -8.389908790588379, -8.023773193359375, -7.657638072967529, -7.291502475738525, -6.9253668785095215, -6.559231758117676, -6.193096160888672, -5.826960563659668, -5.460824966430664, -5.09468936920166, -4.7285542488098145, -4.3624186515808105, -3.9962830543518066, -3.630147695541382, -3.264012336730957, -2.897876739501953, -2.531741142272949, -2.1656057834625244, -1.79947030544281, -1.4333348274230957, -1.0671993494033813, -0.701063871383667, -0.3349285125732422, 0.03120708465576172, 0.3973425626754761, 0.7634780406951904, 1.1296135187149048, 1.4957489967346191, 1.8618844747543335, 2.228019952774048, 2.5941553115844727, 2.9602909088134766, 3.3264265060424805, 3.6925618648529053, 4.05869722366333, 4.424832820892334, 4.790968418121338, 5.157103538513184, 5.5232391357421875, 5.889374732971191, 6.255510330200195, 6.621645927429199, 6.987781047821045, 7.353916645050049, 7.720052242279053, 8.086187362670898, 8.452322959899902, 8.818458557128906, 9.18459415435791, 9.550729751586914, 9.916865348815918, 10.283000946044922, 10.64913558959961, 11.015271186828613, 11.381406784057617, 11.747542381286621]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 2.0, 8.0, 11.0, 8.0, 7.0, 12.0, 17.0, 12.0, 20.0, 24.0, 22.0, 20.0, 27.0, 35.0, 35.0, 39.0, 48.0, 45.0, 40.0, 44.0, 47.0, 58.0, 40.0, 34.0, 32.0, 30.0, 40.0, 34.0, 29.0, 33.0, 14.0, 17.0, 17.0, 14.0, 10.0, 11.0, 4.0, 12.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.698233604431152, -4.536670207977295, -4.375106334686279, -4.213542938232422, -4.051979064941406, -3.890415668487549, -3.7288520336151123, -3.567288398742676, -3.4057250022888184, -3.244161367416382, -3.0825977325439453, -2.921034336090088, -2.7594707012176514, -2.597907066345215, -2.4363434314727783, -2.274779796600342, -2.1132161617279053, -1.9516525268554688, -1.7900890111923218, -1.6285253763198853, -1.4669618606567383, -1.3053982257843018, -1.1438345909118652, -0.9822710752487183, -0.8207074403762817, -0.65914386510849, -0.49758026003837585, -0.3360166549682617, -0.17445307970046997, -0.012889504432678223, 0.1486741304397583, 0.3102376461029053, 0.4718012809753418, 0.6333648562431335, 0.7949284315109253, 0.9564920663833618, 1.1180555820465088, 1.2796192169189453, 1.4411828517913818, 1.6027463674545288, 1.7643100023269653, 1.9258736371994019, 2.087437152862549, 2.2490007877349854, 2.410564422607422, 2.5721278190612793, 2.733691692352295, 2.8952550888061523, 3.056818723678589, 3.2183823585510254, 3.379945993423462, 3.5415096282958984, 3.703073024749756, 3.8646366596221924, 4.026200294494629, 4.187763690948486, 4.349327564239502, 4.510890960693359, 4.672454833984375, 4.834018230438232, 4.995582103729248, 5.1571455001831055, 5.318709373474121, 5.4802727699279785, 5.641836166381836]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 21.0, 19.0, 37.0, 55.0, 102.0, 174.0, 273.0, 598.0, 1138.0, 2467.0, 5746.0, 14423.0, 40051.0, 124097.0, 336015.0, 333638.0, 124455.0, 40121.0, 14484.0, 5737.0, 2481.0, 1093.0, 585.0, 301.0, 170.0, 110.0, 57.0, 36.0, 21.0, 13.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.28173828125, -6.0791015625, -5.87646484375, -5.673828125, -5.47119140625, -5.2685546875, -5.06591796875, -4.86328125, -4.66064453125, -4.4580078125, -4.25537109375, -4.052734375, -3.85009765625, -3.6474609375, -3.44482421875, -3.2421875, -3.03955078125, -2.8369140625, -2.63427734375, -2.431640625, -2.22900390625, -2.0263671875, -1.82373046875, -1.62109375, -1.41845703125, -1.2158203125, -1.01318359375, -0.810546875, -0.60791015625, -0.4052734375, -0.20263671875, 0.0, 0.20263671875, 0.4052734375, 0.60791015625, 0.810546875, 1.01318359375, 1.2158203125, 1.41845703125, 1.62109375, 1.82373046875, 2.0263671875, 2.22900390625, 2.431640625, 2.63427734375, 2.8369140625, 3.03955078125, 3.2421875, 3.44482421875, 3.6474609375, 3.85009765625, 4.052734375, 4.25537109375, 4.4580078125, 4.66064453125, 4.86328125, 5.06591796875, 5.2685546875, 5.47119140625, 5.673828125, 5.87646484375, 6.0791015625, 6.28173828125, 6.484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 7.0, 15.0, 8.0, 30.0, 17.0, 21.0, 31.0, 37.0, 38.0, 55.0, 44.0, 45.0, 73.0, 63.0, 57.0, 68.0, 70.0, 53.0, 48.0, 41.0, 37.0, 37.0, 22.0, 19.0, 11.0, 20.0, 12.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.78515625, -4.648284912109375, -4.51141357421875, -4.374542236328125, -4.2376708984375, -4.100799560546875, -3.96392822265625, -3.827056884765625, -3.690185546875, -3.553314208984375, -3.41644287109375, -3.279571533203125, -3.1427001953125, -3.005828857421875, -2.86895751953125, -2.732086181640625, -2.59521484375, -2.458343505859375, -2.32147216796875, -2.184600830078125, -2.0477294921875, -1.910858154296875, -1.77398681640625, -1.637115478515625, -1.500244140625, -1.363372802734375, -1.22650146484375, -1.089630126953125, -0.9527587890625, -0.815887451171875, -0.67901611328125, -0.542144775390625, -0.4052734375, -0.268402099609375, -0.13153076171875, 0.005340576171875, 0.1422119140625, 0.279083251953125, 0.41595458984375, 0.552825927734375, 0.689697265625, 0.826568603515625, 0.96343994140625, 1.100311279296875, 1.2371826171875, 1.374053955078125, 1.51092529296875, 1.647796630859375, 1.78466796875, 1.921539306640625, 2.05841064453125, 2.195281982421875, 2.3321533203125, 2.469024658203125, 2.60589599609375, 2.742767333984375, 2.879638671875, 3.016510009765625, 3.15338134765625, 3.290252685546875, 3.4271240234375, 3.563995361328125, 3.70086669921875, 3.837738037109375, 3.974609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 12.0, 11.0, 22.0, 13.0, 23.0, 28.0, 34.0, 42.0, 64.0, 119.0, 184.0, 342.0, 657.0, 1406.0, 3428.0, 10949.0, 49323.0, 331484.0, 539024.0, 86163.0, 16759.0, 4745.0, 1796.0, 862.0, 408.0, 221.0, 127.0, 92.0, 54.0, 46.0, 23.0, 26.0, 15.0, 9.0, 7.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.4296875, -10.1151123046875, -9.800537109375, -9.4859619140625, -9.17138671875, -8.8568115234375, -8.542236328125, -8.2276611328125, -7.9130859375, -7.5985107421875, -7.283935546875, -6.9693603515625, -6.65478515625, -6.3402099609375, -6.025634765625, -5.7110595703125, -5.396484375, -5.0819091796875, -4.767333984375, -4.4527587890625, -4.13818359375, -3.8236083984375, -3.509033203125, -3.1944580078125, -2.8798828125, -2.5653076171875, -2.250732421875, -1.9361572265625, -1.62158203125, -1.3070068359375, -0.992431640625, -0.6778564453125, -0.36328125, -0.0487060546875, 0.265869140625, 0.5804443359375, 0.89501953125, 1.2095947265625, 1.524169921875, 1.8387451171875, 2.1533203125, 2.4678955078125, 2.782470703125, 3.0970458984375, 3.41162109375, 3.7261962890625, 4.040771484375, 4.3553466796875, 4.669921875, 4.9844970703125, 5.299072265625, 5.6136474609375, 5.92822265625, 6.2427978515625, 6.557373046875, 6.8719482421875, 7.1865234375, 7.5010986328125, 7.815673828125, 8.1302490234375, 8.44482421875, 8.7593994140625, 9.073974609375, 9.3885498046875, 9.703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 15.0, 18.0, 19.0, 23.0, 37.0, 31.0, 34.0, 45.0, 54.0, 54.0, 55.0, 57.0, 60.0, 63.0, 70.0, 49.0, 43.0, 43.0, 36.0, 35.0, 37.0, 23.0, 13.0, 17.0, 12.0, 9.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -21.154296875, -20.52734375, -19.900390625, -19.2734375, -18.646484375, -18.01953125, -17.392578125, -16.765625, -16.138671875, -15.51171875, -14.884765625, -14.2578125, -13.630859375, -13.00390625, -12.376953125, -11.75, -11.123046875, -10.49609375, -9.869140625, -9.2421875, -8.615234375, -7.98828125, -7.361328125, -6.734375, -6.107421875, -5.48046875, -4.853515625, -4.2265625, -3.599609375, -2.97265625, -2.345703125, -1.71875, -1.091796875, -0.46484375, 0.162109375, 0.7890625, 1.416015625, 2.04296875, 2.669921875, 3.296875, 3.923828125, 4.55078125, 5.177734375, 5.8046875, 6.431640625, 7.05859375, 7.685546875, 8.3125, 8.939453125, 9.56640625, 10.193359375, 10.8203125, 11.447265625, 12.07421875, 12.701171875, 13.328125, 13.955078125, 14.58203125, 15.208984375, 15.8359375, 16.462890625, 17.08984375, 17.716796875, 18.34375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 8.0, 7.0, 8.0, 7.0, 10.0, 18.0, 23.0, 27.0, 67.0, 151.0, 280.0, 772.0, 3899.0, 57321.0, 909933.0, 70167.0, 4305.0, 878.0, 323.0, 137.0, 79.0, 47.0, 31.0, 13.0, 11.0, 14.0, 6.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.2120361328125, -9.916259765625, -9.6204833984375, -9.32470703125, -9.0289306640625, -8.733154296875, -8.4373779296875, -8.1416015625, -7.8458251953125, -7.550048828125, -7.2542724609375, -6.95849609375, -6.6627197265625, -6.366943359375, -6.0711669921875, -5.775390625, -5.4796142578125, -5.183837890625, -4.8880615234375, -4.59228515625, -4.2965087890625, -4.000732421875, -3.7049560546875, -3.4091796875, -3.1134033203125, -2.817626953125, -2.5218505859375, -2.22607421875, -1.9302978515625, -1.634521484375, -1.3387451171875, -1.04296875, -0.7471923828125, -0.451416015625, -0.1556396484375, 0.14013671875, 0.4359130859375, 0.731689453125, 1.0274658203125, 1.3232421875, 1.6190185546875, 1.914794921875, 2.2105712890625, 2.50634765625, 2.8021240234375, 3.097900390625, 3.3936767578125, 3.689453125, 3.9852294921875, 4.281005859375, 4.5767822265625, 4.87255859375, 5.1683349609375, 5.464111328125, 5.7598876953125, 6.0556640625, 6.3514404296875, 6.647216796875, 6.9429931640625, 7.23876953125, 7.5345458984375, 7.830322265625, 8.1260986328125, 8.421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 10.0, 5.0, 15.0, 15.0, 30.0, 29.0, 48.0, 53.0, 54.0, 70.0, 77.0, 66.0, 70.0, 84.0, 68.0, 62.0, 40.0, 37.0, 37.0, 37.0, 18.0, 18.0, 10.0, 11.0, 6.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0007157325744628906, -0.0006964579224586487, -0.0006771832704544067, -0.0006579086184501648, -0.0006386339664459229, -0.0006193593144416809, -0.000600084662437439, -0.000580810010433197, -0.0005615353584289551, -0.0005422607064247131, -0.0005229860544204712, -0.0005037114024162292, -0.0004844367504119873, -0.00046516209840774536, -0.0004458874464035034, -0.0004266127943992615, -0.00040733814239501953, -0.0003880634903907776, -0.00036878883838653564, -0.0003495141863822937, -0.00033023953437805176, -0.0003109648823738098, -0.00029169023036956787, -0.00027241557836532593, -0.000253140926361084, -0.00023386627435684204, -0.0002145916223526001, -0.00019531697034835815, -0.0001760423183441162, -0.00015676766633987427, -0.00013749301433563232, -0.00011821836233139038, -9.894371032714844e-05, -7.96690583229065e-05, -6.039440631866455e-05, -4.111975431442261e-05, -2.1845102310180664e-05, -2.5704503059387207e-06, 1.6704201698303223e-05, 3.5978853702545166e-05, 5.525350570678711e-05, 7.452815771102905e-05, 9.3802809715271e-05, 0.00011307746171951294, 0.00013235211372375488, 0.00015162676572799683, 0.00017090141773223877, 0.0001901760697364807, 0.00020945072174072266, 0.0002287253737449646, 0.00024800002574920654, 0.0002672746777534485, 0.00028654932975769043, 0.0003058239817619324, 0.0003250986337661743, 0.00034437328577041626, 0.0003636479377746582, 0.00038292258977890015, 0.0004021972417831421, 0.00042147189378738403, 0.000440746545791626, 0.0004600211977958679, 0.00047929584980010986, 0.0004985705018043518, 0.0005178451538085938]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 7.0, 5.0, 11.0, 9.0, 24.0, 15.0, 35.0, 65.0, 118.0, 175.0, 422.0, 811.0, 1954.0, 7284.0, 58708.0, 727021.0, 229378.0, 16736.0, 3494.0, 1203.0, 495.0, 233.0, 131.0, 85.0, 50.0, 19.0, 19.0, 13.0, 8.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.453125, -6.236083984375, -6.01904296875, -5.802001953125, -5.5849609375, -5.367919921875, -5.15087890625, -4.933837890625, -4.716796875, -4.499755859375, -4.28271484375, -4.065673828125, -3.8486328125, -3.631591796875, -3.41455078125, -3.197509765625, -2.98046875, -2.763427734375, -2.54638671875, -2.329345703125, -2.1123046875, -1.895263671875, -1.67822265625, -1.461181640625, -1.244140625, -1.027099609375, -0.81005859375, -0.593017578125, -0.3759765625, -0.158935546875, 0.05810546875, 0.275146484375, 0.4921875, 0.709228515625, 0.92626953125, 1.143310546875, 1.3603515625, 1.577392578125, 1.79443359375, 2.011474609375, 2.228515625, 2.445556640625, 2.66259765625, 2.879638671875, 3.0966796875, 3.313720703125, 3.53076171875, 3.747802734375, 3.96484375, 4.181884765625, 4.39892578125, 4.615966796875, 4.8330078125, 5.050048828125, 5.26708984375, 5.484130859375, 5.701171875, 5.918212890625, 6.13525390625, 6.352294921875, 6.5693359375, 6.786376953125, 7.00341796875, 7.220458984375, 7.4375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 20.0, 21.0, 15.0, 38.0, 45.0, 64.0, 97.0, 99.0, 108.0, 116.0, 99.0, 82.0, 63.0, 39.0, 26.0, 15.0, 11.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.290283203125, -7.08447265625, -6.878662109375, -6.6728515625, -6.467041015625, -6.26123046875, -6.055419921875, -5.849609375, -5.643798828125, -5.43798828125, -5.232177734375, -5.0263671875, -4.820556640625, -4.61474609375, -4.408935546875, -4.203125, -3.997314453125, -3.79150390625, -3.585693359375, -3.3798828125, -3.174072265625, -2.96826171875, -2.762451171875, -2.556640625, -2.350830078125, -2.14501953125, -1.939208984375, -1.7333984375, -1.527587890625, -1.32177734375, -1.115966796875, -0.91015625, -0.704345703125, -0.49853515625, -0.292724609375, -0.0869140625, 0.118896484375, 0.32470703125, 0.530517578125, 0.736328125, 0.942138671875, 1.14794921875, 1.353759765625, 1.5595703125, 1.765380859375, 1.97119140625, 2.177001953125, 2.3828125, 2.588623046875, 2.79443359375, 3.000244140625, 3.2060546875, 3.411865234375, 3.61767578125, 3.823486328125, 4.029296875, 4.235107421875, 4.44091796875, 4.646728515625, 4.8525390625, 5.058349609375, 5.26416015625, 5.469970703125, 5.67578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 14.0, 30.0, 64.0, 132.0, 211.0, 239.0, 143.0, 74.0, 30.0, 16.0, 18.0, 9.0, 8.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.56095886230469, -84.87007904052734, -81.17919921875, -77.48831939697266, -73.79743957519531, -70.10655975341797, -66.41567993164062, -62.724796295166016, -59.03391647338867, -55.34303665161133, -51.652156829833984, -47.961273193359375, -44.27039337158203, -40.57951354980469, -36.888633728027344, -33.19775390625, -29.506874084472656, -25.815994262695312, -22.12511444091797, -18.434232711791992, -14.743352890014648, -11.052473068237305, -7.361591339111328, -3.6707115173339844, 0.020168304443359375, 3.7110486030578613, 7.401928901672363, 11.092809677124023, 14.783689498901367, 18.47456932067871, 22.165451049804688, 25.85633087158203, 29.547210693359375, 33.23809051513672, 36.92897033691406, 40.619850158691406, 44.31072998046875, 48.001609802246094, 51.6924934387207, 55.38337326049805, 59.07425308227539, 62.765132904052734, 66.45601654052734, 70.14689636230469, 73.83777618408203, 77.52865600585938, 81.21953582763672, 84.91041564941406, 88.6012954711914, 92.29217529296875, 95.9830551147461, 99.67393493652344, 103.36481475830078, 107.05569458007812, 110.74658203125, 114.43745422363281, 118.12834167480469, 121.81922149658203, 125.51010131835938, 129.20098876953125, 132.89186096191406, 136.58274841308594, 140.27362060546875, 143.96450805664062, 147.65538024902344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 13.0, 17.0, 18.0, 17.0, 26.0, 31.0, 28.0, 30.0, 27.0, 40.0, 48.0, 36.0, 45.0, 49.0, 51.0, 54.0, 62.0, 51.0, 42.0, 42.0, 37.0, 33.0, 28.0, 23.0, 15.0, 21.0, 21.0, 21.0, 11.0, 13.0, 4.0, 3.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-82.78804016113281, -80.41075134277344, -78.03346252441406, -75.65617370605469, -73.27888488769531, -70.90159606933594, -68.52430725097656, -66.14701843261719, -63.76972961425781, -61.39244079589844, -59.01515197753906, -56.63786315917969, -54.26057434082031, -51.88328552246094, -49.50599670410156, -47.12870788574219, -44.75141906738281, -42.37413024902344, -39.99684143066406, -37.61955261230469, -35.24226379394531, -32.86497497558594, -30.487686157226562, -28.110397338867188, -25.733108520507812, -23.355819702148438, -20.978530883789062, -18.601242065429688, -16.223953247070312, -13.846664428710938, -11.469375610351562, -9.092086791992188, -6.714805603027344, -4.337516784667969, -1.9602279663085938, 0.41706085205078125, 2.7943496704101562, 5.171638488769531, 7.548927307128906, 9.926216125488281, 12.303504943847656, 14.680793762207031, 17.058082580566406, 19.43537139892578, 21.812660217285156, 24.18994903564453, 26.567237854003906, 28.94452667236328, 31.321815490722656, 33.69910430908203, 36.076393127441406, 38.45368194580078, 40.830970764160156, 43.20825958251953, 45.585548400878906, 47.96283721923828, 50.340126037597656, 52.71741485595703, 55.094703674316406, 57.47199249267578, 59.849281311035156, 62.22657012939453, 64.6038589477539, 66.98114776611328, 69.35843658447266]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 13.0, 17.0, 26.0, 33.0, 59.0, 70.0, 131.0, 184.0, 331.0, 535.0, 1026.0, 1973.0, 4596.0, 14555.0, 93138.0, 3992438.0, 65254.0, 12010.0, 3896.0, 1771.0, 902.0, 505.0, 298.0, 197.0, 106.0, 69.0, 45.0, 33.0, 20.0, 19.0, 10.0, 2.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.56640625, -6.31793212890625, -6.0694580078125, -5.82098388671875, -5.572509765625, -5.32403564453125, -5.0755615234375, -4.82708740234375, -4.57861328125, -4.33013916015625, -4.0816650390625, -3.83319091796875, -3.584716796875, -3.33624267578125, -3.0877685546875, -2.83929443359375, -2.5908203125, -2.34234619140625, -2.0938720703125, -1.84539794921875, -1.596923828125, -1.34844970703125, -1.0999755859375, -0.85150146484375, -0.60302734375, -0.35455322265625, -0.1060791015625, 0.14239501953125, 0.390869140625, 0.63934326171875, 0.8878173828125, 1.13629150390625, 1.384765625, 1.63323974609375, 1.8817138671875, 2.13018798828125, 2.378662109375, 2.62713623046875, 2.8756103515625, 3.12408447265625, 3.37255859375, 3.62103271484375, 3.8695068359375, 4.11798095703125, 4.366455078125, 4.61492919921875, 4.8634033203125, 5.11187744140625, 5.3603515625, 5.60882568359375, 5.8572998046875, 6.10577392578125, 6.354248046875, 6.60272216796875, 6.8511962890625, 7.09967041015625, 7.34814453125, 7.59661865234375, 7.8450927734375, 8.09356689453125, 8.342041015625, 8.59051513671875, 8.8389892578125, 9.08746337890625, 9.3359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 6.0, 3.0, 9.0, 10.0, 9.0, 14.0, 21.0, 29.0, 24.0, 22.0, 42.0, 35.0, 41.0, 34.0, 44.0, 41.0, 51.0, 44.0, 45.0, 57.0, 49.0, 31.0, 57.0, 46.0, 31.0, 28.0, 35.0, 18.0, 19.0, 20.0, 15.0, 15.0, 8.0, 7.0, 9.0, 8.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.708984375, -3.60821533203125, -3.5074462890625, -3.40667724609375, -3.305908203125, -3.20513916015625, -3.1043701171875, -3.00360107421875, -2.90283203125, -2.80206298828125, -2.7012939453125, -2.60052490234375, -2.499755859375, -2.39898681640625, -2.2982177734375, -2.19744873046875, -2.0966796875, -1.99591064453125, -1.8951416015625, -1.79437255859375, -1.693603515625, -1.59283447265625, -1.4920654296875, -1.39129638671875, -1.29052734375, -1.18975830078125, -1.0889892578125, -0.98822021484375, -0.887451171875, -0.78668212890625, -0.6859130859375, -0.58514404296875, -0.484375, -0.38360595703125, -0.2828369140625, -0.18206787109375, -0.081298828125, 0.01947021484375, 0.1202392578125, 0.22100830078125, 0.32177734375, 0.42254638671875, 0.5233154296875, 0.62408447265625, 0.724853515625, 0.82562255859375, 0.9263916015625, 1.02716064453125, 1.1279296875, 1.22869873046875, 1.3294677734375, 1.43023681640625, 1.531005859375, 1.63177490234375, 1.7325439453125, 1.83331298828125, 1.93408203125, 2.03485107421875, 2.1356201171875, 2.23638916015625, 2.337158203125, 2.43792724609375, 2.5386962890625, 2.63946533203125, 2.740234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 5.0, 13.0, 15.0, 27.0, 38.0, 44.0, 51.0, 70.0, 101.0, 154.0, 227.0, 349.0, 492.0, 805.0, 1376.0, 2769.0, 6123.0, 18437.0, 101080.0, 3875148.0, 149781.0, 22659.0, 7221.0, 3093.0, 1556.0, 901.0, 549.0, 367.0, 236.0, 178.0, 111.0, 87.0, 47.0, 56.0, 32.0, 24.0, 16.0, 10.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.921875, -8.6844482421875, -8.447021484375, -8.2095947265625, -7.97216796875, -7.7347412109375, -7.497314453125, -7.2598876953125, -7.0224609375, -6.7850341796875, -6.547607421875, -6.3101806640625, -6.07275390625, -5.8353271484375, -5.597900390625, -5.3604736328125, -5.123046875, -4.8856201171875, -4.648193359375, -4.4107666015625, -4.17333984375, -3.9359130859375, -3.698486328125, -3.4610595703125, -3.2236328125, -2.9862060546875, -2.748779296875, -2.5113525390625, -2.27392578125, -2.0364990234375, -1.799072265625, -1.5616455078125, -1.32421875, -1.0867919921875, -0.849365234375, -0.6119384765625, -0.37451171875, -0.1370849609375, 0.100341796875, 0.3377685546875, 0.5751953125, 0.8126220703125, 1.050048828125, 1.2874755859375, 1.52490234375, 1.7623291015625, 1.999755859375, 2.2371826171875, 2.474609375, 2.7120361328125, 2.949462890625, 3.1868896484375, 3.42431640625, 3.6617431640625, 3.899169921875, 4.1365966796875, 4.3740234375, 4.6114501953125, 4.848876953125, 5.0863037109375, 5.32373046875, 5.5611572265625, 5.798583984375, 6.0360107421875, 6.2734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 6.0, 8.0, 24.0, 36.0, 75.0, 158.0, 856.0, 2534.0, 172.0, 83.0, 44.0, 16.0, 13.0, 11.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.462890625, -2.396453857421875, -2.33001708984375, -2.263580322265625, -2.1971435546875, -2.130706787109375, -2.06427001953125, -1.997833251953125, -1.931396484375, -1.864959716796875, -1.79852294921875, -1.732086181640625, -1.6656494140625, -1.599212646484375, -1.53277587890625, -1.466339111328125, -1.39990234375, -1.333465576171875, -1.26702880859375, -1.200592041015625, -1.1341552734375, -1.067718505859375, -1.00128173828125, -0.934844970703125, -0.868408203125, -0.801971435546875, -0.73553466796875, -0.669097900390625, -0.6026611328125, -0.536224365234375, -0.46978759765625, -0.403350830078125, -0.3369140625, -0.270477294921875, -0.20404052734375, -0.137603759765625, -0.0711669921875, -0.004730224609375, 0.06170654296875, 0.128143310546875, 0.194580078125, 0.261016845703125, 0.32745361328125, 0.393890380859375, 0.4603271484375, 0.526763916015625, 0.59320068359375, 0.659637451171875, 0.72607421875, 0.792510986328125, 0.85894775390625, 0.925384521484375, 0.9918212890625, 1.058258056640625, 1.12469482421875, 1.191131591796875, 1.257568359375, 1.324005126953125, 1.39044189453125, 1.456878662109375, 1.5233154296875, 1.589752197265625, 1.65618896484375, 1.722625732421875, 1.7890625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 16.0, 21.0, 30.0, 47.0, 61.0, 92.0, 110.0, 110.0, 85.0, 111.0, 87.0, 65.0, 42.0, 41.0, 23.0, 13.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9436798095703125, -6.709510803222656, -6.475341320037842, -6.2411723136901855, -6.007002830505371, -5.772833824157715, -5.538664817810059, -5.304495334625244, -5.070326328277588, -4.836157321929932, -4.601987838745117, -4.367818832397461, -4.1336493492126465, -3.8994803428649902, -3.665311098098755, -3.4311418533325195, -3.196972608566284, -2.962803363800049, -2.7286341190338135, -2.494464874267578, -2.260295867919922, -2.0261266231536865, -1.7919573783874512, -1.5577882528305054, -1.32361900806427, -1.0894497632980347, -0.8552806377410889, -0.6211113929748535, -0.38694220781326294, -0.15277302265167236, 0.08139622211456299, 0.3155653476715088, 0.5497345924377441, 0.7839037775993347, 1.0180729627609253, 1.2522422075271606, 1.4864113330841064, 1.7205805778503418, 1.9547498226165771, 2.1889190673828125, 2.4230880737304688, 2.657257318496704, 2.8914265632629395, 3.1255955696105957, 3.359764814376831, 3.5939340591430664, 3.8281033039093018, 4.062272548675537, 4.296442031860352, 4.530611038208008, 4.764780521392822, 4.9989495277404785, 5.233119010925293, 5.467288017272949, 5.7014570236206055, 5.93562650680542, 6.169795513153076, 6.403964519500732, 6.638134002685547, 6.872303009033203, 7.106472492218018, 7.340641498565674, 7.574810981750488, 7.8089799880981445, 8.0431489944458]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 3.0, 11.0, 7.0, 10.0, 14.0, 18.0, 21.0, 27.0, 23.0, 16.0, 36.0, 31.0, 38.0, 38.0, 43.0, 48.0, 41.0, 56.0, 38.0, 48.0, 47.0, 35.0, 47.0, 26.0, 39.0, 40.0, 24.0, 25.0, 22.0, 15.0, 21.0, 11.0, 16.0, 9.0, 7.0, 11.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8736374378204346, -3.743974208831787, -3.6143109798431396, -3.484647750854492, -3.3549842834472656, -3.2253212928771973, -3.0956578254699707, -2.9659945964813232, -2.836331367492676, -2.7066681385040283, -2.577004909515381, -2.4473416805267334, -2.317678451538086, -2.1880149841308594, -2.058351755142212, -1.9286885261535645, -1.799025297164917, -1.6693620681762695, -1.539698839187622, -1.410035490989685, -1.2803722620010376, -1.1507090330123901, -1.0210456848144531, -0.8913824558258057, -0.7617192268371582, -0.6320559978485107, -0.5023927092552185, -0.37272945046424866, -0.2430661916732788, -0.11340296268463135, 0.01626032590866089, 0.14592361450195312, 0.2755866050720215, 0.40524986386299133, 0.5349131226539612, 0.6645764112472534, 0.7942396402359009, 0.9239028692245483, 1.0535662174224854, 1.1832294464111328, 1.3128926753997803, 1.4425559043884277, 1.5722191333770752, 1.7018824815750122, 1.8315457105636597, 1.9612089395523071, 2.090872287750244, 2.2205355167388916, 2.350198745727539, 2.4798619747161865, 2.609525203704834, 2.7391884326934814, 2.868851661682129, 2.9985151290893555, 3.128178358078003, 3.2578415870666504, 3.387504816055298, 3.5171680450439453, 3.6468312740325928, 3.7764945030212402, 3.906157970428467, 4.035820960998535, 4.165484428405762, 4.295147895812988, 4.424810886383057]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 7.0, 7.0, 8.0, 15.0, 22.0, 26.0, 31.0, 48.0, 73.0, 116.0, 162.0, 251.0, 365.0, 596.0, 968.0, 1650.0, 2956.0, 5666.0, 10903.0, 22284.0, 47528.0, 104965.0, 219127.0, 289837.0, 181455.0, 83511.0, 38117.0, 17942.0, 8953.0, 4628.0, 2511.0, 1467.0, 820.0, 498.0, 340.0, 234.0, 137.0, 100.0, 63.0, 55.0, 38.0, 19.0, 18.0, 8.0, 12.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-4.15625, -4.031646728515625, -3.90704345703125, -3.782440185546875, -3.6578369140625, -3.533233642578125, -3.40863037109375, -3.284027099609375, -3.159423828125, -3.034820556640625, -2.91021728515625, -2.785614013671875, -2.6610107421875, -2.536407470703125, -2.41180419921875, -2.287200927734375, -2.16259765625, -2.037994384765625, -1.91339111328125, -1.788787841796875, -1.6641845703125, -1.539581298828125, -1.41497802734375, -1.290374755859375, -1.165771484375, -1.041168212890625, -0.91656494140625, -0.791961669921875, -0.6673583984375, -0.542755126953125, -0.41815185546875, -0.293548583984375, -0.1689453125, -0.044342041015625, 0.08026123046875, 0.204864501953125, 0.3294677734375, 0.454071044921875, 0.57867431640625, 0.703277587890625, 0.827880859375, 0.952484130859375, 1.07708740234375, 1.201690673828125, 1.3262939453125, 1.450897216796875, 1.57550048828125, 1.700103759765625, 1.82470703125, 1.949310302734375, 2.07391357421875, 2.198516845703125, 2.3231201171875, 2.447723388671875, 2.57232666015625, 2.696929931640625, 2.821533203125, 2.946136474609375, 3.07073974609375, 3.195343017578125, 3.3199462890625, 3.444549560546875, 3.56915283203125, 3.693756103515625, 3.818359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 6.0, 8.0, 7.0, 10.0, 12.0, 12.0, 17.0, 25.0, 16.0, 25.0, 37.0, 30.0, 34.0, 33.0, 38.0, 32.0, 41.0, 39.0, 42.0, 39.0, 51.0, 39.0, 36.0, 49.0, 40.0, 34.0, 36.0, 28.0, 23.0, 19.0, 23.0, 19.0, 15.0, 13.0, 16.0, 7.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.173828125, -3.0811767578125, -2.988525390625, -2.8958740234375, -2.80322265625, -2.7105712890625, -2.617919921875, -2.5252685546875, -2.4326171875, -2.3399658203125, -2.247314453125, -2.1546630859375, -2.06201171875, -1.9693603515625, -1.876708984375, -1.7840576171875, -1.69140625, -1.5987548828125, -1.506103515625, -1.4134521484375, -1.32080078125, -1.2281494140625, -1.135498046875, -1.0428466796875, -0.9501953125, -0.8575439453125, -0.764892578125, -0.6722412109375, -0.57958984375, -0.4869384765625, -0.394287109375, -0.3016357421875, -0.208984375, -0.1163330078125, -0.023681640625, 0.0689697265625, 0.16162109375, 0.2542724609375, 0.346923828125, 0.4395751953125, 0.5322265625, 0.6248779296875, 0.717529296875, 0.8101806640625, 0.90283203125, 0.9954833984375, 1.088134765625, 1.1807861328125, 1.2734375, 1.3660888671875, 1.458740234375, 1.5513916015625, 1.64404296875, 1.7366943359375, 1.829345703125, 1.9219970703125, 2.0146484375, 2.1072998046875, 2.199951171875, 2.2926025390625, 2.38525390625, 2.4779052734375, 2.570556640625, 2.6632080078125, 2.755859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 16.0, 13.0, 35.0, 53.0, 78.0, 83.0, 139.0, 249.0, 344.0, 764.0, 1578.0, 4092.0, 14826.0, 84589.0, 609362.0, 282312.0, 36770.0, 7973.0, 2689.0, 1125.0, 555.0, 337.0, 187.0, 115.0, 72.0, 45.0, 51.0, 19.0, 24.0, 15.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.9140625, -10.6173095703125, -10.320556640625, -10.0238037109375, -9.72705078125, -9.4302978515625, -9.133544921875, -8.8367919921875, -8.5400390625, -8.2432861328125, -7.946533203125, -7.6497802734375, -7.35302734375, -7.0562744140625, -6.759521484375, -6.4627685546875, -6.166015625, -5.8692626953125, -5.572509765625, -5.2757568359375, -4.97900390625, -4.6822509765625, -4.385498046875, -4.0887451171875, -3.7919921875, -3.4952392578125, -3.198486328125, -2.9017333984375, -2.60498046875, -2.3082275390625, -2.011474609375, -1.7147216796875, -1.41796875, -1.1212158203125, -0.824462890625, -0.5277099609375, -0.23095703125, 0.0657958984375, 0.362548828125, 0.6593017578125, 0.9560546875, 1.2528076171875, 1.549560546875, 1.8463134765625, 2.14306640625, 2.4398193359375, 2.736572265625, 3.0333251953125, 3.330078125, 3.6268310546875, 3.923583984375, 4.2203369140625, 4.51708984375, 4.8138427734375, 5.110595703125, 5.4073486328125, 5.7041015625, 6.0008544921875, 6.297607421875, 6.5943603515625, 6.89111328125, 7.1878662109375, 7.484619140625, 7.7813720703125, 8.078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 9.0, 6.0, 6.0, 13.0, 13.0, 12.0, 14.0, 18.0, 20.0, 29.0, 35.0, 35.0, 38.0, 45.0, 42.0, 33.0, 46.0, 56.0, 46.0, 47.0, 46.0, 45.0, 46.0, 46.0, 34.0, 22.0, 30.0, 20.0, 26.0, 9.0, 13.0, 16.0, 18.0, 15.0, 14.0, 9.0, 2.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.234375, -14.7626953125, -14.291015625, -13.8193359375, -13.34765625, -12.8759765625, -12.404296875, -11.9326171875, -11.4609375, -10.9892578125, -10.517578125, -10.0458984375, -9.57421875, -9.1025390625, -8.630859375, -8.1591796875, -7.6875, -7.2158203125, -6.744140625, -6.2724609375, -5.80078125, -5.3291015625, -4.857421875, -4.3857421875, -3.9140625, -3.4423828125, -2.970703125, -2.4990234375, -2.02734375, -1.5556640625, -1.083984375, -0.6123046875, -0.140625, 0.3310546875, 0.802734375, 1.2744140625, 1.74609375, 2.2177734375, 2.689453125, 3.1611328125, 3.6328125, 4.1044921875, 4.576171875, 5.0478515625, 5.51953125, 5.9912109375, 6.462890625, 6.9345703125, 7.40625, 7.8779296875, 8.349609375, 8.8212890625, 9.29296875, 9.7646484375, 10.236328125, 10.7080078125, 11.1796875, 11.6513671875, 12.123046875, 12.5947265625, 13.06640625, 13.5380859375, 14.009765625, 14.4814453125, 14.953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 12.0, 14.0, 15.0, 21.0, 28.0, 58.0, 94.0, 160.0, 333.0, 752.0, 1860.0, 7104.0, 64304.0, 851936.0, 108545.0, 9433.0, 2211.0, 846.0, 351.0, 181.0, 113.0, 61.0, 40.0, 31.0, 16.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27734375, -6.07208251953125, -5.8668212890625, -5.66156005859375, -5.456298828125, -5.25103759765625, -5.0457763671875, -4.84051513671875, -4.63525390625, -4.42999267578125, -4.2247314453125, -4.01947021484375, -3.814208984375, -3.60894775390625, -3.4036865234375, -3.19842529296875, -2.9931640625, -2.78790283203125, -2.5826416015625, -2.37738037109375, -2.172119140625, -1.96685791015625, -1.7615966796875, -1.55633544921875, -1.35107421875, -1.14581298828125, -0.9405517578125, -0.73529052734375, -0.530029296875, -0.32476806640625, -0.1195068359375, 0.08575439453125, 0.291015625, 0.49627685546875, 0.7015380859375, 0.90679931640625, 1.112060546875, 1.31732177734375, 1.5225830078125, 1.72784423828125, 1.93310546875, 2.13836669921875, 2.3436279296875, 2.54888916015625, 2.754150390625, 2.95941162109375, 3.1646728515625, 3.36993408203125, 3.5751953125, 3.78045654296875, 3.9857177734375, 4.19097900390625, 4.396240234375, 4.60150146484375, 4.8067626953125, 5.01202392578125, 5.21728515625, 5.42254638671875, 5.6278076171875, 5.83306884765625, 6.038330078125, 6.24359130859375, 6.4488525390625, 6.65411376953125, 6.859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 5.0, 13.0, 30.0, 49.0, 76.0, 81.0, 136.0, 165.0, 141.0, 88.0, 81.0, 45.0, 32.0, 14.0, 17.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00072479248046875, -0.0006909668445587158, -0.0006571412086486816, -0.0006233155727386475, -0.0005894899368286133, -0.0005556643009185791, -0.0005218386650085449, -0.00048801302909851074, -0.00045418739318847656, -0.0004203617572784424, -0.0003865361213684082, -0.000352710485458374, -0.00031888484954833984, -0.00028505921363830566, -0.0002512335777282715, -0.0002174079418182373, -0.00018358230590820312, -0.00014975666999816895, -0.00011593103408813477, -8.210539817810059e-05, -4.8279762268066406e-05, -1.4454126358032227e-05, 1.9371509552001953e-05, 5.319714546203613e-05, 8.702278137207031e-05, 0.00012084841728210449, 0.00015467405319213867, 0.00018849968910217285, 0.00022232532501220703, 0.0002561509609222412, 0.0002899765968322754, 0.00032380223274230957, 0.00035762786865234375, 0.00039145350456237793, 0.0004252791404724121, 0.0004591047763824463, 0.0004929304122924805, 0.0005267560482025146, 0.0005605816841125488, 0.000594407320022583, 0.0006282329559326172, 0.0006620585918426514, 0.0006958842277526855, 0.0007297098636627197, 0.0007635354995727539, 0.0007973611354827881, 0.0008311867713928223, 0.0008650124073028564, 0.0008988380432128906, 0.0009326636791229248, 0.000966489315032959, 0.0010003149509429932, 0.0010341405868530273, 0.0010679662227630615, 0.0011017918586730957, 0.0011356174945831299, 0.001169443130493164, 0.0012032687664031982, 0.0012370944023132324, 0.0012709200382232666, 0.0013047456741333008, 0.001338571310043335, 0.0013723969459533691, 0.0014062225818634033, 0.0014400482177734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 12.0, 18.0, 18.0, 34.0, 48.0, 73.0, 109.0, 225.0, 449.0, 881.0, 2137.0, 6736.0, 34496.0, 371707.0, 568461.0, 49797.0, 8659.0, 2601.0, 1018.0, 471.0, 246.0, 137.0, 84.0, 43.0, 33.0, 20.0, 7.0, 7.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.08709716796875, -3.9241943359375, -3.76129150390625, -3.598388671875, -3.43548583984375, -3.2725830078125, -3.10968017578125, -2.94677734375, -2.78387451171875, -2.6209716796875, -2.45806884765625, -2.295166015625, -2.13226318359375, -1.9693603515625, -1.80645751953125, -1.6435546875, -1.48065185546875, -1.3177490234375, -1.15484619140625, -0.991943359375, -0.82904052734375, -0.6661376953125, -0.50323486328125, -0.34033203125, -0.17742919921875, -0.0145263671875, 0.14837646484375, 0.311279296875, 0.47418212890625, 0.6370849609375, 0.79998779296875, 0.962890625, 1.12579345703125, 1.2886962890625, 1.45159912109375, 1.614501953125, 1.77740478515625, 1.9403076171875, 2.10321044921875, 2.26611328125, 2.42901611328125, 2.5919189453125, 2.75482177734375, 2.917724609375, 3.08062744140625, 3.2435302734375, 3.40643310546875, 3.5693359375, 3.73223876953125, 3.8951416015625, 4.05804443359375, 4.220947265625, 4.38385009765625, 4.5467529296875, 4.70965576171875, 4.87255859375, 5.03546142578125, 5.1983642578125, 5.36126708984375, 5.524169921875, 5.68707275390625, 5.8499755859375, 6.01287841796875, 6.17578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 13.0, 12.0, 18.0, 30.0, 40.0, 47.0, 62.0, 93.0, 110.0, 106.0, 96.0, 95.0, 68.0, 50.0, 32.0, 28.0, 19.0, 15.0, 9.0, 10.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.5833740234375, -5.416748046875, -5.2501220703125, -5.08349609375, -4.9168701171875, -4.750244140625, -4.5836181640625, -4.4169921875, -4.2503662109375, -4.083740234375, -3.9171142578125, -3.75048828125, -3.5838623046875, -3.417236328125, -3.2506103515625, -3.083984375, -2.9173583984375, -2.750732421875, -2.5841064453125, -2.41748046875, -2.2508544921875, -2.084228515625, -1.9176025390625, -1.7509765625, -1.5843505859375, -1.417724609375, -1.2510986328125, -1.08447265625, -0.9178466796875, -0.751220703125, -0.5845947265625, -0.41796875, -0.2513427734375, -0.084716796875, 0.0819091796875, 0.24853515625, 0.4151611328125, 0.581787109375, 0.7484130859375, 0.9150390625, 1.0816650390625, 1.248291015625, 1.4149169921875, 1.58154296875, 1.7481689453125, 1.914794921875, 2.0814208984375, 2.248046875, 2.4146728515625, 2.581298828125, 2.7479248046875, 2.91455078125, 3.0811767578125, 3.247802734375, 3.4144287109375, 3.5810546875, 3.7476806640625, 3.914306640625, 4.0809326171875, 4.24755859375, 4.4141845703125, 4.580810546875, 4.7474365234375, 4.9140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 11.0, 20.0, 19.0, 58.0, 108.0, 122.0, 168.0, 199.0, 112.0, 70.0, 47.0, 22.0, 13.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.09539794921875, -96.62400817871094, -94.15262603759766, -91.68123626708984, -89.20984649658203, -86.73846435546875, -84.26707458496094, -81.79568481445312, -79.32430267333984, -76.85291290283203, -74.38153076171875, -71.91014099121094, -69.43875122070312, -66.96736907958984, -64.49597930908203, -62.024593353271484, -59.55320358276367, -57.081817626953125, -54.61042785644531, -52.139041900634766, -49.66765594482422, -47.196266174316406, -44.72488021850586, -42.25349426269531, -39.7821044921875, -37.31071853637695, -34.83932876586914, -32.367942810058594, -29.896556854248047, -27.425168991088867, -24.953781127929688, -22.48239517211914, -20.011009216308594, -17.539621353149414, -15.068235397338867, -12.596847534179688, -10.125460624694824, -7.654073715209961, -5.182685852050781, -2.7112998962402344, -0.2399120330810547, 2.2314751148223877, 4.70286226272583, 7.174249649047852, 9.645636558532715, 12.117023468017578, 14.588411331176758, 17.059797286987305, 19.531185150146484, 22.002573013305664, 24.47395896911621, 26.94534683227539, 29.416732788085938, 31.888120651245117, 34.3595085144043, 36.830894470214844, 39.302284240722656, 41.7736701965332, 44.245059967041016, 46.71644592285156, 49.18783187866211, 51.659217834472656, 54.13060760498047, 56.601993560791016, 59.07337951660156]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 8.0, 12.0, 10.0, 12.0, 18.0, 15.0, 20.0, 23.0, 31.0, 40.0, 43.0, 32.0, 34.0, 43.0, 48.0, 46.0, 63.0, 41.0, 54.0, 40.0, 40.0, 33.0, 39.0, 33.0, 27.0, 22.0, 35.0, 21.0, 18.0, 17.0, 14.0, 6.0, 10.0, 7.0, 9.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.31007385253906, -63.313865661621094, -61.31765365600586, -59.32144546508789, -57.32523727416992, -55.32902526855469, -53.33281707763672, -51.33660888671875, -49.34040069580078, -47.34419250488281, -45.34798049926758, -43.35177230834961, -41.35556411743164, -39.359352111816406, -37.36314392089844, -35.36693572998047, -33.370723724365234, -31.374513626098633, -29.378305435180664, -27.382095336914062, -25.385887145996094, -23.389677047729492, -21.39346694946289, -19.397258758544922, -17.40104866027832, -15.404839515686035, -13.40863037109375, -11.412420272827148, -9.416211128234863, -7.420001983642578, -5.423791885375977, -3.4275827407836914, -1.4313735961914062, 0.564835786819458, 2.5610451698303223, 4.557254791259766, 6.553463935852051, 8.549673080444336, 10.545883178710938, 12.542092323303223, 14.538301467895508, 16.53451156616211, 18.530719757080078, 20.52692985534668, 22.52313995361328, 24.51934814453125, 26.51555824279785, 28.511768341064453, 30.507976531982422, 32.50418472290039, 34.500396728515625, 36.496604919433594, 38.49281311035156, 40.48902130126953, 42.485233306884766, 44.481441497802734, 46.47765350341797, 48.47386169433594, 50.47007369995117, 52.46628189086914, 54.46249008178711, 56.458702087402344, 58.45491027832031, 60.45111846923828, 62.44732666015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 24.0, 29.0, 39.0, 65.0, 95.0, 211.0, 349.0, 701.0, 1645.0, 4105.0, 13059.0, 68639.0, 3906199.0, 168472.0, 20804.0, 5930.0, 2116.0, 893.0, 395.0, 224.0, 122.0, 57.0, 47.0, 24.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.666015625, -9.37890625, -9.091796875, -8.8046875, -8.517578125, -8.23046875, -7.943359375, -7.65625, -7.369140625, -7.08203125, -6.794921875, -6.5078125, -6.220703125, -5.93359375, -5.646484375, -5.359375, -5.072265625, -4.78515625, -4.498046875, -4.2109375, -3.923828125, -3.63671875, -3.349609375, -3.0625, -2.775390625, -2.48828125, -2.201171875, -1.9140625, -1.626953125, -1.33984375, -1.052734375, -0.765625, -0.478515625, -0.19140625, 0.095703125, 0.3828125, 0.669921875, 0.95703125, 1.244140625, 1.53125, 1.818359375, 2.10546875, 2.392578125, 2.6796875, 2.966796875, 3.25390625, 3.541015625, 3.828125, 4.115234375, 4.40234375, 4.689453125, 4.9765625, 5.263671875, 5.55078125, 5.837890625, 6.125, 6.412109375, 6.69921875, 6.986328125, 7.2734375, 7.560546875, 7.84765625, 8.134765625, 8.421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 13.0, 6.0, 18.0, 25.0, 28.0, 47.0, 67.0, 81.0, 78.0, 75.0, 103.0, 89.0, 83.0, 62.0, 55.0, 45.0, 44.0, 19.0, 20.0, 12.0, 12.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.046875, -7.861358642578125, -7.67584228515625, -7.490325927734375, -7.3048095703125, -7.119293212890625, -6.93377685546875, -6.748260498046875, -6.562744140625, -6.377227783203125, -6.19171142578125, -6.006195068359375, -5.8206787109375, -5.635162353515625, -5.44964599609375, -5.264129638671875, -5.07861328125, -4.893096923828125, -4.70758056640625, -4.522064208984375, -4.3365478515625, -4.151031494140625, -3.96551513671875, -3.779998779296875, -3.594482421875, -3.408966064453125, -3.22344970703125, -3.037933349609375, -2.8524169921875, -2.666900634765625, -2.48138427734375, -2.295867919921875, -2.1103515625, -1.924835205078125, -1.73931884765625, -1.553802490234375, -1.3682861328125, -1.182769775390625, -0.99725341796875, -0.811737060546875, -0.626220703125, -0.440704345703125, -0.25518798828125, -0.069671630859375, 0.1158447265625, 0.301361083984375, 0.48687744140625, 0.672393798828125, 0.85791015625, 1.043426513671875, 1.22894287109375, 1.414459228515625, 1.5999755859375, 1.785491943359375, 1.97100830078125, 2.156524658203125, 2.342041015625, 2.527557373046875, 2.71307373046875, 2.898590087890625, 3.0841064453125, 3.269622802734375, 3.45513916015625, 3.640655517578125, 3.826171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 12.0, 7.0, 14.0, 20.0, 20.0, 46.0, 59.0, 52.0, 98.0, 134.0, 231.0, 308.0, 506.0, 995.0, 2025.0, 6090.0, 25508.0, 343521.0, 3740699.0, 57346.0, 10194.0, 3166.0, 1361.0, 658.0, 401.0, 247.0, 168.0, 97.0, 63.0, 56.0, 45.0, 34.0, 30.0, 16.0, 15.0, 16.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.390380859375, -10.04638671875, -9.702392578125, -9.3583984375, -9.014404296875, -8.67041015625, -8.326416015625, -7.982421875, -7.638427734375, -7.29443359375, -6.950439453125, -6.6064453125, -6.262451171875, -5.91845703125, -5.574462890625, -5.23046875, -4.886474609375, -4.54248046875, -4.198486328125, -3.8544921875, -3.510498046875, -3.16650390625, -2.822509765625, -2.478515625, -2.134521484375, -1.79052734375, -1.446533203125, -1.1025390625, -0.758544921875, -0.41455078125, -0.070556640625, 0.2734375, 0.617431640625, 0.96142578125, 1.305419921875, 1.6494140625, 1.993408203125, 2.33740234375, 2.681396484375, 3.025390625, 3.369384765625, 3.71337890625, 4.057373046875, 4.4013671875, 4.745361328125, 5.08935546875, 5.433349609375, 5.77734375, 6.121337890625, 6.46533203125, 6.809326171875, 7.1533203125, 7.497314453125, 7.84130859375, 8.185302734375, 8.529296875, 8.873291015625, 9.21728515625, 9.561279296875, 9.9052734375, 10.249267578125, 10.59326171875, 10.937255859375, 11.28125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 18.0, 15.0, 24.0, 63.0, 217.0, 2948.0, 576.0, 129.0, 45.0, 18.0, 6.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.397705078125, -6.13916015625, -5.880615234375, -5.6220703125, -5.363525390625, -5.10498046875, -4.846435546875, -4.587890625, -4.329345703125, -4.07080078125, -3.812255859375, -3.5537109375, -3.295166015625, -3.03662109375, -2.778076171875, -2.51953125, -2.260986328125, -2.00244140625, -1.743896484375, -1.4853515625, -1.226806640625, -0.96826171875, -0.709716796875, -0.451171875, -0.192626953125, 0.06591796875, 0.324462890625, 0.5830078125, 0.841552734375, 1.10009765625, 1.358642578125, 1.6171875, 1.875732421875, 2.13427734375, 2.392822265625, 2.6513671875, 2.909912109375, 3.16845703125, 3.427001953125, 3.685546875, 3.944091796875, 4.20263671875, 4.461181640625, 4.7197265625, 4.978271484375, 5.23681640625, 5.495361328125, 5.75390625, 6.012451171875, 6.27099609375, 6.529541015625, 6.7880859375, 7.046630859375, 7.30517578125, 7.563720703125, 7.822265625, 8.080810546875, 8.33935546875, 8.597900390625, 8.8564453125, 9.114990234375, 9.37353515625, 9.632080078125, 9.890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 18.0, 24.0, 40.0, 65.0, 105.0, 106.0, 124.0, 145.0, 136.0, 77.0, 52.0, 32.0, 22.0, 7.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.251514434814453, -15.594195365905762, -14.93687629699707, -14.279558181762695, -13.622239112854004, -12.964920043945312, -12.307600975036621, -11.65028190612793, -10.992963790893555, -10.335644721984863, -9.678325653076172, -9.021007537841797, -8.363688468933105, -7.706369400024414, -7.049050331115723, -6.3917317390441895, -5.73441219329834, -5.077093124389648, -4.419774532318115, -3.762455463409424, -3.1051366329193115, -2.447817802429199, -1.7904987335205078, -1.1331801414489746, -0.4758610725402832, 0.18145781755447388, 0.838776707649231, 1.4960956573486328, 2.153414487838745, 2.8107333183288574, 3.468052387237549, 4.125370979309082, 4.782690048217773, 5.440009117126465, 6.097327709197998, 6.7546467781066895, 7.411965370178223, 8.069284439086914, 8.726603507995605, 9.383922576904297, 10.041240692138672, 10.698559761047363, 11.355878829956055, 12.01319694519043, 12.670516014099121, 13.327835083007812, 13.985154151916504, 14.642473220825195, 15.299792289733887, 15.957111358642578, 16.614429473876953, 17.27174949645996, 17.929067611694336, 18.586387634277344, 19.24370574951172, 19.901023864746094, 20.5583438873291, 21.215662002563477, 21.872982025146484, 22.53030014038086, 23.187620162963867, 23.844938278198242, 24.50225830078125, 25.159576416015625, 25.81689453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 9.0, 24.0, 17.0, 18.0, 32.0, 28.0, 36.0, 51.0, 52.0, 39.0, 58.0, 63.0, 73.0, 67.0, 60.0, 63.0, 50.0, 57.0, 37.0, 27.0, 30.0, 25.0, 23.0, 12.0, 13.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.553426742553711, -13.98253345489502, -13.411641120910645, -12.840747833251953, -12.269855499267578, -11.698962211608887, -11.128068923950195, -10.55717658996582, -9.986283302307129, -9.415390014648438, -8.844497680664062, -8.273604393005371, -7.702711582183838, -7.131818771362305, -6.560925483703613, -5.99003267288208, -5.419139862060547, -4.848247051239014, -4.2773542404174805, -3.706460952758789, -3.135568141937256, -2.5646753311157227, -1.9937822818756104, -1.422889232635498, -0.8519964218139648, -0.2811034917831421, 0.28978943824768066, 0.8606823682785034, 1.4315752983093262, 2.0024681091308594, 2.5733611583709717, 3.144254207611084, 3.71514892578125, 4.286041736602783, 4.856934547424316, 5.427827835083008, 5.998720645904541, 6.569613456726074, 7.140506744384766, 7.711399555206299, 8.282292366027832, 8.853185653686523, 9.424077987670898, 9.99497127532959, 10.565864562988281, 11.136756896972656, 11.707650184631348, 12.278543472290039, 12.849435806274414, 13.420329093933105, 13.99122142791748, 14.562114715576172, 15.133007049560547, 15.703900337219238, 16.27479362487793, 16.845685958862305, 17.416580200195312, 17.987472534179688, 18.558366775512695, 19.12925910949707, 19.700151443481445, 20.271045684814453, 20.841938018798828, 21.412830352783203, 21.983722686767578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 15.0, 20.0, 36.0, 43.0, 91.0, 136.0, 264.0, 536.0, 1154.0, 3247.0, 10789.0, 49441.0, 271069.0, 536361.0, 138474.0, 26368.0, 6600.0, 2066.0, 850.0, 425.0, 245.0, 107.0, 77.0, 46.0, 32.0, 14.0, 15.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.826416015625, -6.56689453125, -6.307373046875, -6.0478515625, -5.788330078125, -5.52880859375, -5.269287109375, -5.009765625, -4.750244140625, -4.49072265625, -4.231201171875, -3.9716796875, -3.712158203125, -3.45263671875, -3.193115234375, -2.93359375, -2.674072265625, -2.41455078125, -2.155029296875, -1.8955078125, -1.635986328125, -1.37646484375, -1.116943359375, -0.857421875, -0.597900390625, -0.33837890625, -0.078857421875, 0.1806640625, 0.440185546875, 0.69970703125, 0.959228515625, 1.21875, 1.478271484375, 1.73779296875, 1.997314453125, 2.2568359375, 2.516357421875, 2.77587890625, 3.035400390625, 3.294921875, 3.554443359375, 3.81396484375, 4.073486328125, 4.3330078125, 4.592529296875, 4.85205078125, 5.111572265625, 5.37109375, 5.630615234375, 5.89013671875, 6.149658203125, 6.4091796875, 6.668701171875, 6.92822265625, 7.187744140625, 7.447265625, 7.706787109375, 7.96630859375, 8.225830078125, 8.4853515625, 8.744873046875, 9.00439453125, 9.263916015625, 9.5234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 17.0, 27.0, 27.0, 36.0, 40.0, 66.0, 68.0, 63.0, 87.0, 86.0, 94.0, 77.0, 67.0, 59.0, 45.0, 44.0, 21.0, 24.0, 9.0, 17.0, 8.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.87451171875, -6.6865234375, -6.49853515625, -6.310546875, -6.12255859375, -5.9345703125, -5.74658203125, -5.55859375, -5.37060546875, -5.1826171875, -4.99462890625, -4.806640625, -4.61865234375, -4.4306640625, -4.24267578125, -4.0546875, -3.86669921875, -3.6787109375, -3.49072265625, -3.302734375, -3.11474609375, -2.9267578125, -2.73876953125, -2.55078125, -2.36279296875, -2.1748046875, -1.98681640625, -1.798828125, -1.61083984375, -1.4228515625, -1.23486328125, -1.046875, -0.85888671875, -0.6708984375, -0.48291015625, -0.294921875, -0.10693359375, 0.0810546875, 0.26904296875, 0.45703125, 0.64501953125, 0.8330078125, 1.02099609375, 1.208984375, 1.39697265625, 1.5849609375, 1.77294921875, 1.9609375, 2.14892578125, 2.3369140625, 2.52490234375, 2.712890625, 2.90087890625, 3.0888671875, 3.27685546875, 3.46484375, 3.65283203125, 3.8408203125, 4.02880859375, 4.216796875, 4.40478515625, 4.5927734375, 4.78076171875, 4.96875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 13.0, 12.0, 23.0, 19.0, 58.0, 76.0, 127.0, 202.0, 402.0, 804.0, 2079.0, 7730.0, 70663.0, 798547.0, 150931.0, 11998.0, 2749.0, 949.0, 491.0, 275.0, 154.0, 75.0, 47.0, 33.0, 20.0, 18.0, 15.0, 12.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.640625, -16.1983642578125, -15.756103515625, -15.3138427734375, -14.87158203125, -14.4293212890625, -13.987060546875, -13.5447998046875, -13.1025390625, -12.6602783203125, -12.218017578125, -11.7757568359375, -11.33349609375, -10.8912353515625, -10.448974609375, -10.0067138671875, -9.564453125, -9.1221923828125, -8.679931640625, -8.2376708984375, -7.79541015625, -7.3531494140625, -6.910888671875, -6.4686279296875, -6.0263671875, -5.5841064453125, -5.141845703125, -4.6995849609375, -4.25732421875, -3.8150634765625, -3.372802734375, -2.9305419921875, -2.48828125, -2.0460205078125, -1.603759765625, -1.1614990234375, -0.71923828125, -0.2769775390625, 0.165283203125, 0.6075439453125, 1.0498046875, 1.4920654296875, 1.934326171875, 2.3765869140625, 2.81884765625, 3.2611083984375, 3.703369140625, 4.1456298828125, 4.587890625, 5.0301513671875, 5.472412109375, 5.9146728515625, 6.35693359375, 6.7991943359375, 7.241455078125, 7.6837158203125, 8.1259765625, 8.5682373046875, 9.010498046875, 9.4527587890625, 9.89501953125, 10.3372802734375, 10.779541015625, 11.2218017578125, 11.6640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 9.0, 20.0, 14.0, 20.0, 30.0, 34.0, 32.0, 44.0, 47.0, 48.0, 70.0, 58.0, 59.0, 67.0, 51.0, 63.0, 52.0, 46.0, 42.0, 30.0, 31.0, 21.0, 22.0, 22.0, 13.0, 12.0, 8.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.783203125, -18.17578125, -17.568359375, -16.9609375, -16.353515625, -15.74609375, -15.138671875, -14.53125, -13.923828125, -13.31640625, -12.708984375, -12.1015625, -11.494140625, -10.88671875, -10.279296875, -9.671875, -9.064453125, -8.45703125, -7.849609375, -7.2421875, -6.634765625, -6.02734375, -5.419921875, -4.8125, -4.205078125, -3.59765625, -2.990234375, -2.3828125, -1.775390625, -1.16796875, -0.560546875, 0.046875, 0.654296875, 1.26171875, 1.869140625, 2.4765625, 3.083984375, 3.69140625, 4.298828125, 4.90625, 5.513671875, 6.12109375, 6.728515625, 7.3359375, 7.943359375, 8.55078125, 9.158203125, 9.765625, 10.373046875, 10.98046875, 11.587890625, 12.1953125, 12.802734375, 13.41015625, 14.017578125, 14.625, 15.232421875, 15.83984375, 16.447265625, 17.0546875, 17.662109375, 18.26953125, 18.876953125, 19.484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 10.0, 11.0, 10.0, 19.0, 23.0, 41.0, 86.0, 181.0, 426.0, 1185.0, 6110.0, 138020.0, 872239.0, 26263.0, 2679.0, 653.0, 288.0, 144.0, 66.0, 39.0, 25.0, 15.0, 4.0, 6.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.6929931640625, -6.456298828125, -6.2196044921875, -5.98291015625, -5.7462158203125, -5.509521484375, -5.2728271484375, -5.0361328125, -4.7994384765625, -4.562744140625, -4.3260498046875, -4.08935546875, -3.8526611328125, -3.615966796875, -3.3792724609375, -3.142578125, -2.9058837890625, -2.669189453125, -2.4324951171875, -2.19580078125, -1.9591064453125, -1.722412109375, -1.4857177734375, -1.2490234375, -1.0123291015625, -0.775634765625, -0.5389404296875, -0.30224609375, -0.0655517578125, 0.171142578125, 0.4078369140625, 0.64453125, 0.8812255859375, 1.117919921875, 1.3546142578125, 1.59130859375, 1.8280029296875, 2.064697265625, 2.3013916015625, 2.5380859375, 2.7747802734375, 3.011474609375, 3.2481689453125, 3.48486328125, 3.7215576171875, 3.958251953125, 4.1949462890625, 4.431640625, 4.6683349609375, 4.905029296875, 5.1417236328125, 5.37841796875, 5.6151123046875, 5.851806640625, 6.0885009765625, 6.3251953125, 6.5618896484375, 6.798583984375, 7.0352783203125, 7.27197265625, 7.5086669921875, 7.745361328125, 7.9820556640625, 8.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 8.0, 12.0, 9.0, 11.0, 15.0, 18.0, 15.0, 28.0, 26.0, 40.0, 41.0, 64.0, 70.0, 129.0, 95.0, 93.0, 53.0, 40.0, 47.0, 33.0, 27.0, 23.0, 21.0, 12.0, 11.0, 14.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005870312452316284, -0.0005660951137542725, -0.0005451589822769165, -0.0005242228507995605, -0.0005032867193222046, -0.00048235058784484863, -0.0004614144563674927, -0.0004404783248901367, -0.00041954219341278076, -0.0003986060619354248, -0.00037766993045806885, -0.0003567337989807129, -0.00033579766750335693, -0.000314861536026001, -0.000293925404548645, -0.00027298927307128906, -0.0002520531415939331, -0.00023111701011657715, -0.0002101808786392212, -0.00018924474716186523, -0.00016830861568450928, -0.00014737248420715332, -0.00012643635272979736, -0.0001055002212524414, -8.456408977508545e-05, -6.362795829772949e-05, -4.2691826820373535e-05, -2.1755695343017578e-05, -8.195638656616211e-07, 2.0116567611694336e-05, 4.105269908905029e-05, 6.198883056640625e-05, 8.292496204376221e-05, 0.00010386109352111816, 0.00012479722499847412, 0.00014573335647583008, 0.00016666948795318604, 0.000187605619430542, 0.00020854175090789795, 0.0002294778823852539, 0.00025041401386260986, 0.0002713501453399658, 0.0002922862768173218, 0.00031322240829467773, 0.0003341585397720337, 0.00035509467124938965, 0.0003760308027267456, 0.00039696693420410156, 0.0004179030656814575, 0.0004388391971588135, 0.00045977532863616943, 0.0004807114601135254, 0.0005016475915908813, 0.0005225837230682373, 0.0005435198545455933, 0.0005644559860229492, 0.0005853921175003052, 0.0006063282489776611, 0.0006272643804550171, 0.000648200511932373, 0.000669136643409729, 0.000690072774887085, 0.0007110089063644409, 0.0007319450378417969]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 8.0, 12.0, 17.0, 31.0, 53.0, 105.0, 211.0, 477.0, 1113.0, 3396.0, 18832.0, 301730.0, 680317.0, 34584.0, 5018.0, 1506.0, 574.0, 257.0, 125.0, 67.0, 40.0, 21.0, 12.0, 8.0, 4.0, 9.0, 5.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.828125, -6.6337890625, -6.439453125, -6.2451171875, -6.05078125, -5.8564453125, -5.662109375, -5.4677734375, -5.2734375, -5.0791015625, -4.884765625, -4.6904296875, -4.49609375, -4.3017578125, -4.107421875, -3.9130859375, -3.71875, -3.5244140625, -3.330078125, -3.1357421875, -2.94140625, -2.7470703125, -2.552734375, -2.3583984375, -2.1640625, -1.9697265625, -1.775390625, -1.5810546875, -1.38671875, -1.1923828125, -0.998046875, -0.8037109375, -0.609375, -0.4150390625, -0.220703125, -0.0263671875, 0.16796875, 0.3623046875, 0.556640625, 0.7509765625, 0.9453125, 1.1396484375, 1.333984375, 1.5283203125, 1.72265625, 1.9169921875, 2.111328125, 2.3056640625, 2.5, 2.6943359375, 2.888671875, 3.0830078125, 3.27734375, 3.4716796875, 3.666015625, 3.8603515625, 4.0546875, 4.2490234375, 4.443359375, 4.6376953125, 4.83203125, 5.0263671875, 5.220703125, 5.4150390625, 5.609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 8.0, 18.0, 16.0, 19.0, 36.0, 35.0, 49.0, 79.0, 95.0, 110.0, 103.0, 120.0, 72.0, 61.0, 52.0, 28.0, 29.0, 18.0, 17.0, 12.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.96539306640625, -5.8057861328125, -5.64617919921875, -5.486572265625, -5.32696533203125, -5.1673583984375, -5.00775146484375, -4.84814453125, -4.68853759765625, -4.5289306640625, -4.36932373046875, -4.209716796875, -4.05010986328125, -3.8905029296875, -3.73089599609375, -3.5712890625, -3.41168212890625, -3.2520751953125, -3.09246826171875, -2.932861328125, -2.77325439453125, -2.6136474609375, -2.45404052734375, -2.29443359375, -2.13482666015625, -1.9752197265625, -1.81561279296875, -1.656005859375, -1.49639892578125, -1.3367919921875, -1.17718505859375, -1.017578125, -0.85797119140625, -0.6983642578125, -0.53875732421875, -0.379150390625, -0.21954345703125, -0.0599365234375, 0.09967041015625, 0.25927734375, 0.41888427734375, 0.5784912109375, 0.73809814453125, 0.897705078125, 1.05731201171875, 1.2169189453125, 1.37652587890625, 1.5361328125, 1.69573974609375, 1.8553466796875, 2.01495361328125, 2.174560546875, 2.33416748046875, 2.4937744140625, 2.65338134765625, 2.81298828125, 2.97259521484375, 3.1322021484375, 3.29180908203125, 3.451416015625, 3.61102294921875, 3.7706298828125, 3.93023681640625, 4.08984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 14.0, 25.0, 63.0, 140.0, 170.0, 202.0, 173.0, 90.0, 54.0, 22.0, 9.0, 4.0, 8.0, 8.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-125.43487548828125, -122.29891204833984, -119.16295623779297, -116.02699279785156, -112.89102935791016, -109.75507354736328, -106.61911010742188, -103.483154296875, -100.3471908569336, -97.21122741699219, -94.07527160644531, -90.9393081665039, -87.8033447265625, -84.66738891601562, -81.53142547607422, -78.39546203613281, -75.25950622558594, -72.12354278564453, -68.98758697509766, -65.85162353515625, -62.71566390991211, -59.57970428466797, -56.44374084472656, -53.30778121948242, -50.17181396484375, -47.03585433959961, -43.8998908996582, -40.76393127441406, -37.62797164916992, -34.49201202392578, -31.356048583984375, -28.220088958740234, -25.084129333496094, -21.94816780090332, -18.81220817565918, -15.676246643066406, -12.54028606414795, -9.404325485229492, -6.268363952636719, -3.132404327392578, 0.0035572052001953125, 3.1395180225372314, 6.275478839874268, 9.411439895629883, 12.54740047454834, 15.683361053466797, 18.81932258605957, 21.95528221130371, 25.091243743896484, 28.227205276489258, 31.3631649017334, 34.49912643432617, 37.63508605957031, 40.77104949951172, 43.90700912475586, 47.04296875, 50.178932189941406, 53.31489181518555, 56.45085525512695, 59.586814880371094, 62.722774505615234, 65.85873413085938, 68.99469757080078, 72.13066101074219, 75.26661682128906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 11.0, 3.0, 3.0, 2.0, 7.0, 15.0, 18.0, 16.0, 26.0, 25.0, 23.0, 15.0, 19.0, 43.0, 37.0, 37.0, 35.0, 53.0, 53.0, 44.0, 46.0, 54.0, 52.0, 44.0, 36.0, 46.0, 35.0, 31.0, 29.0, 27.0, 20.0, 22.0, 15.0, 15.0, 8.0, 9.0, 6.0, 5.0, 3.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-72.56350708007812, -70.47933197021484, -68.39515686035156, -66.31098937988281, -64.22681427001953, -62.14263916015625, -60.05846405029297, -57.97428894042969, -55.890113830566406, -53.805938720703125, -51.72176742553711, -49.63759231567383, -47.55341720581055, -45.46924591064453, -43.38507080078125, -41.30089569091797, -39.21672439575195, -37.13254928588867, -35.048377990722656, -32.964202880859375, -30.880027770996094, -28.795854568481445, -26.711681365966797, -24.627506256103516, -22.543333053588867, -20.45915985107422, -18.374984741210938, -16.29081153869629, -14.206637382507324, -12.12246322631836, -10.038290023803711, -7.954115867614746, -5.869945526123047, -3.785771608352661, -1.7015976905822754, 0.38257598876953125, 2.466750144958496, 4.550924301147461, 6.635097503662109, 8.719271659851074, 10.803445816040039, 12.887619972229004, 14.971794128417969, 17.055967330932617, 19.140140533447266, 21.224315643310547, 23.308488845825195, 25.392662048339844, 27.476837158203125, 29.561010360717773, 31.645185470581055, 33.7293586730957, 35.813533782958984, 37.897705078125, 39.98188018798828, 42.06605529785156, 44.150230407714844, 46.234405517578125, 48.31857681274414, 50.40275192260742, 52.4869270324707, 54.57109832763672, 56.6552734375, 58.73944854736328, 60.8236198425293]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 10.0, 11.0, 9.0, 20.0, 28.0, 33.0, 51.0, 79.0, 166.0, 257.0, 506.0, 935.0, 2124.0, 5446.0, 17966.0, 111379.0, 2667598.0, 1299682.0, 66438.0, 13622.0, 4473.0, 1729.0, 823.0, 379.0, 208.0, 112.0, 63.0, 52.0, 24.0, 10.0, 14.0, 8.0, 4.0, 7.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.52423095703125, -6.3258056640625, -6.12738037109375, -5.928955078125, -5.73052978515625, -5.5321044921875, -5.33367919921875, -5.13525390625, -4.93682861328125, -4.7384033203125, -4.53997802734375, -4.341552734375, -4.14312744140625, -3.9447021484375, -3.74627685546875, -3.5478515625, -3.34942626953125, -3.1510009765625, -2.95257568359375, -2.754150390625, -2.55572509765625, -2.3572998046875, -2.15887451171875, -1.96044921875, -1.76202392578125, -1.5635986328125, -1.36517333984375, -1.166748046875, -0.96832275390625, -0.7698974609375, -0.57147216796875, -0.373046875, -0.17462158203125, 0.0238037109375, 0.22222900390625, 0.420654296875, 0.61907958984375, 0.8175048828125, 1.01593017578125, 1.21435546875, 1.41278076171875, 1.6112060546875, 1.80963134765625, 2.008056640625, 2.20648193359375, 2.4049072265625, 2.60333251953125, 2.8017578125, 3.00018310546875, 3.1986083984375, 3.39703369140625, 3.595458984375, 3.79388427734375, 3.9923095703125, 4.19073486328125, 4.38916015625, 4.58758544921875, 4.7860107421875, 4.98443603515625, 5.182861328125, 5.38128662109375, 5.5797119140625, 5.77813720703125, 5.9765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 8.0, 4.0, 7.0, 7.0, 11.0, 12.0, 23.0, 20.0, 33.0, 33.0, 41.0, 47.0, 57.0, 43.0, 50.0, 58.0, 60.0, 56.0, 61.0, 54.0, 46.0, 51.0, 29.0, 46.0, 25.0, 20.0, 24.0, 18.0, 17.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.676849365234375, -3.55682373046875, -3.436798095703125, -3.3167724609375, -3.196746826171875, -3.07672119140625, -2.956695556640625, -2.836669921875, -2.716644287109375, -2.59661865234375, -2.476593017578125, -2.3565673828125, -2.236541748046875, -2.11651611328125, -1.996490478515625, -1.87646484375, -1.756439208984375, -1.63641357421875, -1.516387939453125, -1.3963623046875, -1.276336669921875, -1.15631103515625, -1.036285400390625, -0.916259765625, -0.796234130859375, -0.67620849609375, -0.556182861328125, -0.4361572265625, -0.316131591796875, -0.19610595703125, -0.076080322265625, 0.0439453125, 0.163970947265625, 0.28399658203125, 0.404022216796875, 0.5240478515625, 0.644073486328125, 0.76409912109375, 0.884124755859375, 1.004150390625, 1.124176025390625, 1.24420166015625, 1.364227294921875, 1.4842529296875, 1.604278564453125, 1.72430419921875, 1.844329833984375, 1.96435546875, 2.084381103515625, 2.20440673828125, 2.324432373046875, 2.4444580078125, 2.564483642578125, 2.68450927734375, 2.804534912109375, 2.924560546875, 3.044586181640625, 3.16461181640625, 3.284637451171875, 3.4046630859375, 3.524688720703125, 3.64471435546875, 3.764739990234375, 3.884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 8.0, 16.0, 27.0, 27.0, 41.0, 82.0, 106.0, 267.0, 625.0, 1626.0, 5389.0, 24889.0, 276876.0, 3706919.0, 153122.0, 17822.0, 4202.0, 1262.0, 488.0, 207.0, 111.0, 56.0, 30.0, 17.0, 14.0, 7.0, 16.0, 9.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0546875, -7.7376708984375, -7.420654296875, -7.1036376953125, -6.78662109375, -6.4696044921875, -6.152587890625, -5.8355712890625, -5.5185546875, -5.2015380859375, -4.884521484375, -4.5675048828125, -4.25048828125, -3.9334716796875, -3.616455078125, -3.2994384765625, -2.982421875, -2.6654052734375, -2.348388671875, -2.0313720703125, -1.71435546875, -1.3973388671875, -1.080322265625, -0.7633056640625, -0.4462890625, -0.1292724609375, 0.187744140625, 0.5047607421875, 0.82177734375, 1.1387939453125, 1.455810546875, 1.7728271484375, 2.08984375, 2.4068603515625, 2.723876953125, 3.0408935546875, 3.35791015625, 3.6749267578125, 3.991943359375, 4.3089599609375, 4.6259765625, 4.9429931640625, 5.260009765625, 5.5770263671875, 5.89404296875, 6.2110595703125, 6.528076171875, 6.8450927734375, 7.162109375, 7.4791259765625, 7.796142578125, 8.1131591796875, 8.43017578125, 8.7471923828125, 9.064208984375, 9.3812255859375, 9.6982421875, 10.0152587890625, 10.332275390625, 10.6492919921875, 10.96630859375, 11.2833251953125, 11.600341796875, 11.9173583984375, 12.234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 11.0, 15.0, 19.0, 25.0, 37.0, 61.0, 90.0, 206.0, 474.0, 983.0, 1071.0, 506.0, 227.0, 131.0, 67.0, 38.0, 28.0, 11.0, 14.0, 11.0, 7.0, 3.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.5286865234375, -9.221435546875, -8.9141845703125, -8.60693359375, -8.2996826171875, -7.992431640625, -7.6851806640625, -7.3779296875, -7.0706787109375, -6.763427734375, -6.4561767578125, -6.14892578125, -5.8416748046875, -5.534423828125, -5.2271728515625, -4.919921875, -4.6126708984375, -4.305419921875, -3.9981689453125, -3.69091796875, -3.3836669921875, -3.076416015625, -2.7691650390625, -2.4619140625, -2.1546630859375, -1.847412109375, -1.5401611328125, -1.23291015625, -0.9256591796875, -0.618408203125, -0.3111572265625, -0.00390625, 0.3033447265625, 0.610595703125, 0.9178466796875, 1.22509765625, 1.5323486328125, 1.839599609375, 2.1468505859375, 2.4541015625, 2.7613525390625, 3.068603515625, 3.3758544921875, 3.68310546875, 3.9903564453125, 4.297607421875, 4.6048583984375, 4.912109375, 5.2193603515625, 5.526611328125, 5.8338623046875, 6.14111328125, 6.4483642578125, 6.755615234375, 7.0628662109375, 7.3701171875, 7.6773681640625, 7.984619140625, 8.2918701171875, 8.59912109375, 8.9063720703125, 9.213623046875, 9.5208740234375, 9.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 11.0, 10.0, 16.0, 34.0, 59.0, 113.0, 167.0, 147.0, 163.0, 104.0, 64.0, 41.0, 22.0, 13.0, 10.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.25428009033203, -49.22071075439453, -47.18714141845703, -45.1535758972168, -43.1200065612793, -41.0864372253418, -39.05287170410156, -37.01930236816406, -34.98573303222656, -32.95216369628906, -30.918596267700195, -28.885028839111328, -26.851459503173828, -24.817890167236328, -22.78432273864746, -20.750755310058594, -18.717185974121094, -16.683616638183594, -14.650049209594727, -12.616480827331543, -10.58291244506836, -8.549344062805176, -6.515775680541992, -4.482207298278809, -2.448638916015625, -0.4150705337524414, 1.6184978485107422, 3.652066230773926, 5.685634613037109, 7.719202995300293, 9.752771377563477, 11.78633975982666, 13.819900512695312, 15.853468894958496, 17.88703727722168, 19.920604705810547, 21.954174041748047, 23.987743377685547, 26.021310806274414, 28.05487823486328, 30.08844757080078, 32.12201690673828, 34.15558624267578, 36.189151763916016, 38.222721099853516, 40.256290435791016, 42.28985595703125, 44.32342529296875, 46.35699462890625, 48.39056396484375, 50.42413330078125, 52.457698822021484, 54.491268157958984, 56.524837493896484, 58.55840301513672, 60.59197235107422, 62.62554168701172, 64.65911102294922, 66.69268035888672, 68.72624969482422, 70.75981140136719, 72.79338073730469, 74.82695007324219, 76.86051940917969, 78.89408874511719]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 9.0, 13.0, 16.0, 15.0, 25.0, 33.0, 32.0, 38.0, 44.0, 32.0, 51.0, 42.0, 59.0, 50.0, 65.0, 47.0, 44.0, 38.0, 47.0, 39.0, 42.0, 32.0, 26.0, 27.0, 24.0, 23.0, 19.0, 17.0, 8.0, 5.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.69305419921875, -45.42817306518555, -44.16329574584961, -42.898414611816406, -41.63353729248047, -40.368656158447266, -39.10377502441406, -37.838897705078125, -36.57401657104492, -35.30913543701172, -34.04425811767578, -32.77937698364258, -31.514497756958008, -30.249618530273438, -28.984737396240234, -27.719858169555664, -26.454978942871094, -25.190099716186523, -23.925220489501953, -22.66033935546875, -21.39546012878418, -20.13058090209961, -18.865699768066406, -17.600820541381836, -16.335941314697266, -15.071062088012695, -13.806181907653809, -12.541301727294922, -11.276422500610352, -10.011543273925781, -8.746663093566895, -7.481782913208008, -6.216907501220703, -4.952027797698975, -3.687148094177246, -2.4222683906555176, -1.157388687133789, 0.10749101638793945, 1.372370719909668, 2.6372509002685547, 3.902130126953125, 5.1670098304748535, 6.431889533996582, 7.6967692375183105, 8.961648941040039, 10.22652816772461, 11.491408348083496, 12.756288528442383, 14.021167755126953, 15.286046981811523, 16.550926208496094, 17.815807342529297, 19.080686569213867, 20.345565795898438, 21.61044692993164, 22.87532615661621, 24.14020538330078, 25.40508460998535, 26.669963836669922, 27.934844970703125, 29.199724197387695, 30.464603424072266, 31.72948455810547, 32.994361877441406, 34.25924301147461]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 9.0, 4.0, 10.0, 15.0, 21.0, 34.0, 56.0, 84.0, 101.0, 164.0, 243.0, 354.0, 619.0, 915.0, 1577.0, 2604.0, 4471.0, 7903.0, 14019.0, 26372.0, 50693.0, 97250.0, 182971.0, 255718.0, 187599.0, 100678.0, 52316.0, 27921.0, 14454.0, 7969.0, 4525.0, 2621.0, 1565.0, 963.0, 620.0, 379.0, 238.0, 157.0, 112.0, 64.0, 50.0, 39.0, 28.0, 14.0, 17.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.5367431640625, -2.444580078125, -2.3524169921875, -2.26025390625, -2.1680908203125, -2.075927734375, -1.9837646484375, -1.8916015625, -1.7994384765625, -1.707275390625, -1.6151123046875, -1.52294921875, -1.4307861328125, -1.338623046875, -1.2464599609375, -1.154296875, -1.0621337890625, -0.969970703125, -0.8778076171875, -0.78564453125, -0.6934814453125, -0.601318359375, -0.5091552734375, -0.4169921875, -0.3248291015625, -0.232666015625, -0.1405029296875, -0.04833984375, 0.0438232421875, 0.135986328125, 0.2281494140625, 0.3203125, 0.4124755859375, 0.504638671875, 0.5968017578125, 0.68896484375, 0.7811279296875, 0.873291015625, 0.9654541015625, 1.0576171875, 1.1497802734375, 1.241943359375, 1.3341064453125, 1.42626953125, 1.5184326171875, 1.610595703125, 1.7027587890625, 1.794921875, 1.8870849609375, 1.979248046875, 2.0714111328125, 2.16357421875, 2.2557373046875, 2.347900390625, 2.4400634765625, 2.5322265625, 2.6243896484375, 2.716552734375, 2.8087158203125, 2.90087890625, 2.9930419921875, 3.085205078125, 3.1773681640625, 3.26953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 4.0, 14.0, 16.0, 7.0, 21.0, 16.0, 27.0, 25.0, 27.0, 43.0, 49.0, 41.0, 41.0, 43.0, 36.0, 64.0, 49.0, 51.0, 46.0, 47.0, 33.0, 38.0, 32.0, 36.0, 33.0, 29.0, 22.0, 22.0, 16.0, 13.0, 8.0, 15.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.96875, -3.86480712890625, -3.7608642578125, -3.65692138671875, -3.552978515625, -3.44903564453125, -3.3450927734375, -3.24114990234375, -3.13720703125, -3.03326416015625, -2.9293212890625, -2.82537841796875, -2.721435546875, -2.61749267578125, -2.5135498046875, -2.40960693359375, -2.3056640625, -2.20172119140625, -2.0977783203125, -1.99383544921875, -1.889892578125, -1.78594970703125, -1.6820068359375, -1.57806396484375, -1.47412109375, -1.37017822265625, -1.2662353515625, -1.16229248046875, -1.058349609375, -0.95440673828125, -0.8504638671875, -0.74652099609375, -0.642578125, -0.53863525390625, -0.4346923828125, -0.33074951171875, -0.226806640625, -0.12286376953125, -0.0189208984375, 0.08502197265625, 0.18896484375, 0.29290771484375, 0.3968505859375, 0.50079345703125, 0.604736328125, 0.70867919921875, 0.8126220703125, 0.91656494140625, 1.0205078125, 1.12445068359375, 1.2283935546875, 1.33233642578125, 1.436279296875, 1.54022216796875, 1.6441650390625, 1.74810791015625, 1.85205078125, 1.95599365234375, 2.0599365234375, 2.16387939453125, 2.267822265625, 2.37176513671875, 2.4757080078125, 2.57965087890625, 2.68359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 5.0, 5.0, 8.0, 11.0, 9.0, 11.0, 31.0, 33.0, 49.0, 56.0, 88.0, 158.0, 248.0, 429.0, 851.0, 1774.0, 4999.0, 28960.0, 463717.0, 507850.0, 30135.0, 5118.0, 1845.0, 856.0, 495.0, 283.0, 167.0, 120.0, 58.0, 51.0, 36.0, 29.0, 18.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.6524658203125, -10.258056640625, -9.8636474609375, -9.46923828125, -9.0748291015625, -8.680419921875, -8.2860107421875, -7.8916015625, -7.4971923828125, -7.102783203125, -6.7083740234375, -6.31396484375, -5.9195556640625, -5.525146484375, -5.1307373046875, -4.736328125, -4.3419189453125, -3.947509765625, -3.5531005859375, -3.15869140625, -2.7642822265625, -2.369873046875, -1.9754638671875, -1.5810546875, -1.1866455078125, -0.792236328125, -0.3978271484375, -0.00341796875, 0.3909912109375, 0.785400390625, 1.1798095703125, 1.57421875, 1.9686279296875, 2.363037109375, 2.7574462890625, 3.15185546875, 3.5462646484375, 3.940673828125, 4.3350830078125, 4.7294921875, 5.1239013671875, 5.518310546875, 5.9127197265625, 6.30712890625, 6.7015380859375, 7.095947265625, 7.4903564453125, 7.884765625, 8.2791748046875, 8.673583984375, 9.0679931640625, 9.46240234375, 9.8568115234375, 10.251220703125, 10.6456298828125, 11.0400390625, 11.4344482421875, 11.828857421875, 12.2232666015625, 12.61767578125, 13.0120849609375, 13.406494140625, 13.8009033203125, 14.1953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 15.0, 7.0, 19.0, 14.0, 14.0, 23.0, 22.0, 35.0, 44.0, 28.0, 36.0, 52.0, 55.0, 54.0, 65.0, 51.0, 62.0, 35.0, 53.0, 52.0, 35.0, 30.0, 32.0, 32.0, 35.0, 17.0, 15.0, 12.0, 5.0, 7.0, 10.0, 3.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7596435546875, -13.261474609375, -12.7633056640625, -12.26513671875, -11.7669677734375, -11.268798828125, -10.7706298828125, -10.2724609375, -9.7742919921875, -9.276123046875, -8.7779541015625, -8.27978515625, -7.7816162109375, -7.283447265625, -6.7852783203125, -6.287109375, -5.7889404296875, -5.290771484375, -4.7926025390625, -4.29443359375, -3.7962646484375, -3.298095703125, -2.7999267578125, -2.3017578125, -1.8035888671875, -1.305419921875, -0.8072509765625, -0.30908203125, 0.1890869140625, 0.687255859375, 1.1854248046875, 1.68359375, 2.1817626953125, 2.679931640625, 3.1781005859375, 3.67626953125, 4.1744384765625, 4.672607421875, 5.1707763671875, 5.6689453125, 6.1671142578125, 6.665283203125, 7.1634521484375, 7.66162109375, 8.1597900390625, 8.657958984375, 9.1561279296875, 9.654296875, 10.1524658203125, 10.650634765625, 11.1488037109375, 11.64697265625, 12.1451416015625, 12.643310546875, 13.1414794921875, 13.6396484375, 14.1378173828125, 14.635986328125, 15.1341552734375, 15.63232421875, 16.1304931640625, 16.628662109375, 17.1268310546875, 17.625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 17.0, 25.0, 46.0, 58.0, 104.0, 179.0, 326.0, 714.0, 1950.0, 6777.0, 45098.0, 769729.0, 199910.0, 17728.0, 3600.0, 1198.0, 465.0, 262.0, 134.0, 68.0, 40.0, 33.0, 22.0, 14.0, 14.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.943603515625, -5.75048828125, -5.557373046875, -5.3642578125, -5.171142578125, -4.97802734375, -4.784912109375, -4.591796875, -4.398681640625, -4.20556640625, -4.012451171875, -3.8193359375, -3.626220703125, -3.43310546875, -3.239990234375, -3.046875, -2.853759765625, -2.66064453125, -2.467529296875, -2.2744140625, -2.081298828125, -1.88818359375, -1.695068359375, -1.501953125, -1.308837890625, -1.11572265625, -0.922607421875, -0.7294921875, -0.536376953125, -0.34326171875, -0.150146484375, 0.04296875, 0.236083984375, 0.42919921875, 0.622314453125, 0.8154296875, 1.008544921875, 1.20166015625, 1.394775390625, 1.587890625, 1.781005859375, 1.97412109375, 2.167236328125, 2.3603515625, 2.553466796875, 2.74658203125, 2.939697265625, 3.1328125, 3.325927734375, 3.51904296875, 3.712158203125, 3.9052734375, 4.098388671875, 4.29150390625, 4.484619140625, 4.677734375, 4.870849609375, 5.06396484375, 5.257080078125, 5.4501953125, 5.643310546875, 5.83642578125, 6.029541015625, 6.22265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 14.0, 12.0, 20.0, 22.0, 32.0, 39.0, 75.0, 114.0, 156.0, 145.0, 98.0, 60.0, 47.0, 40.0, 23.0, 11.0, 16.0, 7.0, 13.0, 12.0, 6.0, 4.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0014009475708007812, -0.0013674795627593994, -0.0013340115547180176, -0.0013005435466766357, -0.001267075538635254, -0.001233607530593872, -0.0012001395225524902, -0.0011666715145111084, -0.0011332035064697266, -0.0010997354984283447, -0.0010662674903869629, -0.001032799482345581, -0.0009993314743041992, -0.0009658634662628174, -0.0009323954582214355, -0.0008989274501800537, -0.0008654594421386719, -0.00083199143409729, -0.0007985234260559082, -0.0007650554180145264, -0.0007315874099731445, -0.0006981194019317627, -0.0006646513938903809, -0.000631183385848999, -0.0005977153778076172, -0.0005642473697662354, -0.0005307793617248535, -0.0004973113536834717, -0.00046384334564208984, -0.000430375337600708, -0.00039690732955932617, -0.00036343932151794434, -0.0003299713134765625, -0.00029650330543518066, -0.00026303529739379883, -0.000229567289352417, -0.00019609928131103516, -0.00016263127326965332, -0.00012916326522827148, -9.569525718688965e-05, -6.222724914550781e-05, -2.8759241104125977e-05, 4.708766937255859e-06, 3.8176774978637695e-05, 7.164478302001953e-05, 0.00010511279106140137, 0.0001385807991027832, 0.00017204880714416504, 0.00020551681518554688, 0.0002389848232269287, 0.00027245283126831055, 0.0003059208393096924, 0.0003393888473510742, 0.00037285685539245605, 0.0004063248634338379, 0.0004397928714752197, 0.00047326087951660156, 0.0005067288875579834, 0.0005401968955993652, 0.0005736649036407471, 0.0006071329116821289, 0.0006406009197235107, 0.0006740689277648926, 0.0007075369358062744, 0.0007410049438476562]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 16.0, 11.0, 15.0, 25.0, 52.0, 59.0, 126.0, 208.0, 368.0, 674.0, 1399.0, 3474.0, 13306.0, 86020.0, 795038.0, 123156.0, 16882.0, 4505.0, 1558.0, 749.0, 361.0, 207.0, 148.0, 75.0, 43.0, 24.0, 20.0, 14.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.4288330078125, -4.232666015625, -4.0364990234375, -3.84033203125, -3.6441650390625, -3.447998046875, -3.2518310546875, -3.0556640625, -2.8594970703125, -2.663330078125, -2.4671630859375, -2.27099609375, -2.0748291015625, -1.878662109375, -1.6824951171875, -1.486328125, -1.2901611328125, -1.093994140625, -0.8978271484375, -0.70166015625, -0.5054931640625, -0.309326171875, -0.1131591796875, 0.0830078125, 0.2791748046875, 0.475341796875, 0.6715087890625, 0.86767578125, 1.0638427734375, 1.260009765625, 1.4561767578125, 1.65234375, 1.8485107421875, 2.044677734375, 2.2408447265625, 2.43701171875, 2.6331787109375, 2.829345703125, 3.0255126953125, 3.2216796875, 3.4178466796875, 3.614013671875, 3.8101806640625, 4.00634765625, 4.2025146484375, 4.398681640625, 4.5948486328125, 4.791015625, 4.9871826171875, 5.183349609375, 5.3795166015625, 5.57568359375, 5.7718505859375, 5.968017578125, 6.1641845703125, 6.3603515625, 6.5565185546875, 6.752685546875, 6.9488525390625, 7.14501953125, 7.3411865234375, 7.537353515625, 7.7335205078125, 7.9296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 7.0, 9.0, 13.0, 18.0, 18.0, 20.0, 46.0, 59.0, 64.0, 84.0, 114.0, 132.0, 94.0, 78.0, 61.0, 53.0, 30.0, 29.0, 12.0, 15.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.71917724609375, -3.5360107421875, -3.35284423828125, -3.169677734375, -2.98651123046875, -2.8033447265625, -2.62017822265625, -2.43701171875, -2.25384521484375, -2.0706787109375, -1.88751220703125, -1.704345703125, -1.52117919921875, -1.3380126953125, -1.15484619140625, -0.9716796875, -0.78851318359375, -0.6053466796875, -0.42218017578125, -0.239013671875, -0.05584716796875, 0.1273193359375, 0.31048583984375, 0.49365234375, 0.67681884765625, 0.8599853515625, 1.04315185546875, 1.226318359375, 1.40948486328125, 1.5926513671875, 1.77581787109375, 1.958984375, 2.14215087890625, 2.3253173828125, 2.50848388671875, 2.691650390625, 2.87481689453125, 3.0579833984375, 3.24114990234375, 3.42431640625, 3.60748291015625, 3.7906494140625, 3.97381591796875, 4.156982421875, 4.34014892578125, 4.5233154296875, 4.70648193359375, 4.8896484375, 5.07281494140625, 5.2559814453125, 5.43914794921875, 5.622314453125, 5.80548095703125, 5.9886474609375, 6.17181396484375, 6.35498046875, 6.53814697265625, 6.7213134765625, 6.90447998046875, 7.087646484375, 7.27081298828125, 7.4539794921875, 7.63714599609375, 7.8203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 25.0, 66.0, 215.0, 371.0, 183.0, 71.0, 26.0, 17.0, 8.0, 4.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.49900817871094, -143.09243774414062, -138.6858673095703, -134.279296875, -129.8727264404297, -125.46615600585938, -121.05958557128906, -116.65301513671875, -112.24644470214844, -107.83987426757812, -103.43330383300781, -99.0267333984375, -94.62016296386719, -90.21359252929688, -85.80702209472656, -81.40045166015625, -76.99388122558594, -72.58731079101562, -68.18074035644531, -63.774169921875, -59.36759948730469, -54.961029052734375, -50.55445861816406, -46.14788818359375, -41.74131774902344, -37.334747314453125, -32.92817687988281, -28.5216064453125, -24.115036010742188, -19.708465576171875, -15.301895141601562, -10.89532470703125, -6.48876953125, -2.0821990966796875, 2.324371337890625, 6.7309417724609375, 11.13751220703125, 15.544082641601562, 19.950653076171875, 24.357223510742188, 28.7637939453125, 33.17036437988281, 37.576934814453125, 41.98350524902344, 46.39007568359375, 50.79664611816406, 55.203216552734375, 59.60978698730469, 64.016357421875, 68.42292785644531, 72.82949829101562, 77.23606872558594, 81.64263916015625, 86.04920959472656, 90.45578002929688, 94.86235046386719, 99.2689208984375, 103.67549133300781, 108.08206176757812, 112.48863220214844, 116.89520263671875, 121.30177307128906, 125.70834350585938, 130.1149139404297, 134.521484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 6.0, 7.0, 15.0, 23.0, 12.0, 14.0, 28.0, 25.0, 29.0, 30.0, 32.0, 33.0, 36.0, 51.0, 43.0, 64.0, 38.0, 63.0, 53.0, 45.0, 39.0, 48.0, 32.0, 30.0, 31.0, 17.0, 21.0, 21.0, 20.0, 10.0, 8.0, 10.0, 8.0, 10.0, 14.0, 7.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.07443618774414, -57.34138870239258, -55.608341217041016, -53.87529754638672, -52.142250061035156, -50.409202575683594, -48.67615509033203, -46.94310760498047, -45.210060119628906, -43.477012634277344, -41.74396514892578, -40.01091766357422, -38.27787399291992, -36.54482650756836, -34.8117790222168, -33.078731536865234, -31.345687866210938, -29.612640380859375, -27.879594802856445, -26.146547317504883, -24.413501739501953, -22.68045425415039, -20.947406768798828, -19.214359283447266, -17.481313705444336, -15.74826717376709, -14.015220642089844, -12.282173156738281, -10.549126625061035, -8.816080093383789, -7.083032608032227, -5.3499860763549805, -3.616943359375, -1.8838965892791748, -0.1508498191833496, 1.5821971893310547, 3.315243721008301, 5.048290252685547, 6.781337738037109, 8.514384269714355, 10.247430801391602, 11.980477333068848, 13.713523864746094, 15.446571350097656, 17.17961883544922, 18.91266441345215, 20.64571189880371, 22.37875747680664, 24.111804962158203, 25.844852447509766, 27.577898025512695, 29.310945510864258, 31.043991088867188, 32.77703857421875, 34.51008605957031, 36.243133544921875, 37.97618103027344, 39.709228515625, 41.44227600097656, 43.175323486328125, 44.90836715698242, 46.641414642333984, 48.37446212768555, 50.10750961303711, 51.840553283691406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 14.0, 14.0, 22.0, 30.0, 50.0, 82.0, 137.0, 253.0, 1639.0, 1248495.0, 2941079.0, 1770.0, 317.0, 147.0, 81.0, 44.0, 39.0, 17.0, 14.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -22.972900390625, -22.05517578125, -21.137451171875, -20.2197265625, -19.302001953125, -18.38427734375, -17.466552734375, -16.548828125, -15.631103515625, -14.71337890625, -13.795654296875, -12.8779296875, -11.960205078125, -11.04248046875, -10.124755859375, -9.20703125, -8.289306640625, -7.37158203125, -6.453857421875, -5.5361328125, -4.618408203125, -3.70068359375, -2.782958984375, -1.865234375, -0.947509765625, -0.02978515625, 0.887939453125, 1.8056640625, 2.723388671875, 3.64111328125, 4.558837890625, 5.4765625, 6.394287109375, 7.31201171875, 8.229736328125, 9.1474609375, 10.065185546875, 10.98291015625, 11.900634765625, 12.818359375, 13.736083984375, 14.65380859375, 15.571533203125, 16.4892578125, 17.406982421875, 18.32470703125, 19.242431640625, 20.16015625, 21.077880859375, 21.99560546875, 22.913330078125, 23.8310546875, 24.748779296875, 25.66650390625, 26.584228515625, 27.501953125, 28.419677734375, 29.33740234375, 30.255126953125, 31.1728515625, 32.090576171875, 33.00830078125, 33.926025390625, 34.84375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 6.0, 5.0, 0.0, 1.0, 2.0, 8.0, 8.0, 6.0, 5.0, 16.0, 23.0, 25.0, 25.0, 42.0, 29.0, 29.0, 46.0, 46.0, 54.0, 57.0, 62.0, 53.0, 47.0, 59.0, 45.0, 44.0, 42.0, 52.0, 32.0, 29.0, 27.0, 20.0, 13.0, 21.0, 11.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.35498046875, -4.2412109375, -4.12744140625, -4.013671875, -3.89990234375, -3.7861328125, -3.67236328125, -3.55859375, -3.44482421875, -3.3310546875, -3.21728515625, -3.103515625, -2.98974609375, -2.8759765625, -2.76220703125, -2.6484375, -2.53466796875, -2.4208984375, -2.30712890625, -2.193359375, -2.07958984375, -1.9658203125, -1.85205078125, -1.73828125, -1.62451171875, -1.5107421875, -1.39697265625, -1.283203125, -1.16943359375, -1.0556640625, -0.94189453125, -0.828125, -0.71435546875, -0.6005859375, -0.48681640625, -0.373046875, -0.25927734375, -0.1455078125, -0.03173828125, 0.08203125, 0.19580078125, 0.3095703125, 0.42333984375, 0.537109375, 0.65087890625, 0.7646484375, 0.87841796875, 0.9921875, 1.10595703125, 1.2197265625, 1.33349609375, 1.447265625, 1.56103515625, 1.6748046875, 1.78857421875, 1.90234375, 2.01611328125, 2.1298828125, 2.24365234375, 2.357421875, 2.47119140625, 2.5849609375, 2.69873046875, 2.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 15.0, 14.0, 42.0, 44.0, 81.0, 151.0, 222.0, 463.0, 878.0, 1666.0, 3966.0, 10174.0, 34389.0, 214353.0, 2951054.0, 873902.0, 74277.0, 17620.0, 5951.0, 2389.0, 1151.0, 622.0, 297.0, 188.0, 120.0, 89.0, 47.0, 28.0, 15.0, 16.0, 7.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.2791748046875, -5.081787109375, -4.8843994140625, -4.68701171875, -4.4896240234375, -4.292236328125, -4.0948486328125, -3.8974609375, -3.7000732421875, -3.502685546875, -3.3052978515625, -3.10791015625, -2.9105224609375, -2.713134765625, -2.5157470703125, -2.318359375, -2.1209716796875, -1.923583984375, -1.7261962890625, -1.52880859375, -1.3314208984375, -1.134033203125, -0.9366455078125, -0.7392578125, -0.5418701171875, -0.344482421875, -0.1470947265625, 0.05029296875, 0.2476806640625, 0.445068359375, 0.6424560546875, 0.83984375, 1.0372314453125, 1.234619140625, 1.4320068359375, 1.62939453125, 1.8267822265625, 2.024169921875, 2.2215576171875, 2.4189453125, 2.6163330078125, 2.813720703125, 3.0111083984375, 3.20849609375, 3.4058837890625, 3.603271484375, 3.8006591796875, 3.998046875, 4.1954345703125, 4.392822265625, 4.5902099609375, 4.78759765625, 4.9849853515625, 5.182373046875, 5.3797607421875, 5.5771484375, 5.7745361328125, 5.971923828125, 6.1693115234375, 6.36669921875, 6.5640869140625, 6.761474609375, 6.9588623046875, 7.15625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 7.0, 7.0, 14.0, 12.0, 21.0, 38.0, 52.0, 87.0, 143.0, 269.0, 462.0, 705.0, 822.0, 580.0, 340.0, 186.0, 107.0, 53.0, 44.0, 38.0, 17.0, 8.0, 18.0, 6.0, 5.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3753662109375, -6.164794921875, -5.9542236328125, -5.74365234375, -5.5330810546875, -5.322509765625, -5.1119384765625, -4.9013671875, -4.6907958984375, -4.480224609375, -4.2696533203125, -4.05908203125, -3.8485107421875, -3.637939453125, -3.4273681640625, -3.216796875, -3.0062255859375, -2.795654296875, -2.5850830078125, -2.37451171875, -2.1639404296875, -1.953369140625, -1.7427978515625, -1.5322265625, -1.3216552734375, -1.111083984375, -0.9005126953125, -0.68994140625, -0.4793701171875, -0.268798828125, -0.0582275390625, 0.15234375, 0.3629150390625, 0.573486328125, 0.7840576171875, 0.99462890625, 1.2052001953125, 1.415771484375, 1.6263427734375, 1.8369140625, 2.0474853515625, 2.258056640625, 2.4686279296875, 2.67919921875, 2.8897705078125, 3.100341796875, 3.3109130859375, 3.521484375, 3.7320556640625, 3.942626953125, 4.1531982421875, 4.36376953125, 4.5743408203125, 4.784912109375, 4.9954833984375, 5.2060546875, 5.4166259765625, 5.627197265625, 5.8377685546875, 6.04833984375, 6.2589111328125, 6.469482421875, 6.6800537109375, 6.890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 16.0, 27.0, 48.0, 85.0, 167.0, 207.0, 180.0, 146.0, 56.0, 24.0, 11.0, 10.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.01990509033203, -64.9867172241211, -62.95352554321289, -60.92033386230469, -58.88714599609375, -56.85395431518555, -54.820762634277344, -52.787574768066406, -50.75438690185547, -48.721195220947266, -46.68800735473633, -44.654815673828125, -42.62162780761719, -40.588436126708984, -38.55524444580078, -36.522056579589844, -34.48886489868164, -32.45567321777344, -30.4224853515625, -28.389293670654297, -26.35610580444336, -24.322914123535156, -22.289724349975586, -20.256534576416016, -18.223344802856445, -16.190155029296875, -14.156965255737305, -12.123774528503418, -10.090584754943848, -8.057394981384277, -6.024204254150391, -3.9910144805908203, -1.9578208923339844, 0.07536911964416504, 2.1085591316223145, 4.141749382019043, 6.174939155578613, 8.208128929138184, 10.24131965637207, 12.27450942993164, 14.307699203491211, 16.34088897705078, 18.37407875061035, 20.407268524169922, 22.440460205078125, 24.473648071289062, 26.506839752197266, 28.540029525756836, 30.573219299316406, 32.60641098022461, 34.63959884643555, 36.67279052734375, 38.70597839355469, 40.73917007446289, 42.772361755371094, 44.80554962158203, 46.83873748779297, 48.87192916870117, 50.90511703491211, 52.93830871582031, 54.97149658203125, 57.00468826293945, 59.037879943847656, 61.071067810058594, 63.1042594909668]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 12.0, 12.0, 12.0, 15.0, 21.0, 20.0, 19.0, 27.0, 31.0, 21.0, 34.0, 38.0, 47.0, 50.0, 42.0, 51.0, 52.0, 48.0, 38.0, 33.0, 46.0, 47.0, 41.0, 33.0, 29.0, 26.0, 27.0, 27.0, 12.0, 15.0, 10.0, 10.0, 6.0, 4.0, 5.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.61740493774414, -22.8070068359375, -21.99660873413086, -21.18621063232422, -20.375810623168945, -19.565412521362305, -18.755014419555664, -17.944616317749023, -17.13421630859375, -16.32381820678711, -15.513419151306152, -14.703021049499512, -13.892621994018555, -13.082223892211914, -12.271825790405273, -11.461427688598633, -10.651029586791992, -9.840631484985352, -9.030232429504395, -8.219834327697754, -7.409435749053955, -6.599037170410156, -5.788639068603516, -4.978240489959717, -4.167841911315918, -3.357443332672119, -2.5470449924468994, -1.7366466522216797, -0.9262480735778809, -0.11584949493408203, 0.6945486068725586, 1.5049471855163574, 2.3153457641601562, 3.125744342803955, 3.936142683029175, 4.7465410232543945, 5.556939601898193, 6.367338180541992, 7.177736282348633, 7.988134860992432, 8.79853343963623, 9.608931541442871, 10.419330596923828, 11.229728698730469, 12.04012680053711, 12.850525856018066, 13.660923957824707, 14.471323013305664, 15.281721115112305, 16.092119216918945, 16.902517318725586, 17.71291732788086, 18.5233154296875, 19.33371353149414, 20.14411163330078, 20.954509735107422, 21.764907836914062, 22.575305938720703, 23.385704040527344, 24.196102142333984, 25.006502151489258, 25.8169002532959, 26.62729835510254, 27.43769645690918, 28.248096466064453]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 12.0, 5.0, 10.0, 18.0, 13.0, 39.0, 41.0, 81.0, 106.0, 175.0, 242.0, 396.0, 677.0, 1181.0, 1882.0, 3507.0, 6548.0, 12387.0, 24335.0, 51175.0, 116088.0, 260839.0, 299696.0, 144679.0, 63278.0, 29183.0, 14607.0, 7535.0, 4131.0, 2259.0, 1374.0, 757.0, 487.0, 268.0, 185.0, 129.0, 71.0, 45.0, 31.0, 22.0, 19.0, 16.0, 4.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.08984375, -3.973419189453125, -3.85699462890625, -3.740570068359375, -3.6241455078125, -3.507720947265625, -3.39129638671875, -3.274871826171875, -3.158447265625, -3.042022705078125, -2.92559814453125, -2.809173583984375, -2.6927490234375, -2.576324462890625, -2.45989990234375, -2.343475341796875, -2.22705078125, -2.110626220703125, -1.99420166015625, -1.877777099609375, -1.7613525390625, -1.644927978515625, -1.52850341796875, -1.412078857421875, -1.295654296875, -1.179229736328125, -1.06280517578125, -0.946380615234375, -0.8299560546875, -0.713531494140625, -0.59710693359375, -0.480682373046875, -0.3642578125, -0.247833251953125, -0.13140869140625, -0.014984130859375, 0.1014404296875, 0.217864990234375, 0.33428955078125, 0.450714111328125, 0.567138671875, 0.683563232421875, 0.79998779296875, 0.916412353515625, 1.0328369140625, 1.149261474609375, 1.26568603515625, 1.382110595703125, 1.49853515625, 1.614959716796875, 1.73138427734375, 1.847808837890625, 1.9642333984375, 2.080657958984375, 2.19708251953125, 2.313507080078125, 2.429931640625, 2.546356201171875, 2.66278076171875, 2.779205322265625, 2.8956298828125, 3.012054443359375, 3.12847900390625, 3.244903564453125, 3.361328125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 8.0, 14.0, 15.0, 15.0, 16.0, 25.0, 28.0, 25.0, 28.0, 29.0, 36.0, 47.0, 35.0, 42.0, 50.0, 47.0, 40.0, 48.0, 45.0, 44.0, 37.0, 28.0, 29.0, 29.0, 32.0, 25.0, 36.0, 19.0, 29.0, 15.0, 14.0, 9.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.775634765625, -2.68408203125, -2.592529296875, -2.5009765625, -2.409423828125, -2.31787109375, -2.226318359375, -2.134765625, -2.043212890625, -1.95166015625, -1.860107421875, -1.7685546875, -1.677001953125, -1.58544921875, -1.493896484375, -1.40234375, -1.310791015625, -1.21923828125, -1.127685546875, -1.0361328125, -0.944580078125, -0.85302734375, -0.761474609375, -0.669921875, -0.578369140625, -0.48681640625, -0.395263671875, -0.3037109375, -0.212158203125, -0.12060546875, -0.029052734375, 0.0625, 0.154052734375, 0.24560546875, 0.337158203125, 0.4287109375, 0.520263671875, 0.61181640625, 0.703369140625, 0.794921875, 0.886474609375, 0.97802734375, 1.069580078125, 1.1611328125, 1.252685546875, 1.34423828125, 1.435791015625, 1.52734375, 1.618896484375, 1.71044921875, 1.802001953125, 1.8935546875, 1.985107421875, 2.07666015625, 2.168212890625, 2.259765625, 2.351318359375, 2.44287109375, 2.534423828125, 2.6259765625, 2.717529296875, 2.80908203125, 2.900634765625, 2.9921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 9.0, 20.0, 20.0, 43.0, 74.0, 114.0, 203.0, 363.0, 872.0, 2449.0, 9593.0, 66058.0, 772733.0, 171693.0, 18153.0, 3768.0, 1227.0, 517.0, 247.0, 155.0, 67.0, 47.0, 23.0, 30.0, 15.0, 16.0, 6.0, 1.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0859375, -14.6632080078125, -14.240478515625, -13.8177490234375, -13.39501953125, -12.9722900390625, -12.549560546875, -12.1268310546875, -11.7041015625, -11.2813720703125, -10.858642578125, -10.4359130859375, -10.01318359375, -9.5904541015625, -9.167724609375, -8.7449951171875, -8.322265625, -7.8995361328125, -7.476806640625, -7.0540771484375, -6.63134765625, -6.2086181640625, -5.785888671875, -5.3631591796875, -4.9404296875, -4.5177001953125, -4.094970703125, -3.6722412109375, -3.24951171875, -2.8267822265625, -2.404052734375, -1.9813232421875, -1.55859375, -1.1358642578125, -0.713134765625, -0.2904052734375, 0.13232421875, 0.5550537109375, 0.977783203125, 1.4005126953125, 1.8232421875, 2.2459716796875, 2.668701171875, 3.0914306640625, 3.51416015625, 3.9368896484375, 4.359619140625, 4.7823486328125, 5.205078125, 5.6278076171875, 6.050537109375, 6.4732666015625, 6.89599609375, 7.3187255859375, 7.741455078125, 8.1641845703125, 8.5869140625, 9.0096435546875, 9.432373046875, 9.8551025390625, 10.27783203125, 10.7005615234375, 11.123291015625, 11.5460205078125, 11.96875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 13.0, 14.0, 16.0, 18.0, 30.0, 19.0, 30.0, 29.0, 35.0, 57.0, 62.0, 54.0, 62.0, 74.0, 71.0, 51.0, 42.0, 37.0, 40.0, 31.0, 22.0, 37.0, 20.0, 19.0, 18.0, 15.0, 10.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.052978515625, -14.59814453125, -14.143310546875, -13.6884765625, -13.233642578125, -12.77880859375, -12.323974609375, -11.869140625, -11.414306640625, -10.95947265625, -10.504638671875, -10.0498046875, -9.594970703125, -9.14013671875, -8.685302734375, -8.23046875, -7.775634765625, -7.32080078125, -6.865966796875, -6.4111328125, -5.956298828125, -5.50146484375, -5.046630859375, -4.591796875, -4.136962890625, -3.68212890625, -3.227294921875, -2.7724609375, -2.317626953125, -1.86279296875, -1.407958984375, -0.953125, -0.498291015625, -0.04345703125, 0.411376953125, 0.8662109375, 1.321044921875, 1.77587890625, 2.230712890625, 2.685546875, 3.140380859375, 3.59521484375, 4.050048828125, 4.5048828125, 4.959716796875, 5.41455078125, 5.869384765625, 6.32421875, 6.779052734375, 7.23388671875, 7.688720703125, 8.1435546875, 8.598388671875, 9.05322265625, 9.508056640625, 9.962890625, 10.417724609375, 10.87255859375, 11.327392578125, 11.7822265625, 12.237060546875, 12.69189453125, 13.146728515625, 13.6015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 18.0, 24.0, 62.0, 136.0, 417.0, 1534.0, 11937.0, 406207.0, 611973.0, 13860.0, 1693.0, 418.0, 137.0, 54.0, 26.0, 11.0, 13.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75390625, -7.41717529296875, -7.0804443359375, -6.74371337890625, -6.406982421875, -6.07025146484375, -5.7335205078125, -5.39678955078125, -5.06005859375, -4.72332763671875, -4.3865966796875, -4.04986572265625, -3.713134765625, -3.37640380859375, -3.0396728515625, -2.70294189453125, -2.3662109375, -2.02947998046875, -1.6927490234375, -1.35601806640625, -1.019287109375, -0.68255615234375, -0.3458251953125, -0.00909423828125, 0.32763671875, 0.66436767578125, 1.0010986328125, 1.33782958984375, 1.674560546875, 2.01129150390625, 2.3480224609375, 2.68475341796875, 3.021484375, 3.35821533203125, 3.6949462890625, 4.03167724609375, 4.368408203125, 4.70513916015625, 5.0418701171875, 5.37860107421875, 5.71533203125, 6.05206298828125, 6.3887939453125, 6.72552490234375, 7.062255859375, 7.39898681640625, 7.7357177734375, 8.07244873046875, 8.4091796875, 8.74591064453125, 9.0826416015625, 9.41937255859375, 9.756103515625, 10.09283447265625, 10.4295654296875, 10.76629638671875, 11.10302734375, 11.43975830078125, 11.7764892578125, 12.11322021484375, 12.449951171875, 12.78668212890625, 13.1234130859375, 13.46014404296875, 13.796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 10.0, 20.0, 17.0, 41.0, 52.0, 66.0, 102.0, 146.0, 112.0, 128.0, 66.0, 37.0, 31.0, 26.0, 18.0, 21.0, 18.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010356903076171875, -0.0010033398866653442, -0.000970989465713501, -0.0009386390447616577, -0.0009062886238098145, -0.0008739382028579712, -0.0008415877819061279, -0.0008092373609542847, -0.0007768869400024414, -0.0007445365190505981, -0.0007121860980987549, -0.0006798356771469116, -0.0006474852561950684, -0.0006151348352432251, -0.0005827844142913818, -0.0005504339933395386, -0.0005180835723876953, -0.00048573315143585205, -0.0004533827304840088, -0.00042103230953216553, -0.00038868188858032227, -0.000356331467628479, -0.00032398104667663574, -0.0002916306257247925, -0.0002592802047729492, -0.00022692978382110596, -0.0001945793628692627, -0.00016222894191741943, -0.00012987852096557617, -9.752810001373291e-05, -6.517767906188965e-05, -3.282725811004639e-05, -4.76837158203125e-07, 3.187358379364014e-05, 6.42240047454834e-05, 9.657442569732666e-05, 0.00012892484664916992, 0.00016127526760101318, 0.00019362568855285645, 0.0002259761095046997, 0.00025832653045654297, 0.00029067695140838623, 0.0003230273723602295, 0.00035537779331207275, 0.000387728214263916, 0.0004200786352157593, 0.00045242905616760254, 0.0004847794771194458, 0.0005171298980712891, 0.0005494803190231323, 0.0005818307399749756, 0.0006141811609268188, 0.0006465315818786621, 0.0006788820028305054, 0.0007112324237823486, 0.0007435828447341919, 0.0007759332656860352, 0.0008082836866378784, 0.0008406341075897217, 0.0008729845285415649, 0.0009053349494934082, 0.0009376853704452515, 0.0009700357913970947, 0.001002386212348938, 0.0010347366333007812]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 3.0, 11.0, 9.0, 22.0, 27.0, 35.0, 50.0, 80.0, 135.0, 173.0, 341.0, 582.0, 1146.0, 2604.0, 7201.0, 23943.0, 119765.0, 710470.0, 141890.0, 26643.0, 7809.0, 2737.0, 1265.0, 641.0, 337.0, 198.0, 138.0, 91.0, 59.0, 28.0, 34.0, 23.0, 21.0, 13.0, 11.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.2608642578125, -4.111572265625, -3.9622802734375, -3.81298828125, -3.6636962890625, -3.514404296875, -3.3651123046875, -3.2158203125, -3.0665283203125, -2.917236328125, -2.7679443359375, -2.61865234375, -2.4693603515625, -2.320068359375, -2.1707763671875, -2.021484375, -1.8721923828125, -1.722900390625, -1.5736083984375, -1.42431640625, -1.2750244140625, -1.125732421875, -0.9764404296875, -0.8271484375, -0.6778564453125, -0.528564453125, -0.3792724609375, -0.22998046875, -0.0806884765625, 0.068603515625, 0.2178955078125, 0.3671875, 0.5164794921875, 0.665771484375, 0.8150634765625, 0.96435546875, 1.1136474609375, 1.262939453125, 1.4122314453125, 1.5615234375, 1.7108154296875, 1.860107421875, 2.0093994140625, 2.15869140625, 2.3079833984375, 2.457275390625, 2.6065673828125, 2.755859375, 2.9051513671875, 3.054443359375, 3.2037353515625, 3.35302734375, 3.5023193359375, 3.651611328125, 3.8009033203125, 3.9501953125, 4.0994873046875, 4.248779296875, 4.3980712890625, 4.54736328125, 4.6966552734375, 4.845947265625, 4.9952392578125, 5.14453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 6.0, 3.0, 6.0, 4.0, 10.0, 5.0, 11.0, 13.0, 24.0, 27.0, 42.0, 49.0, 75.0, 82.0, 95.0, 91.0, 99.0, 66.0, 85.0, 51.0, 46.0, 25.0, 18.0, 23.0, 14.0, 4.0, 2.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.62652587890625, -4.4835205078125, -4.34051513671875, -4.197509765625, -4.05450439453125, -3.9114990234375, -3.76849365234375, -3.62548828125, -3.48248291015625, -3.3394775390625, -3.19647216796875, -3.053466796875, -2.91046142578125, -2.7674560546875, -2.62445068359375, -2.4814453125, -2.33843994140625, -2.1954345703125, -2.05242919921875, -1.909423828125, -1.76641845703125, -1.6234130859375, -1.48040771484375, -1.33740234375, -1.19439697265625, -1.0513916015625, -0.90838623046875, -0.765380859375, -0.62237548828125, -0.4793701171875, -0.33636474609375, -0.193359375, -0.05035400390625, 0.0926513671875, 0.23565673828125, 0.378662109375, 0.52166748046875, 0.6646728515625, 0.80767822265625, 0.95068359375, 1.09368896484375, 1.2366943359375, 1.37969970703125, 1.522705078125, 1.66571044921875, 1.8087158203125, 1.95172119140625, 2.0947265625, 2.23773193359375, 2.3807373046875, 2.52374267578125, 2.666748046875, 2.80975341796875, 2.9527587890625, 3.09576416015625, 3.23876953125, 3.38177490234375, 3.5247802734375, 3.66778564453125, 3.810791015625, 3.95379638671875, 4.0968017578125, 4.23980712890625, 4.3828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 8.0, 11.0, 26.0, 48.0, 142.0, 338.0, 224.0, 130.0, 44.0, 20.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.65896606445312, -73.74069213867188, -69.8224105834961, -65.90413665771484, -61.98585510253906, -58.06758117675781, -54.1493034362793, -50.23102569580078, -46.312747955322266, -42.39447021484375, -38.476192474365234, -34.55791473388672, -30.639638900756836, -26.72136116027832, -22.803085327148438, -18.884807586669922, -14.966529846191406, -11.04825210571289, -7.129975318908691, -3.211698532104492, 0.7065792083740234, 4.624856948852539, 8.543132781982422, 12.461410522460938, 16.379688262939453, 20.29796600341797, 24.216243743896484, 28.134519577026367, 32.05279541015625, 35.97107696533203, 39.88935089111328, 43.8076286315918, 47.72590637207031, 51.64418411254883, 55.562461853027344, 59.480735778808594, 63.399017333984375, 67.31729125976562, 71.23556518554688, 75.15384674072266, 79.07212829589844, 82.99040222167969, 86.90868377685547, 90.82695770263672, 94.7452392578125, 98.66351318359375, 102.581787109375, 106.50006866455078, 110.41834259033203, 114.33661651611328, 118.25489807128906, 122.17317199707031, 126.0914535522461, 130.00973510742188, 133.92800903320312, 137.84628295898438, 141.76455688476562, 145.68283081054688, 149.60110473632812, 153.51939392089844, 157.4376678466797, 161.35594177246094, 165.2742156982422, 169.1925048828125, 173.11077880859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 5.0, 9.0, 11.0, 9.0, 15.0, 20.0, 18.0, 19.0, 28.0, 31.0, 32.0, 33.0, 25.0, 40.0, 41.0, 54.0, 46.0, 37.0, 65.0, 47.0, 58.0, 47.0, 33.0, 37.0, 36.0, 32.0, 25.0, 20.0, 27.0, 17.0, 15.0, 11.0, 11.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.30426025390625, -43.69240188598633, -42.080543518066406, -40.468685150146484, -38.85682678222656, -37.24496841430664, -35.63311004638672, -34.0212516784668, -32.409393310546875, -30.797534942626953, -29.18567657470703, -27.57381820678711, -25.961959838867188, -24.350101470947266, -22.738243103027344, -21.126384735107422, -19.514528274536133, -17.90266990661621, -16.29081153869629, -14.678953170776367, -13.067094802856445, -11.45523738861084, -9.843379020690918, -8.231520652770996, -6.619662284851074, -5.007803916931152, -3.3959457874298096, -1.7840876579284668, -0.17222929000854492, 1.4396286010742188, 3.0514869689941406, 4.6633453369140625, 6.275203704833984, 7.887062072753906, 9.498920440673828, 11.11077880859375, 12.722637176513672, 14.334494590759277, 15.9463529586792, 17.558212280273438, 19.17007064819336, 20.78192901611328, 22.393787384033203, 24.005645751953125, 25.617504119873047, 27.22936248779297, 28.84122085571289, 30.453079223632812, 32.06493377685547, 33.67679214477539, 35.28865051269531, 36.900508880615234, 38.512367248535156, 40.12422561645508, 41.736083984375, 43.34794235229492, 44.959800720214844, 46.571659088134766, 48.18351745605469, 49.79537582397461, 51.40723419189453, 53.01909255981445, 54.630950927734375, 56.2428092956543, 57.85466766357422]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 18.0, 23.0, 38.0, 56.0, 83.0, 131.0, 257.0, 362.0, 791.0, 1474.0, 2941.0, 6677.0, 17368.0, 56378.0, 294909.0, 1984249.0, 1545879.0, 212504.0, 44781.0, 14182.0, 5643.0, 2555.0, 1246.0, 664.0, 402.0, 220.0, 137.0, 87.0, 45.0, 50.0, 24.0, 25.0, 14.0, 7.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.28125, -4.15118408203125, -4.0211181640625, -3.89105224609375, -3.760986328125, -3.63092041015625, -3.5008544921875, -3.37078857421875, -3.24072265625, -3.11065673828125, -2.9805908203125, -2.85052490234375, -2.720458984375, -2.59039306640625, -2.4603271484375, -2.33026123046875, -2.2001953125, -2.07012939453125, -1.9400634765625, -1.80999755859375, -1.679931640625, -1.54986572265625, -1.4197998046875, -1.28973388671875, -1.15966796875, -1.02960205078125, -0.8995361328125, -0.76947021484375, -0.639404296875, -0.50933837890625, -0.3792724609375, -0.24920654296875, -0.119140625, 0.01092529296875, 0.1409912109375, 0.27105712890625, 0.401123046875, 0.53118896484375, 0.6612548828125, 0.79132080078125, 0.92138671875, 1.05145263671875, 1.1815185546875, 1.31158447265625, 1.441650390625, 1.57171630859375, 1.7017822265625, 1.83184814453125, 1.9619140625, 2.09197998046875, 2.2220458984375, 2.35211181640625, 2.482177734375, 2.61224365234375, 2.7423095703125, 2.87237548828125, 3.00244140625, 3.13250732421875, 3.2625732421875, 3.39263916015625, 3.522705078125, 3.65277099609375, 3.7828369140625, 3.91290283203125, 4.04296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 21.0, 11.0, 19.0, 30.0, 32.0, 35.0, 35.0, 33.0, 33.0, 45.0, 46.0, 52.0, 46.0, 47.0, 48.0, 49.0, 31.0, 57.0, 45.0, 34.0, 33.0, 36.0, 34.0, 26.0, 17.0, 12.0, 20.0, 15.0, 10.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.525390625, -3.426300048828125, -3.32720947265625, -3.228118896484375, -3.1290283203125, -3.029937744140625, -2.93084716796875, -2.831756591796875, -2.732666015625, -2.633575439453125, -2.53448486328125, -2.435394287109375, -2.3363037109375, -2.237213134765625, -2.13812255859375, -2.039031982421875, -1.93994140625, -1.840850830078125, -1.74176025390625, -1.642669677734375, -1.5435791015625, -1.444488525390625, -1.34539794921875, -1.246307373046875, -1.147216796875, -1.048126220703125, -0.94903564453125, -0.849945068359375, -0.7508544921875, -0.651763916015625, -0.55267333984375, -0.453582763671875, -0.3544921875, -0.255401611328125, -0.15631103515625, -0.057220458984375, 0.0418701171875, 0.140960693359375, 0.24005126953125, 0.339141845703125, 0.438232421875, 0.537322998046875, 0.63641357421875, 0.735504150390625, 0.8345947265625, 0.933685302734375, 1.03277587890625, 1.131866455078125, 1.23095703125, 1.330047607421875, 1.42913818359375, 1.528228759765625, 1.6273193359375, 1.726409912109375, 1.82550048828125, 1.924591064453125, 2.023681640625, 2.122772216796875, 2.22186279296875, 2.320953369140625, 2.4200439453125, 2.519134521484375, 2.61822509765625, 2.717315673828125, 2.81640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 7.0, 5.0, 13.0, 15.0, 19.0, 52.0, 106.0, 187.0, 489.0, 1769.0, 9368.0, 93839.0, 3547178.0, 512619.0, 23521.0, 3418.0, 924.0, 367.0, 205.0, 74.0, 48.0, 23.0, 10.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.466796875, -8.05859375, -7.650390625, -7.2421875, -6.833984375, -6.42578125, -6.017578125, -5.609375, -5.201171875, -4.79296875, -4.384765625, -3.9765625, -3.568359375, -3.16015625, -2.751953125, -2.34375, -1.935546875, -1.52734375, -1.119140625, -0.7109375, -0.302734375, 0.10546875, 0.513671875, 0.921875, 1.330078125, 1.73828125, 2.146484375, 2.5546875, 2.962890625, 3.37109375, 3.779296875, 4.1875, 4.595703125, 5.00390625, 5.412109375, 5.8203125, 6.228515625, 6.63671875, 7.044921875, 7.453125, 7.861328125, 8.26953125, 8.677734375, 9.0859375, 9.494140625, 9.90234375, 10.310546875, 10.71875, 11.126953125, 11.53515625, 11.943359375, 12.3515625, 12.759765625, 13.16796875, 13.576171875, 13.984375, 14.392578125, 14.80078125, 15.208984375, 15.6171875, 16.025390625, 16.43359375, 16.841796875, 17.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 15.0, 14.0, 31.0, 38.0, 45.0, 60.0, 99.0, 152.0, 277.0, 476.0, 803.0, 759.0, 537.0, 295.0, 155.0, 105.0, 56.0, 39.0, 32.0, 22.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.10546875, -5.81658935546875, -5.5277099609375, -5.23883056640625, -4.949951171875, -4.66107177734375, -4.3721923828125, -4.08331298828125, -3.79443359375, -3.50555419921875, -3.2166748046875, -2.92779541015625, -2.638916015625, -2.35003662109375, -2.0611572265625, -1.77227783203125, -1.4833984375, -1.19451904296875, -0.9056396484375, -0.61676025390625, -0.327880859375, -0.03900146484375, 0.2498779296875, 0.53875732421875, 0.82763671875, 1.11651611328125, 1.4053955078125, 1.69427490234375, 1.983154296875, 2.27203369140625, 2.5609130859375, 2.84979248046875, 3.138671875, 3.42755126953125, 3.7164306640625, 4.00531005859375, 4.294189453125, 4.58306884765625, 4.8719482421875, 5.16082763671875, 5.44970703125, 5.73858642578125, 6.0274658203125, 6.31634521484375, 6.605224609375, 6.89410400390625, 7.1829833984375, 7.47186279296875, 7.7607421875, 8.04962158203125, 8.3385009765625, 8.62738037109375, 8.916259765625, 9.20513916015625, 9.4940185546875, 9.78289794921875, 10.07177734375, 10.36065673828125, 10.6495361328125, 10.93841552734375, 11.227294921875, 11.51617431640625, 11.8050537109375, 12.09393310546875, 12.3828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 23.0, 26.0, 47.0, 62.0, 111.0, 162.0, 130.0, 126.0, 102.0, 59.0, 46.0, 28.0, 13.0, 6.0, 8.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.352508544921875, -57.27739715576172, -55.2022819519043, -53.127166748046875, -51.05205535888672, -48.97694396972656, -46.90182876586914, -44.82671356201172, -42.75160217285156, -40.676490783691406, -38.601375579833984, -36.52626037597656, -34.451148986816406, -32.37603759765625, -30.300922393798828, -28.22580909729004, -26.15069580078125, -24.07558250427246, -22.000469207763672, -19.925355911254883, -17.850242614746094, -15.775129318237305, -13.700016021728516, -11.624902725219727, -9.549789428710938, -7.474676132202148, -5.399562835693359, -3.3244495391845703, -1.2493362426757812, 0.8257770538330078, 2.900890350341797, 4.976003646850586, 7.051109313964844, 9.126222610473633, 11.201335906982422, 13.276449203491211, 15.3515625, 17.42667579650879, 19.501789093017578, 21.576902389526367, 23.652015686035156, 25.727128982543945, 27.802242279052734, 29.877355575561523, 31.952468872070312, 34.02758026123047, 36.10269546508789, 38.17781066894531, 40.25292205810547, 42.328033447265625, 44.40314865112305, 46.47826385498047, 48.553375244140625, 50.62848663330078, 52.7036018371582, 54.778717041015625, 56.85382843017578, 58.92893981933594, 61.00405502319336, 63.07917022705078, 65.15428161621094, 67.2293930053711, 69.30450439453125, 71.37962341308594, 73.4547348022461]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 8.0, 9.0, 10.0, 8.0, 18.0, 14.0, 29.0, 27.0, 25.0, 34.0, 26.0, 33.0, 36.0, 45.0, 32.0, 47.0, 40.0, 48.0, 35.0, 51.0, 42.0, 46.0, 42.0, 40.0, 39.0, 27.0, 23.0, 21.0, 20.0, 22.0, 20.0, 16.0, 7.0, 17.0, 14.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.987953186035156, -34.789764404296875, -33.591575622558594, -32.39338302612305, -31.195194244384766, -29.997005462646484, -28.79881477355957, -27.600624084472656, -26.402435302734375, -25.204246520996094, -24.00605583190918, -22.807865142822266, -21.609676361083984, -20.411487579345703, -19.21329689025879, -18.015106201171875, -16.816917419433594, -15.618727684020996, -14.420537948608398, -13.2223482131958, -12.024158477783203, -10.825968742370605, -9.627779006958008, -8.42958927154541, -7.2313995361328125, -6.033209800720215, -4.835020065307617, -3.6368303298950195, -2.438640594482422, -1.2404508590698242, -0.04226112365722656, 1.155928611755371, 2.3541221618652344, 3.552311897277832, 4.75050163269043, 5.948691368103027, 7.146881103515625, 8.345070838928223, 9.54326057434082, 10.741450309753418, 11.939640045166016, 13.137829780578613, 14.336019515991211, 15.534209251403809, 16.732398986816406, 17.930587768554688, 19.1287784576416, 20.326969146728516, 21.525157928466797, 22.723346710205078, 23.921537399291992, 25.119728088378906, 26.317916870117188, 27.51610565185547, 28.714296340942383, 29.912487030029297, 31.110675811767578, 32.30886459350586, 33.507057189941406, 34.70524597167969, 35.90343475341797, 37.10162353515625, 38.29981231689453, 39.49800491333008, 40.69619369506836]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 0.0, 3.0, 8.0, 8.0, 17.0, 17.0, 18.0, 18.0, 39.0, 57.0, 119.0, 179.0, 289.0, 430.0, 750.0, 1337.0, 2370.0, 4686.0, 9465.0, 20552.0, 44445.0, 100904.0, 226102.0, 315433.0, 177058.0, 78156.0, 34412.0, 15901.0, 7519.0, 3646.0, 1985.0, 1051.0, 551.0, 389.0, 218.0, 141.0, 104.0, 58.0, 35.0, 29.0, 22.0, 10.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8359375, -3.7052001953125, -3.574462890625, -3.4437255859375, -3.31298828125, -3.1822509765625, -3.051513671875, -2.9207763671875, -2.7900390625, -2.6593017578125, -2.528564453125, -2.3978271484375, -2.26708984375, -2.1363525390625, -2.005615234375, -1.8748779296875, -1.744140625, -1.6134033203125, -1.482666015625, -1.3519287109375, -1.22119140625, -1.0904541015625, -0.959716796875, -0.8289794921875, -0.6982421875, -0.5675048828125, -0.436767578125, -0.3060302734375, -0.17529296875, -0.0445556640625, 0.086181640625, 0.2169189453125, 0.34765625, 0.4783935546875, 0.609130859375, 0.7398681640625, 0.87060546875, 1.0013427734375, 1.132080078125, 1.2628173828125, 1.3935546875, 1.5242919921875, 1.655029296875, 1.7857666015625, 1.91650390625, 2.0472412109375, 2.177978515625, 2.3087158203125, 2.439453125, 2.5701904296875, 2.700927734375, 2.8316650390625, 2.96240234375, 3.0931396484375, 3.223876953125, 3.3546142578125, 3.4853515625, 3.6160888671875, 3.746826171875, 3.8775634765625, 4.00830078125, 4.1390380859375, 4.269775390625, 4.4005126953125, 4.53125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 17.0, 13.0, 7.0, 14.0, 20.0, 19.0, 22.0, 31.0, 35.0, 31.0, 38.0, 43.0, 39.0, 43.0, 38.0, 58.0, 34.0, 39.0, 42.0, 43.0, 35.0, 41.0, 32.0, 33.0, 28.0, 21.0, 35.0, 18.0, 17.0, 18.0, 10.0, 14.0, 12.0, 8.0, 3.0, 8.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.818359375, -2.73150634765625, -2.6446533203125, -2.55780029296875, -2.470947265625, -2.38409423828125, -2.2972412109375, -2.21038818359375, -2.12353515625, -2.03668212890625, -1.9498291015625, -1.86297607421875, -1.776123046875, -1.68927001953125, -1.6024169921875, -1.51556396484375, -1.4287109375, -1.34185791015625, -1.2550048828125, -1.16815185546875, -1.081298828125, -0.99444580078125, -0.9075927734375, -0.82073974609375, -0.73388671875, -0.64703369140625, -0.5601806640625, -0.47332763671875, -0.386474609375, -0.29962158203125, -0.2127685546875, -0.12591552734375, -0.0390625, 0.04779052734375, 0.1346435546875, 0.22149658203125, 0.308349609375, 0.39520263671875, 0.4820556640625, 0.56890869140625, 0.65576171875, 0.74261474609375, 0.8294677734375, 0.91632080078125, 1.003173828125, 1.09002685546875, 1.1768798828125, 1.26373291015625, 1.3505859375, 1.43743896484375, 1.5242919921875, 1.61114501953125, 1.697998046875, 1.78485107421875, 1.8717041015625, 1.95855712890625, 2.04541015625, 2.13226318359375, 2.2191162109375, 2.30596923828125, 2.392822265625, 2.47967529296875, 2.5665283203125, 2.65338134765625, 2.740234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 9.0, 13.0, 12.0, 14.0, 19.0, 35.0, 63.0, 81.0, 141.0, 192.0, 349.0, 565.0, 1082.0, 2426.0, 6518.0, 31169.0, 319643.0, 623961.0, 47800.0, 8546.0, 2961.0, 1266.0, 678.0, 371.0, 202.0, 145.0, 85.0, 66.0, 37.0, 33.0, 16.0, 10.0, 8.0, 7.0, 10.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6015625, -12.1964111328125, -11.791259765625, -11.3861083984375, -10.98095703125, -10.5758056640625, -10.170654296875, -9.7655029296875, -9.3603515625, -8.9552001953125, -8.550048828125, -8.1448974609375, -7.73974609375, -7.3345947265625, -6.929443359375, -6.5242919921875, -6.119140625, -5.7139892578125, -5.308837890625, -4.9036865234375, -4.49853515625, -4.0933837890625, -3.688232421875, -3.2830810546875, -2.8779296875, -2.4727783203125, -2.067626953125, -1.6624755859375, -1.25732421875, -0.8521728515625, -0.447021484375, -0.0418701171875, 0.36328125, 0.7684326171875, 1.173583984375, 1.5787353515625, 1.98388671875, 2.3890380859375, 2.794189453125, 3.1993408203125, 3.6044921875, 4.0096435546875, 4.414794921875, 4.8199462890625, 5.22509765625, 5.6302490234375, 6.035400390625, 6.4405517578125, 6.845703125, 7.2508544921875, 7.656005859375, 8.0611572265625, 8.46630859375, 8.8714599609375, 9.276611328125, 9.6817626953125, 10.0869140625, 10.4920654296875, 10.897216796875, 11.3023681640625, 11.70751953125, 12.1126708984375, 12.517822265625, 12.9229736328125, 13.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 2.0, 2.0, 7.0, 9.0, 10.0, 9.0, 19.0, 19.0, 31.0, 23.0, 41.0, 45.0, 49.0, 55.0, 50.0, 55.0, 42.0, 62.0, 52.0, 54.0, 48.0, 49.0, 40.0, 36.0, 34.0, 34.0, 24.0, 26.0, 20.0, 10.0, 17.0, 3.0, 4.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.15625, -15.6763916015625, -15.196533203125, -14.7166748046875, -14.23681640625, -13.7569580078125, -13.277099609375, -12.7972412109375, -12.3173828125, -11.8375244140625, -11.357666015625, -10.8778076171875, -10.39794921875, -9.9180908203125, -9.438232421875, -8.9583740234375, -8.478515625, -7.9986572265625, -7.518798828125, -7.0389404296875, -6.55908203125, -6.0792236328125, -5.599365234375, -5.1195068359375, -4.6396484375, -4.1597900390625, -3.679931640625, -3.2000732421875, -2.72021484375, -2.2403564453125, -1.760498046875, -1.2806396484375, -0.80078125, -0.3209228515625, 0.158935546875, 0.6387939453125, 1.11865234375, 1.5985107421875, 2.078369140625, 2.5582275390625, 3.0380859375, 3.5179443359375, 3.997802734375, 4.4776611328125, 4.95751953125, 5.4373779296875, 5.917236328125, 6.3970947265625, 6.876953125, 7.3568115234375, 7.836669921875, 8.3165283203125, 8.79638671875, 9.2762451171875, 9.756103515625, 10.2359619140625, 10.7158203125, 11.1956787109375, 11.675537109375, 12.1553955078125, 12.63525390625, 13.1151123046875, 13.594970703125, 14.0748291015625, 14.5546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 6.0, 13.0, 17.0, 17.0, 39.0, 32.0, 55.0, 72.0, 97.0, 179.0, 241.0, 379.0, 626.0, 997.0, 1799.0, 3759.0, 8757.0, 25082.0, 85721.0, 541910.0, 279767.0, 64801.0, 19549.0, 7287.0, 3132.0, 1614.0, 931.0, 576.0, 344.0, 232.0, 170.0, 110.0, 73.0, 45.0, 36.0, 36.0, 15.0, 8.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.61322021484375, -3.4881591796875, -3.36309814453125, -3.238037109375, -3.11297607421875, -2.9879150390625, -2.86285400390625, -2.73779296875, -2.61273193359375, -2.4876708984375, -2.36260986328125, -2.237548828125, -2.11248779296875, -1.9874267578125, -1.86236572265625, -1.7373046875, -1.61224365234375, -1.4871826171875, -1.36212158203125, -1.237060546875, -1.11199951171875, -0.9869384765625, -0.86187744140625, -0.73681640625, -0.61175537109375, -0.4866943359375, -0.36163330078125, -0.236572265625, -0.11151123046875, 0.0135498046875, 0.13861083984375, 0.263671875, 0.38873291015625, 0.5137939453125, 0.63885498046875, 0.763916015625, 0.88897705078125, 1.0140380859375, 1.13909912109375, 1.26416015625, 1.38922119140625, 1.5142822265625, 1.63934326171875, 1.764404296875, 1.88946533203125, 2.0145263671875, 2.13958740234375, 2.2646484375, 2.38970947265625, 2.5147705078125, 2.63983154296875, 2.764892578125, 2.88995361328125, 3.0150146484375, 3.14007568359375, 3.26513671875, 3.39019775390625, 3.5152587890625, 3.64031982421875, 3.765380859375, 3.89044189453125, 4.0155029296875, 4.14056396484375, 4.265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 2.0, 6.0, 4.0, 9.0, 16.0, 12.0, 11.0, 24.0, 29.0, 40.0, 46.0, 54.0, 54.0, 111.0, 148.0, 108.0, 65.0, 39.0, 40.0, 20.0, 32.0, 26.0, 17.0, 12.0, 19.0, 8.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0014753341674804688, -0.0014349520206451416, -0.0013945698738098145, -0.0013541877269744873, -0.0013138055801391602, -0.001273423433303833, -0.0012330412864685059, -0.0011926591396331787, -0.0011522769927978516, -0.0011118948459625244, -0.0010715126991271973, -0.0010311305522918701, -0.000990748405456543, -0.0009503662586212158, -0.0009099841117858887, -0.0008696019649505615, -0.0008292198181152344, -0.0007888376712799072, -0.0007484555244445801, -0.0007080733776092529, -0.0006676912307739258, -0.0006273090839385986, -0.0005869269371032715, -0.0005465447902679443, -0.0005061626434326172, -0.00046578049659729004, -0.0004253983497619629, -0.00038501620292663574, -0.0003446340560913086, -0.00030425190925598145, -0.0002638697624206543, -0.00022348761558532715, -0.00018310546875, -0.00014272332191467285, -0.0001023411750793457, -6.195902824401855e-05, -2.1576881408691406e-05, 1.8805265426635742e-05, 5.918741226196289e-05, 9.956955909729004e-05, 0.0001399517059326172, 0.00018033385276794434, 0.00022071599960327148, 0.00026109814643859863, 0.0003014802932739258, 0.00034186244010925293, 0.0003822445869445801, 0.0004226267337799072, 0.0004630088806152344, 0.0005033910274505615, 0.0005437731742858887, 0.0005841553211212158, 0.000624537467956543, 0.0006649196147918701, 0.0007053017616271973, 0.0007456839084625244, 0.0007860660552978516, 0.0008264482021331787, 0.0008668303489685059, 0.000907212495803833, 0.0009475946426391602, 0.0009879767894744873, 0.0010283589363098145, 0.0010687410831451416, 0.0011091232299804688]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 0.0, 5.0, 13.0, 18.0, 30.0, 39.0, 56.0, 88.0, 127.0, 163.0, 258.0, 392.0, 593.0, 1057.0, 1931.0, 4585.0, 12766.0, 46389.0, 238761.0, 622563.0, 85148.0, 20646.0, 6752.0, 2746.0, 1351.0, 743.0, 448.0, 286.0, 177.0, 116.0, 72.0, 68.0, 42.0, 30.0, 25.0, 15.0, 11.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.626708984375, -4.46826171875, -4.309814453125, -4.1513671875, -3.992919921875, -3.83447265625, -3.676025390625, -3.517578125, -3.359130859375, -3.20068359375, -3.042236328125, -2.8837890625, -2.725341796875, -2.56689453125, -2.408447265625, -2.25, -2.091552734375, -1.93310546875, -1.774658203125, -1.6162109375, -1.457763671875, -1.29931640625, -1.140869140625, -0.982421875, -0.823974609375, -0.66552734375, -0.507080078125, -0.3486328125, -0.190185546875, -0.03173828125, 0.126708984375, 0.28515625, 0.443603515625, 0.60205078125, 0.760498046875, 0.9189453125, 1.077392578125, 1.23583984375, 1.394287109375, 1.552734375, 1.711181640625, 1.86962890625, 2.028076171875, 2.1865234375, 2.344970703125, 2.50341796875, 2.661865234375, 2.8203125, 2.978759765625, 3.13720703125, 3.295654296875, 3.4541015625, 3.612548828125, 3.77099609375, 3.929443359375, 4.087890625, 4.246337890625, 4.40478515625, 4.563232421875, 4.7216796875, 4.880126953125, 5.03857421875, 5.197021484375, 5.35546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 15.0, 17.0, 15.0, 21.0, 18.0, 27.0, 35.0, 29.0, 44.0, 60.0, 90.0, 93.0, 92.0, 75.0, 65.0, 51.0, 45.0, 36.0, 26.0, 23.0, 20.0, 18.0, 11.0, 6.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.69140625, -4.54937744140625, -4.4073486328125, -4.26531982421875, -4.123291015625, -3.98126220703125, -3.8392333984375, -3.69720458984375, -3.55517578125, -3.41314697265625, -3.2711181640625, -3.12908935546875, -2.987060546875, -2.84503173828125, -2.7030029296875, -2.56097412109375, -2.4189453125, -2.27691650390625, -2.1348876953125, -1.99285888671875, -1.850830078125, -1.70880126953125, -1.5667724609375, -1.42474365234375, -1.28271484375, -1.14068603515625, -0.9986572265625, -0.85662841796875, -0.714599609375, -0.57257080078125, -0.4305419921875, -0.28851318359375, -0.146484375, -0.00445556640625, 0.1375732421875, 0.27960205078125, 0.421630859375, 0.56365966796875, 0.7056884765625, 0.84771728515625, 0.98974609375, 1.13177490234375, 1.2738037109375, 1.41583251953125, 1.557861328125, 1.69989013671875, 1.8419189453125, 1.98394775390625, 2.1259765625, 2.26800537109375, 2.4100341796875, 2.55206298828125, 2.694091796875, 2.83612060546875, 2.9781494140625, 3.12017822265625, 3.26220703125, 3.40423583984375, 3.5462646484375, 3.68829345703125, 3.830322265625, 3.97235107421875, 4.1143798828125, 4.25640869140625, 4.3984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 3.0, 7.0, 9.0, 11.0, 44.0, 92.0, 147.0, 259.0, 189.0, 100.0, 65.0, 18.0, 21.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-118.05953979492188, -114.7703628540039, -111.48119354248047, -108.1920166015625, -104.90284729003906, -101.6136703491211, -98.32449340820312, -95.03532409667969, -91.74614715576172, -88.45697021484375, -85.16780090332031, -81.87862396240234, -78.58944702148438, -75.30027770996094, -72.01110076904297, -68.721923828125, -65.43275451660156, -62.14358139038086, -58.854408264160156, -55.56523132324219, -52.276058197021484, -48.98688507080078, -45.69770812988281, -42.40853500366211, -39.119361877441406, -35.8301887512207, -32.541015625, -29.25183868408203, -25.962665557861328, -22.673492431640625, -19.38431739807129, -16.095142364501953, -12.805961608886719, -9.5167875289917, -6.22761344909668, -2.93843936920166, 0.3507347106933594, 3.6399078369140625, 6.929082870483398, 10.218257904052734, 13.507431030273438, 16.79660415649414, 20.085779190063477, 23.374954223632812, 26.664127349853516, 29.95330047607422, 33.24247741699219, 36.53165054321289, 39.820823669433594, 43.1099967956543, 46.399169921875, 49.68834686279297, 52.97751998901367, 56.266693115234375, 59.555870056152344, 62.84504318237305, 66.13421630859375, 69.42339324951172, 72.71256256103516, 76.00173950195312, 79.29090881347656, 82.58008575439453, 85.8692626953125, 89.15843200683594, 92.4476089477539]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 4.0, 11.0, 5.0, 7.0, 21.0, 15.0, 10.0, 18.0, 20.0, 32.0, 28.0, 33.0, 30.0, 30.0, 34.0, 36.0, 50.0, 48.0, 79.0, 57.0, 59.0, 33.0, 36.0, 32.0, 27.0, 29.0, 22.0, 24.0, 24.0, 26.0, 8.0, 14.0, 17.0, 13.0, 7.0, 7.0, 9.0, 6.0, 11.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-49.10178756713867, -47.68122100830078, -46.260650634765625, -44.84008026123047, -43.41951370239258, -41.99894714355469, -40.57837677001953, -39.157806396484375, -37.737239837646484, -36.316673278808594, -34.89610290527344, -33.47553253173828, -32.05496597290039, -30.634397506713867, -29.213829040527344, -27.79326057434082, -26.372692108154297, -24.952123641967773, -23.53155517578125, -22.110986709594727, -20.690418243408203, -19.26984977722168, -17.849281311035156, -16.428712844848633, -15.00814437866211, -13.587575912475586, -12.167007446289062, -10.746438980102539, -9.325870513916016, -7.905302047729492, -6.484733581542969, -5.064165115356445, -3.6436004638671875, -2.223031997680664, -0.8024635314941406, 0.6181049346923828, 2.0386734008789062, 3.4592418670654297, 4.879810333251953, 6.300378799438477, 7.720947265625, 9.141515731811523, 10.562084197998047, 11.98265266418457, 13.403221130371094, 14.823789596557617, 16.24435806274414, 17.664926528930664, 19.085494995117188, 20.50606346130371, 21.926631927490234, 23.347200393676758, 24.76776885986328, 26.188337326049805, 27.608905792236328, 29.02947425842285, 30.450042724609375, 31.8706111907959, 33.29117965698242, 34.71174621582031, 36.13231658935547, 37.552886962890625, 38.973453521728516, 40.394020080566406, 41.81459045410156]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 1.0, 14.0, 10.0, 17.0, 16.0, 30.0, 35.0, 75.0, 108.0, 178.0, 309.0, 582.0, 1150.0, 2432.0, 6325.0, 20025.0, 98394.0, 1223594.0, 2539467.0, 249981.0, 36085.0, 9327.0, 3156.0, 1417.0, 671.0, 359.0, 190.0, 115.0, 69.0, 53.0, 26.0, 23.0, 15.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.12890625, -4.9532470703125, -4.777587890625, -4.6019287109375, -4.42626953125, -4.2506103515625, -4.074951171875, -3.8992919921875, -3.7236328125, -3.5479736328125, -3.372314453125, -3.1966552734375, -3.02099609375, -2.8453369140625, -2.669677734375, -2.4940185546875, -2.318359375, -2.1427001953125, -1.967041015625, -1.7913818359375, -1.61572265625, -1.4400634765625, -1.264404296875, -1.0887451171875, -0.9130859375, -0.7374267578125, -0.561767578125, -0.3861083984375, -0.21044921875, -0.0347900390625, 0.140869140625, 0.3165283203125, 0.4921875, 0.6678466796875, 0.843505859375, 1.0191650390625, 1.19482421875, 1.3704833984375, 1.546142578125, 1.7218017578125, 1.8974609375, 2.0731201171875, 2.248779296875, 2.4244384765625, 2.60009765625, 2.7757568359375, 2.951416015625, 3.1270751953125, 3.302734375, 3.4783935546875, 3.654052734375, 3.8297119140625, 4.00537109375, 4.1810302734375, 4.356689453125, 4.5323486328125, 4.7080078125, 4.8836669921875, 5.059326171875, 5.2349853515625, 5.41064453125, 5.5863037109375, 5.761962890625, 5.9376220703125, 6.11328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 11.0, 11.0, 9.0, 12.0, 15.0, 32.0, 33.0, 38.0, 33.0, 53.0, 54.0, 42.0, 59.0, 71.0, 59.0, 57.0, 56.0, 61.0, 38.0, 45.0, 41.0, 41.0, 26.0, 21.0, 10.0, 19.0, 9.0, 6.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.00189208984375, -2.8865966796875, -2.77130126953125, -2.656005859375, -2.54071044921875, -2.4254150390625, -2.31011962890625, -2.19482421875, -2.07952880859375, -1.9642333984375, -1.84893798828125, -1.733642578125, -1.61834716796875, -1.5030517578125, -1.38775634765625, -1.2724609375, -1.15716552734375, -1.0418701171875, -0.92657470703125, -0.811279296875, -0.69598388671875, -0.5806884765625, -0.46539306640625, -0.35009765625, -0.23480224609375, -0.1195068359375, -0.00421142578125, 0.111083984375, 0.22637939453125, 0.3416748046875, 0.45697021484375, 0.572265625, 0.68756103515625, 0.8028564453125, 0.91815185546875, 1.033447265625, 1.14874267578125, 1.2640380859375, 1.37933349609375, 1.49462890625, 1.60992431640625, 1.7252197265625, 1.84051513671875, 1.955810546875, 2.07110595703125, 2.1864013671875, 2.30169677734375, 2.4169921875, 2.53228759765625, 2.6475830078125, 2.76287841796875, 2.878173828125, 2.99346923828125, 3.1087646484375, 3.22406005859375, 3.33935546875, 3.45465087890625, 3.5699462890625, 3.68524169921875, 3.800537109375, 3.91583251953125, 4.0311279296875, 4.14642333984375, 4.26171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 11.0, 5.0, 14.0, 17.0, 32.0, 64.0, 66.0, 168.0, 276.0, 541.0, 1290.0, 3430.0, 12040.0, 59669.0, 812959.0, 3091720.0, 176051.0, 25616.0, 6178.0, 2060.0, 885.0, 448.0, 263.0, 165.0, 111.0, 59.0, 49.0, 37.0, 21.0, 12.0, 6.0, 9.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1953125, -7.93310546875, -7.6708984375, -7.40869140625, -7.146484375, -6.88427734375, -6.6220703125, -6.35986328125, -6.09765625, -5.83544921875, -5.5732421875, -5.31103515625, -5.048828125, -4.78662109375, -4.5244140625, -4.26220703125, -4.0, -3.73779296875, -3.4755859375, -3.21337890625, -2.951171875, -2.68896484375, -2.4267578125, -2.16455078125, -1.90234375, -1.64013671875, -1.3779296875, -1.11572265625, -0.853515625, -0.59130859375, -0.3291015625, -0.06689453125, 0.1953125, 0.45751953125, 0.7197265625, 0.98193359375, 1.244140625, 1.50634765625, 1.7685546875, 2.03076171875, 2.29296875, 2.55517578125, 2.8173828125, 3.07958984375, 3.341796875, 3.60400390625, 3.8662109375, 4.12841796875, 4.390625, 4.65283203125, 4.9150390625, 5.17724609375, 5.439453125, 5.70166015625, 5.9638671875, 6.22607421875, 6.48828125, 6.75048828125, 7.0126953125, 7.27490234375, 7.537109375, 7.79931640625, 8.0615234375, 8.32373046875, 8.5859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 12.0, 19.0, 25.0, 59.0, 113.0, 159.0, 290.0, 611.0, 958.0, 812.0, 487.0, 227.0, 117.0, 55.0, 42.0, 25.0, 13.0, 14.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.5963134765625, -7.262939453125, -6.9295654296875, -6.59619140625, -6.2628173828125, -5.929443359375, -5.5960693359375, -5.2626953125, -4.9293212890625, -4.595947265625, -4.2625732421875, -3.92919921875, -3.5958251953125, -3.262451171875, -2.9290771484375, -2.595703125, -2.2623291015625, -1.928955078125, -1.5955810546875, -1.26220703125, -0.9288330078125, -0.595458984375, -0.2620849609375, 0.0712890625, 0.4046630859375, 0.738037109375, 1.0714111328125, 1.40478515625, 1.7381591796875, 2.071533203125, 2.4049072265625, 2.73828125, 3.0716552734375, 3.405029296875, 3.7384033203125, 4.07177734375, 4.4051513671875, 4.738525390625, 5.0718994140625, 5.4052734375, 5.7386474609375, 6.072021484375, 6.4053955078125, 6.73876953125, 7.0721435546875, 7.405517578125, 7.7388916015625, 8.072265625, 8.4056396484375, 8.739013671875, 9.0723876953125, 9.40576171875, 9.7391357421875, 10.072509765625, 10.4058837890625, 10.7392578125, 11.0726318359375, 11.406005859375, 11.7393798828125, 12.07275390625, 12.4061279296875, 12.739501953125, 13.0728759765625, 13.40625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 21.0, 31.0, 81.0, 138.0, 230.0, 227.0, 152.0, 59.0, 22.0, 11.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-141.0215301513672, -137.81118774414062, -134.600830078125, -131.39048767089844, -128.1801300048828, -124.96978759765625, -121.75943756103516, -118.54908752441406, -115.33873748779297, -112.12838745117188, -108.91803741455078, -105.70768737792969, -102.49734497070312, -99.28699493408203, -96.07664489746094, -92.86629486083984, -89.65594482421875, -86.44559478759766, -83.23524475097656, -80.02490234375, -76.8145523071289, -73.60420227050781, -70.39385223388672, -67.18350219726562, -63.97315979003906, -60.76280975341797, -57.55246353149414, -54.34211349487305, -51.13176345825195, -47.921417236328125, -44.71106719970703, -41.50071716308594, -38.290367126464844, -35.08001708984375, -31.86966896057129, -28.659320831298828, -25.448970794677734, -22.238622665405273, -19.028274536132812, -15.817924499511719, -12.607576370239258, -9.39722728729248, -6.186878681182861, -2.976530075073242, 0.23381900787353516, 3.4441680908203125, 6.654516220092773, 9.864866256713867, 13.075214385986328, 16.28556251525879, 19.495912551879883, 22.706260681152344, 25.916610717773438, 29.1269588470459, 32.33730697631836, 35.54765701293945, 38.75800323486328, 41.968353271484375, 45.1786994934082, 48.3890495300293, 51.59939956665039, 54.80974578857422, 58.02009582519531, 61.230445861816406, 64.4407958984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 9.0, 24.0, 25.0, 41.0, 46.0, 57.0, 76.0, 92.0, 81.0, 93.0, 97.0, 75.0, 75.0, 56.0, 54.0, 27.0, 29.0, 13.0, 12.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.31664276123047, -71.4379653930664, -69.55928039550781, -67.68060302734375, -65.80192565917969, -63.923240661621094, -62.04456329345703, -60.1658821105957, -58.287200927734375, -56.40851974487305, -54.529842376708984, -52.651161193847656, -50.77248001098633, -48.893798828125, -47.01512145996094, -45.13644027709961, -43.25775909423828, -41.37907791137695, -39.50040054321289, -37.62171936035156, -35.743038177490234, -33.864356994628906, -31.985679626464844, -30.106998443603516, -28.228321075439453, -26.349641799926758, -24.47096061706543, -22.592281341552734, -20.713600158691406, -18.83492088317871, -16.956241607666016, -15.077560424804688, -13.19887924194336, -11.320199012756348, -9.441518783569336, -7.562839031219482, -5.684158802032471, -3.805479049682617, -1.9267988204956055, -0.04811859130859375, 1.830561637878418, 3.7092418670654297, 5.587922096252441, 7.466601848602295, 9.345281600952148, 11.22396183013916, 13.102642059326172, 14.981322288513184, 16.860002517700195, 18.73868179321289, 20.61736297607422, 22.496042251586914, 24.374723434448242, 26.253402709960938, 28.132083892822266, 30.01076316833496, 31.889442443847656, 33.768123626708984, 35.64680099487305, 37.525482177734375, 39.4041633605957, 41.28284454345703, 43.161521911621094, 45.04020309448242, 46.91888427734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 18.0, 4.0, 25.0, 21.0, 35.0, 41.0, 61.0, 96.0, 136.0, 210.0, 408.0, 705.0, 1406.0, 3004.0, 7098.0, 18265.0, 51425.0, 151955.0, 385561.0, 279027.0, 94863.0, 32555.0, 12178.0, 4918.0, 2152.0, 1015.0, 537.0, 290.0, 176.0, 117.0, 73.0, 41.0, 44.0, 21.0, 19.0, 13.0, 8.0, 11.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.27734375, -5.08740234375, -4.8974609375, -4.70751953125, -4.517578125, -4.32763671875, -4.1376953125, -3.94775390625, -3.7578125, -3.56787109375, -3.3779296875, -3.18798828125, -2.998046875, -2.80810546875, -2.6181640625, -2.42822265625, -2.23828125, -2.04833984375, -1.8583984375, -1.66845703125, -1.478515625, -1.28857421875, -1.0986328125, -0.90869140625, -0.71875, -0.52880859375, -0.3388671875, -0.14892578125, 0.041015625, 0.23095703125, 0.4208984375, 0.61083984375, 0.80078125, 0.99072265625, 1.1806640625, 1.37060546875, 1.560546875, 1.75048828125, 1.9404296875, 2.13037109375, 2.3203125, 2.51025390625, 2.7001953125, 2.89013671875, 3.080078125, 3.27001953125, 3.4599609375, 3.64990234375, 3.83984375, 4.02978515625, 4.2197265625, 4.40966796875, 4.599609375, 4.78955078125, 4.9794921875, 5.16943359375, 5.359375, 5.54931640625, 5.7392578125, 5.92919921875, 6.119140625, 6.30908203125, 6.4990234375, 6.68896484375, 6.87890625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 12.0, 14.0, 12.0, 18.0, 16.0, 24.0, 28.0, 25.0, 38.0, 33.0, 26.0, 42.0, 48.0, 44.0, 52.0, 46.0, 49.0, 43.0, 56.0, 44.0, 36.0, 25.0, 27.0, 31.0, 29.0, 24.0, 20.0, 26.0, 11.0, 14.0, 12.0, 9.0, 5.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.677703857421875, -2.58978271484375, -2.501861572265625, -2.4139404296875, -2.326019287109375, -2.23809814453125, -2.150177001953125, -2.062255859375, -1.974334716796875, -1.88641357421875, -1.798492431640625, -1.7105712890625, -1.622650146484375, -1.53472900390625, -1.446807861328125, -1.35888671875, -1.270965576171875, -1.18304443359375, -1.095123291015625, -1.0072021484375, -0.919281005859375, -0.83135986328125, -0.743438720703125, -0.655517578125, -0.567596435546875, -0.47967529296875, -0.391754150390625, -0.3038330078125, -0.215911865234375, -0.12799072265625, -0.040069580078125, 0.0478515625, 0.135772705078125, 0.22369384765625, 0.311614990234375, 0.3995361328125, 0.487457275390625, 0.57537841796875, 0.663299560546875, 0.751220703125, 0.839141845703125, 0.92706298828125, 1.014984130859375, 1.1029052734375, 1.190826416015625, 1.27874755859375, 1.366668701171875, 1.45458984375, 1.542510986328125, 1.63043212890625, 1.718353271484375, 1.8062744140625, 1.894195556640625, 1.98211669921875, 2.070037841796875, 2.157958984375, 2.245880126953125, 2.33380126953125, 2.421722412109375, 2.5096435546875, 2.597564697265625, 2.68548583984375, 2.773406982421875, 2.861328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 11.0, 18.0, 21.0, 41.0, 63.0, 78.0, 75.0, 143.0, 234.0, 400.0, 786.0, 1801.0, 5094.0, 22990.0, 262390.0, 699722.0, 42592.0, 7410.0, 2346.0, 1026.0, 478.0, 266.0, 166.0, 94.0, 79.0, 53.0, 40.0, 35.0, 20.0, 15.0, 12.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.2265625, -14.7215576171875, -14.216552734375, -13.7115478515625, -13.20654296875, -12.7015380859375, -12.196533203125, -11.6915283203125, -11.1865234375, -10.6815185546875, -10.176513671875, -9.6715087890625, -9.16650390625, -8.6614990234375, -8.156494140625, -7.6514892578125, -7.146484375, -6.6414794921875, -6.136474609375, -5.6314697265625, -5.12646484375, -4.6214599609375, -4.116455078125, -3.6114501953125, -3.1064453125, -2.6014404296875, -2.096435546875, -1.5914306640625, -1.08642578125, -0.5814208984375, -0.076416015625, 0.4285888671875, 0.93359375, 1.4385986328125, 1.943603515625, 2.4486083984375, 2.95361328125, 3.4586181640625, 3.963623046875, 4.4686279296875, 4.9736328125, 5.4786376953125, 5.983642578125, 6.4886474609375, 6.99365234375, 7.4986572265625, 8.003662109375, 8.5086669921875, 9.013671875, 9.5186767578125, 10.023681640625, 10.5286865234375, 11.03369140625, 11.5386962890625, 12.043701171875, 12.5487060546875, 13.0537109375, 13.5587158203125, 14.063720703125, 14.5687255859375, 15.07373046875, 15.5787353515625, 16.083740234375, 16.5887451171875, 17.09375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 15.0, 29.0, 15.0, 22.0, 30.0, 25.0, 34.0, 41.0, 45.0, 42.0, 55.0, 52.0, 47.0, 45.0, 46.0, 41.0, 39.0, 40.0, 44.0, 43.0, 23.0, 32.0, 24.0, 19.0, 15.0, 19.0, 13.0, 10.0, 8.0, 10.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.0689697265625, -9.692626953125, -9.3162841796875, -8.93994140625, -8.5635986328125, -8.187255859375, -7.8109130859375, -7.4345703125, -7.0582275390625, -6.681884765625, -6.3055419921875, -5.92919921875, -5.5528564453125, -5.176513671875, -4.8001708984375, -4.423828125, -4.0474853515625, -3.671142578125, -3.2947998046875, -2.91845703125, -2.5421142578125, -2.165771484375, -1.7894287109375, -1.4130859375, -1.0367431640625, -0.660400390625, -0.2840576171875, 0.09228515625, 0.4686279296875, 0.844970703125, 1.2213134765625, 1.59765625, 1.9739990234375, 2.350341796875, 2.7266845703125, 3.10302734375, 3.4793701171875, 3.855712890625, 4.2320556640625, 4.6083984375, 4.9847412109375, 5.361083984375, 5.7374267578125, 6.11376953125, 6.4901123046875, 6.866455078125, 7.2427978515625, 7.619140625, 7.9954833984375, 8.371826171875, 8.7481689453125, 9.12451171875, 9.5008544921875, 9.877197265625, 10.2535400390625, 10.6298828125, 11.0062255859375, 11.382568359375, 11.7589111328125, 12.13525390625, 12.5115966796875, 12.887939453125, 13.2642822265625, 13.640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 11.0, 14.0, 9.0, 13.0, 28.0, 38.0, 54.0, 101.0, 127.0, 206.0, 331.0, 644.0, 1649.0, 5197.0, 21656.0, 125957.0, 778997.0, 89913.0, 16582.0, 4204.0, 1409.0, 599.0, 291.0, 180.0, 100.0, 75.0, 39.0, 35.0, 32.0, 17.0, 7.0, 6.0, 8.0, 4.0, 6.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.25421142578125, -5.0474853515625, -4.84075927734375, -4.634033203125, -4.42730712890625, -4.2205810546875, -4.01385498046875, -3.80712890625, -3.60040283203125, -3.3936767578125, -3.18695068359375, -2.980224609375, -2.77349853515625, -2.5667724609375, -2.36004638671875, -2.1533203125, -1.94659423828125, -1.7398681640625, -1.53314208984375, -1.326416015625, -1.11968994140625, -0.9129638671875, -0.70623779296875, -0.49951171875, -0.29278564453125, -0.0860595703125, 0.12066650390625, 0.327392578125, 0.53411865234375, 0.7408447265625, 0.94757080078125, 1.154296875, 1.36102294921875, 1.5677490234375, 1.77447509765625, 1.981201171875, 2.18792724609375, 2.3946533203125, 2.60137939453125, 2.80810546875, 3.01483154296875, 3.2215576171875, 3.42828369140625, 3.635009765625, 3.84173583984375, 4.0484619140625, 4.25518798828125, 4.4619140625, 4.66864013671875, 4.8753662109375, 5.08209228515625, 5.288818359375, 5.49554443359375, 5.7022705078125, 5.90899658203125, 6.11572265625, 6.32244873046875, 6.5291748046875, 6.73590087890625, 6.942626953125, 7.14935302734375, 7.3560791015625, 7.56280517578125, 7.76953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 9.0, 6.0, 13.0, 18.0, 30.0, 30.0, 56.0, 82.0, 161.0, 234.0, 116.0, 64.0, 30.0, 39.0, 27.0, 17.0, 11.0, 8.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020313262939453125, -0.001968294382095337, -0.0019052624702453613, -0.0018422305583953857, -0.0017791986465454102, -0.0017161667346954346, -0.001653134822845459, -0.0015901029109954834, -0.0015270709991455078, -0.0014640390872955322, -0.0014010071754455566, -0.001337975263595581, -0.0012749433517456055, -0.0012119114398956299, -0.0011488795280456543, -0.0010858476161956787, -0.0010228157043457031, -0.0009597837924957275, -0.000896751880645752, -0.0008337199687957764, -0.0007706880569458008, -0.0007076561450958252, -0.0006446242332458496, -0.000581592321395874, -0.0005185604095458984, -0.00045552849769592285, -0.00039249658584594727, -0.0003294646739959717, -0.0002664327621459961, -0.0002034008502960205, -0.00014036893844604492, -7.733702659606934e-05, -1.430511474609375e-05, 4.8726797103881836e-05, 0.00011175870895385742, 0.000174790620803833, 0.0002378225326538086, 0.0003008544445037842, 0.00036388635635375977, 0.00042691826820373535, 0.0004899501800537109, 0.0005529820919036865, 0.0006160140037536621, 0.0006790459156036377, 0.0007420778274536133, 0.0008051097393035889, 0.0008681416511535645, 0.00093117356300354, 0.0009942054748535156, 0.0010572373867034912, 0.0011202692985534668, 0.0011833012104034424, 0.001246333122253418, 0.0013093650341033936, 0.0013723969459533691, 0.0014354288578033447, 0.0014984607696533203, 0.001561492681503296, 0.0016245245933532715, 0.001687556505203247, 0.0017505884170532227, 0.0018136203289031982, 0.0018766522407531738, 0.0019396841526031494, 0.002002716064453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 7.0, 5.0, 8.0, 8.0, 12.0, 20.0, 33.0, 33.0, 62.0, 69.0, 99.0, 163.0, 238.0, 342.0, 516.0, 890.0, 1884.0, 4569.0, 13609.0, 46619.0, 249356.0, 622222.0, 75506.0, 20171.0, 6614.0, 2503.0, 1236.0, 588.0, 360.0, 250.0, 179.0, 111.0, 81.0, 66.0, 34.0, 23.0, 20.0, 16.0, 4.0, 10.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.765625, -4.61273193359375, -4.4598388671875, -4.30694580078125, -4.154052734375, -4.00115966796875, -3.8482666015625, -3.69537353515625, -3.54248046875, -3.38958740234375, -3.2366943359375, -3.08380126953125, -2.930908203125, -2.77801513671875, -2.6251220703125, -2.47222900390625, -2.3193359375, -2.16644287109375, -2.0135498046875, -1.86065673828125, -1.707763671875, -1.55487060546875, -1.4019775390625, -1.24908447265625, -1.09619140625, -0.94329833984375, -0.7904052734375, -0.63751220703125, -0.484619140625, -0.33172607421875, -0.1788330078125, -0.02593994140625, 0.126953125, 0.27984619140625, 0.4327392578125, 0.58563232421875, 0.738525390625, 0.89141845703125, 1.0443115234375, 1.19720458984375, 1.35009765625, 1.50299072265625, 1.6558837890625, 1.80877685546875, 1.961669921875, 2.11456298828125, 2.2674560546875, 2.42034912109375, 2.5732421875, 2.72613525390625, 2.8790283203125, 3.03192138671875, 3.184814453125, 3.33770751953125, 3.4906005859375, 3.64349365234375, 3.79638671875, 3.94927978515625, 4.1021728515625, 4.25506591796875, 4.407958984375, 4.56085205078125, 4.7137451171875, 4.86663818359375, 5.01953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 11.0, 11.0, 20.0, 21.0, 16.0, 20.0, 30.0, 34.0, 49.0, 45.0, 49.0, 77.0, 95.0, 96.0, 79.0, 65.0, 50.0, 43.0, 28.0, 28.0, 19.0, 15.0, 5.0, 16.0, 9.0, 5.0, 7.0, 5.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-3.47265625, -3.360565185546875, -3.24847412109375, -3.136383056640625, -3.0242919921875, -2.912200927734375, -2.80010986328125, -2.688018798828125, -2.575927734375, -2.463836669921875, -2.35174560546875, -2.239654541015625, -2.1275634765625, -2.015472412109375, -1.90338134765625, -1.791290283203125, -1.67919921875, -1.567108154296875, -1.45501708984375, -1.342926025390625, -1.2308349609375, -1.118743896484375, -1.00665283203125, -0.894561767578125, -0.782470703125, -0.670379638671875, -0.55828857421875, -0.446197509765625, -0.3341064453125, -0.222015380859375, -0.10992431640625, 0.002166748046875, 0.1142578125, 0.226348876953125, 0.33843994140625, 0.450531005859375, 0.5626220703125, 0.674713134765625, 0.78680419921875, 0.898895263671875, 1.010986328125, 1.123077392578125, 1.23516845703125, 1.347259521484375, 1.4593505859375, 1.571441650390625, 1.68353271484375, 1.795623779296875, 1.90771484375, 2.019805908203125, 2.13189697265625, 2.243988037109375, 2.3560791015625, 2.468170166015625, 2.58026123046875, 2.692352294921875, 2.804443359375, 2.916534423828125, 3.02862548828125, 3.140716552734375, 3.2528076171875, 3.364898681640625, 3.47698974609375, 3.589080810546875, 3.701171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 14.0, 17.0, 54.0, 126.0, 263.0, 263.0, 127.0, 59.0, 20.0, 18.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-123.2546615600586, -119.6417236328125, -116.02877807617188, -112.41583251953125, -108.80289459228516, -105.18995666503906, -101.57701110839844, -97.96406555175781, -94.35112762451172, -90.73818969726562, -87.125244140625, -83.51229858398438, -79.89936065673828, -76.28642272949219, -72.67347717285156, -69.06053161621094, -65.44759368896484, -61.834651947021484, -58.221710205078125, -54.608768463134766, -50.995826721191406, -47.38288497924805, -43.76994323730469, -40.15700149536133, -36.54405975341797, -32.93111801147461, -29.31817626953125, -25.70523452758789, -22.09229278564453, -18.479351043701172, -14.866409301757812, -11.253467559814453, -7.640525817871094, -4.027584075927734, -0.414642333984375, 3.1982994079589844, 6.811241149902344, 10.424182891845703, 14.037124633789062, 17.650066375732422, 21.26300811767578, 24.87594985961914, 28.4888916015625, 32.10183334350586, 35.71477508544922, 39.32771682739258, 42.94065856933594, 46.5536003112793, 50.166542053222656, 53.779483795166016, 57.392425537109375, 61.005367279052734, 64.6183090209961, 68.23124694824219, 71.84419250488281, 75.45713806152344, 79.07007598876953, 82.68301391601562, 86.29595947265625, 89.90890502929688, 93.52184295654297, 97.13478088378906, 100.74772644042969, 104.36067199707031, 107.9736099243164]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 8.0, 4.0, 2.0, 1.0, 8.0, 12.0, 13.0, 12.0, 10.0, 14.0, 19.0, 15.0, 18.0, 31.0, 31.0, 29.0, 42.0, 34.0, 45.0, 59.0, 63.0, 53.0, 64.0, 69.0, 42.0, 42.0, 32.0, 24.0, 23.0, 27.0, 21.0, 28.0, 15.0, 13.0, 18.0, 15.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.525146484375, -42.01411819458008, -40.503089904785156, -38.992061614990234, -37.48103332519531, -35.970001220703125, -34.4589729309082, -32.94794464111328, -31.43691635131836, -29.925888061523438, -28.414859771728516, -26.90382957458496, -25.39280128479004, -23.881772994995117, -22.370742797851562, -20.85971450805664, -19.34868621826172, -17.837657928466797, -16.326629638671875, -14.81559944152832, -13.304571151733398, -11.793542861938477, -10.282513618469238, -8.771484375, -7.260456085205078, -5.749427318572998, -4.238398551940918, -2.727369785308838, -1.2163410186767578, 0.29468774795532227, 1.8057165145874023, 3.3167457580566406, 4.8277740478515625, 6.338802814483643, 7.849831581115723, 9.360860824584961, 10.871889114379883, 12.382917404174805, 13.893946647644043, 15.404975891113281, 16.916004180908203, 18.427032470703125, 19.938060760498047, 21.4490909576416, 22.960119247436523, 24.471147537231445, 25.982177734375, 27.493206024169922, 29.004234313964844, 30.515262603759766, 32.02629089355469, 33.53731918334961, 35.04834747314453, 36.55937957763672, 38.07040786743164, 39.58143615722656, 41.092464447021484, 42.603492736816406, 44.11452102661133, 45.62554931640625, 47.13658142089844, 48.64760971069336, 50.15863800048828, 51.6696662902832, 53.180694580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 16.0, 18.0, 31.0, 33.0, 67.0, 98.0, 161.0, 230.0, 477.0, 918.0, 1828.0, 4594.0, 13422.0, 59088.0, 698442.0, 3020474.0, 341547.0, 37277.0, 9252.0, 3221.0, 1374.0, 689.0, 323.0, 227.0, 159.0, 84.0, 62.0, 42.0, 32.0, 15.0, 14.0, 9.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.58203125, -6.39056396484375, -6.1990966796875, -6.00762939453125, -5.816162109375, -5.62469482421875, -5.4332275390625, -5.24176025390625, -5.05029296875, -4.85882568359375, -4.6673583984375, -4.47589111328125, -4.284423828125, -4.09295654296875, -3.9014892578125, -3.71002197265625, -3.5185546875, -3.32708740234375, -3.1356201171875, -2.94415283203125, -2.752685546875, -2.56121826171875, -2.3697509765625, -2.17828369140625, -1.98681640625, -1.79534912109375, -1.6038818359375, -1.41241455078125, -1.220947265625, -1.02947998046875, -0.8380126953125, -0.64654541015625, -0.455078125, -0.26361083984375, -0.0721435546875, 0.11932373046875, 0.310791015625, 0.50225830078125, 0.6937255859375, 0.88519287109375, 1.07666015625, 1.26812744140625, 1.4595947265625, 1.65106201171875, 1.842529296875, 2.03399658203125, 2.2254638671875, 2.41693115234375, 2.6083984375, 2.79986572265625, 2.9913330078125, 3.18280029296875, 3.374267578125, 3.56573486328125, 3.7572021484375, 3.94866943359375, 4.14013671875, 4.33160400390625, 4.5230712890625, 4.71453857421875, 4.906005859375, 5.09747314453125, 5.2889404296875, 5.48040771484375, 5.671875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 6.0, 3.0, 4.0, 4.0, 11.0, 11.0, 30.0, 21.0, 28.0, 50.0, 56.0, 49.0, 57.0, 66.0, 64.0, 66.0, 74.0, 66.0, 68.0, 61.0, 49.0, 38.0, 29.0, 27.0, 21.0, 16.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.363677978515625, -2.22930908203125, -2.094940185546875, -1.9605712890625, -1.826202392578125, -1.69183349609375, -1.557464599609375, -1.423095703125, -1.288726806640625, -1.15435791015625, -1.019989013671875, -0.8856201171875, -0.751251220703125, -0.61688232421875, -0.482513427734375, -0.34814453125, -0.213775634765625, -0.07940673828125, 0.054962158203125, 0.1893310546875, 0.323699951171875, 0.45806884765625, 0.592437744140625, 0.726806640625, 0.861175537109375, 0.99554443359375, 1.129913330078125, 1.2642822265625, 1.398651123046875, 1.53302001953125, 1.667388916015625, 1.8017578125, 1.936126708984375, 2.07049560546875, 2.204864501953125, 2.3392333984375, 2.473602294921875, 2.60797119140625, 2.742340087890625, 2.876708984375, 3.011077880859375, 3.14544677734375, 3.279815673828125, 3.4141845703125, 3.548553466796875, 3.68292236328125, 3.817291259765625, 3.95166015625, 4.086029052734375, 4.22039794921875, 4.354766845703125, 4.4891357421875, 4.623504638671875, 4.75787353515625, 4.892242431640625, 5.026611328125, 5.160980224609375, 5.29534912109375, 5.429718017578125, 5.5640869140625, 5.698455810546875, 5.83282470703125, 5.967193603515625, 6.1015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 15.0, 27.0, 47.0, 81.0, 133.0, 294.0, 610.0, 1349.0, 3511.0, 16487.0, 271368.0, 3771930.0, 112049.0, 10959.0, 2904.0, 1221.0, 587.0, 282.0, 191.0, 86.0, 42.0, 27.0, 16.0, 14.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.8515625, -14.443359375, -14.03515625, -13.626953125, -13.21875, -12.810546875, -12.40234375, -11.994140625, -11.5859375, -11.177734375, -10.76953125, -10.361328125, -9.953125, -9.544921875, -9.13671875, -8.728515625, -8.3203125, -7.912109375, -7.50390625, -7.095703125, -6.6875, -6.279296875, -5.87109375, -5.462890625, -5.0546875, -4.646484375, -4.23828125, -3.830078125, -3.421875, -3.013671875, -2.60546875, -2.197265625, -1.7890625, -1.380859375, -0.97265625, -0.564453125, -0.15625, 0.251953125, 0.66015625, 1.068359375, 1.4765625, 1.884765625, 2.29296875, 2.701171875, 3.109375, 3.517578125, 3.92578125, 4.333984375, 4.7421875, 5.150390625, 5.55859375, 5.966796875, 6.375, 6.783203125, 7.19140625, 7.599609375, 8.0078125, 8.416015625, 8.82421875, 9.232421875, 9.640625, 10.048828125, 10.45703125, 10.865234375, 11.2734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 14.0, 15.0, 23.0, 40.0, 85.0, 155.0, 333.0, 639.0, 1066.0, 797.0, 402.0, 219.0, 104.0, 63.0, 31.0, 17.0, 19.0, 11.0, 9.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.765625, -9.436767578125, -9.10791015625, -8.779052734375, -8.4501953125, -8.121337890625, -7.79248046875, -7.463623046875, -7.134765625, -6.805908203125, -6.47705078125, -6.148193359375, -5.8193359375, -5.490478515625, -5.16162109375, -4.832763671875, -4.50390625, -4.175048828125, -3.84619140625, -3.517333984375, -3.1884765625, -2.859619140625, -2.53076171875, -2.201904296875, -1.873046875, -1.544189453125, -1.21533203125, -0.886474609375, -0.5576171875, -0.228759765625, 0.10009765625, 0.428955078125, 0.7578125, 1.086669921875, 1.41552734375, 1.744384765625, 2.0732421875, 2.402099609375, 2.73095703125, 3.059814453125, 3.388671875, 3.717529296875, 4.04638671875, 4.375244140625, 4.7041015625, 5.032958984375, 5.36181640625, 5.690673828125, 6.01953125, 6.348388671875, 6.67724609375, 7.006103515625, 7.3349609375, 7.663818359375, 7.99267578125, 8.321533203125, 8.650390625, 8.979248046875, 9.30810546875, 9.636962890625, 9.9658203125, 10.294677734375, 10.62353515625, 10.952392578125, 11.28125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 16.0, 41.0, 182.0, 343.0, 286.0, 86.0, 21.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.53707885742188, -187.4213409423828, -182.3055877685547, -177.18984985351562, -172.0740966796875, -166.95835876464844, -161.84262084960938, -156.72686767578125, -151.6111297607422, -146.49539184570312, -141.379638671875, -136.26390075683594, -131.14816284179688, -126.03240966796875, -120.91667175292969, -115.8009262084961, -110.6851806640625, -105.5694351196289, -100.45368957519531, -95.33795166015625, -90.22220611572266, -85.10646057128906, -79.99072265625, -74.8749771118164, -69.75923156738281, -64.64348602294922, -59.52774429321289, -54.41200256347656, -49.29625701904297, -44.180511474609375, -39.06476974487305, -33.94902801513672, -28.833267211914062, -23.7175235748291, -18.60177993774414, -13.48603630065918, -8.370292663574219, -3.254549026489258, 1.8611946105957031, 6.976936340332031, 12.092681884765625, 17.208425521850586, 22.324169158935547, 27.439912796020508, 32.55565643310547, 37.67140197753906, 42.78714370727539, 47.90288543701172, 53.01863098144531, 58.134376525878906, 63.250118255615234, 68.36585998535156, 73.48160552978516, 78.59735107421875, 83.71308898925781, 88.8288345336914, 93.944580078125, 99.0603256225586, 104.17607116699219, 109.29180908203125, 114.40755462646484, 119.52330017089844, 124.6390380859375, 129.75479125976562, 134.8705291748047]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 18.0, 20.0, 26.0, 33.0, 35.0, 38.0, 48.0, 65.0, 72.0, 78.0, 83.0, 69.0, 63.0, 71.0, 59.0, 52.0, 49.0, 34.0, 21.0, 16.0, 16.0, 7.0, 8.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.65948486328125, -29.259729385375977, -27.859973907470703, -26.460220336914062, -25.06046485900879, -23.660709381103516, -22.260953903198242, -20.86119842529297, -19.461444854736328, -18.061689376831055, -16.66193389892578, -15.262179374694824, -13.862424850463867, -12.462669372558594, -11.06291389465332, -9.663159370422363, -8.263402938842773, -6.863647937774658, -5.463892936706543, -4.0641374588012695, -2.6643824577331543, -1.264627456665039, 0.13512802124023438, 1.5348825454711914, 2.934638023376465, 4.33439302444458, 5.734148025512695, 7.133903503417969, 8.533658981323242, 9.9334135055542, 11.333168983459473, 12.73292350769043, 14.132678985595703, 15.532434463500977, 16.93218994140625, 18.33194351196289, 19.731698989868164, 21.131454467773438, 22.53120994567871, 23.930965423583984, 25.330718994140625, 26.7304744720459, 28.130229949951172, 29.529983520507812, 30.929738998413086, 32.32949447631836, 33.729248046875, 35.129005432128906, 36.52876281738281, 37.92851638793945, 39.32827377319336, 40.72802734375, 42.127784729003906, 43.52753829956055, 44.92729187011719, 46.327049255371094, 47.726802825927734, 49.126556396484375, 50.52631378173828, 51.92606735229492, 53.32582473754883, 54.72557830810547, 56.125335693359375, 57.525089263916016, 58.924842834472656]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 9.0, 24.0, 26.0, 54.0, 80.0, 135.0, 260.0, 663.0, 1928.0, 7149.0, 37819.0, 265645.0, 593287.0, 116801.0, 18444.0, 3920.0, 1275.0, 480.0, 234.0, 119.0, 73.0, 43.0, 28.0, 13.0, 11.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3338623046875, -10.003662109375, -9.6734619140625, -9.34326171875, -9.0130615234375, -8.682861328125, -8.3526611328125, -8.0224609375, -7.6922607421875, -7.362060546875, -7.0318603515625, -6.70166015625, -6.3714599609375, -6.041259765625, -5.7110595703125, -5.380859375, -5.0506591796875, -4.720458984375, -4.3902587890625, -4.06005859375, -3.7298583984375, -3.399658203125, -3.0694580078125, -2.7392578125, -2.4090576171875, -2.078857421875, -1.7486572265625, -1.41845703125, -1.0882568359375, -0.758056640625, -0.4278564453125, -0.09765625, 0.2325439453125, 0.562744140625, 0.8929443359375, 1.22314453125, 1.5533447265625, 1.883544921875, 2.2137451171875, 2.5439453125, 2.8741455078125, 3.204345703125, 3.5345458984375, 3.86474609375, 4.1949462890625, 4.525146484375, 4.8553466796875, 5.185546875, 5.5157470703125, 5.845947265625, 6.1761474609375, 6.50634765625, 6.8365478515625, 7.166748046875, 7.4969482421875, 7.8271484375, 8.1573486328125, 8.487548828125, 8.8177490234375, 9.14794921875, 9.4781494140625, 9.808349609375, 10.1385498046875, 10.46875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 18.0, 17.0, 22.0, 36.0, 41.0, 53.0, 53.0, 69.0, 81.0, 81.0, 81.0, 74.0, 69.0, 68.0, 52.0, 43.0, 44.0, 27.0, 22.0, 16.0, 18.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.217926025390625, -3.05108642578125, -2.884246826171875, -2.7174072265625, -2.550567626953125, -2.38372802734375, -2.216888427734375, -2.050048828125, -1.883209228515625, -1.71636962890625, -1.549530029296875, -1.3826904296875, -1.215850830078125, -1.04901123046875, -0.882171630859375, -0.71533203125, -0.548492431640625, -0.38165283203125, -0.214813232421875, -0.0479736328125, 0.118865966796875, 0.28570556640625, 0.452545166015625, 0.619384765625, 0.786224365234375, 0.95306396484375, 1.119903564453125, 1.2867431640625, 1.453582763671875, 1.62042236328125, 1.787261962890625, 1.9541015625, 2.120941162109375, 2.28778076171875, 2.454620361328125, 2.6214599609375, 2.788299560546875, 2.95513916015625, 3.121978759765625, 3.288818359375, 3.455657958984375, 3.62249755859375, 3.789337158203125, 3.9561767578125, 4.123016357421875, 4.28985595703125, 4.456695556640625, 4.62353515625, 4.790374755859375, 4.95721435546875, 5.124053955078125, 5.2908935546875, 5.457733154296875, 5.62457275390625, 5.791412353515625, 5.958251953125, 6.125091552734375, 6.29193115234375, 6.458770751953125, 6.6256103515625, 6.792449951171875, 6.95928955078125, 7.126129150390625, 7.29296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 11.0, 16.0, 12.0, 19.0, 23.0, 47.0, 57.0, 83.0, 152.0, 230.0, 544.0, 1111.0, 2751.0, 7916.0, 29921.0, 171892.0, 672343.0, 126882.0, 23566.0, 6581.0, 2326.0, 984.0, 454.0, 238.0, 128.0, 84.0, 58.0, 37.0, 26.0, 15.0, 11.0, 9.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0703125, -8.7816162109375, -8.492919921875, -8.2042236328125, -7.91552734375, -7.6268310546875, -7.338134765625, -7.0494384765625, -6.7607421875, -6.4720458984375, -6.183349609375, -5.8946533203125, -5.60595703125, -5.3172607421875, -5.028564453125, -4.7398681640625, -4.451171875, -4.1624755859375, -3.873779296875, -3.5850830078125, -3.29638671875, -3.0076904296875, -2.718994140625, -2.4302978515625, -2.1416015625, -1.8529052734375, -1.564208984375, -1.2755126953125, -0.98681640625, -0.6981201171875, -0.409423828125, -0.1207275390625, 0.16796875, 0.4566650390625, 0.745361328125, 1.0340576171875, 1.32275390625, 1.6114501953125, 1.900146484375, 2.1888427734375, 2.4775390625, 2.7662353515625, 3.054931640625, 3.3436279296875, 3.63232421875, 3.9210205078125, 4.209716796875, 4.4984130859375, 4.787109375, 5.0758056640625, 5.364501953125, 5.6531982421875, 5.94189453125, 6.2305908203125, 6.519287109375, 6.8079833984375, 7.0966796875, 7.3853759765625, 7.674072265625, 7.9627685546875, 8.25146484375, 8.5401611328125, 8.828857421875, 9.1175537109375, 9.40625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 15.0, 13.0, 22.0, 25.0, 28.0, 38.0, 31.0, 44.0, 43.0, 37.0, 42.0, 62.0, 55.0, 50.0, 58.0, 49.0, 42.0, 38.0, 29.0, 40.0, 34.0, 21.0, 27.0, 25.0, 24.0, 15.0, 8.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.5740966796875, -12.179443359375, -11.7847900390625, -11.39013671875, -10.9954833984375, -10.600830078125, -10.2061767578125, -9.8115234375, -9.4168701171875, -9.022216796875, -8.6275634765625, -8.23291015625, -7.8382568359375, -7.443603515625, -7.0489501953125, -6.654296875, -6.2596435546875, -5.864990234375, -5.4703369140625, -5.07568359375, -4.6810302734375, -4.286376953125, -3.8917236328125, -3.4970703125, -3.1024169921875, -2.707763671875, -2.3131103515625, -1.91845703125, -1.5238037109375, -1.129150390625, -0.7344970703125, -0.33984375, 0.0548095703125, 0.449462890625, 0.8441162109375, 1.23876953125, 1.6334228515625, 2.028076171875, 2.4227294921875, 2.8173828125, 3.2120361328125, 3.606689453125, 4.0013427734375, 4.39599609375, 4.7906494140625, 5.185302734375, 5.5799560546875, 5.974609375, 6.3692626953125, 6.763916015625, 7.1585693359375, 7.55322265625, 7.9478759765625, 8.342529296875, 8.7371826171875, 9.1318359375, 9.5264892578125, 9.921142578125, 10.3157958984375, 10.71044921875, 11.1051025390625, 11.499755859375, 11.8944091796875, 12.2890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 1.0, 10.0, 10.0, 19.0, 24.0, 37.0, 75.0, 137.0, 204.0, 409.0, 812.0, 1552.0, 3434.0, 8215.0, 27099.0, 144869.0, 683105.0, 137752.0, 26276.0, 7939.0, 3397.0, 1517.0, 778.0, 372.0, 207.0, 121.0, 71.0, 41.0, 20.0, 10.0, 12.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23046875, -3.1170654296875, -3.003662109375, -2.8902587890625, -2.77685546875, -2.6634521484375, -2.550048828125, -2.4366455078125, -2.3232421875, -2.2098388671875, -2.096435546875, -1.9830322265625, -1.86962890625, -1.7562255859375, -1.642822265625, -1.5294189453125, -1.416015625, -1.3026123046875, -1.189208984375, -1.0758056640625, -0.96240234375, -0.8489990234375, -0.735595703125, -0.6221923828125, -0.5087890625, -0.3953857421875, -0.281982421875, -0.1685791015625, -0.05517578125, 0.0582275390625, 0.171630859375, 0.2850341796875, 0.3984375, 0.5118408203125, 0.625244140625, 0.7386474609375, 0.85205078125, 0.9654541015625, 1.078857421875, 1.1922607421875, 1.3056640625, 1.4190673828125, 1.532470703125, 1.6458740234375, 1.75927734375, 1.8726806640625, 1.986083984375, 2.0994873046875, 2.212890625, 2.3262939453125, 2.439697265625, 2.5531005859375, 2.66650390625, 2.7799072265625, 2.893310546875, 3.0067138671875, 3.1201171875, 3.2335205078125, 3.346923828125, 3.4603271484375, 3.57373046875, 3.6871337890625, 3.800537109375, 3.9139404296875, 4.02734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 0.0, 2.0, 8.0, 5.0, 9.0, 15.0, 28.0, 34.0, 45.0, 76.0, 119.0, 150.0, 166.0, 111.0, 73.0, 54.0, 34.0, 18.0, 11.0, 10.0, 6.0, 9.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014047622680664062, -0.0013645291328430176, -0.001324295997619629, -0.0012840628623962402, -0.0012438297271728516, -0.0012035965919494629, -0.0011633634567260742, -0.0011231303215026855, -0.0010828971862792969, -0.0010426640510559082, -0.0010024309158325195, -0.0009621977806091309, -0.0009219646453857422, -0.0008817315101623535, -0.0008414983749389648, -0.0008012652397155762, -0.0007610321044921875, -0.0007207989692687988, -0.0006805658340454102, -0.0006403326988220215, -0.0006000995635986328, -0.0005598664283752441, -0.0005196332931518555, -0.0004794001579284668, -0.0004391670227050781, -0.00039893388748168945, -0.0003587007522583008, -0.0003184676170349121, -0.00027823448181152344, -0.00023800134658813477, -0.0001977682113647461, -0.00015753507614135742, -0.00011730194091796875, -7.706880569458008e-05, -3.6835670471191406e-05, 3.3974647521972656e-06, 4.363059997558594e-05, 8.386373519897461e-05, 0.00012409687042236328, 0.00016433000564575195, 0.00020456314086914062, 0.0002447962760925293, 0.00028502941131591797, 0.00032526254653930664, 0.0003654956817626953, 0.000405728816986084, 0.00044596195220947266, 0.00048619508743286133, 0.00052642822265625, 0.0005666613578796387, 0.0006068944931030273, 0.000647127628326416, 0.0006873607635498047, 0.0007275938987731934, 0.000767827033996582, 0.0008080601692199707, 0.0008482933044433594, 0.000888526439666748, 0.0009287595748901367, 0.0009689927101135254, 0.001009225845336914, 0.0010494589805603027, 0.0010896921157836914, 0.00112992525100708, 0.0011701583862304688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 3.0, 9.0, 12.0, 16.0, 30.0, 29.0, 84.0, 117.0, 224.0, 417.0, 822.0, 1720.0, 4135.0, 10639.0, 36547.0, 178926.0, 636136.0, 134407.0, 28968.0, 8849.0, 3379.0, 1505.0, 735.0, 349.0, 183.0, 113.0, 64.0, 41.0, 24.0, 17.0, 10.0, 8.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.203582763671875, -3.09466552734375, -2.985748291015625, -2.8768310546875, -2.767913818359375, -2.65899658203125, -2.550079345703125, -2.441162109375, -2.332244873046875, -2.22332763671875, -2.114410400390625, -2.0054931640625, -1.896575927734375, -1.78765869140625, -1.678741455078125, -1.56982421875, -1.460906982421875, -1.35198974609375, -1.243072509765625, -1.1341552734375, -1.025238037109375, -0.91632080078125, -0.807403564453125, -0.698486328125, -0.589569091796875, -0.48065185546875, -0.371734619140625, -0.2628173828125, -0.153900146484375, -0.04498291015625, 0.063934326171875, 0.1728515625, 0.281768798828125, 0.39068603515625, 0.499603271484375, 0.6085205078125, 0.717437744140625, 0.82635498046875, 0.935272216796875, 1.044189453125, 1.153106689453125, 1.26202392578125, 1.370941162109375, 1.4798583984375, 1.588775634765625, 1.69769287109375, 1.806610107421875, 1.91552734375, 2.024444580078125, 2.13336181640625, 2.242279052734375, 2.3511962890625, 2.460113525390625, 2.56903076171875, 2.677947998046875, 2.786865234375, 2.895782470703125, 3.00469970703125, 3.113616943359375, 3.2225341796875, 3.331451416015625, 3.44036865234375, 3.549285888671875, 3.658203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 9.0, 9.0, 8.0, 14.0, 24.0, 23.0, 40.0, 32.0, 61.0, 78.0, 76.0, 81.0, 85.0, 76.0, 82.0, 62.0, 55.0, 40.0, 27.0, 34.0, 17.0, 12.0, 9.0, 8.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.177734375, -3.0760498046875, -2.974365234375, -2.8726806640625, -2.77099609375, -2.6693115234375, -2.567626953125, -2.4659423828125, -2.3642578125, -2.2625732421875, -2.160888671875, -2.0592041015625, -1.95751953125, -1.8558349609375, -1.754150390625, -1.6524658203125, -1.55078125, -1.4490966796875, -1.347412109375, -1.2457275390625, -1.14404296875, -1.0423583984375, -0.940673828125, -0.8389892578125, -0.7373046875, -0.6356201171875, -0.533935546875, -0.4322509765625, -0.33056640625, -0.2288818359375, -0.127197265625, -0.0255126953125, 0.076171875, 0.1778564453125, 0.279541015625, 0.3812255859375, 0.48291015625, 0.5845947265625, 0.686279296875, 0.7879638671875, 0.8896484375, 0.9913330078125, 1.093017578125, 1.1947021484375, 1.29638671875, 1.3980712890625, 1.499755859375, 1.6014404296875, 1.703125, 1.8048095703125, 1.906494140625, 2.0081787109375, 2.10986328125, 2.2115478515625, 2.313232421875, 2.4149169921875, 2.5166015625, 2.6182861328125, 2.719970703125, 2.8216552734375, 2.92333984375, 3.0250244140625, 3.126708984375, 3.2283935546875, 3.330078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 14.0, 27.0, 85.0, 219.0, 428.0, 147.0, 47.0, 18.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.21112060546875, -159.68402099609375, -155.1569366455078, -150.6298370361328, -146.10275268554688, -141.57565307617188, -137.04856872558594, -132.52146911621094, -127.994384765625, -123.46729278564453, -118.94020080566406, -114.4131088256836, -109.88601684570312, -105.35892486572266, -100.83183288574219, -96.30473327636719, -91.77764129638672, -87.25054931640625, -82.72345733642578, -78.19636535644531, -73.66927337646484, -69.14218139648438, -64.61508178710938, -60.08799362182617, -55.5609016418457, -51.033809661865234, -46.506717681884766, -41.97962188720703, -37.45252990722656, -32.925437927246094, -28.398345947265625, -23.871253967285156, -19.344161987304688, -14.817070007324219, -10.289977073669434, -5.762884140014648, -1.2357921600341797, 3.291299819946289, 7.818393707275391, 12.34548568725586, 16.872577667236328, 21.399669647216797, 25.926761627197266, 30.453855514526367, 34.98094940185547, 39.50804138183594, 44.035133361816406, 48.562225341796875, 53.089317321777344, 57.61640930175781, 62.14350128173828, 66.67059326171875, 71.19768524169922, 75.72477722167969, 80.25187683105469, 84.77896118164062, 89.30606079101562, 93.8331527709961, 98.36024475097656, 102.88733673095703, 107.4144287109375, 111.94152069091797, 116.46861267089844, 120.99571228027344, 125.52279663085938]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 7.0, 11.0, 17.0, 14.0, 34.0, 27.0, 34.0, 35.0, 42.0, 51.0, 66.0, 101.0, 119.0, 83.0, 52.0, 53.0, 43.0, 37.0, 29.0, 29.0, 17.0, 23.0, 20.0, 15.0, 9.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-84.99681091308594, -82.939697265625, -80.88258361816406, -78.82546997070312, -76.76835632324219, -74.71125030517578, -72.65413665771484, -70.5970230102539, -68.53990936279297, -66.48279571533203, -64.4256820678711, -62.36857223510742, -60.311458587646484, -58.25434494018555, -56.197235107421875, -54.14012145996094, -52.0830078125, -50.02589416503906, -47.968780517578125, -45.91167068481445, -43.854557037353516, -41.79744338989258, -39.740333557128906, -37.68321990966797, -35.62610626220703, -33.568992614746094, -31.51188087463379, -29.454769134521484, -27.397655487060547, -25.34054183959961, -23.283430099487305, -21.226318359375, -19.169200897216797, -17.11208724975586, -15.054975509643555, -12.997862815856934, -10.940750122070312, -8.883637428283691, -6.82652473449707, -4.769412040710449, -2.712299346923828, -0.655186653137207, 1.401926040649414, 3.459038734436035, 5.516151428222656, 7.573264122009277, 9.630376815795898, 11.68748950958252, 13.74460220336914, 15.801714897155762, 17.858827590942383, 19.915939331054688, 21.973052978515625, 24.030166625976562, 26.087278366088867, 28.144390106201172, 30.20150375366211, 32.25861740112305, 34.31572723388672, 36.372840881347656, 38.429954528808594, 40.48706817626953, 42.54418182373047, 44.60129165649414, 46.65840530395508]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 13.0, 20.0, 26.0, 33.0, 45.0, 96.0, 165.0, 331.0, 804.0, 2006.0, 7290.0, 44841.0, 1067719.0, 2935887.0, 116864.0, 13012.0, 3117.0, 1095.0, 401.0, 208.0, 116.0, 72.0, 52.0, 24.0, 11.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.72900390625, -8.4736328125, -8.21826171875, -7.962890625, -7.70751953125, -7.4521484375, -7.19677734375, -6.94140625, -6.68603515625, -6.4306640625, -6.17529296875, -5.919921875, -5.66455078125, -5.4091796875, -5.15380859375, -4.8984375, -4.64306640625, -4.3876953125, -4.13232421875, -3.876953125, -3.62158203125, -3.3662109375, -3.11083984375, -2.85546875, -2.60009765625, -2.3447265625, -2.08935546875, -1.833984375, -1.57861328125, -1.3232421875, -1.06787109375, -0.8125, -0.55712890625, -0.3017578125, -0.04638671875, 0.208984375, 0.46435546875, 0.7197265625, 0.97509765625, 1.23046875, 1.48583984375, 1.7412109375, 1.99658203125, 2.251953125, 2.50732421875, 2.7626953125, 3.01806640625, 3.2734375, 3.52880859375, 3.7841796875, 4.03955078125, 4.294921875, 4.55029296875, 4.8056640625, 5.06103515625, 5.31640625, 5.57177734375, 5.8271484375, 6.08251953125, 6.337890625, 6.59326171875, 6.8486328125, 7.10400390625, 7.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 1.0, 8.0, 10.0, 9.0, 6.0, 20.0, 27.0, 19.0, 25.0, 29.0, 32.0, 50.0, 55.0, 61.0, 53.0, 63.0, 54.0, 59.0, 55.0, 57.0, 58.0, 48.0, 33.0, 30.0, 27.0, 26.0, 30.0, 19.0, 9.0, 10.0, 8.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.478515625, -3.356475830078125, -3.23443603515625, -3.112396240234375, -2.9903564453125, -2.868316650390625, -2.74627685546875, -2.624237060546875, -2.502197265625, -2.380157470703125, -2.25811767578125, -2.136077880859375, -2.0140380859375, -1.891998291015625, -1.76995849609375, -1.647918701171875, -1.52587890625, -1.403839111328125, -1.28179931640625, -1.159759521484375, -1.0377197265625, -0.915679931640625, -0.79364013671875, -0.671600341796875, -0.549560546875, -0.427520751953125, -0.30548095703125, -0.183441162109375, -0.0614013671875, 0.060638427734375, 0.18267822265625, 0.304718017578125, 0.4267578125, 0.548797607421875, 0.67083740234375, 0.792877197265625, 0.9149169921875, 1.036956787109375, 1.15899658203125, 1.281036376953125, 1.403076171875, 1.525115966796875, 1.64715576171875, 1.769195556640625, 1.8912353515625, 2.013275146484375, 2.13531494140625, 2.257354736328125, 2.37939453125, 2.501434326171875, 2.62347412109375, 2.745513916015625, 2.8675537109375, 2.989593505859375, 3.11163330078125, 3.233673095703125, 3.355712890625, 3.477752685546875, 3.59979248046875, 3.721832275390625, 3.8438720703125, 3.965911865234375, 4.08795166015625, 4.209991455078125, 4.33203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 4.0, 4.0, 8.0, 14.0, 22.0, 35.0, 76.0, 219.0, 640.0, 3555.0, 76061.0, 3985436.0, 122095.0, 4782.0, 842.0, 295.0, 109.0, 49.0, 18.0, 12.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.5, -21.95849609375, -21.4169921875, -20.87548828125, -20.333984375, -19.79248046875, -19.2509765625, -18.70947265625, -18.16796875, -17.62646484375, -17.0849609375, -16.54345703125, -16.001953125, -15.46044921875, -14.9189453125, -14.37744140625, -13.8359375, -13.29443359375, -12.7529296875, -12.21142578125, -11.669921875, -11.12841796875, -10.5869140625, -10.04541015625, -9.50390625, -8.96240234375, -8.4208984375, -7.87939453125, -7.337890625, -6.79638671875, -6.2548828125, -5.71337890625, -5.171875, -4.63037109375, -4.0888671875, -3.54736328125, -3.005859375, -2.46435546875, -1.9228515625, -1.38134765625, -0.83984375, -0.29833984375, 0.2431640625, 0.78466796875, 1.326171875, 1.86767578125, 2.4091796875, 2.95068359375, 3.4921875, 4.03369140625, 4.5751953125, 5.11669921875, 5.658203125, 6.19970703125, 6.7412109375, 7.28271484375, 7.82421875, 8.36572265625, 8.9072265625, 9.44873046875, 9.990234375, 10.53173828125, 11.0732421875, 11.61474609375, 12.15625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 15.0, 19.0, 53.0, 53.0, 104.0, 169.0, 279.0, 469.0, 735.0, 823.0, 563.0, 308.0, 169.0, 104.0, 57.0, 40.0, 32.0, 16.0, 14.0, 16.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.753173828125, -4.49072265625, -4.228271484375, -3.9658203125, -3.703369140625, -3.44091796875, -3.178466796875, -2.916015625, -2.653564453125, -2.39111328125, -2.128662109375, -1.8662109375, -1.603759765625, -1.34130859375, -1.078857421875, -0.81640625, -0.553955078125, -0.29150390625, -0.029052734375, 0.2333984375, 0.495849609375, 0.75830078125, 1.020751953125, 1.283203125, 1.545654296875, 1.80810546875, 2.070556640625, 2.3330078125, 2.595458984375, 2.85791015625, 3.120361328125, 3.3828125, 3.645263671875, 3.90771484375, 4.170166015625, 4.4326171875, 4.695068359375, 4.95751953125, 5.219970703125, 5.482421875, 5.744873046875, 6.00732421875, 6.269775390625, 6.5322265625, 6.794677734375, 7.05712890625, 7.319580078125, 7.58203125, 7.844482421875, 8.10693359375, 8.369384765625, 8.6318359375, 8.894287109375, 9.15673828125, 9.419189453125, 9.681640625, 9.944091796875, 10.20654296875, 10.468994140625, 10.7314453125, 10.993896484375, 11.25634765625, 11.518798828125, 11.78125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 41.0, 117.0, 237.0, 260.0, 181.0, 92.0, 39.0, 18.0, 9.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1497802734375, -111.68578338623047, -108.22178649902344, -104.75778198242188, -101.29378509521484, -97.82978820800781, -94.36578369140625, -90.90178680419922, -87.43778991699219, -83.97379302978516, -80.50979614257812, -77.04579162597656, -73.58179473876953, -70.1177978515625, -66.65379333496094, -63.189796447753906, -59.725799560546875, -56.261802673339844, -52.79780197143555, -49.33380126953125, -45.86980438232422, -42.40580749511719, -38.94180679321289, -35.477806091308594, -32.01380920410156, -28.5498104095459, -25.085811614990234, -21.62181282043457, -18.157814025878906, -14.693815231323242, -11.229816436767578, -7.765817642211914, -4.30181884765625, -0.8378200531005859, 2.626178741455078, 6.090177536010742, 9.554176330566406, 13.01817512512207, 16.482173919677734, 19.9461727142334, 23.410171508789062, 26.874170303344727, 30.33816909790039, 33.80216979980469, 37.26616668701172, 40.73016357421875, 44.19416427612305, 47.658164978027344, 51.122161865234375, 54.586158752441406, 58.0501594543457, 61.51416015625, 64.97815704345703, 68.44215393066406, 71.90615844726562, 75.37015533447266, 78.83415222167969, 82.29814910888672, 85.76214599609375, 89.22615051269531, 92.69014739990234, 96.15414428710938, 99.61814880371094, 103.08214569091797, 106.546142578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 9.0, 12.0, 8.0, 15.0, 18.0, 21.0, 20.0, 24.0, 35.0, 30.0, 29.0, 58.0, 44.0, 57.0, 61.0, 61.0, 38.0, 38.0, 45.0, 37.0, 47.0, 43.0, 42.0, 36.0, 29.0, 39.0, 17.0, 15.0, 12.0, 18.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.70735168457031, -38.657447814941406, -37.607540130615234, -36.55763626098633, -35.507728576660156, -34.45782470703125, -33.40791702270508, -32.35801315307617, -31.30810546875, -30.25819969177246, -29.208293914794922, -28.158388137817383, -27.108482360839844, -26.058576583862305, -25.008670806884766, -23.95876693725586, -22.90886116027832, -21.85895538330078, -20.809049606323242, -19.759143829345703, -18.709238052368164, -17.659332275390625, -16.60942840576172, -15.559521675109863, -14.509615898132324, -13.459710121154785, -12.409804344177246, -11.359899520874023, -10.309993743896484, -9.260087966918945, -8.210182189941406, -7.160276412963867, -6.110372543334961, -5.060466766357422, -4.010560989379883, -2.960655689239502, -1.910749912261963, -0.8608441352844238, 0.18906116485595703, 1.238966941833496, 2.288872718811035, 3.338778495788574, 4.388684272766113, 5.438589572906494, 6.488495349884033, 7.538401126861572, 8.588306427001953, 9.638212203979492, 10.688117980957031, 11.73802375793457, 12.78792953491211, 13.837835311889648, 14.887741088867188, 15.937646865844727, 16.987552642822266, 18.037456512451172, 19.087364196777344, 20.137269973754883, 21.187175750732422, 22.23708152770996, 23.2869873046875, 24.33689308166504, 25.386798858642578, 26.436702728271484, 27.486608505249023]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 13.0, 30.0, 39.0, 54.0, 111.0, 215.0, 420.0, 879.0, 1985.0, 4688.0, 13104.0, 42365.0, 171197.0, 513677.0, 220865.0, 53178.0, 15947.0, 5654.0, 2170.0, 936.0, 437.0, 256.0, 127.0, 72.0, 44.0, 24.0, 11.0, 17.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.34375, -6.121826171875, -5.89990234375, -5.677978515625, -5.4560546875, -5.234130859375, -5.01220703125, -4.790283203125, -4.568359375, -4.346435546875, -4.12451171875, -3.902587890625, -3.6806640625, -3.458740234375, -3.23681640625, -3.014892578125, -2.79296875, -2.571044921875, -2.34912109375, -2.127197265625, -1.9052734375, -1.683349609375, -1.46142578125, -1.239501953125, -1.017578125, -0.795654296875, -0.57373046875, -0.351806640625, -0.1298828125, 0.092041015625, 0.31396484375, 0.535888671875, 0.7578125, 0.979736328125, 1.20166015625, 1.423583984375, 1.6455078125, 1.867431640625, 2.08935546875, 2.311279296875, 2.533203125, 2.755126953125, 2.97705078125, 3.198974609375, 3.4208984375, 3.642822265625, 3.86474609375, 4.086669921875, 4.30859375, 4.530517578125, 4.75244140625, 4.974365234375, 5.1962890625, 5.418212890625, 5.64013671875, 5.862060546875, 6.083984375, 6.305908203125, 6.52783203125, 6.749755859375, 6.9716796875, 7.193603515625, 7.41552734375, 7.637451171875, 7.859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 8.0, 11.0, 16.0, 12.0, 19.0, 27.0, 33.0, 46.0, 45.0, 46.0, 50.0, 53.0, 61.0, 64.0, 58.0, 57.0, 65.0, 50.0, 51.0, 39.0, 34.0, 27.0, 32.0, 26.0, 14.0, 11.0, 14.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.170013427734375, -4.04315185546875, -3.916290283203125, -3.7894287109375, -3.662567138671875, -3.53570556640625, -3.408843994140625, -3.281982421875, -3.155120849609375, -3.02825927734375, -2.901397705078125, -2.7745361328125, -2.647674560546875, -2.52081298828125, -2.393951416015625, -2.26708984375, -2.140228271484375, -2.01336669921875, -1.886505126953125, -1.7596435546875, -1.632781982421875, -1.50592041015625, -1.379058837890625, -1.252197265625, -1.125335693359375, -0.99847412109375, -0.871612548828125, -0.7447509765625, -0.617889404296875, -0.49102783203125, -0.364166259765625, -0.2373046875, -0.110443115234375, 0.01641845703125, 0.143280029296875, 0.2701416015625, 0.397003173828125, 0.52386474609375, 0.650726318359375, 0.777587890625, 0.904449462890625, 1.03131103515625, 1.158172607421875, 1.2850341796875, 1.411895751953125, 1.53875732421875, 1.665618896484375, 1.79248046875, 1.919342041015625, 2.04620361328125, 2.173065185546875, 2.2999267578125, 2.426788330078125, 2.55364990234375, 2.680511474609375, 2.807373046875, 2.934234619140625, 3.06109619140625, 3.187957763671875, 3.3148193359375, 3.441680908203125, 3.56854248046875, 3.695404052734375, 3.822265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 6.0, 8.0, 12.0, 7.0, 16.0, 19.0, 23.0, 28.0, 41.0, 62.0, 59.0, 100.0, 147.0, 244.0, 361.0, 537.0, 1072.0, 2354.0, 6036.0, 20216.0, 104308.0, 714054.0, 158114.0, 27090.0, 7603.0, 2807.0, 1313.0, 697.0, 381.0, 237.0, 158.0, 130.0, 80.0, 56.0, 49.0, 33.0, 23.0, 11.0, 17.0, 4.0, 7.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8515625, -8.580078125, -8.30859375, -8.037109375, -7.765625, -7.494140625, -7.22265625, -6.951171875, -6.6796875, -6.408203125, -6.13671875, -5.865234375, -5.59375, -5.322265625, -5.05078125, -4.779296875, -4.5078125, -4.236328125, -3.96484375, -3.693359375, -3.421875, -3.150390625, -2.87890625, -2.607421875, -2.3359375, -2.064453125, -1.79296875, -1.521484375, -1.25, -0.978515625, -0.70703125, -0.435546875, -0.1640625, 0.107421875, 0.37890625, 0.650390625, 0.921875, 1.193359375, 1.46484375, 1.736328125, 2.0078125, 2.279296875, 2.55078125, 2.822265625, 3.09375, 3.365234375, 3.63671875, 3.908203125, 4.1796875, 4.451171875, 4.72265625, 4.994140625, 5.265625, 5.537109375, 5.80859375, 6.080078125, 6.3515625, 6.623046875, 6.89453125, 7.166015625, 7.4375, 7.708984375, 7.98046875, 8.251953125, 8.5234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 8.0, 11.0, 12.0, 14.0, 10.0, 18.0, 16.0, 18.0, 18.0, 30.0, 23.0, 39.0, 38.0, 44.0, 54.0, 41.0, 60.0, 52.0, 44.0, 51.0, 53.0, 42.0, 45.0, 32.0, 35.0, 33.0, 22.0, 22.0, 20.0, 9.0, 10.0, 12.0, 13.0, 6.0, 2.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.069091796875, -9.70068359375, -9.332275390625, -8.9638671875, -8.595458984375, -8.22705078125, -7.858642578125, -7.490234375, -7.121826171875, -6.75341796875, -6.385009765625, -6.0166015625, -5.648193359375, -5.27978515625, -4.911376953125, -4.54296875, -4.174560546875, -3.80615234375, -3.437744140625, -3.0693359375, -2.700927734375, -2.33251953125, -1.964111328125, -1.595703125, -1.227294921875, -0.85888671875, -0.490478515625, -0.1220703125, 0.246337890625, 0.61474609375, 0.983154296875, 1.3515625, 1.719970703125, 2.08837890625, 2.456787109375, 2.8251953125, 3.193603515625, 3.56201171875, 3.930419921875, 4.298828125, 4.667236328125, 5.03564453125, 5.404052734375, 5.7724609375, 6.140869140625, 6.50927734375, 6.877685546875, 7.24609375, 7.614501953125, 7.98291015625, 8.351318359375, 8.7197265625, 9.088134765625, 9.45654296875, 9.824951171875, 10.193359375, 10.561767578125, 10.93017578125, 11.298583984375, 11.6669921875, 12.035400390625, 12.40380859375, 12.772216796875, 13.140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 6.0, 11.0, 11.0, 26.0, 40.0, 46.0, 65.0, 126.0, 187.0, 357.0, 638.0, 1297.0, 2634.0, 6145.0, 15337.0, 43755.0, 170960.0, 651824.0, 103945.0, 30622.0, 11412.0, 4668.0, 2144.0, 990.0, 520.0, 282.0, 178.0, 108.0, 59.0, 43.0, 27.0, 27.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 5.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.851287841796875, -2.76312255859375, -2.674957275390625, -2.5867919921875, -2.498626708984375, -2.41046142578125, -2.322296142578125, -2.234130859375, -2.145965576171875, -2.05780029296875, -1.969635009765625, -1.8814697265625, -1.793304443359375, -1.70513916015625, -1.616973876953125, -1.52880859375, -1.440643310546875, -1.35247802734375, -1.264312744140625, -1.1761474609375, -1.087982177734375, -0.99981689453125, -0.911651611328125, -0.823486328125, -0.735321044921875, -0.64715576171875, -0.558990478515625, -0.4708251953125, -0.382659912109375, -0.29449462890625, -0.206329345703125, -0.1181640625, -0.029998779296875, 0.05816650390625, 0.146331787109375, 0.2344970703125, 0.322662353515625, 0.41082763671875, 0.498992919921875, 0.587158203125, 0.675323486328125, 0.76348876953125, 0.851654052734375, 0.9398193359375, 1.027984619140625, 1.11614990234375, 1.204315185546875, 1.29248046875, 1.380645751953125, 1.46881103515625, 1.556976318359375, 1.6451416015625, 1.733306884765625, 1.82147216796875, 1.909637451171875, 1.997802734375, 2.085968017578125, 2.17413330078125, 2.262298583984375, 2.3504638671875, 2.438629150390625, 2.52679443359375, 2.614959716796875, 2.703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 10.0, 18.0, 23.0, 38.0, 35.0, 47.0, 77.0, 124.0, 107.0, 131.0, 92.0, 68.0, 44.0, 25.0, 30.0, 25.0, 15.0, 11.0, 5.0, 5.0, 8.0, 5.0, 5.0, 1.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008645057678222656, -0.0008373931050300598, -0.000810280442237854, -0.0007831677794456482, -0.0007560551166534424, -0.0007289424538612366, -0.0007018297910690308, -0.000674717128276825, -0.0006476044654846191, -0.0006204918026924133, -0.0005933791399002075, -0.0005662664771080017, -0.0005391538143157959, -0.0005120411515235901, -0.0004849284887313843, -0.00045781582593917847, -0.00043070316314697266, -0.00040359050035476685, -0.00037647783756256104, -0.0003493651747703552, -0.0003222525119781494, -0.0002951398491859436, -0.0002680271863937378, -0.00024091452360153198, -0.00021380186080932617, -0.00018668919801712036, -0.00015957653522491455, -0.00013246387243270874, -0.00010535120964050293, -7.823854684829712e-05, -5.112588405609131e-05, -2.4013221263885498e-05, 3.0994415283203125e-06, 3.0212104320526123e-05, 5.7324767112731934e-05, 8.443742990493774e-05, 0.00011155009269714355, 0.00013866275548934937, 0.00016577541828155518, 0.00019288808107376099, 0.0002200007438659668, 0.0002471134066581726, 0.0002742260694503784, 0.00030133873224258423, 0.00032845139503479004, 0.00035556405782699585, 0.00038267672061920166, 0.00040978938341140747, 0.0004369020462036133, 0.0004640147089958191, 0.0004911273717880249, 0.0005182400345802307, 0.0005453526973724365, 0.0005724653601646423, 0.0005995780229568481, 0.000626690685749054, 0.0006538033485412598, 0.0006809160113334656, 0.0007080286741256714, 0.0007351413369178772, 0.000762253999710083, 0.0007893666625022888, 0.0008164793252944946, 0.0008435919880867004, 0.0008707046508789062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 17.0, 13.0, 13.0, 29.0, 32.0, 48.0, 98.0, 154.0, 290.0, 500.0, 947.0, 1965.0, 4770.0, 12714.0, 41747.0, 193268.0, 664169.0, 89964.0, 23685.0, 8070.0, 3112.0, 1368.0, 679.0, 346.0, 173.0, 135.0, 82.0, 51.0, 31.0, 19.0, 21.0, 15.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.347442626953125, -3.24371337890625, -3.139984130859375, -3.0362548828125, -2.932525634765625, -2.82879638671875, -2.725067138671875, -2.621337890625, -2.517608642578125, -2.41387939453125, -2.310150146484375, -2.2064208984375, -2.102691650390625, -1.99896240234375, -1.895233154296875, -1.79150390625, -1.687774658203125, -1.58404541015625, -1.480316162109375, -1.3765869140625, -1.272857666015625, -1.16912841796875, -1.065399169921875, -0.961669921875, -0.857940673828125, -0.75421142578125, -0.650482177734375, -0.5467529296875, -0.443023681640625, -0.33929443359375, -0.235565185546875, -0.1318359375, -0.028106689453125, 0.07562255859375, 0.179351806640625, 0.2830810546875, 0.386810302734375, 0.49053955078125, 0.594268798828125, 0.697998046875, 0.801727294921875, 0.90545654296875, 1.009185791015625, 1.1129150390625, 1.216644287109375, 1.32037353515625, 1.424102783203125, 1.52783203125, 1.631561279296875, 1.73529052734375, 1.839019775390625, 1.9427490234375, 2.046478271484375, 2.15020751953125, 2.253936767578125, 2.357666015625, 2.461395263671875, 2.56512451171875, 2.668853759765625, 2.7725830078125, 2.876312255859375, 2.98004150390625, 3.083770751953125, 3.1875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 9.0, 15.0, 13.0, 9.0, 9.0, 27.0, 37.0, 40.0, 65.0, 93.0, 110.0, 114.0, 109.0, 69.0, 56.0, 48.0, 40.0, 24.0, 21.0, 14.0, 14.0, 5.0, 14.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.968109130859375, -2.86395263671875, -2.759796142578125, -2.6556396484375, -2.551483154296875, -2.44732666015625, -2.343170166015625, -2.239013671875, -2.134857177734375, -2.03070068359375, -1.926544189453125, -1.8223876953125, -1.718231201171875, -1.61407470703125, -1.509918212890625, -1.40576171875, -1.301605224609375, -1.19744873046875, -1.093292236328125, -0.9891357421875, -0.884979248046875, -0.78082275390625, -0.676666259765625, -0.572509765625, -0.468353271484375, -0.36419677734375, -0.260040283203125, -0.1558837890625, -0.051727294921875, 0.05242919921875, 0.156585693359375, 0.2607421875, 0.364898681640625, 0.46905517578125, 0.573211669921875, 0.6773681640625, 0.781524658203125, 0.88568115234375, 0.989837646484375, 1.093994140625, 1.198150634765625, 1.30230712890625, 1.406463623046875, 1.5106201171875, 1.614776611328125, 1.71893310546875, 1.823089599609375, 1.92724609375, 2.031402587890625, 2.13555908203125, 2.239715576171875, 2.3438720703125, 2.448028564453125, 2.55218505859375, 2.656341552734375, 2.760498046875, 2.864654541015625, 2.96881103515625, 3.072967529296875, 3.1771240234375, 3.281280517578125, 3.38543701171875, 3.489593505859375, 3.59375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 7.0, 15.0, 21.0, 59.0, 96.0, 248.0, 261.0, 115.0, 70.0, 52.0, 25.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.06014633178711, -56.257965087890625, -53.45578384399414, -50.653602600097656, -47.85142135620117, -45.04924011230469, -42.2470588684082, -39.44487762451172, -36.642696380615234, -33.84051513671875, -31.038333892822266, -28.23615264892578, -25.433971405029297, -22.631790161132812, -19.829608917236328, -17.027427673339844, -14.22524642944336, -11.423065185546875, -8.62088394165039, -5.818702697753906, -3.016521453857422, -0.2143402099609375, 2.587841033935547, 5.390022277832031, 8.192203521728516, 10.994384765625, 13.796566009521484, 16.59874725341797, 19.400928497314453, 22.203109741210938, 25.005290985107422, 27.807472229003906, 30.609649658203125, 33.41183090209961, 36.214012145996094, 39.01619338989258, 41.81837463378906, 44.62055587768555, 47.42273712158203, 50.224918365478516, 53.027099609375, 55.829280853271484, 58.63146209716797, 61.43364334106445, 64.23582458496094, 67.03800964355469, 69.8401870727539, 72.64236450195312, 75.44454956054688, 78.24673461914062, 81.04891204833984, 83.85108947753906, 86.65327453613281, 89.45545959472656, 92.25763702392578, 95.059814453125, 97.86199951171875, 100.6641845703125, 103.46636199951172, 106.26853942871094, 109.07072448730469, 111.87290954589844, 114.67508697509766, 117.47726440429688, 120.27944946289062]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 1.0, 4.0, 6.0, 10.0, 10.0, 13.0, 9.0, 18.0, 21.0, 30.0, 18.0, 26.0, 21.0, 28.0, 30.0, 35.0, 44.0, 78.0, 90.0, 104.0, 71.0, 38.0, 32.0, 29.0, 20.0, 26.0, 33.0, 24.0, 18.0, 19.0, 15.0, 11.0, 11.0, 9.0, 7.0, 13.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.99598693847656, -48.56504821777344, -47.13410568237305, -45.70316696166992, -44.2722282409668, -42.84128952026367, -41.41034698486328, -39.979408264160156, -38.54846954345703, -37.117530822753906, -35.686588287353516, -34.25564956665039, -32.824710845947266, -31.393770217895508, -29.96282958984375, -28.531890869140625, -27.100950241088867, -25.67000961303711, -24.239070892333984, -22.808130264282227, -21.3771915435791, -19.946250915527344, -18.51531219482422, -17.08437156677246, -15.65343189239502, -14.222492218017578, -12.791552543640137, -11.360612869262695, -9.929672241210938, -8.498733520507812, -7.067792892456055, -5.636853218078613, -4.205913543701172, -2.7749738693237305, -1.34403395652771, 0.08690595626831055, 1.517845630645752, 2.9487853050231934, 4.379725456237793, 5.810665130615234, 7.241604804992676, 8.672544479370117, 10.103484153747559, 11.534423828125, 12.965364456176758, 14.396303176879883, 15.82724380493164, 17.258182525634766, 18.689123153686523, 20.12006378173828, 21.551002502441406, 22.981943130493164, 24.41288185119629, 25.843822479248047, 27.274761199951172, 28.70570182800293, 30.136642456054688, 31.567583084106445, 32.9985237121582, 34.42946243286133, 35.86040115356445, 37.29133987426758, 38.72228240966797, 40.153221130371094, 41.58415985107422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 9.0, 15.0, 18.0, 21.0, 30.0, 55.0, 79.0, 143.0, 261.0, 441.0, 954.0, 2224.0, 7361.0, 40800.0, 676812.0, 3137830.0, 292734.0, 25673.0, 5422.0, 1865.0, 644.0, 370.0, 183.0, 126.0, 66.0, 44.0, 26.0, 20.0, 17.0, 10.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.125, -9.8677978515625, -9.610595703125, -9.3533935546875, -9.09619140625, -8.8389892578125, -8.581787109375, -8.3245849609375, -8.0673828125, -7.8101806640625, -7.552978515625, -7.2957763671875, -7.03857421875, -6.7813720703125, -6.524169921875, -6.2669677734375, -6.009765625, -5.7525634765625, -5.495361328125, -5.2381591796875, -4.98095703125, -4.7237548828125, -4.466552734375, -4.2093505859375, -3.9521484375, -3.6949462890625, -3.437744140625, -3.1805419921875, -2.92333984375, -2.6661376953125, -2.408935546875, -2.1517333984375, -1.89453125, -1.6373291015625, -1.380126953125, -1.1229248046875, -0.86572265625, -0.6085205078125, -0.351318359375, -0.0941162109375, 0.1630859375, 0.4202880859375, 0.677490234375, 0.9346923828125, 1.19189453125, 1.4490966796875, 1.706298828125, 1.9635009765625, 2.220703125, 2.4779052734375, 2.735107421875, 2.9923095703125, 3.24951171875, 3.5067138671875, 3.763916015625, 4.0211181640625, 4.2783203125, 4.5355224609375, 4.792724609375, 5.0499267578125, 5.30712890625, 5.5643310546875, 5.821533203125, 6.0787353515625, 6.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 16.0, 12.0, 18.0, 16.0, 20.0, 18.0, 31.0, 29.0, 27.0, 37.0, 41.0, 35.0, 49.0, 50.0, 57.0, 65.0, 55.0, 48.0, 46.0, 47.0, 44.0, 44.0, 34.0, 41.0, 31.0, 24.0, 16.0, 15.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.953125, -4.838714599609375, -4.72430419921875, -4.609893798828125, -4.4954833984375, -4.381072998046875, -4.26666259765625, -4.152252197265625, -4.037841796875, -3.923431396484375, -3.80902099609375, -3.694610595703125, -3.5802001953125, -3.465789794921875, -3.35137939453125, -3.236968994140625, -3.12255859375, -3.008148193359375, -2.89373779296875, -2.779327392578125, -2.6649169921875, -2.550506591796875, -2.43609619140625, -2.321685791015625, -2.207275390625, -2.092864990234375, -1.97845458984375, -1.864044189453125, -1.7496337890625, -1.635223388671875, -1.52081298828125, -1.406402587890625, -1.2919921875, -1.177581787109375, -1.06317138671875, -0.948760986328125, -0.8343505859375, -0.719940185546875, -0.60552978515625, -0.491119384765625, -0.376708984375, -0.262298583984375, -0.14788818359375, -0.033477783203125, 0.0809326171875, 0.195343017578125, 0.30975341796875, 0.424163818359375, 0.53857421875, 0.652984619140625, 0.76739501953125, 0.881805419921875, 0.9962158203125, 1.110626220703125, 1.22503662109375, 1.339447021484375, 1.453857421875, 1.568267822265625, 1.68267822265625, 1.797088623046875, 1.9114990234375, 2.025909423828125, 2.14031982421875, 2.254730224609375, 2.369140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 9.0, 14.0, 16.0, 26.0, 59.0, 73.0, 133.0, 294.0, 592.0, 1529.0, 5109.0, 33945.0, 1137549.0, 2937632.0, 66290.0, 7705.0, 1907.0, 702.0, 341.0, 142.0, 67.0, 46.0, 22.0, 14.0, 20.0, 6.0, 5.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7421875, -13.3720703125, -13.001953125, -12.6318359375, -12.26171875, -11.8916015625, -11.521484375, -11.1513671875, -10.78125, -10.4111328125, -10.041015625, -9.6708984375, -9.30078125, -8.9306640625, -8.560546875, -8.1904296875, -7.8203125, -7.4501953125, -7.080078125, -6.7099609375, -6.33984375, -5.9697265625, -5.599609375, -5.2294921875, -4.859375, -4.4892578125, -4.119140625, -3.7490234375, -3.37890625, -3.0087890625, -2.638671875, -2.2685546875, -1.8984375, -1.5283203125, -1.158203125, -0.7880859375, -0.41796875, -0.0478515625, 0.322265625, 0.6923828125, 1.0625, 1.4326171875, 1.802734375, 2.1728515625, 2.54296875, 2.9130859375, 3.283203125, 3.6533203125, 4.0234375, 4.3935546875, 4.763671875, 5.1337890625, 5.50390625, 5.8740234375, 6.244140625, 6.6142578125, 6.984375, 7.3544921875, 7.724609375, 8.0947265625, 8.46484375, 8.8349609375, 9.205078125, 9.5751953125, 9.9453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 12.0, 18.0, 10.0, 23.0, 16.0, 34.0, 55.0, 97.0, 147.0, 204.0, 313.0, 492.0, 588.0, 641.0, 476.0, 314.0, 198.0, 151.0, 82.0, 54.0, 43.0, 29.0, 22.0, 16.0, 10.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.703125, -8.44671630859375, -8.1903076171875, -7.93389892578125, -7.677490234375, -7.42108154296875, -7.1646728515625, -6.90826416015625, -6.65185546875, -6.39544677734375, -6.1390380859375, -5.88262939453125, -5.626220703125, -5.36981201171875, -5.1134033203125, -4.85699462890625, -4.6005859375, -4.34417724609375, -4.0877685546875, -3.83135986328125, -3.574951171875, -3.31854248046875, -3.0621337890625, -2.80572509765625, -2.54931640625, -2.29290771484375, -2.0364990234375, -1.78009033203125, -1.523681640625, -1.26727294921875, -1.0108642578125, -0.75445556640625, -0.498046875, -0.24163818359375, 0.0147705078125, 0.27117919921875, 0.527587890625, 0.78399658203125, 1.0404052734375, 1.29681396484375, 1.55322265625, 1.80963134765625, 2.0660400390625, 2.32244873046875, 2.578857421875, 2.83526611328125, 3.0916748046875, 3.34808349609375, 3.6044921875, 3.86090087890625, 4.1173095703125, 4.37371826171875, 4.630126953125, 4.88653564453125, 5.1429443359375, 5.39935302734375, 5.65576171875, 5.91217041015625, 6.1685791015625, 6.42498779296875, 6.681396484375, 6.93780517578125, 7.1942138671875, 7.45062255859375, 7.70703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 21.0, 32.0, 48.0, 62.0, 67.0, 98.0, 113.0, 104.0, 120.0, 91.0, 68.0, 39.0, 30.0, 27.0, 15.0, 12.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.77815246582031, -63.20740509033203, -61.63665771484375, -60.065914154052734, -58.49516677856445, -56.92441940307617, -55.353675842285156, -53.782928466796875, -52.212181091308594, -50.64143371582031, -49.07068634033203, -47.499942779541016, -45.929195404052734, -44.35844802856445, -42.78770446777344, -41.216957092285156, -39.646209716796875, -38.075462341308594, -36.50471496582031, -34.9339714050293, -33.363224029541016, -31.792476654052734, -30.221731185913086, -28.650985717773438, -27.080238342285156, -25.509490966796875, -23.938745498657227, -22.368000030517578, -20.797252655029297, -19.226505279541016, -17.655759811401367, -16.08501434326172, -14.514266967773438, -12.943520545959473, -11.372774124145508, -9.802027702331543, -8.231281280517578, -6.660534858703613, -5.089788436889648, -3.5190420150756836, -1.9482955932617188, -0.3775491714477539, 1.193197250366211, 2.763943672180176, 4.334690093994141, 5.9054365158081055, 7.47618293762207, 9.046929359436035, 10.61767578125, 12.188422203063965, 13.75916862487793, 15.329915046691895, 16.90066146850586, 18.47140884399414, 20.04215431213379, 21.612899780273438, 23.18364715576172, 24.75439453125, 26.32513999938965, 27.895885467529297, 29.466632843017578, 31.03738021850586, 32.608123779296875, 34.178871154785156, 35.74961853027344]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 7.0, 10.0, 5.0, 10.0, 10.0, 17.0, 11.0, 15.0, 19.0, 18.0, 24.0, 21.0, 35.0, 41.0, 42.0, 45.0, 54.0, 46.0, 45.0, 55.0, 59.0, 54.0, 39.0, 30.0, 27.0, 45.0, 24.0, 32.0, 23.0, 27.0, 15.0, 9.0, 14.0, 10.0, 12.0, 4.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 4.0], "bins": [-34.2764892578125, -33.23725128173828, -32.19801712036133, -31.15877914428711, -30.11954116821289, -29.080305099487305, -28.04106903076172, -27.0018310546875, -25.96259307861328, -24.923357009887695, -23.884119033813477, -22.84488296508789, -21.805644989013672, -20.766408920288086, -19.7271728515625, -18.68793487548828, -17.648698806762695, -16.60946273803711, -15.57022476196289, -14.530988693237305, -13.491750717163086, -12.4525146484375, -11.413277626037598, -10.374040603637695, -9.334803581237793, -8.29556655883789, -7.256329536437988, -6.217092990875244, -5.177855968475342, -4.1386189460754395, -3.0993824005126953, -2.060145378112793, -1.0209083557128906, 0.018328547477722168, 1.057565450668335, 2.096802234649658, 3.1360392570495605, 4.175276279449463, 5.214512825012207, 6.253749847412109, 7.292986869812012, 8.332223892211914, 9.371460914611816, 10.410697937011719, 11.449934005737305, 12.489171981811523, 13.52840805053711, 14.567645072937012, 15.606882095336914, 16.6461181640625, 17.68535614013672, 18.724592208862305, 19.763830184936523, 20.80306625366211, 21.842304229736328, 22.881540298461914, 23.9207763671875, 24.960012435913086, 25.999250411987305, 27.03848648071289, 28.07772445678711, 29.116960525512695, 30.15619659423828, 31.1954345703125, 32.23467254638672]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 14.0, 24.0, 42.0, 69.0, 112.0, 182.0, 317.0, 500.0, 888.0, 1615.0, 3063.0, 6142.0, 13162.0, 31156.0, 83115.0, 256549.0, 399892.0, 157401.0, 53599.0, 21477.0, 9498.0, 4442.0, 2337.0, 1185.0, 682.0, 432.0, 229.0, 132.0, 104.0, 53.0, 37.0, 22.0, 21.0, 12.0, 5.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.80078125, -3.65618896484375, -3.5115966796875, -3.36700439453125, -3.222412109375, -3.07781982421875, -2.9332275390625, -2.78863525390625, -2.64404296875, -2.49945068359375, -2.3548583984375, -2.21026611328125, -2.065673828125, -1.92108154296875, -1.7764892578125, -1.63189697265625, -1.4873046875, -1.34271240234375, -1.1981201171875, -1.05352783203125, -0.908935546875, -0.76434326171875, -0.6197509765625, -0.47515869140625, -0.33056640625, -0.18597412109375, -0.0413818359375, 0.10321044921875, 0.247802734375, 0.39239501953125, 0.5369873046875, 0.68157958984375, 0.826171875, 0.97076416015625, 1.1153564453125, 1.25994873046875, 1.404541015625, 1.54913330078125, 1.6937255859375, 1.83831787109375, 1.98291015625, 2.12750244140625, 2.2720947265625, 2.41668701171875, 2.561279296875, 2.70587158203125, 2.8504638671875, 2.99505615234375, 3.1396484375, 3.28424072265625, 3.4288330078125, 3.57342529296875, 3.718017578125, 3.86260986328125, 4.0072021484375, 4.15179443359375, 4.29638671875, 4.44097900390625, 4.5855712890625, 4.73016357421875, 4.874755859375, 5.01934814453125, 5.1639404296875, 5.30853271484375, 5.453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 4.0, 10.0, 7.0, 9.0, 13.0, 23.0, 12.0, 19.0, 34.0, 26.0, 43.0, 50.0, 45.0, 37.0, 52.0, 41.0, 57.0, 43.0, 52.0, 52.0, 48.0, 35.0, 31.0, 29.0, 34.0, 45.0, 24.0, 23.0, 20.0, 19.0, 19.0, 16.0, 4.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3046875, -4.1925048828125, -4.080322265625, -3.9681396484375, -3.85595703125, -3.7437744140625, -3.631591796875, -3.5194091796875, -3.4072265625, -3.2950439453125, -3.182861328125, -3.0706787109375, -2.95849609375, -2.8463134765625, -2.734130859375, -2.6219482421875, -2.509765625, -2.3975830078125, -2.285400390625, -2.1732177734375, -2.06103515625, -1.9488525390625, -1.836669921875, -1.7244873046875, -1.6123046875, -1.5001220703125, -1.387939453125, -1.2757568359375, -1.16357421875, -1.0513916015625, -0.939208984375, -0.8270263671875, -0.71484375, -0.6026611328125, -0.490478515625, -0.3782958984375, -0.26611328125, -0.1539306640625, -0.041748046875, 0.0704345703125, 0.1826171875, 0.2947998046875, 0.406982421875, 0.5191650390625, 0.63134765625, 0.7435302734375, 0.855712890625, 0.9678955078125, 1.080078125, 1.1922607421875, 1.304443359375, 1.4166259765625, 1.52880859375, 1.6409912109375, 1.753173828125, 1.8653564453125, 1.9775390625, 2.0897216796875, 2.201904296875, 2.3140869140625, 2.42626953125, 2.5384521484375, 2.650634765625, 2.7628173828125, 2.875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 10.0, 17.0, 16.0, 23.0, 36.0, 37.0, 63.0, 72.0, 96.0, 200.0, 263.0, 415.0, 710.0, 1403.0, 4067.0, 20331.0, 257431.0, 720710.0, 33111.0, 5644.0, 1688.0, 860.0, 477.0, 287.0, 182.0, 105.0, 80.0, 51.0, 58.0, 26.0, 22.0, 13.0, 15.0, 9.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.1007080078125, -11.756103515625, -11.4114990234375, -11.06689453125, -10.7222900390625, -10.377685546875, -10.0330810546875, -9.6884765625, -9.3438720703125, -8.999267578125, -8.6546630859375, -8.31005859375, -7.9654541015625, -7.620849609375, -7.2762451171875, -6.931640625, -6.5870361328125, -6.242431640625, -5.8978271484375, -5.55322265625, -5.2086181640625, -4.864013671875, -4.5194091796875, -4.1748046875, -3.8302001953125, -3.485595703125, -3.1409912109375, -2.79638671875, -2.4517822265625, -2.107177734375, -1.7625732421875, -1.41796875, -1.0733642578125, -0.728759765625, -0.3841552734375, -0.03955078125, 0.3050537109375, 0.649658203125, 0.9942626953125, 1.3388671875, 1.6834716796875, 2.028076171875, 2.3726806640625, 2.71728515625, 3.0618896484375, 3.406494140625, 3.7510986328125, 4.095703125, 4.4403076171875, 4.784912109375, 5.1295166015625, 5.47412109375, 5.8187255859375, 6.163330078125, 6.5079345703125, 6.8525390625, 7.1971435546875, 7.541748046875, 7.8863525390625, 8.23095703125, 8.5755615234375, 8.920166015625, 9.2647705078125, 9.609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 10.0, 10.0, 4.0, 17.0, 16.0, 20.0, 15.0, 25.0, 28.0, 33.0, 34.0, 29.0, 48.0, 48.0, 62.0, 46.0, 40.0, 49.0, 35.0, 52.0, 36.0, 45.0, 41.0, 24.0, 33.0, 26.0, 26.0, 20.0, 22.0, 11.0, 14.0, 11.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.1015625, -11.7421875, -11.3828125, -11.0234375, -10.6640625, -10.3046875, -9.9453125, -9.5859375, -9.2265625, -8.8671875, -8.5078125, -8.1484375, -7.7890625, -7.4296875, -7.0703125, -6.7109375, -6.3515625, -5.9921875, -5.6328125, -5.2734375, -4.9140625, -4.5546875, -4.1953125, -3.8359375, -3.4765625, -3.1171875, -2.7578125, -2.3984375, -2.0390625, -1.6796875, -1.3203125, -0.9609375, -0.6015625, -0.2421875, 0.1171875, 0.4765625, 0.8359375, 1.1953125, 1.5546875, 1.9140625, 2.2734375, 2.6328125, 2.9921875, 3.3515625, 3.7109375, 4.0703125, 4.4296875, 4.7890625, 5.1484375, 5.5078125, 5.8671875, 6.2265625, 6.5859375, 6.9453125, 7.3046875, 7.6640625, 8.0234375, 8.3828125, 8.7421875, 9.1015625, 9.4609375, 9.8203125, 10.1796875, 10.5390625, 10.8984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 11.0, 21.0, 39.0, 46.0, 70.0, 133.0, 250.0, 782.0, 3105.0, 21680.0, 908550.0, 104336.0, 7211.0, 1402.0, 437.0, 184.0, 98.0, 55.0, 38.0, 30.0, 22.0, 15.0, 8.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.10784912109375, -5.8953857421875, -5.68292236328125, -5.470458984375, -5.25799560546875, -5.0455322265625, -4.83306884765625, -4.62060546875, -4.40814208984375, -4.1956787109375, -3.98321533203125, -3.770751953125, -3.55828857421875, -3.3458251953125, -3.13336181640625, -2.9208984375, -2.70843505859375, -2.4959716796875, -2.28350830078125, -2.071044921875, -1.85858154296875, -1.6461181640625, -1.43365478515625, -1.22119140625, -1.00872802734375, -0.7962646484375, -0.58380126953125, -0.371337890625, -0.15887451171875, 0.0535888671875, 0.26605224609375, 0.478515625, 0.69097900390625, 0.9034423828125, 1.11590576171875, 1.328369140625, 1.54083251953125, 1.7532958984375, 1.96575927734375, 2.17822265625, 2.39068603515625, 2.6031494140625, 2.81561279296875, 3.028076171875, 3.24053955078125, 3.4530029296875, 3.66546630859375, 3.8779296875, 4.09039306640625, 4.3028564453125, 4.51531982421875, 4.727783203125, 4.94024658203125, 5.1527099609375, 5.36517333984375, 5.57763671875, 5.79010009765625, 6.0025634765625, 6.21502685546875, 6.427490234375, 6.63995361328125, 6.8524169921875, 7.06488037109375, 7.27734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 8.0, 9.0, 10.0, 4.0, 18.0, 30.0, 36.0, 74.0, 88.0, 182.0, 183.0, 136.0, 72.0, 30.0, 28.0, 17.0, 17.0, 6.0, 7.0, 10.0, 6.0, 6.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009889602661132812, -0.0009551644325256348, -0.0009213685989379883, -0.0008875727653503418, -0.0008537769317626953, -0.0008199810981750488, -0.0007861852645874023, -0.0007523894309997559, -0.0007185935974121094, -0.0006847977638244629, -0.0006510019302368164, -0.0006172060966491699, -0.0005834102630615234, -0.000549614429473877, -0.0005158185958862305, -0.000482022762298584, -0.0004482269287109375, -0.000414431095123291, -0.00038063526153564453, -0.00034683942794799805, -0.00031304359436035156, -0.0002792477607727051, -0.0002454519271850586, -0.0002116560935974121, -0.00017786026000976562, -0.00014406442642211914, -0.00011026859283447266, -7.647275924682617e-05, -4.267692565917969e-05, -8.881092071533203e-06, 2.491474151611328e-05, 5.8710575103759766e-05, 9.250640869140625e-05, 0.00012630224227905273, 0.00016009807586669922, 0.0001938939094543457, 0.0002276897430419922, 0.00026148557662963867, 0.00029528141021728516, 0.00032907724380493164, 0.0003628730773925781, 0.0003966689109802246, 0.0004304647445678711, 0.0004642605781555176, 0.0004980564117431641, 0.0005318522453308105, 0.000565648078918457, 0.0005994439125061035, 0.00063323974609375, 0.0006670355796813965, 0.000700831413269043, 0.0007346272468566895, 0.0007684230804443359, 0.0008022189140319824, 0.0008360147476196289, 0.0008698105812072754, 0.0009036064147949219, 0.0009374022483825684, 0.0009711980819702148, 0.0010049939155578613, 0.0010387897491455078, 0.0010725855827331543, 0.0011063814163208008, 0.0011401772499084473, 0.0011739730834960938]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 9.0, 14.0, 10.0, 13.0, 25.0, 41.0, 49.0, 87.0, 125.0, 143.0, 302.0, 476.0, 979.0, 1942.0, 4578.0, 12866.0, 44461.0, 246592.0, 643617.0, 64204.0, 17024.0, 5836.0, 2424.0, 1138.0, 617.0, 343.0, 211.0, 120.0, 87.0, 60.0, 38.0, 28.0, 20.0, 14.0, 8.0, 10.0, 7.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.52734375, -2.44866943359375, -2.3699951171875, -2.29132080078125, -2.212646484375, -2.13397216796875, -2.0552978515625, -1.97662353515625, -1.89794921875, -1.81927490234375, -1.7406005859375, -1.66192626953125, -1.583251953125, -1.50457763671875, -1.4259033203125, -1.34722900390625, -1.2685546875, -1.18988037109375, -1.1112060546875, -1.03253173828125, -0.953857421875, -0.87518310546875, -0.7965087890625, -0.71783447265625, -0.63916015625, -0.56048583984375, -0.4818115234375, -0.40313720703125, -0.324462890625, -0.24578857421875, -0.1671142578125, -0.08843994140625, -0.009765625, 0.06890869140625, 0.1475830078125, 0.22625732421875, 0.304931640625, 0.38360595703125, 0.4622802734375, 0.54095458984375, 0.61962890625, 0.69830322265625, 0.7769775390625, 0.85565185546875, 0.934326171875, 1.01300048828125, 1.0916748046875, 1.17034912109375, 1.2490234375, 1.32769775390625, 1.4063720703125, 1.48504638671875, 1.563720703125, 1.64239501953125, 1.7210693359375, 1.79974365234375, 1.87841796875, 1.95709228515625, 2.0357666015625, 2.11444091796875, 2.193115234375, 2.27178955078125, 2.3504638671875, 2.42913818359375, 2.5078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 7.0, 13.0, 11.0, 8.0, 22.0, 23.0, 36.0, 31.0, 47.0, 77.0, 78.0, 89.0, 92.0, 93.0, 86.0, 78.0, 44.0, 37.0, 23.0, 18.0, 19.0, 11.0, 8.0, 10.0, 9.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.3006591796875, -2.222412109375, -2.1441650390625, -2.06591796875, -1.9876708984375, -1.909423828125, -1.8311767578125, -1.7529296875, -1.6746826171875, -1.596435546875, -1.5181884765625, -1.43994140625, -1.3616943359375, -1.283447265625, -1.2052001953125, -1.126953125, -1.0487060546875, -0.970458984375, -0.8922119140625, -0.81396484375, -0.7357177734375, -0.657470703125, -0.5792236328125, -0.5009765625, -0.4227294921875, -0.344482421875, -0.2662353515625, -0.18798828125, -0.1097412109375, -0.031494140625, 0.0467529296875, 0.125, 0.2032470703125, 0.281494140625, 0.3597412109375, 0.43798828125, 0.5162353515625, 0.594482421875, 0.6727294921875, 0.7509765625, 0.8292236328125, 0.907470703125, 0.9857177734375, 1.06396484375, 1.1422119140625, 1.220458984375, 1.2987060546875, 1.376953125, 1.4552001953125, 1.533447265625, 1.6116943359375, 1.68994140625, 1.7681884765625, 1.846435546875, 1.9246826171875, 2.0029296875, 2.0811767578125, 2.159423828125, 2.2376708984375, 2.31591796875, 2.3941650390625, 2.472412109375, 2.5506591796875, 2.62890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 24.0, 146.0, 606.0, 163.0, 33.0, 12.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.89833068847656, -201.08966064453125, -195.28099060058594, -189.47232055664062, -183.66366577148438, -177.85499572753906, -172.04632568359375, -166.23765563964844, -160.42898559570312, -154.6203155517578, -148.8116455078125, -143.00299072265625, -137.19432067871094, -131.38565063476562, -125.57698059082031, -119.768310546875, -113.95965576171875, -108.15098571777344, -102.34232330322266, -96.53365325927734, -90.72499084472656, -84.91632080078125, -79.10765075683594, -73.29898071289062, -67.49031829833984, -61.6816520690918, -55.87298583984375, -50.06431579589844, -44.25564956665039, -38.446983337402344, -32.63831329345703, -26.829647064208984, -21.020965576171875, -15.212298393249512, -9.403631210327148, -3.5949630737304688, 2.213703155517578, 8.022369384765625, 13.831039428710938, 19.639705657958984, 25.44837188720703, 31.257038116455078, 37.065704345703125, 42.87437438964844, 48.683040618896484, 54.49170684814453, 60.300376892089844, 66.10903930664062, 71.91770935058594, 77.72637939453125, 83.53504180908203, 89.34371185302734, 95.15237426757812, 100.96104431152344, 106.76971435546875, 112.57838439941406, 118.38704681396484, 124.19571685791016, 130.00437927246094, 135.81304931640625, 141.62171936035156, 147.43038940429688, 153.23904418945312, 159.04771423339844, 164.85638427734375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 8.0, 8.0, 5.0, 12.0, 14.0, 13.0, 14.0, 22.0, 20.0, 26.0, 28.0, 44.0, 25.0, 43.0, 42.0, 73.0, 165.0, 118.0, 50.0, 35.0, 46.0, 30.0, 21.0, 23.0, 24.0, 12.0, 16.0, 9.0, 14.0, 12.0, 4.0, 6.0, 12.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.14698791503906, -44.415069580078125, -42.68315124511719, -40.95123291015625, -39.21931457519531, -37.487396240234375, -35.75547790527344, -34.0235595703125, -32.29164123535156, -30.559722900390625, -28.827804565429688, -27.09588623046875, -25.363967895507812, -23.632049560546875, -21.900131225585938, -20.168212890625, -18.436294555664062, -16.704376220703125, -14.972457885742188, -13.24053955078125, -11.508621215820312, -9.776702880859375, -8.044784545898438, -6.3128662109375, -4.5809478759765625, -2.849029541015625, -1.1171112060546875, 0.61480712890625, 2.3467254638671875, 4.078643798828125, 5.8105621337890625, 7.54248046875, 9.274398803710938, 11.006317138671875, 12.738235473632812, 14.47015380859375, 16.202072143554688, 17.933990478515625, 19.665908813476562, 21.3978271484375, 23.129745483398438, 24.861663818359375, 26.593582153320312, 28.32550048828125, 30.057418823242188, 31.789337158203125, 33.52125549316406, 35.253173828125, 36.98509216308594, 38.717010498046875, 40.44892883300781, 42.18084716796875, 43.91276550292969, 45.644683837890625, 47.37660217285156, 49.1085205078125, 50.84043884277344, 52.572357177734375, 54.30427551269531, 56.03619384765625, 57.76811218261719, 59.500030517578125, 61.23194885253906, 62.9638671875, 64.69578552246094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 8.0, 22.0, 23.0, 44.0, 63.0, 104.0, 180.0, 271.0, 560.0, 1174.0, 2431.0, 5605.0, 16767.0, 75687.0, 502315.0, 2066373.0, 1264051.0, 206461.0, 35192.0, 9777.0, 3711.0, 1696.0, 747.0, 417.0, 221.0, 143.0, 85.0, 60.0, 26.0, 19.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.58984375, -7.37158203125, -7.1533203125, -6.93505859375, -6.716796875, -6.49853515625, -6.2802734375, -6.06201171875, -5.84375, -5.62548828125, -5.4072265625, -5.18896484375, -4.970703125, -4.75244140625, -4.5341796875, -4.31591796875, -4.09765625, -3.87939453125, -3.6611328125, -3.44287109375, -3.224609375, -3.00634765625, -2.7880859375, -2.56982421875, -2.3515625, -2.13330078125, -1.9150390625, -1.69677734375, -1.478515625, -1.26025390625, -1.0419921875, -0.82373046875, -0.60546875, -0.38720703125, -0.1689453125, 0.04931640625, 0.267578125, 0.48583984375, 0.7041015625, 0.92236328125, 1.140625, 1.35888671875, 1.5771484375, 1.79541015625, 2.013671875, 2.23193359375, 2.4501953125, 2.66845703125, 2.88671875, 3.10498046875, 3.3232421875, 3.54150390625, 3.759765625, 3.97802734375, 4.1962890625, 4.41455078125, 4.6328125, 4.85107421875, 5.0693359375, 5.28759765625, 5.505859375, 5.72412109375, 5.9423828125, 6.16064453125, 6.37890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 9.0, 11.0, 4.0, 7.0, 12.0, 18.0, 20.0, 26.0, 14.0, 23.0, 21.0, 40.0, 29.0, 36.0, 35.0, 43.0, 26.0, 47.0, 51.0, 46.0, 36.0, 30.0, 40.0, 33.0, 45.0, 38.0, 32.0, 34.0, 27.0, 21.0, 19.0, 17.0, 13.0, 20.0, 11.0, 16.0, 10.0, 10.0, 9.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.232421875, -3.1390380859375, -3.045654296875, -2.9522705078125, -2.85888671875, -2.7655029296875, -2.672119140625, -2.5787353515625, -2.4853515625, -2.3919677734375, -2.298583984375, -2.2052001953125, -2.11181640625, -2.0184326171875, -1.925048828125, -1.8316650390625, -1.73828125, -1.6448974609375, -1.551513671875, -1.4581298828125, -1.36474609375, -1.2713623046875, -1.177978515625, -1.0845947265625, -0.9912109375, -0.8978271484375, -0.804443359375, -0.7110595703125, -0.61767578125, -0.5242919921875, -0.430908203125, -0.3375244140625, -0.244140625, -0.1507568359375, -0.057373046875, 0.0360107421875, 0.12939453125, 0.2227783203125, 0.316162109375, 0.4095458984375, 0.5029296875, 0.5963134765625, 0.689697265625, 0.7830810546875, 0.87646484375, 0.9698486328125, 1.063232421875, 1.1566162109375, 1.25, 1.3433837890625, 1.436767578125, 1.5301513671875, 1.62353515625, 1.7169189453125, 1.810302734375, 1.9036865234375, 1.9970703125, 2.0904541015625, 2.183837890625, 2.2772216796875, 2.37060546875, 2.4639892578125, 2.557373046875, 2.6507568359375, 2.744140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 18.0, 29.0, 47.0, 96.0, 210.0, 656.0, 2032.0, 14262.0, 4073343.0, 98343.0, 3692.0, 903.0, 374.0, 140.0, 56.0, 24.0, 16.0, 4.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.12353515625, -32.9345703125, -31.74560546875, -30.556640625, -29.36767578125, -28.1787109375, -26.98974609375, -25.80078125, -24.61181640625, -23.4228515625, -22.23388671875, -21.044921875, -19.85595703125, -18.6669921875, -17.47802734375, -16.2890625, -15.10009765625, -13.9111328125, -12.72216796875, -11.533203125, -10.34423828125, -9.1552734375, -7.96630859375, -6.77734375, -5.58837890625, -4.3994140625, -3.21044921875, -2.021484375, -0.83251953125, 0.3564453125, 1.54541015625, 2.734375, 3.92333984375, 5.1123046875, 6.30126953125, 7.490234375, 8.67919921875, 9.8681640625, 11.05712890625, 12.24609375, 13.43505859375, 14.6240234375, 15.81298828125, 17.001953125, 18.19091796875, 19.3798828125, 20.56884765625, 21.7578125, 22.94677734375, 24.1357421875, 25.32470703125, 26.513671875, 27.70263671875, 28.8916015625, 30.08056640625, 31.26953125, 32.45849609375, 33.6474609375, 34.83642578125, 36.025390625, 37.21435546875, 38.4033203125, 39.59228515625, 40.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 13.0, 21.0, 58.0, 101.0, 261.0, 468.0, 870.0, 1000.0, 669.0, 340.0, 143.0, 67.0, 38.0, 17.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -29.110595703125, -28.33056640625, -27.550537109375, -26.7705078125, -25.990478515625, -25.21044921875, -24.430419921875, -23.650390625, -22.870361328125, -22.09033203125, -21.310302734375, -20.5302734375, -19.750244140625, -18.97021484375, -18.190185546875, -17.41015625, -16.630126953125, -15.85009765625, -15.070068359375, -14.2900390625, -13.510009765625, -12.72998046875, -11.949951171875, -11.169921875, -10.389892578125, -9.60986328125, -8.829833984375, -8.0498046875, -7.269775390625, -6.48974609375, -5.709716796875, -4.9296875, -4.149658203125, -3.36962890625, -2.589599609375, -1.8095703125, -1.029541015625, -0.24951171875, 0.530517578125, 1.310546875, 2.090576171875, 2.87060546875, 3.650634765625, 4.4306640625, 5.210693359375, 5.99072265625, 6.770751953125, 7.55078125, 8.330810546875, 9.11083984375, 9.890869140625, 10.6708984375, 11.450927734375, 12.23095703125, 13.010986328125, 13.791015625, 14.571044921875, 15.35107421875, 16.131103515625, 16.9111328125, 17.691162109375, 18.47119140625, 19.251220703125, 20.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 10.0, 10.0, 22.0, 33.0, 66.0, 135.0, 240.0, 230.0, 137.0, 49.0, 26.0, 13.0, 10.0, 5.0, 8.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-307.7391357421875, -301.7035217285156, -295.6678771972656, -289.63226318359375, -283.5966491699219, -277.5610046386719, -271.525390625, -265.4897766113281, -259.4541320800781, -253.4185028076172, -247.3828887939453, -241.34725952148438, -235.31163024902344, -229.2760009765625, -223.24038696289062, -217.2047576904297, -211.1691436767578, -205.13351440429688, -199.097900390625, -193.06227111816406, -187.02664184570312, -180.99102783203125, -174.9553985595703, -168.91976928710938, -162.8841552734375, -156.84852600097656, -150.8129119873047, -144.77728271484375, -138.7416534423828, -132.70602416992188, -126.67041015625, -120.63478088378906, -114.59915161132812, -108.56352996826172, -102.52790069580078, -96.49227905273438, -90.45664978027344, -84.42102813720703, -78.38540649414062, -72.34977722167969, -66.31415557861328, -60.27853012084961, -54.24290466308594, -48.20728302001953, -42.17165756225586, -36.13603210449219, -30.10041046142578, -24.06478500366211, -18.029159545898438, -11.993535041809082, -5.957910537719727, 0.0777130126953125, 6.113338470458984, 12.148963928222656, 18.184585571289062, 24.220211029052734, 30.255836486816406, 36.29146194458008, 42.32708740234375, 48.362709045410156, 54.39833450317383, 60.4339599609375, 66.4695816040039, 72.50520324707031, 78.54083251953125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 4.0, 3.0, 8.0, 24.0, 21.0, 21.0, 31.0, 37.0, 38.0, 34.0, 43.0, 44.0, 47.0, 69.0, 72.0, 74.0, 61.0, 45.0, 51.0, 43.0, 32.0, 32.0, 28.0, 29.0, 20.0, 8.0, 11.0, 16.0, 12.0, 11.0, 4.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.11773681640625, -72.55535888671875, -69.99298095703125, -67.43060302734375, -64.86823272705078, -62.30585479736328, -59.74347686767578, -57.18109893798828, -54.61872100830078, -52.05634307861328, -49.49396896362305, -46.93159103393555, -44.36921310424805, -41.80683898925781, -39.24446105957031, -36.68208312988281, -34.11970901489258, -31.55733299255371, -28.99495506286621, -26.432579040527344, -23.870201110839844, -21.307825088500977, -18.74544906616211, -16.18307113647461, -13.620695114135742, -11.058318138122559, -8.495941162109375, -5.933565139770508, -3.371188163757324, -0.8088111877441406, 1.7535648345947266, 4.315942764282227, 6.878318786621094, 9.440695762634277, 12.003072738647461, 14.565448760986328, 17.127826690673828, 19.690202713012695, 22.252578735351562, 24.814956665039062, 27.37733268737793, 29.939708709716797, 32.5020866394043, 35.06446075439453, 37.62683868408203, 40.18921661376953, 42.75159454345703, 45.31397247314453, 47.876346588134766, 50.438724517822266, 53.0010986328125, 55.5634765625, 58.1258544921875, 60.688232421875, 63.250606536865234, 65.81298828125, 68.37535858154297, 70.93773651123047, 73.50011444091797, 76.06248474121094, 78.62486267089844, 81.18724060058594, 83.74961853027344, 86.31199645996094, 88.87437438964844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 11.0, 19.0, 31.0, 32.0, 54.0, 81.0, 125.0, 170.0, 322.0, 469.0, 851.0, 1579.0, 3023.0, 6857.0, 17587.0, 52685.0, 207330.0, 568920.0, 128472.0, 36209.0, 12696.0, 5240.0, 2483.0, 1317.0, 738.0, 434.0, 275.0, 174.0, 87.0, 69.0, 58.0, 38.0, 35.0, 14.0, 14.0, 9.0, 3.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.0560302734375, -3.889404296875, -3.7227783203125, -3.55615234375, -3.3895263671875, -3.222900390625, -3.0562744140625, -2.8896484375, -2.7230224609375, -2.556396484375, -2.3897705078125, -2.22314453125, -2.0565185546875, -1.889892578125, -1.7232666015625, -1.556640625, -1.3900146484375, -1.223388671875, -1.0567626953125, -0.89013671875, -0.7235107421875, -0.556884765625, -0.3902587890625, -0.2236328125, -0.0570068359375, 0.109619140625, 0.2762451171875, 0.44287109375, 0.6094970703125, 0.776123046875, 0.9427490234375, 1.109375, 1.2760009765625, 1.442626953125, 1.6092529296875, 1.77587890625, 1.9425048828125, 2.109130859375, 2.2757568359375, 2.4423828125, 2.6090087890625, 2.775634765625, 2.9422607421875, 3.10888671875, 3.2755126953125, 3.442138671875, 3.6087646484375, 3.775390625, 3.9420166015625, 4.108642578125, 4.2752685546875, 4.44189453125, 4.6085205078125, 4.775146484375, 4.9417724609375, 5.1083984375, 5.2750244140625, 5.441650390625, 5.6082763671875, 5.77490234375, 5.9415283203125, 6.108154296875, 6.2747802734375, 6.44140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 10.0, 13.0, 9.0, 13.0, 26.0, 27.0, 38.0, 44.0, 54.0, 69.0, 76.0, 68.0, 72.0, 80.0, 58.0, 52.0, 42.0, 48.0, 33.0, 31.0, 25.0, 24.0, 23.0, 15.0, 13.0, 10.0, 9.0, 7.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.901611328125, -5.69775390625, -5.493896484375, -5.2900390625, -5.086181640625, -4.88232421875, -4.678466796875, -4.474609375, -4.270751953125, -4.06689453125, -3.863037109375, -3.6591796875, -3.455322265625, -3.25146484375, -3.047607421875, -2.84375, -2.639892578125, -2.43603515625, -2.232177734375, -2.0283203125, -1.824462890625, -1.62060546875, -1.416748046875, -1.212890625, -1.009033203125, -0.80517578125, -0.601318359375, -0.3974609375, -0.193603515625, 0.01025390625, 0.214111328125, 0.41796875, 0.621826171875, 0.82568359375, 1.029541015625, 1.2333984375, 1.437255859375, 1.64111328125, 1.844970703125, 2.048828125, 2.252685546875, 2.45654296875, 2.660400390625, 2.8642578125, 3.068115234375, 3.27197265625, 3.475830078125, 3.6796875, 3.883544921875, 4.08740234375, 4.291259765625, 4.4951171875, 4.698974609375, 4.90283203125, 5.106689453125, 5.310546875, 5.514404296875, 5.71826171875, 5.922119140625, 6.1259765625, 6.329833984375, 6.53369140625, 6.737548828125, 6.94140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 14.0, 18.0, 29.0, 38.0, 46.0, 74.0, 108.0, 207.0, 310.0, 788.0, 2157.0, 12386.0, 342593.0, 672668.0, 13263.0, 2210.0, 758.0, 324.0, 179.0, 122.0, 85.0, 49.0, 33.0, 23.0, 20.0, 11.0, 12.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0859375, -9.7498779296875, -9.413818359375, -9.0777587890625, -8.74169921875, -8.4056396484375, -8.069580078125, -7.7335205078125, -7.3974609375, -7.0614013671875, -6.725341796875, -6.3892822265625, -6.05322265625, -5.7171630859375, -5.381103515625, -5.0450439453125, -4.708984375, -4.3729248046875, -4.036865234375, -3.7008056640625, -3.36474609375, -3.0286865234375, -2.692626953125, -2.3565673828125, -2.0205078125, -1.6844482421875, -1.348388671875, -1.0123291015625, -0.67626953125, -0.3402099609375, -0.004150390625, 0.3319091796875, 0.66796875, 1.0040283203125, 1.340087890625, 1.6761474609375, 2.01220703125, 2.3482666015625, 2.684326171875, 3.0203857421875, 3.3564453125, 3.6925048828125, 4.028564453125, 4.3646240234375, 4.70068359375, 5.0367431640625, 5.372802734375, 5.7088623046875, 6.044921875, 6.3809814453125, 6.717041015625, 7.0531005859375, 7.38916015625, 7.7252197265625, 8.061279296875, 8.3973388671875, 8.7333984375, 9.0694580078125, 9.405517578125, 9.7415771484375, 10.07763671875, 10.4136962890625, 10.749755859375, 11.0858154296875, 11.421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 3.0, 12.0, 13.0, 17.0, 24.0, 18.0, 31.0, 29.0, 38.0, 45.0, 52.0, 62.0, 80.0, 103.0, 83.0, 63.0, 64.0, 38.0, 36.0, 33.0, 23.0, 20.0, 12.0, 20.0, 20.0, 12.0, 10.0, 8.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.21875, -20.586181640625, -19.95361328125, -19.321044921875, -18.6884765625, -18.055908203125, -17.42333984375, -16.790771484375, -16.158203125, -15.525634765625, -14.89306640625, -14.260498046875, -13.6279296875, -12.995361328125, -12.36279296875, -11.730224609375, -11.09765625, -10.465087890625, -9.83251953125, -9.199951171875, -8.5673828125, -7.934814453125, -7.30224609375, -6.669677734375, -6.037109375, -5.404541015625, -4.77197265625, -4.139404296875, -3.5068359375, -2.874267578125, -2.24169921875, -1.609130859375, -0.9765625, -0.343994140625, 0.28857421875, 0.921142578125, 1.5537109375, 2.186279296875, 2.81884765625, 3.451416015625, 4.083984375, 4.716552734375, 5.34912109375, 5.981689453125, 6.6142578125, 7.246826171875, 7.87939453125, 8.511962890625, 9.14453125, 9.777099609375, 10.40966796875, 11.042236328125, 11.6748046875, 12.307373046875, 12.93994140625, 13.572509765625, 14.205078125, 14.837646484375, 15.47021484375, 16.102783203125, 16.7353515625, 17.367919921875, 18.00048828125, 18.633056640625, 19.265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 6.0, 9.0, 10.0, 14.0, 29.0, 59.0, 105.0, 197.0, 472.0, 1288.0, 4854.0, 32320.0, 899592.0, 96278.0, 9924.0, 2113.0, 732.0, 262.0, 129.0, 57.0, 40.0, 25.0, 13.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.93194580078125, -1.8746337890625, -1.81732177734375, -1.760009765625, -1.70269775390625, -1.6453857421875, -1.58807373046875, -1.53076171875, -1.47344970703125, -1.4161376953125, -1.35882568359375, -1.301513671875, -1.24420166015625, -1.1868896484375, -1.12957763671875, -1.072265625, -1.01495361328125, -0.9576416015625, -0.90032958984375, -0.843017578125, -0.78570556640625, -0.7283935546875, -0.67108154296875, -0.61376953125, -0.55645751953125, -0.4991455078125, -0.44183349609375, -0.384521484375, -0.32720947265625, -0.2698974609375, -0.21258544921875, -0.1552734375, -0.09796142578125, -0.0406494140625, 0.01666259765625, 0.073974609375, 0.13128662109375, 0.1885986328125, 0.24591064453125, 0.30322265625, 0.36053466796875, 0.4178466796875, 0.47515869140625, 0.532470703125, 0.58978271484375, 0.6470947265625, 0.70440673828125, 0.76171875, 0.81903076171875, 0.8763427734375, 0.93365478515625, 0.990966796875, 1.04827880859375, 1.1055908203125, 1.16290283203125, 1.22021484375, 1.27752685546875, 1.3348388671875, 1.39215087890625, 1.449462890625, 1.50677490234375, 1.5640869140625, 1.62139892578125, 1.6787109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 2.0, 8.0, 4.0, 7.0, 13.0, 15.0, 17.0, 29.0, 30.0, 46.0, 39.0, 68.0, 77.0, 110.0, 115.0, 78.0, 83.0, 63.0, 32.0, 36.0, 30.0, 14.0, 19.0, 11.0, 8.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003216266632080078, -0.0003116726875305176, -0.00030171871185302734, -0.0002917647361755371, -0.0002818107604980469, -0.00027185678482055664, -0.0002619028091430664, -0.00025194883346557617, -0.00024199485778808594, -0.0002320408821105957, -0.00022208690643310547, -0.00021213293075561523, -0.000202178955078125, -0.00019222497940063477, -0.00018227100372314453, -0.0001723170280456543, -0.00016236305236816406, -0.00015240907669067383, -0.0001424551010131836, -0.00013250112533569336, -0.00012254714965820312, -0.00011259317398071289, -0.00010263919830322266, -9.268522262573242e-05, -8.273124694824219e-05, -7.277727127075195e-05, -6.282329559326172e-05, -5.2869319915771484e-05, -4.291534423828125e-05, -3.2961368560791016e-05, -2.300739288330078e-05, -1.3053417205810547e-05, -3.0994415283203125e-06, 6.854534149169922e-06, 1.6808509826660156e-05, 2.676248550415039e-05, 3.6716461181640625e-05, 4.667043685913086e-05, 5.6624412536621094e-05, 6.657838821411133e-05, 7.653236389160156e-05, 8.64863395690918e-05, 9.644031524658203e-05, 0.00010639429092407227, 0.0001163482666015625, 0.00012630224227905273, 0.00013625621795654297, 0.0001462101936340332, 0.00015616416931152344, 0.00016611814498901367, 0.0001760721206665039, 0.00018602609634399414, 0.00019598007202148438, 0.0002059340476989746, 0.00021588802337646484, 0.00022584199905395508, 0.0002357959747314453, 0.00024574995040893555, 0.0002557039260864258, 0.000265657901763916, 0.00027561187744140625, 0.0002855658531188965, 0.0002955198287963867, 0.00030547380447387695, 0.0003154277801513672]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 9.0, 19.0, 25.0, 48.0, 74.0, 113.0, 197.0, 441.0, 913.0, 2499.0, 7410.0, 28366.0, 253530.0, 710558.0, 31667.0, 8055.0, 2621.0, 1037.0, 444.0, 230.0, 116.0, 66.0, 37.0, 26.0, 15.0, 12.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.3339385986328125, -1.287994384765625, -1.2420501708984375, -1.19610595703125, -1.1501617431640625, -1.104217529296875, -1.0582733154296875, -1.0123291015625, -0.9663848876953125, -0.920440673828125, -0.8744964599609375, -0.82855224609375, -0.7826080322265625, -0.736663818359375, -0.6907196044921875, -0.644775390625, -0.5988311767578125, -0.552886962890625, -0.5069427490234375, -0.46099853515625, -0.4150543212890625, -0.369110107421875, -0.3231658935546875, -0.2772216796875, -0.2312774658203125, -0.185333251953125, -0.1393890380859375, -0.09344482421875, -0.0475006103515625, -0.001556396484375, 0.0443878173828125, 0.09033203125, 0.1362762451171875, 0.182220458984375, 0.2281646728515625, 0.27410888671875, 0.3200531005859375, 0.365997314453125, 0.4119415283203125, 0.4578857421875, 0.5038299560546875, 0.549774169921875, 0.5957183837890625, 0.64166259765625, 0.6876068115234375, 0.733551025390625, 0.7794952392578125, 0.825439453125, 0.8713836669921875, 0.917327880859375, 0.9632720947265625, 1.00921630859375, 1.0551605224609375, 1.101104736328125, 1.1470489501953125, 1.1929931640625, 1.2389373779296875, 1.284881591796875, 1.3308258056640625, 1.37677001953125, 1.4227142333984375, 1.468658447265625, 1.5146026611328125, 1.560546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 8.0, 10.0, 16.0, 18.0, 23.0, 38.0, 67.0, 113.0, 157.0, 174.0, 124.0, 85.0, 39.0, 28.0, 20.0, 21.0, 13.0, 4.0, 12.0, 3.0, 6.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5393218994140625, -1.470245361328125, -1.4011688232421875, -1.33209228515625, -1.2630157470703125, -1.193939208984375, -1.1248626708984375, -1.0557861328125, -0.9867095947265625, -0.917633056640625, -0.8485565185546875, -0.77947998046875, -0.7104034423828125, -0.641326904296875, -0.5722503662109375, -0.503173828125, -0.4340972900390625, -0.365020751953125, -0.2959442138671875, -0.22686767578125, -0.1577911376953125, -0.088714599609375, -0.0196380615234375, 0.0494384765625, 0.1185150146484375, 0.187591552734375, 0.2566680908203125, 0.32574462890625, 0.3948211669921875, 0.463897705078125, 0.5329742431640625, 0.60205078125, 0.6711273193359375, 0.740203857421875, 0.8092803955078125, 0.87835693359375, 0.9474334716796875, 1.016510009765625, 1.0855865478515625, 1.1546630859375, 1.2237396240234375, 1.292816162109375, 1.3618927001953125, 1.43096923828125, 1.5000457763671875, 1.569122314453125, 1.6381988525390625, 1.707275390625, 1.7763519287109375, 1.845428466796875, 1.9145050048828125, 1.98358154296875, 2.0526580810546875, 2.121734619140625, 2.1908111572265625, 2.2598876953125, 2.3289642333984375, 2.398040771484375, 2.4671173095703125, 2.53619384765625, 2.6052703857421875, 2.674346923828125, 2.7434234619140625, 2.8125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 10.0, 32.0, 40.0, 76.0, 289.0, 405.0, 68.0, 40.0, 17.0, 10.0, 9.0, 2.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.4432373046875, -111.95817565917969, -109.47310638427734, -106.988037109375, -104.50297546386719, -102.01791381835938, -99.53284454345703, -97.04777526855469, -94.56271362304688, -92.07765197753906, -89.59258270263672, -87.10751342773438, -84.62245178222656, -82.13739013671875, -79.6523208618164, -77.16725158691406, -74.68218994140625, -72.19712829589844, -69.7120590209961, -67.22698974609375, -64.74192810058594, -62.25686264038086, -59.77179718017578, -57.2867317199707, -54.801666259765625, -52.31660079956055, -49.83153533935547, -47.34646987915039, -44.86140441894531, -42.376338958740234, -39.891273498535156, -37.40620803833008, -34.92115020751953, -32.43608474731445, -29.951019287109375, -27.465953826904297, -24.98088836669922, -22.49582290649414, -20.010757446289062, -17.525691986083984, -15.040626525878906, -12.555561065673828, -10.07049560546875, -7.585430145263672, -5.100364685058594, -2.6152992248535156, -0.1302337646484375, 2.3548316955566406, 4.839897155761719, 7.324962615966797, 9.810028076171875, 12.295093536376953, 14.780158996582031, 17.26522445678711, 19.750289916992188, 22.235355377197266, 24.720420837402344, 27.205486297607422, 29.6905517578125, 32.17561721801758, 34.660682678222656, 37.145748138427734, 39.63081359863281, 42.11587905883789, 44.60094451904297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 7.0, 12.0, 11.0, 8.0, 11.0, 10.0, 25.0, 11.0, 11.0, 25.0, 19.0, 21.0, 33.0, 89.0, 170.0, 180.0, 87.0, 33.0, 26.0, 39.0, 27.0, 15.0, 12.0, 14.0, 12.0, 9.0, 14.0, 6.0, 10.0, 10.0, 6.0, 1.0, 9.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.523048400878906, -45.11537551879883, -43.70770263671875, -42.30002975463867, -40.892356872558594, -39.48468780517578, -38.07701110839844, -36.669342041015625, -35.26166915893555, -33.85399627685547, -32.44632339477539, -31.038650512695312, -29.630979537963867, -28.22330665588379, -26.81563377380371, -25.407962799072266, -24.000288009643555, -22.592615127563477, -21.1849422454834, -19.777271270751953, -18.369598388671875, -16.961925506591797, -15.554252624511719, -14.146580696105957, -12.738907814025879, -11.3312349319458, -9.923563003540039, -8.515890121459961, -7.108217716217041, -5.700545310974121, -4.292872428894043, -2.8852005004882812, -1.4775276184082031, -0.06985509395599365, 1.3378174304962158, 2.745490074157715, 4.153162479400635, 5.560834884643555, 6.968507766723633, 8.376179695129395, 9.783852577209473, 11.19152545928955, 12.599197387695312, 14.00687026977539, 15.414543151855469, 16.822216033935547, 18.229888916015625, 19.63755989074707, 21.04523277282715, 22.452905654907227, 23.860578536987305, 25.26824951171875, 26.675922393798828, 28.083595275878906, 29.491268157958984, 30.898941040039062, 32.30661392211914, 33.71428680419922, 35.1219596862793, 36.529632568359375, 37.93730545043945, 39.34497833251953, 40.752647399902344, 42.16032028198242, 43.5679931640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 2.0, 9.0, 11.0, 14.0, 12.0, 11.0, 7.0, 16.0, 21.0, 23.0, 39.0, 23.0, 30.0, 30.0, 47.0, 49.0, 162.0, 156.0, 61.0, 32.0, 32.0, 27.0, 27.0, 18.0, 26.0, 20.0, 15.0, 12.0, 8.0, 12.0, 3.0, 6.0, 7.0, 4.0, 1.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.6328125, -4.4921875, -4.3515625, -4.2109375, -4.0703125, -3.9296875, -3.7890625, -3.6484375, -3.5078125, -3.3671875, -3.2265625, -3.0859375, -2.9453125, -2.8046875, -2.6640625, -2.5234375, -2.3828125, -2.2421875, -2.1015625, -1.9609375, -1.8203125, -1.6796875, -1.5390625, -1.3984375, -1.2578125, -1.1171875, -0.9765625, -0.8359375, -0.6953125, -0.5546875, -0.4140625, -0.2734375, -0.1328125, 0.0078125, 0.1484375, 0.2890625, 0.4296875, 0.5703125, 0.7109375, 0.8515625, 0.9921875, 1.1328125, 1.2734375, 1.4140625, 1.5546875, 1.6953125, 1.8359375, 1.9765625, 2.1171875, 2.2578125, 2.3984375, 2.5390625, 2.6796875, 2.8203125, 2.9609375, 3.1015625, 3.2421875, 3.3828125, 3.5234375, 3.6640625, 3.8046875, 3.9453125, 4.0859375, 4.2265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 11.0, 2.0, 3.0, 7.0, 19.0, 12.0, 28.0, 29.0, 60.0, 90.0, 188.0, 457.0, 1906.0, 14915.0, 8357494.0, 11014.0, 1579.0, 421.0, 142.0, 69.0, 39.0, 26.0, 21.0, 17.0, 17.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-56.41648864746094, -54.67768859863281, -52.93889236450195, -51.200096130371094, -49.46129608154297, -47.722496032714844, -45.983699798583984, -44.244903564453125, -42.506103515625, -40.767303466796875, -39.028507232666016, -37.289710998535156, -35.55091094970703, -33.812110900878906, -32.07331466674805, -30.334516525268555, -28.595718383789062, -26.85692024230957, -25.118122100830078, -23.379323959350586, -21.640525817871094, -19.9017276763916, -18.16292953491211, -16.424131393432617, -14.685333251953125, -12.946535110473633, -11.20773696899414, -9.468938827514648, -7.730140686035156, -5.991342544555664, -4.252544403076172, -2.5137462615966797, -0.7749443054199219, 0.9638538360595703, 2.7026519775390625, 4.441450119018555, 6.180248260498047, 7.919046401977539, 9.657844543457031, 11.396642684936523, 13.135440826416016, 14.874238967895508, 16.613037109375, 18.351835250854492, 20.090633392333984, 21.829431533813477, 23.56822967529297, 25.30702781677246, 27.045825958251953, 28.784624099731445, 30.523422241210938, 32.26222229003906, 34.00101852416992, 35.73981475830078, 37.478614807128906, 39.21741485595703, 40.95621109008789, 42.69500732421875, 44.433807373046875, 46.172607421875, 47.91140365600586, 49.65019989013672, 51.388999938964844, 53.12779998779297, 54.86659622192383]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 5.0, 4.0, 2.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-104.98562622070312, -101.93575286865234, -98.88587951660156, -95.83599853515625, -92.78612518310547, -89.73625183105469, -86.6863784790039, -83.63650512695312, -80.58662414550781, -77.53675079345703, -74.48687744140625, -71.43699645996094, -68.38712310791016, -65.33724975585938, -62.287376403808594, -59.23749923706055, -56.187625885009766, -53.137752532958984, -50.08787536621094, -47.038002014160156, -43.98812484741211, -40.93825149536133, -37.88837432861328, -34.8385009765625, -31.788625717163086, -28.738750457763672, -25.688875198364258, -22.638999938964844, -19.589126586914062, -16.539249420166016, -13.489376068115234, -10.43950080871582, -7.389625549316406, -4.339750289916992, -1.2898755073547363, 1.7599992752075195, 4.809874534606934, 7.859749794006348, 10.909624099731445, 13.95949935913086, 17.009374618530273, 20.059249877929688, 23.1091251373291, 26.159000396728516, 29.208873748779297, 32.258750915527344, 35.308624267578125, 38.358497619628906, 41.40837478637695, 44.458248138427734, 47.50812530517578, 50.55799865722656, 53.60787582397461, 56.65774917602539, 59.70762634277344, 62.75749969482422, 65.807373046875, 68.85724639892578, 71.90711975097656, 74.95700073242188, 78.00687408447266, 81.05674743652344, 84.10662078857422, 87.156494140625, 90.20637512207031]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 7.0, 11.0, 14.0, 23.0, 20.0, 24.0, 32.0, 42.0, 43.0, 47.0, 59.0, 60.0, 62.0, 65.0, 57.0, 69.0, 61.0, 51.0, 41.0, 31.0, 29.0, 23.0, 26.0, 21.0, 23.0, 13.0, 9.0, 3.0, 5.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.32037353515625, -2.2188720703125, -2.11737060546875, -2.015869140625, -1.91436767578125, -1.8128662109375, -1.71136474609375, -1.60986328125, -1.50836181640625, -1.4068603515625, -1.30535888671875, -1.203857421875, -1.10235595703125, -1.0008544921875, -0.89935302734375, -0.7978515625, -0.69635009765625, -0.5948486328125, -0.49334716796875, -0.391845703125, -0.29034423828125, -0.1888427734375, -0.08734130859375, 0.01416015625, 0.11566162109375, 0.2171630859375, 0.31866455078125, 0.420166015625, 0.52166748046875, 0.6231689453125, 0.72467041015625, 0.826171875, 0.92767333984375, 1.0291748046875, 1.13067626953125, 1.232177734375, 1.33367919921875, 1.4351806640625, 1.53668212890625, 1.63818359375, 1.73968505859375, 1.8411865234375, 1.94268798828125, 2.044189453125, 2.14569091796875, 2.2471923828125, 2.34869384765625, 2.4501953125, 2.55169677734375, 2.6531982421875, 2.75469970703125, 2.856201171875, 2.95770263671875, 3.0592041015625, 3.16070556640625, 3.26220703125, 3.36370849609375, 3.4652099609375, 3.56671142578125, 3.668212890625, 3.76971435546875, 3.8712158203125, 3.97271728515625, 4.07421875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 13.0, 10.0, 14.0, 18.0, 34.0, 44.0, 50.0, 67.0, 99.0, 138.0, 243.0, 474.0, 861.0, 1871.0, 3982.0, 9090.0, 21861.0, 53430.0, 127267.0, 162883.0, 83381.0, 33403.0, 13733.0, 5812.0, 2608.0, 1251.0, 580.0, 346.0, 211.0, 142.0, 77.0, 73.0, 34.0, 44.0, 30.0, 22.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.953125, -22.167724609375, -21.38232421875, -20.596923828125, -19.8115234375, -19.026123046875, -18.24072265625, -17.455322265625, -16.669921875, -15.884521484375, -15.09912109375, -14.313720703125, -13.5283203125, -12.742919921875, -11.95751953125, -11.172119140625, -10.38671875, -9.601318359375, -8.81591796875, -8.030517578125, -7.2451171875, -6.459716796875, -5.67431640625, -4.888916015625, -4.103515625, -3.318115234375, -2.53271484375, -1.747314453125, -0.9619140625, -0.176513671875, 0.60888671875, 1.394287109375, 2.1796875, 2.965087890625, 3.75048828125, 4.535888671875, 5.3212890625, 6.106689453125, 6.89208984375, 7.677490234375, 8.462890625, 9.248291015625, 10.03369140625, 10.819091796875, 11.6044921875, 12.389892578125, 13.17529296875, 13.960693359375, 14.74609375, 15.531494140625, 16.31689453125, 17.102294921875, 17.8876953125, 18.673095703125, 19.45849609375, 20.243896484375, 21.029296875, 21.814697265625, 22.60009765625, 23.385498046875, 24.1708984375, 24.956298828125, 25.74169921875, 26.527099609375, 27.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 20.0, 20.0, 17.0, 27.0, 36.0, 43.0, 65.0, 63.0, 61.0, 62.0, 81.0, 60.0, 69.0, 66.0, 50.0, 38.0, 40.0, 37.0, 28.0, 21.0, 12.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.0933837890625, -4.925048828125, -4.7567138671875, -4.58837890625, -4.4200439453125, -4.251708984375, -4.0833740234375, -3.9150390625, -3.7467041015625, -3.578369140625, -3.4100341796875, -3.24169921875, -3.0733642578125, -2.905029296875, -2.7366943359375, -2.568359375, -2.4000244140625, -2.231689453125, -2.0633544921875, -1.89501953125, -1.7266845703125, -1.558349609375, -1.3900146484375, -1.2216796875, -1.0533447265625, -0.885009765625, -0.7166748046875, -0.54833984375, -0.3800048828125, -0.211669921875, -0.0433349609375, 0.125, 0.2933349609375, 0.461669921875, 0.6300048828125, 0.79833984375, 0.9666748046875, 1.135009765625, 1.3033447265625, 1.4716796875, 1.6400146484375, 1.808349609375, 1.9766845703125, 2.14501953125, 2.3133544921875, 2.481689453125, 2.6500244140625, 2.818359375, 2.9866943359375, 3.155029296875, 3.3233642578125, 3.49169921875, 3.6600341796875, 3.828369140625, 3.9967041015625, 4.1650390625, 4.3333740234375, 4.501708984375, 4.6700439453125, 4.83837890625, 5.0067138671875, 5.175048828125, 5.3433837890625, 5.51171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 3.0, 6.0, 20.0, 24.0, 44.0, 65.0, 83.0, 67.0, 51.0, 39.0, 27.0, 11.0, 5.0, 5.0, 10.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-45.1645622253418, -44.09144973754883, -43.01833724975586, -41.94522476196289, -40.87211227416992, -39.79899597167969, -38.72588348388672, -37.65277099609375, -36.57965850830078, -35.50654602050781, -34.433433532714844, -33.360321044921875, -32.287208557128906, -31.214094161987305, -30.140981674194336, -29.067869186401367, -27.9947566986084, -26.92164421081543, -25.84853172302246, -24.77541732788086, -23.70230484008789, -22.629192352294922, -21.556079864501953, -20.482967376708984, -19.409854888916016, -18.336742401123047, -17.263629913330078, -16.19051742553711, -15.117403030395508, -14.044290542602539, -12.97117805480957, -11.898065567016602, -10.824951171875, -9.751838684082031, -8.678725242614746, -7.605612754821777, -6.53249979019165, -5.459386825561523, -4.386274337768555, -3.3131613731384277, -2.240048408508301, -1.1669355630874634, -0.09382271766662598, 0.9792900085449219, 2.052402973175049, 3.125515937805176, 4.1986284255981445, 5.2717413902282715, 6.344854354858398, 7.417967319488525, 8.491080284118652, 9.564192771911621, 10.637306213378906, 11.710418701171875, 12.783531188964844, 13.856643676757812, 14.929757118225098, 16.002870559692383, 17.07598304748535, 18.14909553527832, 19.22220802307129, 20.29532241821289, 21.36843490600586, 22.441547393798828, 23.514659881591797]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 5.0, 3.0, 0.0, 6.0, 1.0, 6.0, 3.0, 5.0, 11.0, 15.0, 34.0, 49.0, 67.0, 71.0, 55.0, 49.0, 29.0, 16.0, 8.0, 6.0, 1.0, 7.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.482685089111328, -22.64385414123535, -21.805023193359375, -20.96619415283203, -20.127363204956055, -19.288532257080078, -18.449703216552734, -17.610872268676758, -16.77204132080078, -15.933210372924805, -15.094380378723145, -14.255550384521484, -13.416719436645508, -12.577888488769531, -11.739058494567871, -10.900228500366211, -10.061397552490234, -9.222566604614258, -8.383736610412598, -7.544906139373779, -6.706075668334961, -5.867245197296143, -5.028414726257324, -4.189584255218506, -3.3507537841796875, -2.511923313140869, -1.6730928421020508, -0.8342623710632324, 0.0045680999755859375, 0.8433985710144043, 1.6822290420532227, 2.521059513092041, 3.359891891479492, 4.1987223625183105, 5.037552833557129, 5.876383304595947, 6.715213775634766, 7.554044246673584, 8.392874717712402, 9.231704711914062, 10.070535659790039, 10.909366607666016, 11.748196601867676, 12.587026596069336, 13.425857543945312, 14.264688491821289, 15.10351848602295, 15.94234848022461, 16.781179428100586, 17.620010375976562, 18.458839416503906, 19.297670364379883, 20.13650131225586, 20.975332260131836, 21.814163208007812, 22.652992248535156, 23.491823196411133, 24.33065414428711, 25.169483184814453, 26.00831413269043, 26.847145080566406, 27.685976028442383, 28.52480697631836, 29.363636016845703, 30.20246696472168]}, "eval/loss": 6.056567668914795, "eval/wer": 1.275446251487505, "eval/runtime": 640.1555, "eval/samples_per_second": 4.127, "eval/steps_per_second": 0.517} \ No newline at end of file